347 lines
9.0 KiB
C
347 lines
9.0 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
#include <assert.h>
|
|
#include <errno.h>
|
|
#include <error.h>
|
|
#include <fcntl.h>
|
|
#include <inttypes.h>
|
|
#include <limits.h>
|
|
#include <stdlib.h>
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <unistd.h>
|
|
#include <ynl.h>
|
|
|
|
#include <arpa/inet.h>
|
|
#include <netinet/in.h>
|
|
|
|
#include <sys/epoll.h>
|
|
#include <sys/ioctl.h>
|
|
#include <sys/socket.h>
|
|
#include <sys/types.h>
|
|
|
|
#include <linux/genetlink.h>
|
|
#include <linux/netlink.h>
|
|
|
|
#include "netdev-user.h"
|
|
|
|
/* The below ifdef blob is required because:
|
|
*
|
|
* - sys/epoll.h does not (yet) have the ioctl definitions included. So,
|
|
* systems with older glibcs will not have them available. However,
|
|
* sys/epoll.h does include the type definition for epoll_data, which is
|
|
* needed by the user program (e.g. epoll_event.data.fd)
|
|
*
|
|
* - linux/eventpoll.h does not define the epoll_data type, it is simply an
|
|
* opaque __u64. It does, however, include the ioctl definition.
|
|
*
|
|
* Including both headers is impossible (types would be redefined), so I've
|
|
* opted instead to take sys/epoll.h, and include the blob below.
|
|
*
|
|
* Someday, when glibc is globally up to date, the blob below can be removed.
|
|
*/
|
|
#if !defined(EPOLL_IOC_TYPE)
|
|
struct epoll_params {
|
|
uint32_t busy_poll_usecs;
|
|
uint16_t busy_poll_budget;
|
|
uint8_t prefer_busy_poll;
|
|
|
|
/* pad the struct to a multiple of 64bits */
|
|
uint8_t __pad;
|
|
};
|
|
|
|
#define EPOLL_IOC_TYPE 0x8A
|
|
#define EPIOCSPARAMS _IOW(EPOLL_IOC_TYPE, 0x01, struct epoll_params)
|
|
#define EPIOCGPARAMS _IOR(EPOLL_IOC_TYPE, 0x02, struct epoll_params)
|
|
#endif
|
|
|
|
static uint32_t cfg_port = 8000;
|
|
static struct in_addr cfg_bind_addr = { .s_addr = INADDR_ANY };
|
|
static char *cfg_outfile;
|
|
static int cfg_max_events = 8;
|
|
static int cfg_ifindex;
|
|
|
|
/* busy poll params */
|
|
static uint32_t cfg_busy_poll_usecs;
|
|
static uint32_t cfg_busy_poll_budget;
|
|
static uint32_t cfg_prefer_busy_poll;
|
|
|
|
/* IRQ params */
|
|
static uint32_t cfg_defer_hard_irqs;
|
|
static uint64_t cfg_gro_flush_timeout;
|
|
static uint64_t cfg_irq_suspend_timeout;
|
|
|
|
static void usage(const char *filepath)
|
|
{
|
|
error(1, 0,
|
|
"Usage: %s -p<port> -b<addr> -m<max_events> -u<busy_poll_usecs> -P<prefer_busy_poll> -g<busy_poll_budget> -o<outfile> -d<defer_hard_irqs> -r<gro_flush_timeout> -s<irq_suspend_timeout> -i<ifindex>",
|
|
filepath);
|
|
}
|
|
|
|
static void parse_opts(int argc, char **argv)
|
|
{
|
|
int ret;
|
|
int c;
|
|
|
|
if (argc <= 1)
|
|
usage(argv[0]);
|
|
|
|
while ((c = getopt(argc, argv, "p:m:b:u:P:g:o:d:r:s:i:")) != -1) {
|
|
switch (c) {
|
|
case 'u':
|
|
cfg_busy_poll_usecs = strtoul(optarg, NULL, 0);
|
|
if (cfg_busy_poll_usecs == ULONG_MAX ||
|
|
cfg_busy_poll_usecs > UINT32_MAX)
|
|
error(1, ERANGE, "busy_poll_usecs too large");
|
|
break;
|
|
case 'P':
|
|
cfg_prefer_busy_poll = strtoul(optarg, NULL, 0);
|
|
if (cfg_prefer_busy_poll == ULONG_MAX ||
|
|
cfg_prefer_busy_poll > 1)
|
|
error(1, ERANGE,
|
|
"prefer busy poll should be 0 or 1");
|
|
break;
|
|
case 'g':
|
|
cfg_busy_poll_budget = strtoul(optarg, NULL, 0);
|
|
if (cfg_busy_poll_budget == ULONG_MAX ||
|
|
cfg_busy_poll_budget > UINT16_MAX)
|
|
error(1, ERANGE,
|
|
"busy poll budget must be [0, UINT16_MAX]");
|
|
break;
|
|
case 'p':
|
|
cfg_port = strtoul(optarg, NULL, 0);
|
|
if (cfg_port > UINT16_MAX)
|
|
error(1, ERANGE, "port must be <= 65535");
|
|
break;
|
|
case 'b':
|
|
ret = inet_aton(optarg, &cfg_bind_addr);
|
|
if (ret == 0)
|
|
error(1, errno,
|
|
"bind address %s invalid", optarg);
|
|
break;
|
|
case 'o':
|
|
cfg_outfile = strdup(optarg);
|
|
if (!cfg_outfile)
|
|
error(1, 0, "outfile invalid");
|
|
break;
|
|
case 'm':
|
|
cfg_max_events = strtol(optarg, NULL, 0);
|
|
|
|
if (cfg_max_events == LONG_MIN ||
|
|
cfg_max_events == LONG_MAX ||
|
|
cfg_max_events <= 0)
|
|
error(1, ERANGE,
|
|
"max events must be > 0 and < LONG_MAX");
|
|
break;
|
|
case 'd':
|
|
cfg_defer_hard_irqs = strtoul(optarg, NULL, 0);
|
|
|
|
if (cfg_defer_hard_irqs == ULONG_MAX ||
|
|
cfg_defer_hard_irqs > INT32_MAX)
|
|
error(1, ERANGE,
|
|
"defer_hard_irqs must be <= INT32_MAX");
|
|
break;
|
|
case 'r':
|
|
cfg_gro_flush_timeout = strtoull(optarg, NULL, 0);
|
|
|
|
if (cfg_gro_flush_timeout == ULLONG_MAX)
|
|
error(1, ERANGE,
|
|
"gro_flush_timeout must be < ULLONG_MAX");
|
|
break;
|
|
case 's':
|
|
cfg_irq_suspend_timeout = strtoull(optarg, NULL, 0);
|
|
|
|
if (cfg_irq_suspend_timeout == ULLONG_MAX)
|
|
error(1, ERANGE,
|
|
"irq_suspend_timeout must be < ULLONG_MAX");
|
|
break;
|
|
case 'i':
|
|
cfg_ifindex = strtoul(optarg, NULL, 0);
|
|
if (cfg_ifindex == ULONG_MAX)
|
|
error(1, ERANGE,
|
|
"ifindex must be < ULONG_MAX");
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (!cfg_ifindex)
|
|
usage(argv[0]);
|
|
|
|
if (optind != argc)
|
|
usage(argv[0]);
|
|
}
|
|
|
|
static void epoll_ctl_add(int epfd, int fd, uint32_t events)
|
|
{
|
|
struct epoll_event ev;
|
|
|
|
ev.events = events;
|
|
ev.data.fd = fd;
|
|
if (epoll_ctl(epfd, EPOLL_CTL_ADD, fd, &ev) == -1)
|
|
error(1, errno, "epoll_ctl add fd: %d", fd);
|
|
}
|
|
|
|
static void setnonblock(int sockfd)
|
|
{
|
|
int flags;
|
|
|
|
flags = fcntl(sockfd, F_GETFL, 0);
|
|
|
|
if (fcntl(sockfd, F_SETFL, flags | O_NONBLOCK) == -1)
|
|
error(1, errno, "unable to set socket to nonblocking mode");
|
|
}
|
|
|
|
static void write_chunk(int fd, char *buf, ssize_t buflen)
|
|
{
|
|
ssize_t remaining = buflen;
|
|
char *buf_offset = buf;
|
|
ssize_t writelen = 0;
|
|
ssize_t write_result;
|
|
|
|
while (writelen < buflen) {
|
|
write_result = write(fd, buf_offset, remaining);
|
|
if (write_result == -1)
|
|
error(1, errno, "unable to write data to outfile");
|
|
|
|
writelen += write_result;
|
|
remaining -= write_result;
|
|
buf_offset += write_result;
|
|
}
|
|
}
|
|
|
|
static void setup_queue(void)
|
|
{
|
|
struct netdev_napi_get_list *napi_list = NULL;
|
|
struct netdev_napi_get_req_dump *req = NULL;
|
|
struct netdev_napi_set_req *set_req = NULL;
|
|
struct ynl_sock *ys;
|
|
struct ynl_error yerr;
|
|
uint32_t napi_id;
|
|
|
|
ys = ynl_sock_create(&ynl_netdev_family, &yerr);
|
|
if (!ys)
|
|
error(1, 0, "YNL: %s", yerr.msg);
|
|
|
|
req = netdev_napi_get_req_dump_alloc();
|
|
netdev_napi_get_req_dump_set_ifindex(req, cfg_ifindex);
|
|
napi_list = netdev_napi_get_dump(ys, req);
|
|
|
|
/* assume there is 1 NAPI configured and take the first */
|
|
if (napi_list->obj._present.id)
|
|
napi_id = napi_list->obj.id;
|
|
else
|
|
error(1, 0, "napi ID not present?");
|
|
|
|
set_req = netdev_napi_set_req_alloc();
|
|
netdev_napi_set_req_set_id(set_req, napi_id);
|
|
netdev_napi_set_req_set_defer_hard_irqs(set_req, cfg_defer_hard_irqs);
|
|
netdev_napi_set_req_set_gro_flush_timeout(set_req,
|
|
cfg_gro_flush_timeout);
|
|
netdev_napi_set_req_set_irq_suspend_timeout(set_req,
|
|
cfg_irq_suspend_timeout);
|
|
|
|
if (netdev_napi_set(ys, set_req))
|
|
error(1, 0, "can't set NAPI params: %s\n", yerr.msg);
|
|
|
|
netdev_napi_get_list_free(napi_list);
|
|
netdev_napi_get_req_dump_free(req);
|
|
netdev_napi_set_req_free(set_req);
|
|
ynl_sock_destroy(ys);
|
|
}
|
|
|
|
static void run_poller(void)
|
|
{
|
|
struct epoll_event events[cfg_max_events];
|
|
struct epoll_params epoll_params = {0};
|
|
struct sockaddr_in server_addr;
|
|
int i, epfd, nfds;
|
|
ssize_t readlen;
|
|
int outfile_fd;
|
|
char buf[1024];
|
|
int sockfd;
|
|
int conn;
|
|
int val;
|
|
|
|
outfile_fd = open(cfg_outfile, O_WRONLY | O_CREAT, 0644);
|
|
if (outfile_fd == -1)
|
|
error(1, errno, "unable to open outfile: %s", cfg_outfile);
|
|
|
|
sockfd = socket(AF_INET, SOCK_STREAM, IPPROTO_TCP);
|
|
if (sockfd == -1)
|
|
error(1, errno, "unable to create listen socket");
|
|
|
|
server_addr.sin_family = AF_INET;
|
|
server_addr.sin_port = htons(cfg_port);
|
|
server_addr.sin_addr = cfg_bind_addr;
|
|
|
|
/* these values are range checked during parse_opts, so casting is safe
|
|
* here
|
|
*/
|
|
epoll_params.busy_poll_usecs = cfg_busy_poll_usecs;
|
|
epoll_params.busy_poll_budget = (uint16_t)cfg_busy_poll_budget;
|
|
epoll_params.prefer_busy_poll = (uint8_t)cfg_prefer_busy_poll;
|
|
epoll_params.__pad = 0;
|
|
|
|
val = 1;
|
|
if (setsockopt(sockfd, SOL_SOCKET, SO_REUSEADDR, &val, sizeof(val)))
|
|
error(1, errno, "poller setsockopt reuseaddr");
|
|
|
|
setnonblock(sockfd);
|
|
|
|
if (bind(sockfd, (struct sockaddr *)&server_addr,
|
|
sizeof(struct sockaddr_in)))
|
|
error(0, errno, "poller bind to port: %d\n", cfg_port);
|
|
|
|
if (listen(sockfd, 1))
|
|
error(1, errno, "poller listen");
|
|
|
|
epfd = epoll_create1(0);
|
|
if (ioctl(epfd, EPIOCSPARAMS, &epoll_params) == -1)
|
|
error(1, errno, "unable to set busy poll params");
|
|
|
|
epoll_ctl_add(epfd, sockfd, EPOLLIN | EPOLLOUT | EPOLLET);
|
|
|
|
for (;;) {
|
|
nfds = epoll_wait(epfd, events, cfg_max_events, -1);
|
|
for (i = 0; i < nfds; i++) {
|
|
if (events[i].data.fd == sockfd) {
|
|
conn = accept(sockfd, NULL, NULL);
|
|
if (conn == -1)
|
|
error(1, errno,
|
|
"accepting incoming connection failed");
|
|
|
|
setnonblock(conn);
|
|
epoll_ctl_add(epfd, conn,
|
|
EPOLLIN | EPOLLET | EPOLLRDHUP |
|
|
EPOLLHUP);
|
|
} else if (events[i].events & EPOLLIN) {
|
|
for (;;) {
|
|
readlen = read(events[i].data.fd, buf,
|
|
sizeof(buf));
|
|
if (readlen > 0)
|
|
write_chunk(outfile_fd, buf,
|
|
readlen);
|
|
else
|
|
break;
|
|
}
|
|
} else {
|
|
/* spurious event ? */
|
|
}
|
|
if (events[i].events & (EPOLLRDHUP | EPOLLHUP)) {
|
|
epoll_ctl(epfd, EPOLL_CTL_DEL,
|
|
events[i].data.fd, NULL);
|
|
close(events[i].data.fd);
|
|
close(outfile_fd);
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
int main(int argc, char *argv[])
|
|
{
|
|
parse_opts(argc, argv);
|
|
setup_queue();
|
|
run_poller();
|
|
return 0;
|
|
}
|