Files
vpp/src/plugins/snort/daq_vpp.c
Alexander Skorichenko a7e01a83be snort: add timestamps to packets
Type: improvement

Change-Id: I810679c8a73c4d1b3fc2cc2300ded46a30d68e8f
Signed-off-by: Alexander Skorichenko <askorichenko@netgate.com>
2024-10-11 14:06:15 +00:00

724 lines
17 KiB
C

/* SPDX-License-Identifier: Apache-2.0
* Copyright(c) 2021 Cisco Systems, Inc.
*/
#define _GNU_SOURCE
#include <string.h>
#include <stdio.h>
#include <stdlib.h>
#include <stdbool.h>
#include <sys/socket.h>
#include <sys/un.h>
#include <sys/mman.h>
#include <sys/time.h>
#include <errno.h>
#include <sys/epoll.h>
#include <vppinfra/cache.h>
#include <daq_dlt.h>
#include <daq_module_api.h>
#include "daq_vpp.h"
#define DAQ_VPP_VERSION 1
#if __x86_64__
#define VPP_DAQ_PAUSE() __builtin_ia32_pause ()
#elif defined(__aarch64__) || defined(__arm__)
#define VPP_DAQ_PAUSE() __asm__("yield")
#else
#define VPP_DAQ_PAUSE()
#endif
static DAQ_VariableDesc_t vpp_variable_descriptions[] = {
{ "debug", "Enable debugging output to stdout",
DAQ_VAR_DESC_FORBIDS_ARGUMENT },
};
static DAQ_BaseAPI_t daq_base_api;
#define SET_ERROR(modinst, ...) daq_base_api.set_errbuf (modinst, __VA_ARGS__)
typedef struct _vpp_msg_pool
{
DAQ_MsgPoolInfo_t info;
} VPPMsgPool;
typedef struct _vpp_desc_data
{
uint32_t index;
uint32_t qpair_index;
DAQ_Msg_t msg;
DAQ_PktHdr_t pkthdr;
} VPPDescData;
typedef struct _vpp_bpool
{
int fd;
uint32_t size;
void *base;
} VPPBufferPool;
typedef struct _vpp_qpair
{
CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
uint32_t queue_size;
daq_vpp_desc_t *descs;
uint32_t *enq_ring;
uint32_t *deq_ring;
volatile uint32_t *enq_head;
volatile uint32_t *deq_head;
uint32_t next_desc;
int enq_fd;
int deq_fd;
VPPDescData *desc_data;
volatile int lock;
} VPPQueuePair;
typedef enum
{
DAQ_VPP_INPUT_MODE_INTERRUPT = 0,
DAQ_VPP_INPUT_MODE_POLLING,
} daq_vpp_input_mode_t;
typedef struct _vpp_context
{
/* config */
bool debug;
/* state */
uint32_t intf_count;
DAQ_ModuleInstance_h modinst;
VPPMsgPool pool;
/* socket */
int sock_fd;
/* shared memory */
uint32_t shm_size;
void *shm_base;
int shm_fd;
/* queue pairs */
uint8_t num_qpairs;
VPPQueuePair *qpairs;
uint32_t next_qpair;
/* epoll */
struct epoll_event *epoll_events;
int epoll_fd;
/* buffer pools */
uint8_t num_bpools;
VPPBufferPool *bpools;
daq_vpp_input_mode_t input_mode;
const char *socket_name;
volatile bool interrupted;
} VPP_Context_t;
static VPP_Context_t *global_vpp_ctx = 0;
static int
vpp_daq_qpair_lock (VPPQueuePair *p)
{
int free = 0;
while (!__atomic_compare_exchange_n (&p->lock, &free, 1, 0, __ATOMIC_ACQUIRE,
__ATOMIC_RELAXED))
{
while (__atomic_load_n (&p->lock, __ATOMIC_RELAXED))
VPP_DAQ_PAUSE ();
free = 0;
}
return 0;
}
static void
vpp_daq_qpair_unlock (VPPQueuePair *p)
{
__atomic_store_n (&p->lock, 0, __ATOMIC_RELEASE);
}
static int
vpp_daq_module_load (const DAQ_BaseAPI_t *base_api)
{
if (base_api->api_version != DAQ_BASE_API_VERSION ||
base_api->api_size != sizeof (DAQ_BaseAPI_t))
return DAQ_ERROR;
daq_base_api = *base_api;
return DAQ_SUCCESS;
}
static int
vpp_daq_module_unload (void)
{
memset (&daq_base_api, 0, sizeof (daq_base_api));
return DAQ_SUCCESS;
}
static int
vpp_daq_get_variable_descs (const DAQ_VariableDesc_t **var_desc_table)
{
*var_desc_table = vpp_variable_descriptions;
return sizeof (vpp_variable_descriptions) / sizeof (DAQ_VariableDesc_t);
}
static int
vpp_daq_recvmsg (int fd, daq_vpp_msg_t *msg, int n_fds, int *fds)
{
const int ctl_sz =
CMSG_SPACE (sizeof (int) * n_fds) + CMSG_SPACE (sizeof (struct ucred));
char ctl[ctl_sz];
struct msghdr mh = {};
struct iovec iov[1];
struct cmsghdr *cmsg;
iov[0].iov_base = (void *) msg;
iov[0].iov_len = sizeof (daq_vpp_msg_t);
mh.msg_iov = iov;
mh.msg_iovlen = 1;
mh.msg_control = ctl;
mh.msg_controllen = ctl_sz;
memset (ctl, 0, ctl_sz);
int rv;
if ((rv = recvmsg (fd, &mh, 0)) != sizeof (daq_vpp_msg_t))
return DAQ_ERROR_NODEV;
cmsg = CMSG_FIRSTHDR (&mh);
while (cmsg)
{
if (cmsg->cmsg_level == SOL_SOCKET)
{
if (cmsg->cmsg_type == SCM_CREDENTIALS)
{
/* Do nothing */;
}
else if (cmsg->cmsg_type == SCM_RIGHTS)
{
memcpy (fds, CMSG_DATA (cmsg), n_fds * sizeof (int));
}
}
cmsg = CMSG_NXTHDR (&mh, cmsg);
}
return DAQ_SUCCESS;
}
static void
vpp_daq_destroy (void *handle)
{
VPP_Context_t *vc = (VPP_Context_t *) handle;
if (vc->shm_base != MAP_FAILED)
munmap (vc->shm_base, vc->shm_size);
if (vc->shm_fd != -1)
close (vc->shm_fd);
if (vc->bpools)
{
for (int i = 0; i < vc->num_bpools; i++)
{
VPPBufferPool *bp = vc->bpools + i;
if (bp->fd != -1)
close (bp->fd);
if (bp->base && bp->base != MAP_FAILED)
munmap (bp->base, bp->size);
}
free (vc->bpools);
}
if (vc->qpairs)
{
for (int i = 0; i < vc->num_qpairs; i++)
{
VPPQueuePair *qp = vc->qpairs + i;
if (qp->enq_fd != -1)
close (qp->enq_fd);
if (qp->deq_fd != -1)
close (qp->deq_fd);
if (qp->desc_data)
free (qp->desc_data);
}
free (vc->qpairs);
}
free (vc->epoll_events);
close (vc->sock_fd);
if (vc->epoll_fd != -1)
close (vc->epoll_fd);
free (vc);
}
#define ERR(rv, ...) \
{ \
SET_ERROR (modinst, __VA_ARGS__); \
rval = rv; \
goto err; \
}
static int
vpp_daq_instantiate (const DAQ_ModuleConfig_h modcfg,
DAQ_ModuleInstance_h modinst, void **ctxt_ptr)
{
VPP_Context_t *vc = 0;
int rval = DAQ_ERROR;
daq_vpp_msg_t msg;
struct sockaddr_un sun = { .sun_family = AF_UNIX };
int i, fd = -1, shm_fd = -1;
const char *input;
uint8_t *base;
if (global_vpp_ctx)
{
*ctxt_ptr = global_vpp_ctx;
return DAQ_SUCCESS;
}
vc = calloc (1, sizeof (VPP_Context_t));
if (!vc)
ERR (DAQ_ERROR_NOMEM,
"%s: Couldn't allocate memory for the new VPP context!", __func__);
const char *varKey, *varValue;
daq_base_api.config_first_variable (modcfg, &varKey, &varValue);
while (varKey)
{
if (!strcmp (varKey, "debug"))
vc->debug = true;
else if (!strcmp (varKey, "input_mode"))
{
if (!strcmp (varValue, "interrupt"))
vc->input_mode = DAQ_VPP_INPUT_MODE_INTERRUPT;
else if (!strcmp (varValue, "polling"))
vc->input_mode = DAQ_VPP_INPUT_MODE_POLLING;
}
else if (!strcmp (varKey, "socket_name"))
{
vc->socket_name = varValue;
}
daq_base_api.config_next_variable (modcfg, &varKey, &varValue);
}
input = daq_base_api.config_get_input (modcfg);
if (!vc->socket_name)
/* try to use default socket path */
vc->socket_name = DAQ_VPP_DEFAULT_SOCKET_PATH;
if ((fd = socket (AF_UNIX, SOCK_SEQPACKET, 0)) < 0)
ERR (DAQ_ERROR_NODEV, "%s: Couldn't create socket!", __func__);
strncpy (sun.sun_path, vc->socket_name, sizeof (sun.sun_path) - 1);
if (connect (fd, (struct sockaddr *) &sun, sizeof (struct sockaddr_un)) != 0)
ERR (DAQ_ERROR_NODEV, "%s: Couldn't connect to socket! '%s'", __func__,
vc->socket_name);
/* craft and send connect message */
msg.type = DAQ_VPP_MSG_TYPE_HELLO;
snprintf ((char *) &msg.hello.inst_name, DAQ_VPP_INST_NAME_LEN - 1, "%s",
input);
if (send (fd, &msg, sizeof (msg), 0) != sizeof (msg))
ERR (DAQ_ERROR_NODEV, "%s: Couldn't send connect message!", __func__);
/* receive config message */
rval = vpp_daq_recvmsg (fd, &msg, 1, &shm_fd);
if (rval != DAQ_SUCCESS || msg.type != DAQ_VPP_MSG_TYPE_CONFIG ||
shm_fd == -1)
ERR (DAQ_ERROR_NODEV, "%s: Couldn't receive config message!", __func__);
vc->modinst = modinst;
vc->sock_fd = fd;
vc->epoll_fd = -1;
vc->intf_count = 1;
vc->num_bpools = msg.config.num_bpools;
vc->num_qpairs = msg.config.num_qpairs;
vc->shm_size = msg.config.shm_size;
vc->shm_fd = shm_fd;
vc->bpools = calloc (vc->num_bpools, sizeof (VPPBufferPool));
vc->qpairs = calloc (vc->num_qpairs, sizeof (VPPQueuePair));
vc->epoll_events = calloc (vc->num_qpairs, sizeof (struct epoll_event));
if (vc->bpools == 0 || vc->qpairs == 0)
ERR (DAQ_ERROR_NOMEM,
"%s: Couldn't allocate memory for the new VPP context!", __func__);
for (i = 0; i < vc->num_bpools; i++)
vc->bpools[i].fd = -1;
base =
mmap (0, vc->shm_size, PROT_READ | PROT_WRITE, MAP_SHARED, vc->shm_fd, 0);
if (base == MAP_FAILED)
ERR (DAQ_ERROR_NOMEM,
"%s: Couldn't map shared memory for the new VPP context!", __func__);
vc->shm_base = base;
if (vc->debug)
{
printf ("[%s]\n", input);
printf (" Shared memory size: %u\n", vc->shm_size);
printf (" Number of buffer pools: %u\n", vc->num_bpools);
printf (" Number of queue pairs: %u\n", vc->num_qpairs);
}
/* receive buffer pools */
for (int i = 0; i < vc->num_bpools; i++)
{
VPPBufferPool *bp = vc->bpools + i;
rval = vpp_daq_recvmsg (fd, &msg, 1, &bp->fd);
if (rval != DAQ_SUCCESS || msg.type != DAQ_VPP_MSG_TYPE_BPOOL ||
bp->fd == -1)
ERR (DAQ_ERROR_NODEV,
"%s: Failed to receive buffer pool message for the new "
"VPP context!",
__func__);
bp->size = msg.bpool.size;
bp->base = mmap (0, bp->size, PROT_READ, MAP_SHARED, bp->fd, 0);
if (bp->base == MAP_FAILED)
ERR (DAQ_ERROR_NOMEM,
"%s: Couldn't map shared memory for the new VPP context!",
__func__);
if (vc->debug)
printf (" Buffer pool %u size: %u\n", i, bp->size);
}
if ((vc->epoll_fd = epoll_create (1)) == -1)
ERR (DAQ_ERROR_NODEV,
"%s: Couldn't create epoll fd for the new VPP context!", __func__);
/* receive queue pairs */
for (int i = 0; i < vc->num_qpairs; i++)
{
struct epoll_event ev = { .events = EPOLLIN };
int fds[2] = { -1, -1 };
uint32_t qsz;
VPPQueuePair *qp = vc->qpairs + i;
rval = vpp_daq_recvmsg (fd, &msg, 2, fds);
if (rval != DAQ_SUCCESS || msg.type != DAQ_VPP_MSG_TYPE_QPAIR ||
fds[0] == -1 || fds[1] == -1)
ERR (DAQ_ERROR_NODEV,
"%s: Failed to receive queu pair message for the new "
"VPP context!",
__func__);
qp->queue_size = 1 << msg.qpair.log2_queue_size;
qp->descs = (daq_vpp_desc_t *) (base + msg.qpair.desc_table_offset);
qp->enq_ring = (uint32_t *) (base + msg.qpair.enq_ring_offset);
qp->deq_ring = (uint32_t *) (base + msg.qpair.deq_ring_offset);
qp->enq_head = (uint32_t *) (base + msg.qpair.enq_head_offset);
qp->deq_head = (uint32_t *) (base + msg.qpair.deq_head_offset);
qp->enq_fd = fds[0];
qp->deq_fd = fds[1];
ev.data.u32 = i;
if (epoll_ctl (vc->epoll_fd, EPOLL_CTL_ADD, qp->enq_fd, &ev) == -1)
ERR (DAQ_ERROR_NODEV,
"%s: Failed to dequeue fd to epoll instance for the new "
"VPP context!",
__func__);
qsz = qp->queue_size;
qp->desc_data = calloc (qsz, sizeof (VPPDescData));
if (!qp->desc_data)
ERR (DAQ_ERROR_NOMEM,
"%s: Couldn't allocate memory for the new VPP context!",
__func__);
for (int j = 0; j < qsz; j++)
{
VPPDescData *dd = qp->desc_data + j;
DAQ_PktHdr_t *pkthdr = &dd->pkthdr;
DAQ_Msg_t *msg = &dd->msg;
dd->index = j;
dd->qpair_index = i;
pkthdr->ingress_group = DAQ_PKTHDR_UNKNOWN;
pkthdr->egress_group = DAQ_PKTHDR_UNKNOWN;
msg->type = DAQ_MSG_TYPE_PACKET;
msg->hdr_len = sizeof (DAQ_PktHdr_t);
msg->hdr = pkthdr;
msg->owner = vc->modinst;
msg->priv = dd;
}
if (vc->debug)
{
printf (" Queue pair %u:\n", i);
printf (" Size: %u\n", qp->queue_size);
printf (" Enqueue fd: %u\n", qp->enq_fd);
printf (" Dequeue fd: %u\n", qp->deq_fd);
}
}
*ctxt_ptr = global_vpp_ctx = vc;
return DAQ_SUCCESS;
err:
if (vc)
vpp_daq_destroy (vc);
else if (fd != -1)
close (fd);
return rval;
}
static int
vpp_daq_start (void *handle)
{
return DAQ_SUCCESS;
}
static int
vpp_daq_interrupt (void *handle)
{
VPP_Context_t *vc = (VPP_Context_t *) handle;
vc->interrupted = true;
return DAQ_SUCCESS;
}
static int
vpp_daq_get_stats (void *handle, DAQ_Stats_t *stats)
{
memset (stats, 0, sizeof (DAQ_Stats_t));
return DAQ_SUCCESS;
}
static void
vpp_daq_reset_stats (void *handle)
{
}
static uint32_t
vpp_daq_get_capabilities (void *handle)
{
uint32_t capabilities = DAQ_CAPA_BLOCK | DAQ_CAPA_UNPRIV_START;
return capabilities;
}
static int
vpp_daq_get_datalink_type (void *handle)
{
return DLT_IPV4;
}
static inline uint32_t
vpp_daq_msg_receive_one (VPP_Context_t *vc, VPPQueuePair *qp,
const DAQ_Msg_t *msgs[], unsigned max_recv)
{
uint32_t n_recv, n_left;
uint32_t head, next, mask = qp->queue_size - 1;
struct timeval tv;
if (max_recv == 0)
return 0;
vpp_daq_qpair_lock (qp);
next = qp->next_desc;
head = __atomic_load_n (qp->enq_head, __ATOMIC_ACQUIRE);
n_recv = n_left = head - next;
if (n_left > max_recv)
{
n_left = n_recv = max_recv;
}
gettimeofday (&tv, NULL);
while (n_left--)
{
uint32_t desc_index = qp->enq_ring[next & mask];
daq_vpp_desc_t *d = qp->descs + desc_index;
VPPDescData *dd = qp->desc_data + desc_index;
dd->pkthdr.ts.tv_sec = tv.tv_sec;
dd->pkthdr.ts.tv_usec = tv.tv_usec;
dd->pkthdr.pktlen = d->length;
dd->pkthdr.address_space_id = d->address_space_id;
dd->msg.data = vc->bpools[d->buffer_pool].base + d->offset;
dd->msg.data_len = d->length;
next = next + 1;
msgs[0] = &dd->msg;
msgs++;
}
qp->next_desc = next;
vpp_daq_qpair_unlock (qp);
return n_recv;
}
static unsigned
vpp_daq_msg_receive (void *handle, const unsigned max_recv,
const DAQ_Msg_t *msgs[], DAQ_RecvStatus *rstat)
{
VPP_Context_t *vc = (VPP_Context_t *) handle;
uint32_t n_qpairs_left = vc->num_qpairs;
uint32_t n, n_recv = 0;
int32_t n_events;
/* If the receive has been interrupted, break out of loop and return. */
if (vc->interrupted)
{
vc->interrupted = false;
*rstat = DAQ_RSTAT_INTERRUPTED;
return 0;
}
/* first, we visit all qpairs. If we find any work there then we can give
* it back immediatelly. To avoid bias towards qpair 0 we remeber what
* next qpair */
while (n_qpairs_left)
{
VPPQueuePair *qp = vc->qpairs + vc->next_qpair;
if ((n = vpp_daq_msg_receive_one (vc, qp, msgs, max_recv - n_recv)))
{
msgs += n;
n_recv += n;
}
/* next */
vc->next_qpair++;
if (vc->next_qpair == vc->num_qpairs)
vc->next_qpair = 0;
n_qpairs_left--;
}
if (vc->input_mode == DAQ_VPP_INPUT_MODE_POLLING)
{
*rstat = DAQ_RSTAT_OK;
return n_recv;
}
if (n_recv)
{
*rstat = DAQ_RSTAT_OK;
return n_recv;
}
n_events = epoll_wait (vc->epoll_fd, vc->epoll_events, vc->num_qpairs, 1000);
if (n_events == 0)
{
*rstat = DAQ_RSTAT_TIMEOUT;
return 0;
}
if (n_events < 0)
{
*rstat = errno == EINTR ? DAQ_RSTAT_TIMEOUT : DAQ_RSTAT_ERROR;
return 0;
}
for (int i = 0; i < n_events; i++)
{
uint64_t ctr;
VPPQueuePair *qp = vc->qpairs + vc->epoll_events[i].data.u32;
if ((n = vpp_daq_msg_receive_one (vc, qp, msgs, max_recv - n_recv)))
{
msgs += n;
n_recv += n;
}
ssize_t __clib_unused size = read (qp->enq_fd, &ctr, sizeof (ctr));
}
*rstat = DAQ_RSTAT_OK;
return n_recv;
}
static int
vpp_daq_msg_finalize (void *handle, const DAQ_Msg_t *msg, DAQ_Verdict verdict)
{
VPP_Context_t *vc = (VPP_Context_t *) handle;
VPPDescData *dd = msg->priv;
VPPQueuePair *qp = vc->qpairs + dd->qpair_index;
daq_vpp_desc_t *d;
uint32_t mask, head;
uint64_t counter_increment = 1;
int rv, retv = DAQ_SUCCESS;
vpp_daq_qpair_lock (qp);
mask = qp->queue_size - 1;
head = *qp->deq_head;
d = qp->descs + dd->index;
if (verdict == DAQ_VERDICT_PASS)
d->action = DAQ_VPP_ACTION_FORWARD;
else
d->action = DAQ_VPP_ACTION_DROP;
qp->deq_ring[head & mask] = dd->index;
head = head + 1;
__atomic_store_n (qp->deq_head, head, __ATOMIC_RELEASE);
if (vc->input_mode == DAQ_VPP_INPUT_MODE_INTERRUPT)
{
rv = write (qp->deq_fd, &counter_increment, sizeof (counter_increment));
if (rv != sizeof (counter_increment))
retv = DAQ_ERROR;
}
vpp_daq_qpair_unlock (qp);
return retv;
}
static int
vpp_daq_get_msg_pool_info (void *handle, DAQ_MsgPoolInfo_t *info)
{
VPP_Context_t *vc = (VPP_Context_t *) handle;
vc->pool.info.available = 128;
vc->pool.info.size = 256;
*info = vc->pool.info;
return DAQ_SUCCESS;
}
DAQ_SO_PUBLIC
const DAQ_ModuleAPI_t DAQ_MODULE_DATA = {
/* .api_version = */ DAQ_MODULE_API_VERSION,
/* .api_size = */ sizeof (DAQ_ModuleAPI_t),
/* .module_version = */ DAQ_VPP_VERSION,
/* .name = */ "vpp",
/* .type = */ DAQ_TYPE_INTF_CAPABLE | DAQ_TYPE_INLINE_CAPABLE |
DAQ_TYPE_MULTI_INSTANCE,
/* .load = */ vpp_daq_module_load,
/* .unload = */ vpp_daq_module_unload,
/* .get_variable_descs = */ vpp_daq_get_variable_descs,
/* .instantiate = */ vpp_daq_instantiate,
/* .destroy = */ vpp_daq_destroy,
/* .set_filter = */ NULL,
/* .start = */ vpp_daq_start,
/* .inject = */ NULL,
/* .inject_relative = */ NULL,
/* .interrupt = */ vpp_daq_interrupt,
/* .stop = */ NULL,
/* .ioctl = */ NULL,
/* .get_stats = */ vpp_daq_get_stats,
/* .reset_stats = */ vpp_daq_reset_stats,
/* .get_snaplen = */ NULL,
/* .get_capabilities = */ vpp_daq_get_capabilities,
/* .get_datalink_type = */ vpp_daq_get_datalink_type,
/* .config_load = */ NULL,
/* .config_swap = */ NULL,
/* .config_free = */ NULL,
/* .msg_receive = */ vpp_daq_msg_receive,
/* .msg_finalize = */ vpp_daq_msg_finalize,
/* .get_msg_pool_info = */ vpp_daq_get_msg_pool_info,
};