Type: refactor Change-Id: I5235bf3e9aff58af6ba2c14e8c6529c4fc9ec86c Signed-off-by: Damjan Marion <damarion@cisco.com>
955 lines
27 KiB
C
955 lines
27 KiB
C
/*
|
|
* Copyright (c) 2020 Doc.ai and/or its affiliates.
|
|
* Copyright (c) 2020 Cisco and/or its affiliates.
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at:
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include <vlib/vlib.h>
|
|
#include <vnet/vnet.h>
|
|
#include <vppinfra/error.h>
|
|
|
|
#include <wireguard/wireguard.h>
|
|
#include <wireguard/wireguard_send.h>
|
|
|
|
#define foreach_wg_output_error \
|
|
_ (NONE, "No error") \
|
|
_ (PEER, "Peer error") \
|
|
_ (KEYPAIR, "Keypair error") \
|
|
_ (NO_BUFFERS, "No buffers") \
|
|
_ (CRYPTO_ENGINE_ERROR, "crypto engine error (packet dropped)")
|
|
|
|
typedef enum
|
|
{
|
|
#define _(sym,str) WG_OUTPUT_ERROR_##sym,
|
|
foreach_wg_output_error
|
|
#undef _
|
|
WG_OUTPUT_N_ERROR,
|
|
} wg_output_error_t;
|
|
|
|
static char *wg_output_error_strings[] = {
|
|
#define _(sym,string) string,
|
|
foreach_wg_output_error
|
|
#undef _
|
|
};
|
|
|
|
typedef enum
|
|
{
|
|
WG_OUTPUT_NEXT_ERROR,
|
|
WG_OUTPUT_NEXT_HANDOFF,
|
|
WG_OUTPUT_NEXT_INTERFACE_OUTPUT,
|
|
WG_OUTPUT_N_NEXT,
|
|
} wg_output_next_t;
|
|
|
|
typedef struct
|
|
{
|
|
index_t peer;
|
|
u8 header[sizeof (ip6_udp_header_t)];
|
|
u8 is_ip4;
|
|
} wg_output_tun_trace_t;
|
|
|
|
typedef struct
|
|
{
|
|
index_t peer;
|
|
u32 next_index;
|
|
} wg_output_tun_post_trace_t;
|
|
|
|
u8 *
|
|
format_ip4_udp_header (u8 * s, va_list * args)
|
|
{
|
|
ip4_udp_header_t *hdr4 = va_arg (*args, ip4_udp_header_t *);
|
|
|
|
s = format (s, "%U:$U", format_ip4_header, &hdr4->ip4, format_udp_header,
|
|
&hdr4->udp);
|
|
return (s);
|
|
}
|
|
|
|
u8 *
|
|
format_ip6_udp_header (u8 *s, va_list *args)
|
|
{
|
|
ip6_udp_header_t *hdr6 = va_arg (*args, ip6_udp_header_t *);
|
|
|
|
s = format (s, "%U:$U", format_ip6_header, &hdr6->ip6, format_udp_header,
|
|
&hdr6->udp);
|
|
return (s);
|
|
}
|
|
|
|
/* packet trace format function */
|
|
static u8 *
|
|
format_wg_output_tun_trace (u8 * s, va_list * args)
|
|
{
|
|
CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
|
|
CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
|
|
|
|
wg_output_tun_trace_t *t = va_arg (*args, wg_output_tun_trace_t *);
|
|
|
|
s = format (s, "peer: %d\n", t->peer);
|
|
s = format (s, " Encrypted packet: ");
|
|
|
|
s = t->is_ip4 ? format (s, "%U", format_ip4_udp_header, t->header) :
|
|
format (s, "%U", format_ip6_udp_header, t->header);
|
|
return s;
|
|
}
|
|
|
|
/* post node - packet trace format function */
|
|
static u8 *
|
|
format_wg_output_tun_post_trace (u8 *s, va_list *args)
|
|
{
|
|
CLIB_UNUSED (vlib_main_t * vm) = va_arg (*args, vlib_main_t *);
|
|
CLIB_UNUSED (vlib_node_t * node) = va_arg (*args, vlib_node_t *);
|
|
|
|
wg_output_tun_post_trace_t *t = va_arg (*args, wg_output_tun_post_trace_t *);
|
|
|
|
s = format (s, "peer: %d\n", t->peer);
|
|
s = format (s, " wg-post: next node index %u", t->next_index);
|
|
return s;
|
|
}
|
|
|
|
static_always_inline void
|
|
wg_output_chain_crypto (vlib_main_t *vm, wg_per_thread_data_t *ptd,
|
|
vlib_buffer_t *b, vlib_buffer_t *lb, u8 *start,
|
|
u32 start_len, u16 *n_ch)
|
|
{
|
|
vnet_crypto_op_chunk_t *ch;
|
|
vlib_buffer_t *cb = b;
|
|
u32 n_chunks = 1;
|
|
|
|
vec_add2 (ptd->chunks, ch, 1);
|
|
ch->len = start_len;
|
|
ch->src = ch->dst = start;
|
|
cb = vlib_get_buffer (vm, cb->next_buffer);
|
|
|
|
while (1)
|
|
{
|
|
vec_add2 (ptd->chunks, ch, 1);
|
|
n_chunks += 1;
|
|
if (lb == cb)
|
|
ch->len = cb->current_length - NOISE_AUTHTAG_LEN;
|
|
else
|
|
ch->len = cb->current_length;
|
|
|
|
ch->src = ch->dst = vlib_buffer_get_current (cb);
|
|
|
|
if (!(cb->flags & VLIB_BUFFER_NEXT_PRESENT))
|
|
break;
|
|
|
|
cb = vlib_get_buffer (vm, cb->next_buffer);
|
|
}
|
|
|
|
if (n_ch)
|
|
*n_ch = n_chunks;
|
|
}
|
|
|
|
static_always_inline void
|
|
wg_prepare_sync_enc_op (vlib_main_t *vm, wg_per_thread_data_t *ptd,
|
|
vlib_buffer_t *b, vlib_buffer_t *lb,
|
|
vnet_crypto_op_t **crypto_ops, u8 *src, u32 src_len,
|
|
u8 *dst, u8 *aad, u32 aad_len, u64 nonce,
|
|
vnet_crypto_key_index_t key_index, u32 bi, u8 *iv)
|
|
{
|
|
vnet_crypto_op_t _op, *op = &_op;
|
|
u8 src_[] = {};
|
|
|
|
clib_memset (iv, 0, 4);
|
|
clib_memcpy (iv + 4, &nonce, sizeof (nonce));
|
|
|
|
vec_add2_aligned (crypto_ops[0], op, 1, CLIB_CACHE_LINE_BYTES);
|
|
vnet_crypto_op_init (op, VNET_CRYPTO_OP_CHACHA20_POLY1305_ENC);
|
|
|
|
op->tag_len = NOISE_AUTHTAG_LEN;
|
|
op->tag = vlib_buffer_get_tail (lb) - NOISE_AUTHTAG_LEN;
|
|
op->key_index = key_index;
|
|
op->aad = aad;
|
|
op->aad_len = aad_len;
|
|
op->iv = iv;
|
|
op->user_data = bi;
|
|
|
|
if (b != lb)
|
|
{
|
|
/* Chained buffers */
|
|
op->flags |= VNET_CRYPTO_OP_FLAG_CHAINED_BUFFERS;
|
|
op->chunk_index = vec_len (ptd->chunks);
|
|
wg_output_chain_crypto (vm, ptd, b, lb, src, src_len, &op->n_chunks);
|
|
}
|
|
else
|
|
{
|
|
op->src = !src ? src_ : src;
|
|
op->len = src_len;
|
|
op->dst = dst;
|
|
}
|
|
}
|
|
|
|
static_always_inline void
|
|
wg_output_process_chained_ops (vlib_main_t *vm, vlib_node_runtime_t *node,
|
|
vnet_crypto_op_t *ops, vlib_buffer_t *b[],
|
|
u16 *nexts, vnet_crypto_op_chunk_t *chunks,
|
|
u16 drop_next)
|
|
{
|
|
u32 n_fail, n_ops = vec_len (ops);
|
|
vnet_crypto_op_t *op = ops;
|
|
|
|
if (n_ops == 0)
|
|
return;
|
|
|
|
n_fail = n_ops - vnet_crypto_process_chained_ops (vm, op, chunks, n_ops);
|
|
|
|
while (n_fail)
|
|
{
|
|
ASSERT (op - ops < n_ops);
|
|
|
|
if (op->status != VNET_CRYPTO_OP_STATUS_COMPLETED)
|
|
{
|
|
u32 bi = op->user_data;
|
|
b[bi]->error = node->errors[WG_OUTPUT_ERROR_CRYPTO_ENGINE_ERROR];
|
|
nexts[bi] = drop_next;
|
|
n_fail--;
|
|
}
|
|
op++;
|
|
}
|
|
}
|
|
|
|
static_always_inline void
|
|
wg_output_process_ops (vlib_main_t *vm, vlib_node_runtime_t *node,
|
|
vnet_crypto_op_t *ops, vlib_buffer_t *b[], u16 *nexts,
|
|
u16 drop_next)
|
|
{
|
|
u32 n_fail, n_ops = vec_len (ops);
|
|
vnet_crypto_op_t *op = ops;
|
|
|
|
if (n_ops == 0)
|
|
return;
|
|
|
|
n_fail = n_ops - vnet_crypto_process_ops (vm, op, n_ops);
|
|
|
|
while (n_fail)
|
|
{
|
|
ASSERT (op - ops < n_ops);
|
|
|
|
if (op->status != VNET_CRYPTO_OP_STATUS_COMPLETED)
|
|
{
|
|
u32 bi = op->user_data;
|
|
b[bi]->error = node->errors[WG_OUTPUT_ERROR_CRYPTO_ENGINE_ERROR];
|
|
nexts[bi] = drop_next;
|
|
n_fail--;
|
|
}
|
|
op++;
|
|
}
|
|
}
|
|
|
|
static_always_inline void
|
|
wg_output_tun_add_to_frame (vlib_main_t *vm, vnet_crypto_async_frame_t *f,
|
|
u32 key_index, u32 crypto_len,
|
|
i16 crypto_start_offset, u32 buffer_index,
|
|
u16 next_node, u8 *iv, u8 *tag, u8 flags)
|
|
{
|
|
vnet_crypto_async_frame_elt_t *fe;
|
|
u16 index;
|
|
|
|
ASSERT (f->n_elts < VNET_CRYPTO_FRAME_SIZE);
|
|
|
|
index = f->n_elts;
|
|
fe = &f->elts[index];
|
|
f->n_elts++;
|
|
fe->key_index = key_index;
|
|
fe->crypto_total_length = crypto_len;
|
|
fe->crypto_start_offset = crypto_start_offset;
|
|
fe->iv = iv;
|
|
fe->tag = tag;
|
|
fe->flags = flags;
|
|
f->buffer_indices[index] = buffer_index;
|
|
f->next_node_index[index] = next_node;
|
|
}
|
|
|
|
static_always_inline enum noise_state_crypt
|
|
wg_output_tun_process (vlib_main_t *vm, wg_per_thread_data_t *ptd,
|
|
vlib_buffer_t *b, vlib_buffer_t *lb,
|
|
vnet_crypto_op_t **crypto_ops, noise_remote_t *r,
|
|
uint32_t *r_idx, uint64_t *nonce, uint8_t *src,
|
|
size_t srclen, uint8_t *dst, u32 bi, u8 *iv, f64 time)
|
|
{
|
|
noise_keypair_t *kp;
|
|
enum noise_state_crypt ret = SC_FAILED;
|
|
|
|
if ((kp = r->r_current) == NULL)
|
|
goto error;
|
|
|
|
/* We confirm that our values are within our tolerances. We want:
|
|
* - a valid keypair
|
|
* - our keypair to be less than REJECT_AFTER_TIME seconds old
|
|
* - our receive counter to be less than REJECT_AFTER_MESSAGES
|
|
* - our send counter to be less than REJECT_AFTER_MESSAGES
|
|
*/
|
|
if (!kp->kp_valid ||
|
|
wg_birthdate_has_expired_opt (kp->kp_birthdate, REJECT_AFTER_TIME,
|
|
time) ||
|
|
kp->kp_ctr.c_recv >= REJECT_AFTER_MESSAGES ||
|
|
((*nonce = noise_counter_send (&kp->kp_ctr)) > REJECT_AFTER_MESSAGES))
|
|
goto error;
|
|
|
|
/* We encrypt into the same buffer, so the caller must ensure that buf
|
|
* has NOISE_AUTHTAG_LEN bytes to store the MAC. The nonce and index
|
|
* are passed back out to the caller through the provided data pointer. */
|
|
*r_idx = kp->kp_remote_index;
|
|
|
|
wg_prepare_sync_enc_op (vm, ptd, b, lb, crypto_ops, src, srclen, dst, NULL,
|
|
0, *nonce, kp->kp_send_index, bi, iv);
|
|
|
|
/* If our values are still within tolerances, but we are approaching
|
|
* the tolerances, we notify the caller with ESTALE that they should
|
|
* establish a new keypair. The current keypair can continue to be used
|
|
* until the tolerances are hit. We notify if:
|
|
* - our send counter is valid and not less than REKEY_AFTER_MESSAGES
|
|
* - we're the initiator and our keypair is older than
|
|
* REKEY_AFTER_TIME seconds */
|
|
ret = SC_KEEP_KEY_FRESH;
|
|
if ((kp->kp_valid && *nonce >= REKEY_AFTER_MESSAGES) ||
|
|
(kp->kp_is_initiator && wg_birthdate_has_expired_opt (
|
|
kp->kp_birthdate, REKEY_AFTER_TIME, time)))
|
|
goto error;
|
|
|
|
ret = SC_OK;
|
|
error:
|
|
return ret;
|
|
}
|
|
|
|
static_always_inline enum noise_state_crypt
|
|
wg_add_to_async_frame (vlib_main_t *vm, wg_per_thread_data_t *ptd,
|
|
vnet_crypto_async_frame_t **async_frame,
|
|
vlib_buffer_t *b, vlib_buffer_t *lb, u8 *payload,
|
|
u32 payload_len, u32 bi, u16 next, u16 async_next,
|
|
noise_remote_t *r, uint32_t *r_idx, uint64_t *nonce,
|
|
u8 *iv, f64 time)
|
|
{
|
|
wg_post_data_t *post = wg_post_data (b);
|
|
u8 flag = 0;
|
|
u8 *tag;
|
|
noise_keypair_t *kp;
|
|
|
|
post->next_index = next;
|
|
|
|
/* crypto */
|
|
enum noise_state_crypt ret = SC_FAILED;
|
|
|
|
if ((kp = r->r_current) == NULL)
|
|
goto error;
|
|
|
|
/* We confirm that our values are within our tolerances. We want:
|
|
* - a valid keypair
|
|
* - our keypair to be less than REJECT_AFTER_TIME seconds old
|
|
* - our receive counter to be less than REJECT_AFTER_MESSAGES
|
|
* - our send counter to be less than REJECT_AFTER_MESSAGES
|
|
*/
|
|
if (!kp->kp_valid ||
|
|
wg_birthdate_has_expired_opt (kp->kp_birthdate, REJECT_AFTER_TIME,
|
|
time) ||
|
|
kp->kp_ctr.c_recv >= REJECT_AFTER_MESSAGES ||
|
|
((*nonce = noise_counter_send (&kp->kp_ctr)) > REJECT_AFTER_MESSAGES))
|
|
goto error;
|
|
|
|
/* We encrypt into the same buffer, so the caller must ensure that buf
|
|
* has NOISE_AUTHTAG_LEN bytes to store the MAC. The nonce and index
|
|
* are passed back out to the caller through the provided data pointer. */
|
|
*r_idx = kp->kp_remote_index;
|
|
|
|
clib_memset (iv, 0, 4);
|
|
clib_memcpy (iv + 4, nonce, sizeof (*nonce));
|
|
|
|
/* get a frame for this op if we don't yet have one or it's full */
|
|
if (NULL == *async_frame || vnet_crypto_async_frame_is_full (*async_frame))
|
|
{
|
|
*async_frame = vnet_crypto_async_get_frame (
|
|
vm, VNET_CRYPTO_OP_CHACHA20_POLY1305_TAG16_AAD0_ENC);
|
|
if (PREDICT_FALSE (NULL == *async_frame))
|
|
goto error;
|
|
/* Save the frame to the list we'll submit at the end */
|
|
vec_add1 (ptd->async_frames, *async_frame);
|
|
}
|
|
|
|
if (b != lb)
|
|
flag |= VNET_CRYPTO_OP_FLAG_CHAINED_BUFFERS;
|
|
|
|
tag = vlib_buffer_get_tail (lb) - NOISE_AUTHTAG_LEN;
|
|
|
|
/* this always succeeds because we know the frame is not full */
|
|
wg_output_tun_add_to_frame (vm, *async_frame, kp->kp_send_index, payload_len,
|
|
payload - b->data, bi, async_next, iv, tag,
|
|
flag);
|
|
|
|
/* If our values are still within tolerances, but we are approaching
|
|
* the tolerances, we notify the caller with ESTALE that they should
|
|
* establish a new keypair. The current keypair can continue to be used
|
|
* until the tolerances are hit. We notify if:
|
|
* - our send counter is valid and not less than REKEY_AFTER_MESSAGES
|
|
* - we're the initiator and our keypair is older than
|
|
* REKEY_AFTER_TIME seconds */
|
|
ret = SC_KEEP_KEY_FRESH;
|
|
if ((kp->kp_valid && *nonce >= REKEY_AFTER_MESSAGES) ||
|
|
(kp->kp_is_initiator && wg_birthdate_has_expired_opt (
|
|
kp->kp_birthdate, REKEY_AFTER_TIME, time)))
|
|
goto error;
|
|
|
|
ret = SC_OK;
|
|
error:
|
|
return ret;
|
|
}
|
|
|
|
static_always_inline void
|
|
wg_calc_checksum (vlib_main_t *vm, vlib_buffer_t *b)
|
|
{
|
|
int bogus = 0;
|
|
u8 ip_ver_out = (*((u8 *) vlib_buffer_get_current (b)) >> 4);
|
|
|
|
/* IPv6 UDP checksum is mandatory */
|
|
if (ip_ver_out == 6)
|
|
{
|
|
ip6_header_t *ip6 =
|
|
(ip6_header_t *) ((u8 *) vlib_buffer_get_current (b));
|
|
udp_header_t *udp = ip6_next_header (ip6);
|
|
udp->checksum = ip6_tcp_udp_icmp_compute_checksum (vm, b, ip6, &bogus);
|
|
}
|
|
}
|
|
|
|
/* is_ip4 - inner header flag */
|
|
always_inline uword
|
|
wg_output_tun_inline (vlib_main_t *vm, vlib_node_runtime_t *node,
|
|
vlib_frame_t *frame, u8 is_ip4, u16 async_next_node)
|
|
{
|
|
wg_main_t *wmp = &wg_main;
|
|
wg_per_thread_data_t *ptd =
|
|
vec_elt_at_index (wmp->per_thread_data, vm->thread_index);
|
|
u32 *from = vlib_frame_vector_args (frame);
|
|
u32 n_left_from = frame->n_vectors;
|
|
ip4_udp_wg_header_t *hdr4_out = NULL;
|
|
ip6_udp_wg_header_t *hdr6_out = NULL;
|
|
message_data_t *message_data_wg = NULL;
|
|
vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs;
|
|
vlib_buffer_t *lb;
|
|
vnet_crypto_op_t **crypto_ops;
|
|
u16 nexts[VLIB_FRAME_SIZE], *next = nexts;
|
|
vlib_buffer_t *sync_bufs[VLIB_FRAME_SIZE];
|
|
u32 thread_index = vm->thread_index;
|
|
u16 n_sync = 0;
|
|
const u16 drop_next = WG_OUTPUT_NEXT_ERROR;
|
|
const u8 is_async = wg_op_mode_is_set_ASYNC ();
|
|
vnet_crypto_async_frame_t *async_frame = NULL;
|
|
u16 n_async = 0;
|
|
u16 noop_nexts[VLIB_FRAME_SIZE], *noop_next = noop_nexts, n_noop = 0;
|
|
u16 err = !0;
|
|
u32 sync_bi[VLIB_FRAME_SIZE];
|
|
u32 noop_bi[VLIB_FRAME_SIZE];
|
|
|
|
vlib_get_buffers (vm, from, bufs, n_left_from);
|
|
vec_reset_length (ptd->crypto_ops);
|
|
vec_reset_length (ptd->chained_crypto_ops);
|
|
vec_reset_length (ptd->chunks);
|
|
vec_reset_length (ptd->async_frames);
|
|
|
|
wg_peer_t *peer = NULL;
|
|
u32 adj_index = 0;
|
|
u32 last_adj_index = ~0;
|
|
index_t peeri = INDEX_INVALID;
|
|
|
|
f64 time = clib_time_now (&vm->clib_time) + vm->time_offset;
|
|
|
|
while (n_left_from > 0)
|
|
{
|
|
u8 iph_offset = 0;
|
|
u8 is_ip4_out = 1;
|
|
u8 *plain_data;
|
|
u16 plain_data_len;
|
|
u16 plain_data_len_total;
|
|
u16 n_bufs;
|
|
u16 b_space_left_at_beginning;
|
|
u32 bi = from[b - bufs];
|
|
|
|
if (n_left_from > 2)
|
|
{
|
|
u8 *p;
|
|
vlib_prefetch_buffer_header (b[2], LOAD);
|
|
p = vlib_buffer_get_current (b[1]);
|
|
CLIB_PREFETCH (p, CLIB_CACHE_LINE_BYTES, LOAD);
|
|
CLIB_PREFETCH (vlib_buffer_get_tail (b[1]), CLIB_CACHE_LINE_BYTES,
|
|
LOAD);
|
|
}
|
|
|
|
noop_next[0] = WG_OUTPUT_NEXT_ERROR;
|
|
err = WG_OUTPUT_NEXT_ERROR;
|
|
|
|
adj_index = vnet_buffer (b[0])->ip.adj_index[VLIB_TX];
|
|
|
|
if (PREDICT_FALSE (last_adj_index != adj_index))
|
|
{
|
|
peeri = wg_peer_get_by_adj_index (adj_index);
|
|
if (peeri == INDEX_INVALID)
|
|
{
|
|
b[0]->error = node->errors[WG_OUTPUT_ERROR_PEER];
|
|
goto out;
|
|
}
|
|
peer = wg_peer_get (peeri);
|
|
}
|
|
|
|
if (!peer || wg_peer_is_dead (peer))
|
|
{
|
|
b[0]->error = node->errors[WG_OUTPUT_ERROR_PEER];
|
|
goto out;
|
|
}
|
|
if (PREDICT_FALSE (~0 == peer->output_thread_index))
|
|
{
|
|
/* this is the first packet to use this peer, claim the peer
|
|
* for this thread.
|
|
*/
|
|
clib_atomic_cmp_and_swap (&peer->output_thread_index, ~0,
|
|
wg_peer_assign_thread (thread_index));
|
|
}
|
|
|
|
if (PREDICT_FALSE (thread_index != peer->output_thread_index))
|
|
{
|
|
noop_next[0] = WG_OUTPUT_NEXT_HANDOFF;
|
|
err = WG_OUTPUT_NEXT_HANDOFF;
|
|
goto next;
|
|
}
|
|
|
|
if (PREDICT_FALSE (!peer->remote.r_current))
|
|
{
|
|
wg_send_handshake_from_mt (peeri, false);
|
|
b[0]->error = node->errors[WG_OUTPUT_ERROR_KEYPAIR];
|
|
goto out;
|
|
}
|
|
|
|
lb = b[0];
|
|
n_bufs = vlib_buffer_chain_linearize (vm, b[0]);
|
|
if (n_bufs == 0)
|
|
{
|
|
b[0]->error = node->errors[WG_OUTPUT_ERROR_NO_BUFFERS];
|
|
goto out;
|
|
}
|
|
|
|
if (n_bufs > 1)
|
|
{
|
|
/* Find last buffer in the chain */
|
|
while (lb->flags & VLIB_BUFFER_NEXT_PRESENT)
|
|
lb = vlib_get_buffer (vm, lb->next_buffer);
|
|
}
|
|
|
|
/* Ensure there is enough free space at the beginning of the first buffer
|
|
* to write ethernet header (e.g. IPv6 VxLAN over IPv6 Wireguard will
|
|
* trigger this)
|
|
*/
|
|
ASSERT ((signed) b[0]->current_data >=
|
|
(signed) -VLIB_BUFFER_PRE_DATA_SIZE);
|
|
b_space_left_at_beginning =
|
|
b[0]->current_data + VLIB_BUFFER_PRE_DATA_SIZE;
|
|
if (PREDICT_FALSE (b_space_left_at_beginning <
|
|
sizeof (ethernet_header_t)))
|
|
{
|
|
u32 size_diff =
|
|
sizeof (ethernet_header_t) - b_space_left_at_beginning;
|
|
|
|
/* Can only move buffer when it's single and has enough free space*/
|
|
if (lb == b[0] &&
|
|
vlib_buffer_space_left_at_end (vm, b[0]) >= size_diff)
|
|
{
|
|
vlib_buffer_move (vm, b[0],
|
|
b[0]->current_data + (signed) size_diff);
|
|
}
|
|
else
|
|
{
|
|
b[0]->error = node->errors[WG_OUTPUT_ERROR_NO_BUFFERS];
|
|
goto out;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Ensure there is enough free space at the end of the last buffer to
|
|
* write auth tag */
|
|
if (PREDICT_FALSE (vlib_buffer_space_left_at_end (vm, lb) <
|
|
NOISE_AUTHTAG_LEN))
|
|
{
|
|
u32 tmp_bi = 0;
|
|
if (vlib_buffer_alloc (vm, &tmp_bi, 1) != 1)
|
|
{
|
|
b[0]->error = node->errors[WG_OUTPUT_ERROR_NO_BUFFERS];
|
|
goto out;
|
|
}
|
|
lb = vlib_buffer_chain_buffer (vm, lb, tmp_bi);
|
|
}
|
|
|
|
iph_offset = vnet_buffer (b[0])->ip.save_rewrite_length;
|
|
plain_data = vlib_buffer_get_current (b[0]) + iph_offset;
|
|
plain_data_len = b[0]->current_length - iph_offset;
|
|
plain_data_len_total =
|
|
vlib_buffer_length_in_chain (vm, b[0]) - iph_offset;
|
|
size_t encrypted_packet_len = message_data_len (plain_data_len_total);
|
|
vlib_buffer_chain_increase_length (b[0], lb, NOISE_AUTHTAG_LEN);
|
|
u8 *iv_data = b[0]->pre_data;
|
|
|
|
is_ip4_out = ip46_address_is_ip4 (&peer->src.addr);
|
|
if (is_ip4_out)
|
|
{
|
|
hdr4_out = vlib_buffer_get_current (b[0]);
|
|
message_data_wg = &hdr4_out->wg;
|
|
}
|
|
else
|
|
{
|
|
hdr6_out = vlib_buffer_get_current (b[0]);
|
|
message_data_wg = &hdr6_out->wg;
|
|
}
|
|
|
|
if (PREDICT_FALSE (last_adj_index != adj_index))
|
|
{
|
|
wg_timers_any_authenticated_packet_sent_opt (peer, time);
|
|
wg_timers_data_sent_opt (peer, time);
|
|
wg_timers_any_authenticated_packet_traversal (peer);
|
|
last_adj_index = adj_index;
|
|
}
|
|
|
|
/* Here we are sure that can send packet to next node */
|
|
next[0] = WG_OUTPUT_NEXT_INTERFACE_OUTPUT;
|
|
|
|
if (lb != b[0])
|
|
crypto_ops = &ptd->chained_crypto_ops;
|
|
else
|
|
crypto_ops = &ptd->crypto_ops;
|
|
|
|
enum noise_state_crypt state;
|
|
|
|
if (is_async)
|
|
{
|
|
state = wg_add_to_async_frame (
|
|
vm, ptd, &async_frame, b[0], lb, plain_data, plain_data_len_total,
|
|
bi, next[0], async_next_node, &peer->remote,
|
|
&message_data_wg->receiver_index, &message_data_wg->counter,
|
|
iv_data, time);
|
|
}
|
|
else
|
|
{
|
|
state = wg_output_tun_process (
|
|
vm, ptd, b[0], lb, crypto_ops, &peer->remote,
|
|
&message_data_wg->receiver_index, &message_data_wg->counter,
|
|
plain_data, plain_data_len, plain_data, n_sync, iv_data, time);
|
|
}
|
|
|
|
if (PREDICT_FALSE (state == SC_KEEP_KEY_FRESH))
|
|
{
|
|
wg_send_handshake_from_mt (peeri, false);
|
|
}
|
|
else if (PREDICT_FALSE (state == SC_FAILED))
|
|
{
|
|
// TODO: Maybe wrong
|
|
wg_send_handshake_from_mt (peeri, false);
|
|
wg_peer_update_flags (peeri, WG_PEER_ESTABLISHED, false);
|
|
noop_next[0] = WG_OUTPUT_NEXT_ERROR;
|
|
goto out;
|
|
}
|
|
|
|
err = WG_OUTPUT_NEXT_INTERFACE_OUTPUT;
|
|
|
|
if (is_ip4_out)
|
|
{
|
|
hdr4_out->wg.header.type = MESSAGE_DATA;
|
|
hdr4_out->udp.length = clib_host_to_net_u16 (encrypted_packet_len +
|
|
sizeof (udp_header_t));
|
|
ip4_header_set_len_w_chksum (
|
|
&hdr4_out->ip4, clib_host_to_net_u16 (encrypted_packet_len +
|
|
sizeof (ip4_udp_header_t)));
|
|
}
|
|
else
|
|
{
|
|
hdr6_out->wg.header.type = MESSAGE_DATA;
|
|
hdr6_out->ip6.payload_length = hdr6_out->udp.length =
|
|
clib_host_to_net_u16 (encrypted_packet_len +
|
|
sizeof (udp_header_t));
|
|
}
|
|
|
|
out:
|
|
if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE)
|
|
&& (b[0]->flags & VLIB_BUFFER_IS_TRACED)))
|
|
{
|
|
wg_output_tun_trace_t *t =
|
|
vlib_add_trace (vm, node, b[0], sizeof (*t));
|
|
|
|
t->peer = peeri;
|
|
t->is_ip4 = is_ip4_out;
|
|
if (hdr4_out)
|
|
clib_memcpy (t->header, hdr4_out, sizeof (ip4_udp_header_t));
|
|
else if (hdr6_out)
|
|
clib_memcpy (t->header, hdr6_out, sizeof (ip6_udp_header_t));
|
|
}
|
|
|
|
next:
|
|
if (PREDICT_FALSE (err != WG_OUTPUT_NEXT_INTERFACE_OUTPUT))
|
|
{
|
|
noop_bi[n_noop] = bi;
|
|
n_noop++;
|
|
noop_next++;
|
|
goto next_left;
|
|
}
|
|
if (!is_async)
|
|
{
|
|
sync_bi[n_sync] = bi;
|
|
sync_bufs[n_sync] = b[0];
|
|
n_sync += 1;
|
|
next += 1;
|
|
}
|
|
else
|
|
{
|
|
n_async++;
|
|
}
|
|
next_left:
|
|
n_left_from -= 1;
|
|
b += 1;
|
|
}
|
|
|
|
if (n_sync)
|
|
{
|
|
/* wg-output-process-ops */
|
|
wg_output_process_ops (vm, node, ptd->crypto_ops, sync_bufs, nexts,
|
|
drop_next);
|
|
wg_output_process_chained_ops (vm, node, ptd->chained_crypto_ops,
|
|
sync_bufs, nexts, ptd->chunks, drop_next);
|
|
|
|
int n_left_from_sync_bufs = n_sync;
|
|
while (n_left_from_sync_bufs > 0)
|
|
{
|
|
n_left_from_sync_bufs--;
|
|
wg_calc_checksum (vm, sync_bufs[n_left_from_sync_bufs]);
|
|
}
|
|
|
|
vlib_buffer_enqueue_to_next (vm, node, sync_bi, nexts, n_sync);
|
|
}
|
|
if (n_async)
|
|
{
|
|
/* submit all of the open frames */
|
|
vnet_crypto_async_frame_t **async_frame;
|
|
|
|
vec_foreach (async_frame, ptd->async_frames)
|
|
{
|
|
if (PREDICT_FALSE (
|
|
vnet_crypto_async_submit_open_frame (vm, *async_frame) < 0))
|
|
{
|
|
u32 n_drop = (*async_frame)->n_elts;
|
|
u32 *bi = (*async_frame)->buffer_indices;
|
|
u16 index = n_noop;
|
|
while (n_drop--)
|
|
{
|
|
noop_bi[index] = bi[0];
|
|
vlib_buffer_t *b = vlib_get_buffer (vm, bi[0]);
|
|
noop_nexts[index] = drop_next;
|
|
b->error = node->errors[WG_OUTPUT_ERROR_CRYPTO_ENGINE_ERROR];
|
|
bi++;
|
|
index++;
|
|
}
|
|
n_noop += (*async_frame)->n_elts;
|
|
|
|
vnet_crypto_async_reset_frame (*async_frame);
|
|
vnet_crypto_async_free_frame (vm, *async_frame);
|
|
}
|
|
}
|
|
}
|
|
if (n_noop)
|
|
{
|
|
vlib_buffer_enqueue_to_next (vm, node, noop_bi, noop_nexts, n_noop);
|
|
}
|
|
|
|
return frame->n_vectors;
|
|
}
|
|
|
|
always_inline uword
|
|
wg_output_tun_post (vlib_main_t *vm, vlib_node_runtime_t *node,
|
|
vlib_frame_t *frame)
|
|
{
|
|
vlib_buffer_t *bufs[VLIB_FRAME_SIZE], **b = bufs;
|
|
u16 nexts[VLIB_FRAME_SIZE], *next = nexts;
|
|
u32 *from = vlib_frame_vector_args (frame);
|
|
u32 n_left = frame->n_vectors;
|
|
|
|
index_t peeri = ~0;
|
|
|
|
vlib_get_buffers (vm, from, b, n_left);
|
|
|
|
if (n_left >= 4)
|
|
{
|
|
vlib_prefetch_buffer_header (b[0], LOAD);
|
|
vlib_prefetch_buffer_header (b[1], LOAD);
|
|
vlib_prefetch_buffer_header (b[2], LOAD);
|
|
vlib_prefetch_buffer_header (b[3], LOAD);
|
|
}
|
|
|
|
while (n_left > 8)
|
|
{
|
|
vlib_prefetch_buffer_header (b[4], LOAD);
|
|
vlib_prefetch_buffer_header (b[5], LOAD);
|
|
vlib_prefetch_buffer_header (b[6], LOAD);
|
|
vlib_prefetch_buffer_header (b[7], LOAD);
|
|
|
|
next[0] = (wg_post_data (b[0]))->next_index;
|
|
next[1] = (wg_post_data (b[1]))->next_index;
|
|
next[2] = (wg_post_data (b[2]))->next_index;
|
|
next[3] = (wg_post_data (b[3]))->next_index;
|
|
|
|
wg_calc_checksum (vm, b[0]);
|
|
wg_calc_checksum (vm, b[1]);
|
|
wg_calc_checksum (vm, b[2]);
|
|
wg_calc_checksum (vm, b[3]);
|
|
|
|
if (PREDICT_FALSE (node->flags & VLIB_NODE_FLAG_TRACE))
|
|
{
|
|
if (b[0]->flags & VLIB_BUFFER_IS_TRACED)
|
|
{
|
|
wg_output_tun_post_trace_t *tr =
|
|
vlib_add_trace (vm, node, b[0], sizeof (*tr));
|
|
peeri = wg_peer_get_by_adj_index (
|
|
vnet_buffer (b[0])->ip.adj_index[VLIB_TX]);
|
|
tr->peer = peeri;
|
|
tr->next_index = next[0];
|
|
}
|
|
if (b[1]->flags & VLIB_BUFFER_IS_TRACED)
|
|
{
|
|
wg_output_tun_post_trace_t *tr =
|
|
vlib_add_trace (vm, node, b[1], sizeof (*tr));
|
|
peeri = wg_peer_get_by_adj_index (
|
|
vnet_buffer (b[1])->ip.adj_index[VLIB_TX]);
|
|
tr->next_index = next[1];
|
|
}
|
|
if (b[2]->flags & VLIB_BUFFER_IS_TRACED)
|
|
{
|
|
wg_output_tun_post_trace_t *tr =
|
|
vlib_add_trace (vm, node, b[2], sizeof (*tr));
|
|
peeri = wg_peer_get_by_adj_index (
|
|
vnet_buffer (b[2])->ip.adj_index[VLIB_TX]);
|
|
tr->next_index = next[2];
|
|
}
|
|
if (b[3]->flags & VLIB_BUFFER_IS_TRACED)
|
|
{
|
|
wg_output_tun_post_trace_t *tr =
|
|
vlib_add_trace (vm, node, b[3], sizeof (*tr));
|
|
peeri = wg_peer_get_by_adj_index (
|
|
vnet_buffer (b[3])->ip.adj_index[VLIB_TX]);
|
|
tr->next_index = next[3];
|
|
}
|
|
}
|
|
|
|
b += 4;
|
|
next += 4;
|
|
n_left -= 4;
|
|
}
|
|
|
|
while (n_left > 0)
|
|
{
|
|
wg_calc_checksum (vm, b[0]);
|
|
|
|
next[0] = (wg_post_data (b[0]))->next_index;
|
|
if (PREDICT_FALSE ((node->flags & VLIB_NODE_FLAG_TRACE) &&
|
|
(b[0]->flags & VLIB_BUFFER_IS_TRACED)))
|
|
{
|
|
wg_output_tun_post_trace_t *tr =
|
|
vlib_add_trace (vm, node, b[0], sizeof (*tr));
|
|
peeri = wg_peer_get_by_adj_index (
|
|
vnet_buffer (b[0])->ip.adj_index[VLIB_TX]);
|
|
tr->next_index = next[0];
|
|
}
|
|
|
|
b += 1;
|
|
next += 1;
|
|
n_left -= 1;
|
|
}
|
|
|
|
vlib_buffer_enqueue_to_next (vm, node, from, nexts, frame->n_vectors);
|
|
return frame->n_vectors;
|
|
}
|
|
|
|
VLIB_REGISTER_NODE (wg4_output_tun_post_node) = {
|
|
.name = "wg4-output-tun-post-node",
|
|
.vector_size = sizeof (u32),
|
|
.format_trace = format_wg_output_tun_post_trace,
|
|
.type = VLIB_NODE_TYPE_INTERNAL,
|
|
.sibling_of = "wg4-output-tun",
|
|
.n_errors = ARRAY_LEN (wg_output_error_strings),
|
|
.error_strings = wg_output_error_strings,
|
|
};
|
|
|
|
VLIB_REGISTER_NODE (wg6_output_tun_post_node) = {
|
|
.name = "wg6-output-tun-post-node",
|
|
.vector_size = sizeof (u32),
|
|
.format_trace = format_wg_output_tun_post_trace,
|
|
.type = VLIB_NODE_TYPE_INTERNAL,
|
|
.sibling_of = "wg6-output-tun",
|
|
.n_errors = ARRAY_LEN (wg_output_error_strings),
|
|
.error_strings = wg_output_error_strings,
|
|
};
|
|
|
|
VLIB_NODE_FN (wg4_output_tun_post_node)
|
|
(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *from_frame)
|
|
{
|
|
return wg_output_tun_post (vm, node, from_frame);
|
|
}
|
|
|
|
VLIB_NODE_FN (wg6_output_tun_post_node)
|
|
(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *from_frame)
|
|
{
|
|
return wg_output_tun_post (vm, node, from_frame);
|
|
}
|
|
|
|
VLIB_NODE_FN (wg4_output_tun_node)
|
|
(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
|
|
{
|
|
return wg_output_tun_inline (vm, node, frame, /* is_ip4 */ 1,
|
|
wg_encrypt_async_next.wg4_post_next);
|
|
}
|
|
|
|
VLIB_NODE_FN (wg6_output_tun_node)
|
|
(vlib_main_t *vm, vlib_node_runtime_t *node, vlib_frame_t *frame)
|
|
{
|
|
return wg_output_tun_inline (vm, node, frame, /* is_ip4 */ 0,
|
|
wg_encrypt_async_next.wg6_post_next);
|
|
}
|
|
|
|
VLIB_REGISTER_NODE (wg4_output_tun_node) =
|
|
{
|
|
.name = "wg4-output-tun",
|
|
.vector_size = sizeof (u32),
|
|
.format_trace = format_wg_output_tun_trace,
|
|
.type = VLIB_NODE_TYPE_INTERNAL,
|
|
.n_errors = ARRAY_LEN (wg_output_error_strings),
|
|
.error_strings = wg_output_error_strings,
|
|
.n_next_nodes = WG_OUTPUT_N_NEXT,
|
|
.next_nodes = {
|
|
[WG_OUTPUT_NEXT_HANDOFF] = "wg4-output-tun-handoff",
|
|
[WG_OUTPUT_NEXT_INTERFACE_OUTPUT] = "adj-midchain-tx",
|
|
[WG_OUTPUT_NEXT_ERROR] = "error-drop",
|
|
},
|
|
};
|
|
|
|
VLIB_REGISTER_NODE (wg6_output_tun_node) =
|
|
{
|
|
.name = "wg6-output-tun",
|
|
.vector_size = sizeof (u32),
|
|
.format_trace = format_wg_output_tun_trace,
|
|
.type = VLIB_NODE_TYPE_INTERNAL,
|
|
.n_errors = ARRAY_LEN (wg_output_error_strings),
|
|
.error_strings = wg_output_error_strings,
|
|
.n_next_nodes = WG_OUTPUT_N_NEXT,
|
|
.next_nodes = {
|
|
[WG_OUTPUT_NEXT_HANDOFF] = "wg6-output-tun-handoff",
|
|
[WG_OUTPUT_NEXT_INTERFACE_OUTPUT] = "adj-midchain-tx",
|
|
[WG_OUTPUT_NEXT_ERROR] = "error-drop",
|
|
},
|
|
};
|
|
|
|
/*
|
|
* fd.io coding-style-patch-verification: ON
|
|
*
|
|
* Local Variables:
|
|
* eval: (c-set-style "gnu")
|
|
* End:
|
|
*/
|