memif: jumbo frames support

Current memif interface supports frame size up to 2048. This patch is to
enhance memif to support jumbo frames.

On tx (writing buffers to the ring), keep reading the next buffer in vlib
when the flag VLIB_BUFFER_NEXT_PRESENT and merge it to the same ring entry.
Use descriptor chaining if the buffer is not big enough.

On rx (reading buffers from the ring), if the packet is greater than 2048,
create multiple vlib buffers, chained with the VLIB_BUFFER_NEXT_PRESENT.

Testing:
Because the ping command provided by VPP does not support jumbo frames,
I have to use linux ping. Here is the set up that I use for testing.

VM1 --- vhost ---- VPP1 --- memif --- VPP2 --- vhost --- VM2

Create vhost-user interfaces between VM1 and VPP1 and between VPP2 and VM2

VM configuration:
Set the interface mtu on the VM, e.g 9216 to support jumbo frames.
create static route and static arp on VM1 to VM2 and vice versa.
Use iperf3 or ping -s 8000 from VM1 to VM2 or vice versa.

Sample run
sluong@ubuntu:~$ ping 131.1.1.1 -c1 -s 8000
ping 131.1.1.1 -c1 -s 8000
PING 131.1.1.1 (131.1.1.1) 8000(8028) bytes of data.
8008 bytes from 131.1.1.1: icmp_seq=1 ttl=62 time=0.835 ms

--- 131.1.1.1 ping statistics ---
1 packets transmitted, 1 received, 0% packet loss, time 0ms
rtt min/avg/max/mdev = 0.835/0.835/0.835/0.000 ms
sluong@ubuntu:~$

DBGvpp# sh interface memif0
              Name               Idx       State          Counter          Count
memif0                            1         up       rx packets                     1
                                                     rx bytes                    8042
                                                     tx packets                     1
                                                     tx bytes                    8042
                                                     ip4                            1
DBGvpp#

Change-Id: I469bece3d45a790dceaee1d6a8e976bd018feee2
Signed-off-by: Steven <sluong@cisco.com>
This commit is contained in:
Steven
2017-06-08 12:52:29 -07:00
committed by Damjan Marion
parent f89d1859b1
commit 0657c165d9
2 changed files with 275 additions and 151 deletions

View File

@ -30,6 +30,7 @@
#define foreach_memif_tx_func_error \
_(NO_FREE_SLOTS, "no free tx slots") \
_(TRUNC_PACKET, "packet > buffer size -- truncated in tx ring") \
_(PENDING_MSGS, "pending msgs in tx ring")
typedef enum
@ -86,6 +87,70 @@ memif_prefetch_buffer_and_data (vlib_main_t * vm, u32 bi)
CLIB_PREFETCH (b->data, CLIB_CACHE_LINE_BYTES, LOAD);
}
/**
* @brief Copy buffer to tx ring
*
* @param * vm (in)
* @param * node (in)
* @param * mif (in) pointer to memif interface
* @param bi (in) vlib buffer index
* @param * ring (in) pointer to memif ring
* @param * head (in/out) ring head
* @param mask (in) ring size - 1
*/
static_always_inline void
memif_copy_buffer_to_tx_ring (vlib_main_t * vm, vlib_node_runtime_t * node,
memif_if_t * mif, u32 bi, memif_ring_t * ring,
u16 * head, u16 mask)
{
vlib_buffer_t *b0;
void *mb0;
u32 total = 0, len;
mb0 = memif_get_buffer (mif, ring, *head);
ring->desc[*head].flags = 0;
do
{
b0 = vlib_get_buffer (vm, bi);
len = b0->current_length;
if (PREDICT_FALSE (ring->desc[*head].buffer_length < (total + len)))
{
if (PREDICT_TRUE (total))
{
ring->desc[*head].length = total;
total = 0;
ring->desc[*head].flags |= MEMIF_DESC_FLAG_NEXT;
*head = (*head + 1) & mask;
mb0 = memif_get_buffer (mif, ring, *head);
ring->desc[*head].flags = 0;
}
}
if (PREDICT_TRUE (ring->desc[*head].buffer_length >= (total + len)))
{
clib_memcpy (mb0 + total, vlib_buffer_get_current (b0),
CLIB_CACHE_LINE_BYTES);
if (len > CLIB_CACHE_LINE_BYTES)
clib_memcpy (mb0 + CLIB_CACHE_LINE_BYTES + total,
vlib_buffer_get_current (b0) + CLIB_CACHE_LINE_BYTES,
len - CLIB_CACHE_LINE_BYTES);
total += len;
}
else
{
vlib_error_count (vm, node->node_index, MEMIF_TX_ERROR_TRUNC_PACKET,
1);
break;
}
}
while ((bi = (b0->flags & VLIB_BUFFER_NEXT_PRESENT) ? b0->next_buffer : 0));
if (PREDICT_TRUE (total))
{
ring->desc[*head].length = total;
*head = (*head + 1) & mask;
}
}
static_always_inline uword
memif_interface_tx_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
vlib_frame_t * frame, memif_if_t * mif,
@ -152,32 +217,10 @@ memif_interface_tx_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
memif_prefetch_buffer_and_data (vm, buffers[2]);
memif_prefetch_buffer_and_data (vm, buffers[3]);
vlib_buffer_t *b0 = vlib_get_buffer (vm, buffers[0]);
vlib_buffer_t *b1 = vlib_get_buffer (vm, buffers[1]);
void *mb0 = memif_get_buffer (mif, ring, head);
clib_memcpy (mb0, vlib_buffer_get_current (b0), CLIB_CACHE_LINE_BYTES);
ring->desc[head].length = b0->current_length;
head = (head + 1) & mask;
void *mb1 = memif_get_buffer (mif, ring, head);
clib_memcpy (mb1, vlib_buffer_get_current (b1), CLIB_CACHE_LINE_BYTES);
ring->desc[head].length = b1->current_length;
head = (head + 1) & mask;
if (b0->current_length > CLIB_CACHE_LINE_BYTES)
{
clib_memcpy (mb0 + CLIB_CACHE_LINE_BYTES,
vlib_buffer_get_current (b0) + CLIB_CACHE_LINE_BYTES,
b0->current_length - CLIB_CACHE_LINE_BYTES);
}
if (b1->current_length > CLIB_CACHE_LINE_BYTES)
{
clib_memcpy (mb1 + CLIB_CACHE_LINE_BYTES,
vlib_buffer_get_current (b1) + CLIB_CACHE_LINE_BYTES,
b1->current_length - CLIB_CACHE_LINE_BYTES);
}
memif_copy_buffer_to_tx_ring (vm, node, mif, buffers[0], ring, &head,
mask);
memif_copy_buffer_to_tx_ring (vm, node, mif, buffers[1], ring, &head,
mask);
buffers += 2;
n_left -= 2;
@ -186,19 +229,8 @@ memif_interface_tx_inline (vlib_main_t * vm, vlib_node_runtime_t * node,
while (n_left && free_slots)
{
vlib_buffer_t *b0 = vlib_get_buffer (vm, buffers[0]);
void *mb0 = memif_get_buffer (mif, ring, head);
clib_memcpy (mb0, vlib_buffer_get_current (b0), CLIB_CACHE_LINE_BYTES);
if (b0->current_length > CLIB_CACHE_LINE_BYTES)
{
clib_memcpy (mb0 + CLIB_CACHE_LINE_BYTES,
vlib_buffer_get_current (b0) + CLIB_CACHE_LINE_BYTES,
b0->current_length - CLIB_CACHE_LINE_BYTES);
}
ring->desc[head].length = b0->current_length;
head = (head + 1) & mask;
memif_copy_buffer_to_tx_ring (vm, node, mif, buffers[0], ring, &head,
mask);
buffers++;
n_left--;
free_slots--;

File diff suppressed because it is too large Load Diff