Type: refactor Change-Id: I5235bf3e9aff58af6ba2c14e8c6529c4fc9ec86c Signed-off-by: Damjan Marion <damarion@cisco.com>
975 lines
28 KiB
C
975 lines
28 KiB
C
/*
|
|
* Copyright (c) 2018 Cisco and/or its affiliates.
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at:
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include <vppinfra/types.h>
|
|
#include <vlib/vlib.h>
|
|
#include <vlib/pci/pci.h>
|
|
#include <vnet/ethernet/ethernet.h>
|
|
#include <vnet/plugin/plugin.h>
|
|
#include <vpp/app/version.h>
|
|
#include <vnet/interface/rx_queue_funcs.h>
|
|
#include <vnet/interface/tx_queue_funcs.h>
|
|
#include <vmxnet3/vmxnet3.h>
|
|
|
|
#define PCI_VENDOR_ID_VMWARE 0x15ad
|
|
#define PCI_DEVICE_ID_VMWARE_VMXNET3 0x07b0
|
|
|
|
vmxnet3_main_t vmxnet3_main;
|
|
|
|
static pci_device_id_t vmxnet3_pci_device_ids[] = {
|
|
{
|
|
.vendor_id = PCI_VENDOR_ID_VMWARE,
|
|
.device_id = PCI_DEVICE_ID_VMWARE_VMXNET3},
|
|
{0},
|
|
};
|
|
|
|
static clib_error_t *
|
|
vmxnet3_interface_admin_up_down (vnet_main_t * vnm, u32 hw_if_index,
|
|
u32 flags)
|
|
{
|
|
vnet_hw_interface_t *hi = vnet_get_hw_interface (vnm, hw_if_index);
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
vmxnet3_device_t *vd = vec_elt_at_index (vmxm->devices, hi->dev_instance);
|
|
uword is_up = (flags & VNET_SW_INTERFACE_FLAG_ADMIN_UP) != 0;
|
|
|
|
if (vd->flags & VMXNET3_DEVICE_F_ERROR)
|
|
return clib_error_return (0, "device is in error state");
|
|
|
|
if (is_up)
|
|
{
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index,
|
|
VNET_HW_INTERFACE_FLAG_LINK_UP);
|
|
vd->flags |= VMXNET3_DEVICE_F_ADMIN_UP;
|
|
}
|
|
else
|
|
{
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index, 0);
|
|
vd->flags &= ~VMXNET3_DEVICE_F_ADMIN_UP;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static clib_error_t *
|
|
vmxnet3_interface_rx_mode_change (vnet_main_t * vnm, u32 hw_if_index, u32 qid,
|
|
vnet_hw_if_rx_mode mode)
|
|
{
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
|
|
vmxnet3_device_t *vd = pool_elt_at_index (vmxm->devices, hw->dev_instance);
|
|
vmxnet3_rxq_t *rxq = vec_elt_at_index (vd->rxqs, qid);
|
|
vmxnet3_per_thread_data_t *ptd;
|
|
|
|
if (mode == rxq->mode)
|
|
return 0;
|
|
if ((mode != VNET_HW_IF_RX_MODE_POLLING) &&
|
|
(mode != VNET_HW_IF_RX_MODE_INTERRUPT))
|
|
return clib_error_return (0, "Rx mode %U not supported",
|
|
format_vnet_hw_if_rx_mode, mode);
|
|
rxq->mode = mode;
|
|
ptd = vec_elt_at_index (vmxm->per_thread_data, rxq->thread_index);
|
|
if (rxq->mode == VNET_HW_IF_RX_MODE_POLLING)
|
|
ptd->polling_q_count++;
|
|
else
|
|
{
|
|
ASSERT (ptd->polling_q_count != 0);
|
|
ptd->polling_q_count--;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
vmxnet3_set_interface_next_node (vnet_main_t * vnm, u32 hw_if_index,
|
|
u32 node_index)
|
|
{
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
vnet_hw_interface_t *hw = vnet_get_hw_interface (vnm, hw_if_index);
|
|
vmxnet3_device_t *vd = pool_elt_at_index (vmxm->devices, hw->dev_instance);
|
|
|
|
/* Shut off redirection */
|
|
if (node_index == ~0)
|
|
{
|
|
vd->per_interface_next_index = node_index;
|
|
return;
|
|
}
|
|
|
|
vd->per_interface_next_index =
|
|
vlib_node_add_next (vlib_get_main (), vmxnet3_input_node.index,
|
|
node_index);
|
|
}
|
|
|
|
static void
|
|
vmxnet3_clear_hw_interface_counters (u32 instance)
|
|
{
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
vmxnet3_device_t *vd = pool_elt_at_index (vmxm->devices, instance);
|
|
vmxnet3_tx_queue *tx = VMXNET3_TX_START (vd);
|
|
vmxnet3_rx_queue *rx = VMXNET3_RX_START (vd);
|
|
u16 qid;
|
|
|
|
/*
|
|
* Set the "last_cleared_stats" to the current stats, so that
|
|
* things appear to clear from a display perspective.
|
|
*/
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_GET_STATS);
|
|
|
|
vec_foreach_index (qid, vd->txqs)
|
|
{
|
|
vmxnet3_tx_stats *txs = vec_elt_at_index (vd->tx_stats, qid);
|
|
clib_memcpy (txs, &tx->stats, sizeof (*txs));
|
|
tx++;
|
|
}
|
|
vec_foreach_index (qid, vd->rxqs)
|
|
{
|
|
vmxnet3_rx_stats *rxs = vec_elt_at_index (vd->rx_stats, qid);
|
|
clib_memcpy (rxs, &rx->stats, sizeof (*rxs));
|
|
rx++;
|
|
}
|
|
}
|
|
|
|
static char *vmxnet3_tx_func_error_strings[] = {
|
|
#define _(n,s) s,
|
|
foreach_vmxnet3_tx_func_error
|
|
#undef _
|
|
};
|
|
|
|
VNET_DEVICE_CLASS (vmxnet3_device_class,) =
|
|
{
|
|
.name = "VMXNET3 interface",
|
|
.format_device = format_vmxnet3_device,
|
|
.format_device_name = format_vmxnet3_device_name,
|
|
.admin_up_down_function = vmxnet3_interface_admin_up_down,
|
|
.clear_counters = vmxnet3_clear_hw_interface_counters,
|
|
.rx_mode_change_function = vmxnet3_interface_rx_mode_change,
|
|
.rx_redirect_to_node = vmxnet3_set_interface_next_node,
|
|
.tx_function_n_errors = VMXNET3_TX_N_ERROR,
|
|
.tx_function_error_strings = vmxnet3_tx_func_error_strings,
|
|
};
|
|
|
|
static u32
|
|
vmxnet3_flag_change (vnet_main_t * vnm, vnet_hw_interface_t * hw, u32 flags)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
vmxnet3_write_mac (vmxnet3_device_t * vd)
|
|
{
|
|
u32 val;
|
|
|
|
memcpy (&val, vd->mac_addr, 4);
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_MACL, val);
|
|
|
|
val = 0;
|
|
memcpy (&val, vd->mac_addr + 4, 2);
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_MACH, val);
|
|
}
|
|
|
|
static clib_error_t *
|
|
vmxnet3_provision_driver_shared (vlib_main_t * vm, vmxnet3_device_t * vd)
|
|
{
|
|
vmxnet3_shared *shared;
|
|
u64 shared_dma;
|
|
u16 qid, rid;
|
|
vmxnet3_tx_queue *tx = VMXNET3_TX_START (vd);
|
|
vmxnet3_rx_queue *rx = VMXNET3_RX_START (vd);
|
|
|
|
vd->driver_shared =
|
|
vlib_physmem_alloc_aligned_on_numa (vm, sizeof (*vd->driver_shared), 512,
|
|
vd->numa_node);
|
|
if (vd->driver_shared == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (vd->driver_shared, 0, sizeof (*vd->driver_shared));
|
|
|
|
vec_foreach_index (qid, vd->txqs)
|
|
{
|
|
vmxnet3_txq_t *txq = vec_elt_at_index (vd->txqs, qid);
|
|
|
|
tx->cfg.desc_address = vmxnet3_dma_addr (vm, vd, txq->tx_desc);
|
|
tx->cfg.comp_address = vmxnet3_dma_addr (vm, vd, txq->tx_comp);
|
|
tx->cfg.num_desc = txq->size;
|
|
tx->cfg.num_comp = txq->size;
|
|
tx++;
|
|
}
|
|
|
|
vec_foreach_index (qid, vd->rxqs)
|
|
{
|
|
vmxnet3_rxq_t *rxq = vec_elt_at_index (vd->rxqs, qid);
|
|
|
|
for (rid = 0; rid < VMXNET3_RX_RING_SIZE; rid++)
|
|
{
|
|
rx->cfg.desc_address[rid] = vmxnet3_dma_addr (vm, vd,
|
|
rxq->rx_desc[rid]);
|
|
rx->cfg.num_desc[rid] = rxq->size;
|
|
}
|
|
rx->cfg.comp_address = vmxnet3_dma_addr (vm, vd, rxq->rx_comp);
|
|
rx->cfg.num_comp = rxq->size;
|
|
rx->cfg.intr_index = qid;
|
|
rx++;
|
|
}
|
|
|
|
shared = vd->driver_shared;
|
|
shared->magic = VMXNET3_SHARED_MAGIC;
|
|
shared->misc.version = VMXNET3_VERSION_MAGIC;
|
|
if (sizeof (void *) == 4)
|
|
shared->misc.guest_info = VMXNET3_GOS_BITS_32;
|
|
else
|
|
shared->misc.guest_info = VMXNET3_GOS_BITS_64;
|
|
shared->misc.guest_info |= VMXNET3_GOS_TYPE_LINUX;
|
|
shared->misc.version_support = VMXNET3_VERSION_SELECT;
|
|
shared->misc.upt_features = VMXNET3_F_RXCSUM;
|
|
if (vd->gso_enable)
|
|
shared->misc.upt_features |= VMXNET3_F_LRO;
|
|
if (vd->num_rx_queues > 1)
|
|
{
|
|
shared->misc.upt_features |= VMXNET3_F_RSS;
|
|
shared->rss.version = 1;
|
|
shared->rss.address = vmxnet3_dma_addr (vm, vd, vd->rss);
|
|
shared->rss.length = sizeof (*vd->rss);
|
|
}
|
|
shared->misc.max_num_rx_sg = 0;
|
|
shared->misc.upt_version_support = VMXNET3_UPT_VERSION_SELECT;
|
|
shared->misc.queue_desc_address = vmxnet3_dma_addr (vm, vd, vd->queues);
|
|
shared->misc.queue_desc_len = sizeof (*tx) * vd->num_tx_queues +
|
|
sizeof (*rx) * vd->num_rx_queues;
|
|
shared->misc.mtu = VMXNET3_MTU;
|
|
shared->misc.num_tx_queues = vd->num_tx_queues;
|
|
shared->misc.num_rx_queues = vd->num_rx_queues;
|
|
shared->interrupt.num_intrs = vd->num_intrs;
|
|
shared->interrupt.event_intr_index = vd->num_rx_queues;
|
|
shared->interrupt.control = VMXNET3_IC_DISABLE_ALL;
|
|
shared->rx_filter.mode = VMXNET3_RXMODE_UCAST | VMXNET3_RXMODE_BCAST |
|
|
VMXNET3_RXMODE_ALL_MULTI | VMXNET3_RXMODE_PROMISC;
|
|
shared_dma = vmxnet3_dma_addr (vm, vd, shared);
|
|
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_DSAL, shared_dma);
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_DSAH, shared_dma >> 32);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static inline void
|
|
vmxnet3_enable_interrupt (vmxnet3_device_t * vd)
|
|
{
|
|
int i;
|
|
vmxnet3_shared *shared = vd->driver_shared;
|
|
|
|
shared->interrupt.control &= ~VMXNET3_IC_DISABLE_ALL;
|
|
for (i = 0; i < vd->num_intrs; i++)
|
|
vmxnet3_reg_write (vd, 0, VMXNET3_REG_IMR + i * 8, 0);
|
|
}
|
|
|
|
static inline void
|
|
vmxnet3_disable_interrupt (vmxnet3_device_t * vd)
|
|
{
|
|
int i;
|
|
vmxnet3_shared *shared = vd->driver_shared;
|
|
|
|
shared->interrupt.control |= VMXNET3_IC_DISABLE_ALL;
|
|
for (i = 0; i < vd->num_intrs; i++)
|
|
vmxnet3_reg_write (vd, 0, VMXNET3_REG_IMR + i * 8, 1);
|
|
}
|
|
|
|
static clib_error_t *
|
|
vmxnet3_rxq_init (vlib_main_t * vm, vmxnet3_device_t * vd, u16 qid, u16 qsz)
|
|
{
|
|
vmxnet3_rxq_t *rxq;
|
|
vmxnet3_rx_stats *rxs;
|
|
u16 rid;
|
|
|
|
vec_validate (vd->rx_stats, qid);
|
|
rxs = vec_elt_at_index (vd->rx_stats, qid);
|
|
clib_memset (rxs, 0, sizeof (*rxs));
|
|
|
|
vec_validate_aligned (vd->rxqs, qid, CLIB_CACHE_LINE_BYTES);
|
|
rxq = vec_elt_at_index (vd->rxqs, qid);
|
|
clib_memset (rxq, 0, sizeof (*rxq));
|
|
rxq->size = qsz;
|
|
rxq->mode = VNET_HW_IF_RX_MODE_POLLING;
|
|
for (rid = 0; rid < VMXNET3_RX_RING_SIZE; rid++)
|
|
{
|
|
rxq->rx_desc[rid] = vlib_physmem_alloc_aligned_on_numa
|
|
(vm, qsz * sizeof (*rxq->rx_desc[rid]), 512, vd->numa_node);
|
|
|
|
if (rxq->rx_desc[rid] == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (rxq->rx_desc[rid], 0, qsz * sizeof (*rxq->rx_desc[rid]));
|
|
}
|
|
rxq->rx_comp =
|
|
vlib_physmem_alloc_aligned_on_numa (vm, qsz * sizeof (*rxq->rx_comp), 512,
|
|
vd->numa_node);
|
|
if (rxq->rx_comp == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (rxq->rx_comp, 0, qsz * sizeof (*rxq->rx_comp));
|
|
for (rid = 0; rid < VMXNET3_RX_RING_SIZE; rid++)
|
|
{
|
|
vmxnet3_rx_ring *ring;
|
|
|
|
ring = &rxq->rx_ring[rid];
|
|
ring->gen = VMXNET3_RXF_GEN;
|
|
ring->rid = rid;
|
|
vec_validate_aligned (ring->bufs, rxq->size, CLIB_CACHE_LINE_BYTES);
|
|
}
|
|
rxq->rx_comp_ring.gen = VMXNET3_RXCF_GEN;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static clib_error_t *
|
|
vmxnet3_txq_init (vlib_main_t * vm, vmxnet3_device_t * vd, u16 qid, u16 qsz)
|
|
{
|
|
vmxnet3_txq_t *txq;
|
|
vmxnet3_tx_stats *txs;
|
|
u32 size;
|
|
|
|
vec_validate_aligned (vd->txqs, qid, CLIB_CACHE_LINE_BYTES);
|
|
txq = vec_elt_at_index (vd->txqs, qid);
|
|
clib_memset (txq, 0, sizeof (*txq));
|
|
clib_spinlock_init (&txq->lock);
|
|
|
|
vec_validate (vd->tx_stats, qid);
|
|
txs = vec_elt_at_index (vd->tx_stats, qid);
|
|
clib_memset (txs, 0, sizeof (*txs));
|
|
|
|
txq->size = qsz;
|
|
txq->reg_txprod = qid * 8 + VMXNET3_REG_TXPROD;
|
|
|
|
size = qsz * sizeof (*txq->tx_desc);
|
|
txq->tx_desc =
|
|
vlib_physmem_alloc_aligned_on_numa (vm, size, 512, vd->numa_node);
|
|
if (txq->tx_desc == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (txq->tx_desc, 0, size);
|
|
|
|
size = qsz * sizeof (*txq->tx_comp);
|
|
txq->tx_comp =
|
|
vlib_physmem_alloc_aligned_on_numa (vm, size, 512, vd->numa_node);
|
|
if (txq->tx_comp == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (txq->tx_comp, 0, size);
|
|
vec_validate_aligned (txq->tx_ring.bufs, txq->size, CLIB_CACHE_LINE_BYTES);
|
|
txq->tx_ring.gen = VMXNET3_TXF_GEN;
|
|
txq->tx_comp_ring.gen = VMXNET3_TXCF_GEN;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static const u8 vmxnet3_rss_key[VMXNET3_RSS_MAX_KEY_SZ] = {
|
|
0x3b, 0x56, 0xd1, 0x56, 0x13, 0x4a, 0xe7, 0xac,
|
|
0xe8, 0x79, 0x09, 0x75, 0xe8, 0x65, 0x79, 0x28,
|
|
0x35, 0x12, 0xb9, 0x56, 0x7c, 0x76, 0x4b, 0x70,
|
|
0xd8, 0x56, 0xa3, 0x18, 0x9b, 0x0a, 0xee, 0xf3,
|
|
0x96, 0xa6, 0x9f, 0x8f, 0x9e, 0x8c, 0x90, 0xc9,
|
|
};
|
|
|
|
static clib_error_t *
|
|
vmxnet3_rss_init (vlib_main_t * vm, vmxnet3_device_t * vd)
|
|
{
|
|
vmxnet3_rss_shared *rss;
|
|
size_t size = sizeof (*rss);
|
|
u8 i;
|
|
|
|
vd->rss = vlib_physmem_alloc_aligned_on_numa (vm, size, 512, vd->numa_node);
|
|
if (vd->rss == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (vd->rss, 0, size);
|
|
rss = vd->rss;
|
|
rss->hash_type =
|
|
VMXNET3_RSS_HASH_TYPE_IPV4 | VMXNET3_RSS_HASH_TYPE_TCP_IPV4 |
|
|
VMXNET3_RSS_HASH_TYPE_IPV6 | VMXNET3_RSS_HASH_TYPE_TCP_IPV6;
|
|
rss->hash_func = VMXNET3_RSS_HASH_FUNC_TOEPLITZ;
|
|
rss->hash_key_sz = VMXNET3_RSS_MAX_KEY_SZ;
|
|
rss->ind_table_sz = VMXNET3_RSS_MAX_IND_TABLE_SZ;
|
|
clib_memcpy (rss->hash_key, vmxnet3_rss_key, VMXNET3_RSS_MAX_KEY_SZ);
|
|
for (i = 0; i < rss->ind_table_sz; i++)
|
|
rss->ind_table[i] = i % vd->num_rx_queues;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static clib_error_t *
|
|
vmxnet3_device_init (vlib_main_t * vm, vmxnet3_device_t * vd,
|
|
vmxnet3_create_if_args_t * args)
|
|
{
|
|
clib_error_t *error = 0;
|
|
u32 ret, i, size;
|
|
|
|
/* Quiesce the device */
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_QUIESCE_DEV);
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_CMD);
|
|
if (ret != 0)
|
|
{
|
|
error = clib_error_return (0, "error on quiescing device rc (%u)", ret);
|
|
return error;
|
|
}
|
|
|
|
/* Reset the device */
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_RESET_DEV);
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_CMD);
|
|
if (ret != 0)
|
|
{
|
|
error = clib_error_return (0, "error on resetting device rc (%u)", ret);
|
|
return error;
|
|
}
|
|
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_VRRS);
|
|
vd->version = count_leading_zeros (ret);
|
|
vd->version = uword_bits - vd->version;
|
|
|
|
if (vd->version == 0)
|
|
{
|
|
error = clib_error_return (0, "unsupported hardware version %u",
|
|
vd->version);
|
|
return error;
|
|
}
|
|
|
|
/* cap support version to 3 */
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_VRRS,
|
|
1 << (clib_min (3, vd->version) - 1));
|
|
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_UVRS);
|
|
if (ret & 1)
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_UVRS, 1);
|
|
else
|
|
{
|
|
error = clib_error_return (0, "unsupported upt version %u", ret);
|
|
return error;
|
|
}
|
|
|
|
/* GSO is only supported for version >= 3 */
|
|
if (args->enable_gso)
|
|
{
|
|
if (vd->version >= 3)
|
|
vd->gso_enable = 1;
|
|
else
|
|
{
|
|
error =
|
|
clib_error_return (0,
|
|
"GSO is not supported because hardware version"
|
|
" is %u. It must be >= 3", vd->version);
|
|
return error;
|
|
}
|
|
}
|
|
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_GET_LINK);
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_CMD);
|
|
if (ret & 1)
|
|
{
|
|
vd->flags |= VMXNET3_DEVICE_F_LINK_UP;
|
|
vd->link_speed = ret >> 16;
|
|
}
|
|
else
|
|
vd->flags &= ~VMXNET3_DEVICE_F_LINK_UP;
|
|
|
|
/* Get the mac address */
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_MACL);
|
|
clib_memcpy (vd->mac_addr, &ret, 4);
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_MACH);
|
|
clib_memcpy (vd->mac_addr + 4, &ret, 2);
|
|
|
|
size = sizeof (vmxnet3_rx_queue) * vd->num_rx_queues +
|
|
sizeof (vmxnet3_tx_queue) * vd->num_tx_queues;
|
|
|
|
vd->queues =
|
|
vlib_physmem_alloc_aligned_on_numa (vm, size, 512, vd->numa_node);
|
|
if (vd->queues == 0)
|
|
return vlib_physmem_last_error (vm);
|
|
|
|
clib_memset (vd->queues, 0, size);
|
|
|
|
if (vd->num_rx_queues > 1)
|
|
{
|
|
error = vmxnet3_rss_init (vm, vd);
|
|
if (error)
|
|
return error;
|
|
}
|
|
|
|
for (i = 0; i < vd->num_rx_queues; i++)
|
|
{
|
|
error = vmxnet3_rxq_init (vm, vd, i, args->rxq_size);
|
|
if (error)
|
|
return error;
|
|
}
|
|
|
|
for (i = 0; i < vd->num_tx_queues; i++)
|
|
{
|
|
error = vmxnet3_txq_init (vm, vd, i, args->txq_size);
|
|
if (error)
|
|
return error;
|
|
}
|
|
|
|
error = vmxnet3_provision_driver_shared (vm, vd);
|
|
if (error)
|
|
return error;
|
|
|
|
vmxnet3_write_mac (vd);
|
|
|
|
/* Activate device */
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_ACTIVATE_DEV);
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_CMD);
|
|
if (ret != 0)
|
|
{
|
|
error =
|
|
clib_error_return (0, "error on activating device rc (%u)", ret);
|
|
return error;
|
|
}
|
|
|
|
return error;
|
|
}
|
|
|
|
static void
|
|
vmxnet3_rxq_irq_handler (vlib_main_t * vm, vlib_pci_dev_handle_t h, u16 line)
|
|
{
|
|
vnet_main_t *vnm = vnet_get_main ();
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
uword pd = vlib_pci_get_private_data (vm, h);
|
|
vmxnet3_device_t *vd = pool_elt_at_index (vmxm->devices, pd);
|
|
u16 qid = line;
|
|
vmxnet3_rxq_t *rxq = vec_elt_at_index (vd->rxqs, qid);
|
|
|
|
if (vec_len (vd->rxqs) > qid && (rxq->mode != VNET_HW_IF_RX_MODE_POLLING))
|
|
{
|
|
vmxnet3_per_thread_data_t *ptd =
|
|
vec_elt_at_index (vmxm->per_thread_data, rxq->thread_index);
|
|
if (ptd->polling_q_count == 0)
|
|
vnet_hw_if_rx_queue_set_int_pending (vnm, rxq->queue_index);
|
|
}
|
|
}
|
|
|
|
static void
|
|
vmxnet3_event_irq_handler (vlib_main_t * vm, vlib_pci_dev_handle_t h,
|
|
u16 line)
|
|
{
|
|
vnet_main_t *vnm = vnet_get_main ();
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
uword pd = vlib_pci_get_private_data (vm, h);
|
|
vmxnet3_device_t *vd = pool_elt_at_index (vmxm->devices, pd);
|
|
u32 ret;
|
|
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_GET_LINK);
|
|
ret = vmxnet3_reg_read (vd, 1, VMXNET3_REG_CMD);
|
|
if (ret & 1)
|
|
{
|
|
vd->flags |= VMXNET3_DEVICE_F_LINK_UP;
|
|
vd->link_speed = ret >> 16;
|
|
vnet_hw_interface_set_link_speed (
|
|
vnm, vd->hw_if_index,
|
|
(vd->link_speed == UINT32_MAX) ? UINT32_MAX : vd->link_speed * 1000);
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index,
|
|
VNET_HW_INTERFACE_FLAG_LINK_UP);
|
|
}
|
|
else
|
|
{
|
|
vd->flags &= ~VMXNET3_DEVICE_F_LINK_UP;
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index, 0);
|
|
}
|
|
}
|
|
|
|
static u8
|
|
vmxnet3_queue_size_valid (u16 qsz)
|
|
{
|
|
if (qsz < 64 || qsz > 4096)
|
|
return 0;
|
|
if ((qsz % 64) != 0)
|
|
return 0;
|
|
return 1;
|
|
}
|
|
|
|
static u8
|
|
vmxnet3_tx_queue_num_valid (u16 num)
|
|
{
|
|
vlib_thread_main_t *tm = vlib_get_thread_main ();
|
|
|
|
if ((num > VMXNET3_TXQ_MAX) || (num > tm->n_vlib_mains))
|
|
return 0;
|
|
return 1;
|
|
}
|
|
|
|
static u8
|
|
vmxnet3_rx_queue_num_valid (u16 num)
|
|
{
|
|
if (num > VMXNET3_RXQ_MAX)
|
|
return 0;
|
|
return 1;
|
|
}
|
|
|
|
void
|
|
vmxnet3_create_if (vlib_main_t * vm, vmxnet3_create_if_args_t * args)
|
|
{
|
|
vnet_main_t *vnm = vnet_get_main ();
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
vnet_eth_interface_registration_t eir = {};
|
|
|
|
vmxnet3_device_t *vd;
|
|
vlib_pci_dev_handle_t h;
|
|
vnet_hw_if_caps_change_t cc = {};
|
|
clib_error_t *error = 0;
|
|
u16 qid;
|
|
u32 num_intr;
|
|
|
|
if (args->txq_num == 0)
|
|
args->txq_num = 1;
|
|
if (args->rxq_num == 0)
|
|
args->rxq_num = 1;
|
|
if (!vmxnet3_rx_queue_num_valid (args->rxq_num))
|
|
{
|
|
args->rv = VNET_API_ERROR_INVALID_VALUE;
|
|
args->error =
|
|
clib_error_return (error, "number of rx queues must be <= %u",
|
|
VMXNET3_RXQ_MAX);
|
|
vlib_log (VLIB_LOG_LEVEL_ERR, vmxm->log_default, "%U: %s",
|
|
format_vlib_pci_addr, &args->addr,
|
|
"number of rx queues must be <= %u", VMXNET3_RXQ_MAX);
|
|
return;
|
|
}
|
|
|
|
if (!vmxnet3_tx_queue_num_valid (args->txq_num))
|
|
{
|
|
args->rv = VNET_API_ERROR_INVALID_VALUE;
|
|
args->error =
|
|
clib_error_return (error,
|
|
"number of tx queues must be <= %u and <= number of "
|
|
"CPU's assigned to VPP", VMXNET3_TXQ_MAX);
|
|
vlib_log (VLIB_LOG_LEVEL_ERR, vmxm->log_default, "%U: %s",
|
|
format_vlib_pci_addr, &args->addr,
|
|
"number of tx queues must be <= %u and <= number of "
|
|
"CPU's assigned to VPP", VMXNET3_TXQ_MAX);
|
|
return;
|
|
}
|
|
if (args->rxq_size == 0)
|
|
args->rxq_size = VMXNET3_NUM_RX_DESC;
|
|
if (args->txq_size == 0)
|
|
args->txq_size = VMXNET3_NUM_TX_DESC;
|
|
|
|
if (!vmxnet3_queue_size_valid (args->rxq_size) ||
|
|
!vmxnet3_queue_size_valid (args->txq_size))
|
|
{
|
|
args->rv = VNET_API_ERROR_INVALID_VALUE;
|
|
args->error =
|
|
clib_error_return (error,
|
|
"queue size must be <= 4096, >= 64, "
|
|
"and multiples of 64");
|
|
vlib_log (VLIB_LOG_LEVEL_ERR, vmxm->log_default, "%U: %s",
|
|
format_vlib_pci_addr, &args->addr,
|
|
"queue size must be <= 4096, >= 64, and multiples of 64");
|
|
return;
|
|
}
|
|
|
|
pool_foreach (vd, vmxm->devices) {
|
|
if (vd->pci_addr.as_u32 == args->addr.as_u32)
|
|
{
|
|
args->rv = VNET_API_ERROR_ADDRESS_IN_USE;
|
|
args->error =
|
|
clib_error_return (error, "%U: %s", format_vlib_pci_addr,
|
|
&args->addr, "pci address in use");
|
|
vlib_log (VLIB_LOG_LEVEL_ERR, vmxm->log_default, "%U: %s",
|
|
format_vlib_pci_addr, &args->addr, "pci address in use");
|
|
return;
|
|
}
|
|
}
|
|
|
|
if (args->bind)
|
|
{
|
|
error = vlib_pci_bind_to_uio (vm, &args->addr, (char *) "auto",
|
|
VMXNET3_BIND_FORCE == args->bind);
|
|
if (error)
|
|
{
|
|
args->rv = VNET_API_ERROR_INVALID_INTERFACE;
|
|
args->error =
|
|
clib_error_return (error, "%U: %s", format_vlib_pci_addr,
|
|
&args->addr,
|
|
"error encountered on binding pci device");
|
|
vlib_log (VLIB_LOG_LEVEL_ERR, vmxm->log_default, "%U: %s",
|
|
format_vlib_pci_addr, &args->addr,
|
|
"error encountered on binding pci devicee");
|
|
return;
|
|
}
|
|
}
|
|
|
|
if ((error =
|
|
vlib_pci_device_open (vm, &args->addr, vmxnet3_pci_device_ids, &h)))
|
|
{
|
|
args->rv = VNET_API_ERROR_INVALID_INTERFACE;
|
|
args->error =
|
|
clib_error_return (error, "%U: %s", format_vlib_pci_addr,
|
|
&args->addr,
|
|
"error encountered on pci device open");
|
|
vlib_log (VLIB_LOG_LEVEL_ERR, vmxm->log_default, "%U: %s",
|
|
format_vlib_pci_addr, &args->addr,
|
|
"error encountered on pci device open");
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* Do not use vmxnet3_log_error prior to this line since the macro
|
|
* references vd->pci_dev_handle
|
|
*/
|
|
pool_get (vmxm->devices, vd);
|
|
vd->num_tx_queues = args->txq_num;
|
|
vd->num_rx_queues = args->rxq_num;
|
|
vd->dev_instance = vd - vmxm->devices;
|
|
vd->per_interface_next_index = ~0;
|
|
vd->pci_addr = args->addr;
|
|
|
|
if (args->enable_elog)
|
|
vd->flags |= VMXNET3_DEVICE_F_ELOG;
|
|
|
|
vd->pci_dev_handle = h;
|
|
vd->numa_node = vlib_pci_get_numa_node (vm, h);
|
|
vd->num_intrs = vd->num_rx_queues + 1; // +1 for the event interrupt
|
|
|
|
vlib_pci_set_private_data (vm, h, vd->dev_instance);
|
|
|
|
if ((error = vlib_pci_bus_master_enable (vm, h)))
|
|
{
|
|
vmxnet3_log_error (vd, "error encountered on pci bus master enable");
|
|
goto error;
|
|
}
|
|
|
|
if ((error = vlib_pci_map_region (vm, h, 0, (void **) &vd->bar[0])))
|
|
{
|
|
vmxnet3_log_error (vd, "error encountered on pci map region for bar 0");
|
|
goto error;
|
|
}
|
|
|
|
if ((error = vlib_pci_map_region (vm, h, 1, (void **) &vd->bar[1])))
|
|
{
|
|
vmxnet3_log_error (vd, "error encountered on pci map region for bar 1");
|
|
goto error;
|
|
}
|
|
|
|
num_intr = vlib_pci_get_num_msix_interrupts (vm, h);
|
|
if (num_intr < vd->num_rx_queues + 1)
|
|
{
|
|
vmxnet3_log_error (vd,
|
|
"No sufficient interrupt lines (%u) for rx queues",
|
|
num_intr);
|
|
error =
|
|
clib_error_return (0,
|
|
"No sufficient interrupt lines (%u) for rx queues",
|
|
num_intr);
|
|
goto error;
|
|
}
|
|
if ((error = vlib_pci_register_msix_handler (vm, h, 0, vd->num_rx_queues,
|
|
&vmxnet3_rxq_irq_handler)))
|
|
{
|
|
vmxnet3_log_error (vd,
|
|
"error encountered on pci register msix handler 0");
|
|
goto error;
|
|
}
|
|
|
|
if ((error = vlib_pci_register_msix_handler (vm, h, vd->num_rx_queues, 1,
|
|
&vmxnet3_event_irq_handler)))
|
|
{
|
|
vmxnet3_log_error (vd,
|
|
"error encountered on pci register msix handler 1");
|
|
goto error;
|
|
}
|
|
|
|
if ((error = vlib_pci_enable_msix_irq (vm, h, 0, vd->num_rx_queues + 1)))
|
|
{
|
|
vmxnet3_log_error (vd, "error encountered on pci enable msix irq");
|
|
goto error;
|
|
}
|
|
|
|
if ((error = vlib_pci_intr_enable (vm, h)))
|
|
{
|
|
vmxnet3_log_error (vd, "error encountered on pci interrupt enable");
|
|
goto error;
|
|
}
|
|
|
|
if ((error = vmxnet3_device_init (vm, vd, args)))
|
|
{
|
|
vmxnet3_log_error (vd, "error encountered on device init");
|
|
goto error;
|
|
}
|
|
|
|
/* create interface */
|
|
eir.dev_class_index = vmxnet3_device_class.index;
|
|
eir.dev_instance = vd->dev_instance;
|
|
eir.address = vd->mac_addr;
|
|
eir.cb.flag_change = vmxnet3_flag_change;
|
|
vd->hw_if_index = vnet_eth_register_interface (vnm, &eir);
|
|
|
|
vnet_sw_interface_t *sw = vnet_get_hw_sw_interface (vnm, vd->hw_if_index);
|
|
vd->sw_if_index = sw->sw_if_index;
|
|
args->sw_if_index = sw->sw_if_index;
|
|
|
|
cc.mask = VNET_HW_IF_CAP_INT_MODE | VNET_HW_IF_CAP_TCP_GSO |
|
|
VNET_HW_IF_CAP_TX_TCP_CKSUM | VNET_HW_IF_CAP_TX_UDP_CKSUM;
|
|
if (vd->gso_enable)
|
|
cc.val = cc.mask;
|
|
else
|
|
cc.val = VNET_HW_IF_CAP_INT_MODE;
|
|
|
|
vnet_hw_if_change_caps (vnm, vd->hw_if_index, &cc);
|
|
|
|
vnet_hw_if_set_input_node (vnm, vd->hw_if_index, vmxnet3_input_node.index);
|
|
/* Disable interrupts */
|
|
vmxnet3_disable_interrupt (vd);
|
|
vec_foreach_index (qid, vd->rxqs)
|
|
{
|
|
vmxnet3_rxq_t *rxq = vec_elt_at_index (vd->rxqs, qid);
|
|
u32 qi, fi;
|
|
vmxnet3_per_thread_data_t *ptd;
|
|
|
|
qi = vnet_hw_if_register_rx_queue (vnm, vd->hw_if_index, qid,
|
|
VNET_HW_IF_RXQ_THREAD_ANY);
|
|
fi = vlib_pci_get_msix_file_index (vm, vd->pci_dev_handle, qid);
|
|
vnet_hw_if_set_rx_queue_file_index (vnm, qi, fi);
|
|
rxq->queue_index = qi;
|
|
rxq->thread_index =
|
|
vnet_hw_if_get_rx_queue_thread_index (vnm, rxq->queue_index);
|
|
if (rxq->mode == VNET_HW_IF_RX_MODE_POLLING)
|
|
{
|
|
ptd = vec_elt_at_index (vmxm->per_thread_data, rxq->thread_index);
|
|
ptd->polling_q_count++;
|
|
}
|
|
rxq->buffer_pool_index =
|
|
vnet_hw_if_get_rx_queue_numa_node (vnm, rxq->queue_index);
|
|
vmxnet3_rxq_refill_ring0 (vm, vd, rxq);
|
|
vmxnet3_rxq_refill_ring1 (vm, vd, rxq);
|
|
}
|
|
|
|
vec_foreach_index (qid, vd->txqs)
|
|
{
|
|
vmxnet3_txq_t *txq = vec_elt_at_index (vd->txqs, qid);
|
|
txq->queue_index =
|
|
vnet_hw_if_register_tx_queue (vnm, vd->hw_if_index, qid);
|
|
}
|
|
for (u32 i = 0; i < vlib_get_n_threads (); i++)
|
|
{
|
|
u32 qi = vd->txqs[i % vd->num_tx_queues].queue_index;
|
|
vnet_hw_if_tx_queue_assign_thread (vnm, qi, i);
|
|
}
|
|
vnet_hw_if_update_runtime_data (vnm, vd->hw_if_index);
|
|
|
|
vd->flags |= VMXNET3_DEVICE_F_INITIALIZED;
|
|
vmxnet3_enable_interrupt (vd);
|
|
|
|
vnet_hw_interface_set_link_speed (
|
|
vnm, vd->hw_if_index,
|
|
(vd->link_speed == UINT32_MAX) ? UINT32_MAX : vd->link_speed * 1000);
|
|
if (vd->flags & VMXNET3_DEVICE_F_LINK_UP)
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index,
|
|
VNET_HW_INTERFACE_FLAG_LINK_UP);
|
|
else
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index, 0);
|
|
return;
|
|
|
|
error:
|
|
vmxnet3_delete_if (vm, vd);
|
|
args->rv = VNET_API_ERROR_INVALID_INTERFACE;
|
|
args->error = error;
|
|
}
|
|
|
|
void
|
|
vmxnet3_delete_if (vlib_main_t * vm, vmxnet3_device_t * vd)
|
|
{
|
|
vnet_main_t *vnm = vnet_get_main ();
|
|
vmxnet3_main_t *vmxm = &vmxnet3_main;
|
|
u32 i, bi;
|
|
u16 desc_idx;
|
|
|
|
/* Quiesce the device */
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_QUIESCE_DEV);
|
|
|
|
/* Reset the device */
|
|
vmxnet3_reg_write (vd, 1, VMXNET3_REG_CMD, VMXNET3_CMD_RESET_DEV);
|
|
|
|
if (vd->hw_if_index)
|
|
{
|
|
vnet_hw_interface_set_flags (vnm, vd->hw_if_index, 0);
|
|
ethernet_delete_interface (vnm, vd->hw_if_index);
|
|
}
|
|
|
|
vlib_pci_device_close (vm, vd->pci_dev_handle);
|
|
|
|
vec_foreach_index (i, vd->rxqs)
|
|
{
|
|
vmxnet3_rxq_t *rxq = vec_elt_at_index (vd->rxqs, i);
|
|
u16 mask = rxq->size - 1;
|
|
u16 rid;
|
|
vmxnet3_per_thread_data_t *ptd =
|
|
vec_elt_at_index (vmxm->per_thread_data, rxq->thread_index);
|
|
|
|
if (rxq->mode == VNET_HW_IF_RX_MODE_POLLING)
|
|
{
|
|
ASSERT (ptd->polling_q_count != 0);
|
|
ptd->polling_q_count--;
|
|
}
|
|
for (rid = 0; rid < VMXNET3_RX_RING_SIZE; rid++)
|
|
{
|
|
vmxnet3_rx_ring *ring;
|
|
|
|
ring = &rxq->rx_ring[rid];
|
|
desc_idx = (ring->consume + 1) & mask;
|
|
vlib_buffer_free_from_ring (vm, ring->bufs, desc_idx, rxq->size,
|
|
ring->fill);
|
|
vec_free (ring->bufs);
|
|
vlib_physmem_free (vm, rxq->rx_desc[rid]);
|
|
}
|
|
vlib_physmem_free (vm, rxq->rx_comp);
|
|
}
|
|
vec_free (vd->rxqs);
|
|
vec_free (vd->rx_stats);
|
|
|
|
vec_foreach_index (i, vd->txqs)
|
|
{
|
|
vmxnet3_txq_t *txq = vec_elt_at_index (vd->txqs, i);
|
|
u16 mask = txq->size - 1;
|
|
u16 end_idx;
|
|
|
|
desc_idx = txq->tx_ring.consume;
|
|
end_idx = txq->tx_ring.produce;
|
|
while (desc_idx != end_idx)
|
|
{
|
|
bi = txq->tx_ring.bufs[desc_idx];
|
|
vlib_buffer_free_no_next (vm, &bi, 1);
|
|
desc_idx++;
|
|
desc_idx &= mask;
|
|
}
|
|
clib_spinlock_free (&txq->lock);
|
|
vec_free (txq->tx_ring.bufs);
|
|
vlib_physmem_free (vm, txq->tx_desc);
|
|
vlib_physmem_free (vm, txq->tx_comp);
|
|
}
|
|
vec_free (vd->txqs);
|
|
vec_free (vd->tx_stats);
|
|
|
|
vlib_physmem_free (vm, vd->driver_shared);
|
|
vlib_physmem_free (vm, vd->queues);
|
|
vlib_physmem_free (vm, vd->rss);
|
|
|
|
clib_error_free (vd->error);
|
|
clib_memset (vd, 0, sizeof (*vd));
|
|
pool_put (vmxm->devices, vd);
|
|
|
|
}
|
|
|
|
/*
|
|
* fd.io coding-style-patch-verification: ON
|
|
*
|
|
* Local Variables:
|
|
* eval: (c-set-style "gnu")
|
|
* End:
|
|
*/
|