f-stack/dpdk/drivers/net/gve/gve_ethdev.c

694 lines
16 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright(C) 2022 Intel Corporation
*/
#include "gve_ethdev.h"
#include "base/gve_adminq.h"
#include "base/gve_register.h"
#include "rte_ether.h"
const char gve_version_str[] = GVE_VERSION;
static const char gve_version_prefix[] = GVE_VERSION_PREFIX;
static void
gve_write_version(uint8_t *driver_version_register)
{
const char *c = gve_version_prefix;
while (*c) {
writeb(*c, driver_version_register);
c++;
}
c = gve_version_str;
while (*c) {
writeb(*c, driver_version_register);
c++;
}
writeb('\n', driver_version_register);
}
static int
gve_alloc_queue_page_list(struct gve_priv *priv, uint32_t id, uint32_t pages)
{
char z_name[RTE_MEMZONE_NAMESIZE];
struct gve_queue_page_list *qpl;
const struct rte_memzone *mz;
dma_addr_t page_bus;
uint32_t i;
if (priv->num_registered_pages + pages >
priv->max_registered_pages) {
PMD_DRV_LOG(ERR, "Pages %" PRIu64 " > max registered pages %" PRIu64,
priv->num_registered_pages + pages,
priv->max_registered_pages);
return -EINVAL;
}
qpl = &priv->qpl[id];
snprintf(z_name, sizeof(z_name), "gve_%s_qpl%d", priv->pci_dev->device.name, id);
mz = rte_memzone_reserve_aligned(z_name, pages * PAGE_SIZE,
rte_socket_id(),
RTE_MEMZONE_IOVA_CONTIG, PAGE_SIZE);
if (mz == NULL) {
PMD_DRV_LOG(ERR, "Failed to alloc %s.", z_name);
return -ENOMEM;
}
qpl->page_buses = rte_zmalloc("qpl page buses", pages * sizeof(dma_addr_t), 0);
if (qpl->page_buses == NULL) {
PMD_DRV_LOG(ERR, "Failed to alloc qpl %u page buses", id);
return -ENOMEM;
}
page_bus = mz->iova;
for (i = 0; i < pages; i++) {
qpl->page_buses[i] = page_bus;
page_bus += PAGE_SIZE;
}
qpl->id = id;
qpl->mz = mz;
qpl->num_entries = pages;
priv->num_registered_pages += pages;
return 0;
}
static void
gve_free_qpls(struct gve_priv *priv)
{
uint16_t nb_txqs = priv->max_nb_txq;
uint16_t nb_rxqs = priv->max_nb_rxq;
uint32_t i;
for (i = 0; i < nb_txqs + nb_rxqs; i++) {
if (priv->qpl[i].mz != NULL)
rte_memzone_free(priv->qpl[i].mz);
rte_free(priv->qpl[i].page_buses);
}
rte_free(priv->qpl);
}
static int
gve_dev_configure(struct rte_eth_dev *dev)
{
struct gve_priv *priv = dev->data->dev_private;
if (dev->data->dev_conf.rxmode.mq_mode & RTE_ETH_MQ_RX_RSS_FLAG)
dev->data->dev_conf.rxmode.offloads |= RTE_ETH_RX_OFFLOAD_RSS_HASH;
if (dev->data->dev_conf.rxmode.offloads & RTE_ETH_RX_OFFLOAD_TCP_LRO)
priv->enable_rsc = 1;
return 0;
}
static int
gve_refill_pages(struct gve_rx_queue *rxq)
{
struct rte_mbuf *nmb;
uint16_t i;
int diag;
diag = rte_pktmbuf_alloc_bulk(rxq->mpool, &rxq->sw_ring[0], rxq->nb_rx_desc);
if (diag < 0) {
for (i = 0; i < rxq->nb_rx_desc - 1; i++) {
nmb = rte_pktmbuf_alloc(rxq->mpool);
if (!nmb)
break;
rxq->sw_ring[i] = nmb;
}
if (i < rxq->nb_rx_desc - 1)
return -ENOMEM;
}
rxq->nb_avail = 0;
rxq->next_avail = rxq->nb_rx_desc - 1;
for (i = 0; i < rxq->nb_rx_desc; i++) {
if (rxq->is_gqi_qpl) {
rxq->rx_data_ring[i].addr = rte_cpu_to_be_64(i * PAGE_SIZE);
} else {
if (i == rxq->nb_rx_desc - 1)
break;
nmb = rxq->sw_ring[i];
rxq->rx_data_ring[i].addr = rte_cpu_to_be_64(rte_mbuf_data_iova(nmb));
}
}
rte_write32(rte_cpu_to_be_32(rxq->next_avail), rxq->qrx_tail);
return 0;
}
static int
gve_link_update(struct rte_eth_dev *dev, __rte_unused int wait_to_complete)
{
struct gve_priv *priv = dev->data->dev_private;
struct rte_eth_link link;
int err;
memset(&link, 0, sizeof(link));
link.link_duplex = RTE_ETH_LINK_FULL_DUPLEX;
link.link_autoneg = RTE_ETH_LINK_AUTONEG;
if (!dev->data->dev_started) {
link.link_status = RTE_ETH_LINK_DOWN;
link.link_speed = RTE_ETH_SPEED_NUM_NONE;
} else {
link.link_status = RTE_ETH_LINK_UP;
PMD_DRV_LOG(DEBUG, "Get link status from hw");
err = gve_adminq_report_link_speed(priv);
if (err) {
PMD_DRV_LOG(ERR, "Failed to get link speed.");
priv->link_speed = RTE_ETH_SPEED_NUM_UNKNOWN;
}
link.link_speed = priv->link_speed;
}
return rte_eth_linkstatus_set(dev, &link);
}
static int
gve_dev_start(struct rte_eth_dev *dev)
{
uint16_t num_queues = dev->data->nb_tx_queues;
struct gve_priv *priv = dev->data->dev_private;
struct gve_tx_queue *txq;
struct gve_rx_queue *rxq;
uint16_t i;
int err;
priv->txqs = (struct gve_tx_queue **)dev->data->tx_queues;
err = gve_adminq_create_tx_queues(priv, num_queues);
if (err) {
PMD_DRV_LOG(ERR, "failed to create %u tx queues.", num_queues);
return err;
}
for (i = 0; i < num_queues; i++) {
txq = priv->txqs[i];
txq->qtx_tail =
&priv->db_bar2[rte_be_to_cpu_32(txq->qres->db_index)];
txq->qtx_head =
&priv->cnt_array[rte_be_to_cpu_32(txq->qres->counter_index)];
rte_write32(rte_cpu_to_be_32(GVE_IRQ_MASK), txq->ntfy_addr);
}
num_queues = dev->data->nb_rx_queues;
priv->rxqs = (struct gve_rx_queue **)dev->data->rx_queues;
err = gve_adminq_create_rx_queues(priv, num_queues);
if (err) {
PMD_DRV_LOG(ERR, "failed to create %u rx queues.", num_queues);
goto err_tx;
}
for (i = 0; i < num_queues; i++) {
rxq = priv->rxqs[i];
rxq->qrx_tail =
&priv->db_bar2[rte_be_to_cpu_32(rxq->qres->db_index)];
rte_write32(rte_cpu_to_be_32(GVE_IRQ_MASK), rxq->ntfy_addr);
err = gve_refill_pages(rxq);
if (err) {
PMD_DRV_LOG(ERR, "Failed to refill for RX");
goto err_rx;
}
}
dev->data->dev_started = 1;
gve_link_update(dev, 0);
return 0;
err_rx:
gve_stop_rx_queues(dev);
err_tx:
gve_stop_tx_queues(dev);
return err;
}
static int
gve_dev_stop(struct rte_eth_dev *dev)
{
dev->data->dev_link.link_status = RTE_ETH_LINK_DOWN;
gve_stop_tx_queues(dev);
gve_stop_rx_queues(dev);
dev->data->dev_started = 0;
return 0;
}
static int
gve_dev_close(struct rte_eth_dev *dev)
{
struct gve_priv *priv = dev->data->dev_private;
int err = 0;
uint16_t i;
if (dev->data->dev_started) {
err = gve_dev_stop(dev);
if (err != 0)
PMD_DRV_LOG(ERR, "Failed to stop dev.");
}
for (i = 0; i < dev->data->nb_tx_queues; i++)
gve_tx_queue_release(dev, i);
for (i = 0; i < dev->data->nb_rx_queues; i++)
gve_rx_queue_release(dev, i);
gve_free_qpls(priv);
rte_free(priv->adminq);
dev->data->mac_addrs = NULL;
return err;
}
static int
gve_dev_info_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *dev_info)
{
struct gve_priv *priv = dev->data->dev_private;
dev_info->device = dev->device;
dev_info->max_mac_addrs = 1;
dev_info->max_rx_queues = priv->max_nb_rxq;
dev_info->max_tx_queues = priv->max_nb_txq;
dev_info->min_rx_bufsize = GVE_RX_MIN_BUF_SIZE_GQI;
dev_info->max_rx_pktlen = priv->max_mtu + RTE_ETHER_HDR_LEN;
dev_info->max_mtu = priv->max_mtu;
dev_info->min_mtu = RTE_ETHER_MIN_MTU;
dev_info->rx_offload_capa = 0;
dev_info->tx_offload_capa =
RTE_ETH_TX_OFFLOAD_MULTI_SEGS |
RTE_ETH_TX_OFFLOAD_UDP_CKSUM |
RTE_ETH_TX_OFFLOAD_TCP_CKSUM |
RTE_ETH_TX_OFFLOAD_SCTP_CKSUM |
RTE_ETH_TX_OFFLOAD_TCP_TSO;
if (priv->queue_format == GVE_DQO_RDA_FORMAT)
dev_info->rx_offload_capa |= RTE_ETH_RX_OFFLOAD_TCP_LRO;
dev_info->default_rxconf = (struct rte_eth_rxconf) {
.rx_free_thresh = GVE_DEFAULT_RX_FREE_THRESH,
.rx_drop_en = 0,
.offloads = 0,
};
dev_info->default_txconf = (struct rte_eth_txconf) {
.tx_free_thresh = GVE_DEFAULT_TX_FREE_THRESH,
.offloads = 0,
};
dev_info->default_rxportconf.ring_size = priv->rx_desc_cnt;
dev_info->rx_desc_lim = (struct rte_eth_desc_lim) {
.nb_max = priv->rx_desc_cnt,
.nb_min = priv->rx_desc_cnt,
.nb_align = 1,
};
dev_info->default_txportconf.ring_size = priv->tx_desc_cnt;
dev_info->tx_desc_lim = (struct rte_eth_desc_lim) {
.nb_max = priv->tx_desc_cnt,
.nb_min = priv->tx_desc_cnt,
.nb_align = 1,
};
return 0;
}
static int
gve_dev_mtu_set(struct rte_eth_dev *dev, uint16_t mtu)
{
struct gve_priv *priv = dev->data->dev_private;
int err;
if (mtu < RTE_ETHER_MIN_MTU || mtu > priv->max_mtu) {
PMD_DRV_LOG(ERR, "MIN MTU is %u, MAX MTU is %u",
RTE_ETHER_MIN_MTU, priv->max_mtu);
return -EINVAL;
}
/* mtu setting is forbidden if port is start */
if (dev->data->dev_started) {
PMD_DRV_LOG(ERR, "Port must be stopped before configuration");
return -EBUSY;
}
err = gve_adminq_set_mtu(priv, mtu);
if (err) {
PMD_DRV_LOG(ERR, "Failed to set mtu as %u err = %d", mtu, err);
return err;
}
return 0;
}
static const struct eth_dev_ops gve_eth_dev_ops = {
.dev_configure = gve_dev_configure,
.dev_start = gve_dev_start,
.dev_stop = gve_dev_stop,
.dev_close = gve_dev_close,
.dev_infos_get = gve_dev_info_get,
.rx_queue_setup = gve_rx_queue_setup,
.tx_queue_setup = gve_tx_queue_setup,
.rx_queue_release = gve_rx_queue_release,
.tx_queue_release = gve_tx_queue_release,
.link_update = gve_link_update,
.mtu_set = gve_dev_mtu_set,
};
static void
gve_free_counter_array(struct gve_priv *priv)
{
rte_memzone_free(priv->cnt_array_mz);
priv->cnt_array = NULL;
}
static void
gve_free_irq_db(struct gve_priv *priv)
{
rte_memzone_free(priv->irq_dbs_mz);
priv->irq_dbs = NULL;
}
static void
gve_teardown_device_resources(struct gve_priv *priv)
{
int err;
/* Tell device its resources are being freed */
if (gve_get_device_resources_ok(priv)) {
err = gve_adminq_deconfigure_device_resources(priv);
if (err)
PMD_DRV_LOG(ERR, "Could not deconfigure device resources: err=%d", err);
}
gve_free_counter_array(priv);
gve_free_irq_db(priv);
gve_clear_device_resources_ok(priv);
}
static uint8_t
pci_dev_find_capability(struct rte_pci_device *pdev, int cap)
{
uint8_t pos, id;
uint16_t ent;
int loops;
int ret;
ret = rte_pci_read_config(pdev, &pos, sizeof(pos), PCI_CAPABILITY_LIST);
if (ret != sizeof(pos))
return 0;
loops = (PCI_CFG_SPACE_SIZE - PCI_STD_HEADER_SIZEOF) / PCI_CAP_SIZEOF;
while (pos && loops--) {
ret = rte_pci_read_config(pdev, &ent, sizeof(ent), pos);
if (ret != sizeof(ent))
return 0;
id = ent & 0xff;
if (id == 0xff)
break;
if (id == cap)
return pos;
pos = (ent >> 8);
}
return 0;
}
static int
pci_dev_msix_vec_count(struct rte_pci_device *pdev)
{
uint8_t msix_cap = pci_dev_find_capability(pdev, PCI_CAP_ID_MSIX);
uint16_t control;
int ret;
if (!msix_cap)
return 0;
ret = rte_pci_read_config(pdev, &control, sizeof(control), msix_cap + PCI_MSIX_FLAGS);
if (ret != sizeof(control))
return 0;
return (control & PCI_MSIX_FLAGS_QSIZE) + 1;
}
static int
gve_setup_device_resources(struct gve_priv *priv)
{
char z_name[RTE_MEMZONE_NAMESIZE];
const struct rte_memzone *mz;
int err = 0;
snprintf(z_name, sizeof(z_name), "gve_%s_cnt_arr", priv->pci_dev->device.name);
mz = rte_memzone_reserve_aligned(z_name,
priv->num_event_counters * sizeof(*priv->cnt_array),
rte_socket_id(), RTE_MEMZONE_IOVA_CONTIG,
PAGE_SIZE);
if (mz == NULL) {
PMD_DRV_LOG(ERR, "Could not alloc memzone for count array");
return -ENOMEM;
}
priv->cnt_array = (rte_be32_t *)mz->addr;
priv->cnt_array_mz = mz;
snprintf(z_name, sizeof(z_name), "gve_%s_irqmz", priv->pci_dev->device.name);
mz = rte_memzone_reserve_aligned(z_name,
sizeof(*priv->irq_dbs) * (priv->num_ntfy_blks),
rte_socket_id(), RTE_MEMZONE_IOVA_CONTIG,
PAGE_SIZE);
if (mz == NULL) {
PMD_DRV_LOG(ERR, "Could not alloc memzone for irq_dbs");
err = -ENOMEM;
goto free_cnt_array;
}
priv->irq_dbs = (struct gve_irq_db *)mz->addr;
priv->irq_dbs_mz = mz;
err = gve_adminq_configure_device_resources(priv,
priv->cnt_array_mz->iova,
priv->num_event_counters,
priv->irq_dbs_mz->iova,
priv->num_ntfy_blks);
if (unlikely(err)) {
PMD_DRV_LOG(ERR, "Could not config device resources: err=%d", err);
goto free_irq_dbs;
}
return 0;
free_irq_dbs:
gve_free_irq_db(priv);
free_cnt_array:
gve_free_counter_array(priv);
return err;
}
static int
gve_init_priv(struct gve_priv *priv, bool skip_describe_device)
{
uint16_t pages;
int num_ntfy;
uint32_t i;
int err;
/* Set up the adminq */
err = gve_adminq_alloc(priv);
if (err) {
PMD_DRV_LOG(ERR, "Failed to alloc admin queue: err=%d", err);
return err;
}
if (skip_describe_device)
goto setup_device;
/* Get the initial information we need from the device */
err = gve_adminq_describe_device(priv);
if (err) {
PMD_DRV_LOG(ERR, "Could not get device information: err=%d", err);
goto free_adminq;
}
num_ntfy = pci_dev_msix_vec_count(priv->pci_dev);
if (num_ntfy <= 0) {
PMD_DRV_LOG(ERR, "Could not count MSI-x vectors");
err = -EIO;
goto free_adminq;
} else if (num_ntfy < GVE_MIN_MSIX) {
PMD_DRV_LOG(ERR, "GVE needs at least %d MSI-x vectors, but only has %d",
GVE_MIN_MSIX, num_ntfy);
err = -EINVAL;
goto free_adminq;
}
priv->num_registered_pages = 0;
/* gvnic has one Notification Block per MSI-x vector, except for the
* management vector
*/
priv->num_ntfy_blks = (num_ntfy - 1) & ~0x1;
priv->mgmt_msix_idx = priv->num_ntfy_blks;
priv->max_nb_txq = RTE_MIN(priv->max_nb_txq, priv->num_ntfy_blks / 2);
priv->max_nb_rxq = RTE_MIN(priv->max_nb_rxq, priv->num_ntfy_blks / 2);
if (priv->default_num_queues > 0) {
priv->max_nb_txq = RTE_MIN(priv->default_num_queues, priv->max_nb_txq);
priv->max_nb_rxq = RTE_MIN(priv->default_num_queues, priv->max_nb_rxq);
}
PMD_DRV_LOG(INFO, "Max TX queues %d, Max RX queues %d",
priv->max_nb_txq, priv->max_nb_rxq);
/* In GQI_QPL queue format:
* Allocate queue page lists according to max queue number
* tx qpl id should start from 0 while rx qpl id should start
* from priv->max_nb_txq
*/
if (priv->queue_format == GVE_GQI_QPL_FORMAT) {
priv->qpl = rte_zmalloc("gve_qpl",
(priv->max_nb_txq + priv->max_nb_rxq) *
sizeof(struct gve_queue_page_list), 0);
if (priv->qpl == NULL) {
PMD_DRV_LOG(ERR, "Failed to alloc qpl.");
err = -ENOMEM;
goto free_adminq;
}
for (i = 0; i < priv->max_nb_txq + priv->max_nb_rxq; i++) {
if (i < priv->max_nb_txq)
pages = priv->tx_pages_per_qpl;
else
pages = priv->rx_data_slot_cnt;
err = gve_alloc_queue_page_list(priv, i, pages);
if (err != 0) {
PMD_DRV_LOG(ERR, "Failed to alloc qpl %u.", i);
goto err_qpl;
}
}
}
setup_device:
err = gve_setup_device_resources(priv);
if (!err)
return 0;
err_qpl:
gve_free_qpls(priv);
free_adminq:
gve_adminq_free(priv);
return err;
}
static void
gve_teardown_priv_resources(struct gve_priv *priv)
{
gve_teardown_device_resources(priv);
gve_adminq_free(priv);
}
static int
gve_dev_init(struct rte_eth_dev *eth_dev)
{
struct gve_priv *priv = eth_dev->data->dev_private;
int max_tx_queues, max_rx_queues;
struct rte_pci_device *pci_dev;
struct gve_registers *reg_bar;
rte_be32_t *db_bar;
int err;
eth_dev->dev_ops = &gve_eth_dev_ops;
if (rte_eal_process_type() != RTE_PROC_PRIMARY)
return 0;
pci_dev = RTE_DEV_TO_PCI(eth_dev->device);
reg_bar = pci_dev->mem_resource[GVE_REG_BAR].addr;
if (!reg_bar) {
PMD_DRV_LOG(ERR, "Failed to map pci bar!");
return -ENOMEM;
}
db_bar = pci_dev->mem_resource[GVE_DB_BAR].addr;
if (!db_bar) {
PMD_DRV_LOG(ERR, "Failed to map doorbell bar!");
return -ENOMEM;
}
gve_write_version(&reg_bar->driver_version);
/* Get max queues to alloc etherdev */
max_tx_queues = ioread32be(&reg_bar->max_tx_queues);
max_rx_queues = ioread32be(&reg_bar->max_rx_queues);
priv->reg_bar0 = reg_bar;
priv->db_bar2 = db_bar;
priv->pci_dev = pci_dev;
priv->state_flags = 0x0;
priv->max_nb_txq = max_tx_queues;
priv->max_nb_rxq = max_rx_queues;
err = gve_init_priv(priv, false);
if (err)
return err;
if (gve_is_gqi(priv)) {
eth_dev->rx_pkt_burst = gve_rx_burst;
eth_dev->tx_pkt_burst = gve_tx_burst;
} else {
PMD_DRV_LOG(ERR, "DQO_RDA is not implemented and will be added in the future");
}
eth_dev->data->mac_addrs = &priv->dev_addr;
return 0;
}
static int
gve_dev_uninit(struct rte_eth_dev *eth_dev)
{
struct gve_priv *priv = eth_dev->data->dev_private;
gve_teardown_priv_resources(priv);
eth_dev->data->mac_addrs = NULL;
return 0;
}
static int
gve_pci_probe(__rte_unused struct rte_pci_driver *pci_drv,
struct rte_pci_device *pci_dev)
{
return rte_eth_dev_pci_generic_probe(pci_dev, sizeof(struct gve_priv), gve_dev_init);
}
static int
gve_pci_remove(struct rte_pci_device *pci_dev)
{
return rte_eth_dev_pci_generic_remove(pci_dev, gve_dev_uninit);
}
static const struct rte_pci_id pci_id_gve_map[] = {
{ RTE_PCI_DEVICE(GOOGLE_VENDOR_ID, GVE_DEV_ID) },
{ .device_id = 0 },
};
static struct rte_pci_driver rte_gve_pmd = {
.id_table = pci_id_gve_map,
.drv_flags = RTE_PCI_DRV_NEED_MAPPING,
.probe = gve_pci_probe,
.remove = gve_pci_remove,
};
RTE_PMD_REGISTER_PCI(net_gve, rte_gve_pmd);
RTE_PMD_REGISTER_PCI_TABLE(net_gve, pci_id_gve_map);
RTE_PMD_REGISTER_KMOD_DEP(net_gve, "* igb_uio | vfio-pci");
RTE_LOG_REGISTER_SUFFIX(gve_logtype_driver, driver, NOTICE);