freebsd-dev/sys/dev/gve/gve_utils.c
Shailend Chand 54dfc97b0b Add gve, the driver for Google Virtual NIC (gVNIC)
gVNIC is a virtual network interface designed specifically for
Google Compute Engine (GCE). It is required to support per-VM Tier_1
networking performance, and for using certain VM shapes on GCE.

The NIC supports TSO, Rx and Tx checksum offloads, and RSS.
It does not currently do hardware LRO, and thus the software-LRO
in the host is used instead. It also supports jumbo frames.

For each queue, the driver negotiates a set of pages with the NIC to
serve as a fixed bounce buffer, this precludes the use of iflib.

Reviewed-by: 		markj
MFC-after:		2 weeks
Differential Revision: https://reviews.freebsd.org/D39873
2023-06-02 14:31:54 -07:00

406 lines
10 KiB
C

/*-
* SPDX-License-Identifier: BSD-3-Clause
*
* Copyright (c) 2023 Google LLC
*
* Redistribution and use in source and binary forms, with or without modification,
* are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice, this
* list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright notice,
* this list of conditions and the following disclaimer in the documentation
* and/or other materials provided with the distribution.
*
* 3. Neither the name of the copyright holder nor the names of its contributors
* may be used to endorse or promote products derived from this software without
* specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
* ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
* ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "gve.h"
uint32_t
gve_reg_bar_read_4(struct gve_priv *priv, bus_size_t offset)
{
return (be32toh(bus_read_4(priv->reg_bar, offset)));
}
void
gve_reg_bar_write_4(struct gve_priv *priv, bus_size_t offset, uint32_t val)
{
bus_write_4(priv->reg_bar, offset, htobe32(val));
}
void
gve_db_bar_write_4(struct gve_priv *priv, bus_size_t offset, uint32_t val)
{
bus_write_4(priv->db_bar, offset, htobe32(val));
}
void
gve_alloc_counters(counter_u64_t *stat, int num_stats)
{
int i;
for (i = 0; i < num_stats; i++)
stat[i] = counter_u64_alloc(M_WAITOK);
}
void
gve_free_counters(counter_u64_t *stat, int num_stats)
{
int i;
for (i = 0; i < num_stats; i++)
counter_u64_free(stat[i]);
}
/* Currently assumes a single segment. */
static void
gve_dmamap_load_callback(void *arg, bus_dma_segment_t *segs, int nseg,
int error)
{
if (error == 0)
*(bus_addr_t *) arg = segs[0].ds_addr;
}
int
gve_dma_alloc_coherent(struct gve_priv *priv, int size, int align,
struct gve_dma_handle *dma)
{
int err;
device_t dev = priv->dev;
err = bus_dma_tag_create(
bus_get_dma_tag(dev), /* parent */
align, 0, /* alignment, bounds */
BUS_SPACE_MAXADDR, /* lowaddr */
BUS_SPACE_MAXADDR, /* highaddr */
NULL, NULL, /* filter, filterarg */
size, /* maxsize */
1, /* nsegments */
size, /* maxsegsize */
BUS_DMA_ALLOCNOW, /* flags */
NULL, /* lockfunc */
NULL, /* lockarg */
&dma->tag);
if (err != 0) {
device_printf(dev, "%s: bus_dma_tag_create failed: %d\n",
__func__, err);
goto clear_tag;
}
err = bus_dmamem_alloc(dma->tag, (void **) &dma->cpu_addr,
BUS_DMA_WAITOK | BUS_DMA_COHERENT | BUS_DMA_ZERO,
&dma->map);
if (err != 0) {
device_printf(dev, "%s: bus_dmamem_alloc(%ju) failed: %d\n",
__func__, (uintmax_t)size, err);
goto destroy_tag;
}
/* An address set by the callback will never be -1 */
dma->bus_addr = (bus_addr_t)-1;
err = bus_dmamap_load(dma->tag, dma->map, dma->cpu_addr, size,
gve_dmamap_load_callback, &dma->bus_addr, BUS_DMA_NOWAIT);
if (err != 0 || dma->bus_addr == (bus_addr_t)-1) {
device_printf(dev, "%s: bus_dmamap_load failed: %d\n", __func__, err);
goto free_mem;
}
return (0);
free_mem:
bus_dmamem_free(dma->tag, dma->cpu_addr, dma->map);
destroy_tag:
bus_dma_tag_destroy(dma->tag);
clear_tag:
dma->tag = NULL;
return (err);
}
void
gve_dma_free_coherent(struct gve_dma_handle *dma)
{
bus_dmamap_sync(dma->tag, dma->map, BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
bus_dmamap_unload(dma->tag, dma->map);
bus_dmamem_free(dma->tag, dma->cpu_addr, dma->map);
bus_dma_tag_destroy(dma->tag);
}
int
gve_dmamap_create(struct gve_priv *priv, int size, int align,
struct gve_dma_handle *dma)
{
int err;
device_t dev = priv->dev;
err = bus_dma_tag_create(
bus_get_dma_tag(dev), /* parent */
align, 0, /* alignment, bounds */
BUS_SPACE_MAXADDR, /* lowaddr */
BUS_SPACE_MAXADDR, /* highaddr */
NULL, NULL, /* filter, filterarg */
size, /* maxsize */
1, /* nsegments */
size, /* maxsegsize */
BUS_DMA_ALLOCNOW, /* flags */
NULL, /* lockfunc */
NULL, /* lockarg */
&dma->tag);
if (err != 0) {
device_printf(dev, "%s: bus_dma_tag_create failed: %d\n",
__func__, err);
goto clear_tag;
}
err = bus_dmamap_create(dma->tag, BUS_DMA_COHERENT, &dma->map);
if (err != 0) {
device_printf(dev, "%s: bus_dmamap_create failed: %d\n",
__func__, err);
goto destroy_tag;
}
/* An address set by the callback will never be -1 */
dma->bus_addr = (bus_addr_t)-1;
err = bus_dmamap_load(dma->tag, dma->map, dma->cpu_addr, size,
gve_dmamap_load_callback, &dma->bus_addr, BUS_DMA_WAITOK);
if (err != 0 || dma->bus_addr == (bus_addr_t)-1) {
device_printf(dev, "%s: bus_dmamap_load failed: %d\n",
__func__, err);
goto destroy_map;
}
return (0);
destroy_map:
bus_dmamap_destroy(dma->tag, dma->map);
destroy_tag:
bus_dma_tag_destroy(dma->tag);
clear_tag:
dma->tag = NULL;
return (err);
}
void
gve_dmamap_destroy(struct gve_dma_handle *dma)
{
bus_dmamap_sync(dma->tag, dma->map, BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
bus_dmamap_unload(dma->tag, dma->map);
bus_dmamap_destroy(dma->tag, dma->map);
bus_dma_tag_destroy(dma->tag);
}
static int
gve_mgmnt_intr(void *arg)
{
struct gve_priv *priv = arg;
taskqueue_enqueue(priv->service_tq, &priv->service_task);
return (FILTER_HANDLED);
}
void
gve_free_irqs(struct gve_priv *priv)
{
struct gve_irq *irq;
int num_irqs;
int rid;
int rc;
int i;
if (priv->irq_tbl == NULL) {
device_printf(priv->dev, "No irq table, nothing to free\n");
return;
}
num_irqs = priv->tx_cfg.num_queues + priv->rx_cfg.num_queues + 1;
for (i = 0; i < num_irqs; i++) {
irq = &priv->irq_tbl[i];
if (irq->res == NULL)
continue;
rid = rman_get_rid(irq->res);
rc = bus_teardown_intr(priv->dev, irq->res, irq->cookie);
if (rc != 0)
device_printf(priv->dev, "Failed to teardown irq num %d\n",
rid);
rc = bus_release_resource(priv->dev, SYS_RES_IRQ,
rid, irq->res);
if (rc != 0)
device_printf(priv->dev, "Failed to release irq num %d\n",
rid);
irq->res = NULL;
irq->cookie = NULL;
}
free(priv->irq_tbl, M_GVE);
priv->irq_tbl = NULL;
/* Safe to call even if msix was never alloced */
pci_release_msi(priv->dev);
}
int
gve_alloc_irqs(struct gve_priv *priv)
{
int num_tx = priv->tx_cfg.num_queues;
int num_rx = priv->rx_cfg.num_queues;
int req_nvecs = num_tx + num_rx + 1;
int got_nvecs = req_nvecs;
struct gve_irq *irq;
int i, j, m;
int rid;
int err;
struct gve_ring_com *com;
struct gve_rx_ring *rx;
struct gve_tx_ring *tx;
if (pci_alloc_msix(priv->dev, &got_nvecs) != 0) {
device_printf(priv->dev, "Failed to acquire any msix vectors\n");
err = ENXIO;
goto abort;
} else if (got_nvecs != req_nvecs) {
device_printf(priv->dev, "Tried to acquire %d msix vectors, got only %d\n",
req_nvecs, got_nvecs);
err = ENOSPC;
goto abort;
}
if (bootverbose)
device_printf(priv->dev, "Enabled MSIX with %d vectors\n", got_nvecs);
priv->irq_tbl = malloc(sizeof(struct gve_irq) * req_nvecs, M_GVE,
M_WAITOK | M_ZERO);
for (i = 0; i < num_tx; i++) {
irq = &priv->irq_tbl[i];
tx = &priv->tx[i];
com = &tx->com;
rid = i + 1;
irq->res = bus_alloc_resource_any(priv->dev, SYS_RES_IRQ,
&rid, RF_ACTIVE);
if (irq->res == NULL) {
device_printf(priv->dev, "Failed to alloc irq %d for Tx queue %d\n",
rid, i);
err = ENOMEM;
goto abort;
}
err = bus_setup_intr(priv->dev, irq->res, INTR_TYPE_NET | INTR_MPSAFE,
gve_tx_intr, NULL, &priv->tx[i], &irq->cookie);
if (err != 0) {
device_printf(priv->dev, "Failed to setup irq %d for Tx queue %d, "
"err: %d\n", rid, i, err);
goto abort;
}
bus_describe_intr(priv->dev, irq->res, irq->cookie, "tx%d", i);
com->ntfy_id = i;
}
for (j = 0; j < num_rx; j++) {
irq = &priv->irq_tbl[i + j];
rx = &priv->rx[j];
com = &rx->com;
rid = i + j + 1;
irq->res = bus_alloc_resource_any(priv->dev, SYS_RES_IRQ,
&rid, RF_ACTIVE);
if (irq->res == NULL) {
device_printf(priv->dev,
"Failed to alloc irq %d for Rx queue %d", rid, j);
err = ENOMEM;
goto abort;
}
err = bus_setup_intr(priv->dev, irq->res, INTR_TYPE_NET | INTR_MPSAFE,
gve_rx_intr, NULL, &priv->rx[j], &irq->cookie);
if (err != 0) {
device_printf(priv->dev, "Failed to setup irq %d for Rx queue %d, "
"err: %d\n", rid, j, err);
goto abort;
}
bus_describe_intr(priv->dev, irq->res, irq->cookie, "rx%d", j);
com->ntfy_id = i + j;
}
m = i + j;
rid = m + 1;
irq = &priv->irq_tbl[m];
irq->res = bus_alloc_resource_any(priv->dev, SYS_RES_IRQ,
&rid, RF_ACTIVE);
if (irq->res == NULL) {
device_printf(priv->dev, "Failed to allocate irq %d for mgmnt queue\n", rid);
err = ENOMEM;
goto abort;
}
err = bus_setup_intr(priv->dev, irq->res, INTR_TYPE_NET | INTR_MPSAFE,
gve_mgmnt_intr, NULL, priv, &irq->cookie);
if (err != 0) {
device_printf(priv->dev, "Failed to setup irq %d for mgmnt queue, err: %d\n",
rid, err);
goto abort;
}
bus_describe_intr(priv->dev, irq->res, irq->cookie, "mgmnt");
return (0);
abort:
gve_free_irqs(priv);
return (err);
}
void
gve_unmask_all_queue_irqs(struct gve_priv *priv)
{
struct gve_tx_ring *tx;
struct gve_rx_ring *rx;
int idx;
for (idx = 0; idx < priv->tx_cfg.num_queues; idx++) {
tx = &priv->tx[idx];
gve_db_bar_write_4(priv, tx->com.irq_db_offset, 0);
}
for (idx = 0; idx < priv->rx_cfg.num_queues; idx++) {
rx = &priv->rx[idx];
gve_db_bar_write_4(priv, rx->com.irq_db_offset, 0);
}
}
void
gve_mask_all_queue_irqs(struct gve_priv *priv)
{
for (int idx = 0; idx < priv->tx_cfg.num_queues; idx++) {
struct gve_tx_ring *tx = &priv->tx[idx];
gve_db_bar_write_4(priv, tx->com.irq_db_offset, GVE_IRQ_MASK);
}
for (int idx = 0; idx < priv->rx_cfg.num_queues; idx++) {
struct gve_rx_ring *rx = &priv->rx[idx];
gve_db_bar_write_4(priv, rx->com.irq_db_offset, GVE_IRQ_MASK);
}
}