numam-dpdk/drivers/net/ark/ark_ethdev_tx.c
Ed Czeck 6c7f491e7f net/ark: generalize meta data between FPGA and PMD
In this commit we generalize the movement of user-specified
meta data between mbufs and FPGA AXIS tuser fields using
user-defined hook functions.

- Previous use of PMD dynfields are removed
- Remove emptied rte_pmd_ark.h
- Hook function added to ark_user_ext
- Add hook function calls in Rx and Tx paths
- Update guide with example of hook function use

Signed-off-by: Ed Czeck <ed.czeck@atomicrules.com>
2021-03-22 16:56:27 +01:00

475 lines
12 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright (c) 2015-2021 Atomic Rules LLC
*/
#include <unistd.h>
#include "ark_ethdev_tx.h"
#include "ark_global.h"
#include "ark_mpu.h"
#include "ark_ddm.h"
#include "ark_logs.h"
#define ARK_TX_META_SIZE 32
#define ARK_TX_META_OFFSET (RTE_PKTMBUF_HEADROOM - ARK_TX_META_SIZE)
#define ARK_TX_MAX_NOCHAIN (RTE_MBUF_DEFAULT_DATAROOM)
#ifndef RTE_LIBRTE_ARK_MIN_TX_PKTLEN
#define ARK_MIN_TX_PKTLEN 0
#else
#define ARK_MIN_TX_PKTLEN RTE_LIBRTE_ARK_MIN_TX_PKTLEN
#endif
/* ************************************************************************* */
struct ark_tx_queue {
union ark_tx_meta *meta_q;
struct rte_mbuf **bufs;
/* handles for hw objects */
struct ark_mpu_t *mpu;
struct ark_ddm_t *ddm;
/* Stats HW tracks bytes and packets, need to count send errors */
uint64_t tx_errors;
tx_user_meta_hook_fn tx_user_meta_hook;
void *ext_user_data;
uint32_t queue_size;
uint32_t queue_mask;
/* 3 indexes to the paired data rings. */
int32_t prod_index; /* where to put the next one */
int32_t free_index; /* mbuf has been freed */
/* The queue Id is used to identify the HW Q */
uint16_t phys_qid;
/* The queue Index within the dpdk device structures */
uint16_t queue_index;
/* next cache line - fields written by device */
RTE_MARKER cacheline1 __rte_cache_min_aligned;
volatile int32_t cons_index; /* hw is done, can be freed */
} __rte_cache_aligned;
/* Forward declarations */
static int eth_ark_tx_jumbo(struct ark_tx_queue *queue,
struct rte_mbuf *mbuf,
uint32_t *user_meta, uint8_t meta_cnt);
static int eth_ark_tx_hw_queue_config(struct ark_tx_queue *queue);
static void free_completed_tx(struct ark_tx_queue *queue);
static inline void
ark_tx_hw_queue_stop(struct ark_tx_queue *queue)
{
ark_mpu_stop(queue->mpu);
}
/* ************************************************************************* */
static inline void
eth_ark_tx_desc_fill(struct ark_tx_queue *queue,
struct rte_mbuf *mbuf,
uint8_t flags,
uint32_t *user_meta,
uint8_t meta_cnt /* 0 to 5 */
)
{
uint32_t tx_idx;
union ark_tx_meta *meta;
uint8_t m;
/* Header */
tx_idx = queue->prod_index & queue->queue_mask;
meta = &queue->meta_q[tx_idx];
meta->data_len = rte_pktmbuf_data_len(mbuf);
meta->flags = flags;
meta->meta_cnt = meta_cnt / 2;
meta->user1 = meta_cnt ? (*user_meta++) : 0;
queue->prod_index++;
queue->bufs[tx_idx] = mbuf;
/* 1 or 2 user meta data entries, user words 1,2 and 3,4 */
for (m = 1; m < meta_cnt; m += 2) {
tx_idx = queue->prod_index & queue->queue_mask;
meta = &queue->meta_q[tx_idx];
meta->usermeta0 = *user_meta++;
meta->usermeta1 = *user_meta++;
queue->prod_index++;
}
tx_idx = queue->prod_index & queue->queue_mask;
meta = &queue->meta_q[tx_idx];
meta->physaddr = rte_mbuf_data_iova(mbuf);
queue->prod_index++;
}
/* ************************************************************************* */
uint16_t
eth_ark_xmit_pkts_noop(void *vtxq __rte_unused,
struct rte_mbuf **tx_pkts __rte_unused,
uint16_t nb_pkts __rte_unused)
{
return 0;
}
/* ************************************************************************* */
uint16_t
eth_ark_xmit_pkts(void *vtxq, struct rte_mbuf **tx_pkts, uint16_t nb_pkts)
{
struct ark_tx_queue *queue;
struct rte_mbuf *mbuf;
uint32_t user_meta[5];
int stat;
int32_t prod_index_limit;
uint16_t nb;
uint8_t user_len = 0;
const uint32_t min_pkt_len = ARK_MIN_TX_PKTLEN;
tx_user_meta_hook_fn tx_user_meta_hook;
queue = (struct ark_tx_queue *)vtxq;
tx_user_meta_hook = queue->tx_user_meta_hook;
/* free any packets after the HW is done with them */
free_completed_tx(queue);
/* leave 4 elements mpu data */
prod_index_limit = queue->queue_size + queue->free_index - 4;
for (nb = 0;
(nb < nb_pkts) && (prod_index_limit - queue->prod_index) > 0;
++nb) {
mbuf = tx_pkts[nb];
if (min_pkt_len &&
unlikely(rte_pktmbuf_pkt_len(mbuf) < min_pkt_len)) {
/* this packet even if it is small can be split,
* be sure to add to the end mbuf
*/
uint16_t to_add = min_pkt_len -
rte_pktmbuf_pkt_len(mbuf);
char *appended =
rte_pktmbuf_append(mbuf, to_add);
if (appended == 0) {
/* This packet is in error,
* we cannot send it so just
* count it and delete it.
*/
queue->tx_errors += 1;
rte_pktmbuf_free(mbuf);
continue;
}
memset(appended, 0, to_add);
}
if (tx_user_meta_hook)
tx_user_meta_hook(mbuf, user_meta, &user_len,
queue->ext_user_data);
if (unlikely(mbuf->nb_segs != 1)) {
stat = eth_ark_tx_jumbo(queue, mbuf,
user_meta, user_len);
if (unlikely(stat != 0))
break; /* Queue is full */
} else {
eth_ark_tx_desc_fill(queue, mbuf,
ARK_DDM_SOP | ARK_DDM_EOP,
user_meta, user_len);
}
}
if (ARK_DEBUG_CORE && nb != nb_pkts) {
ARK_PMD_LOG(DEBUG, "TX: Failure to send:"
" req: %" PRIU32
" sent: %" PRIU32
" prod: %" PRIU32
" cons: %" PRIU32
" free: %" PRIU32 "\n",
nb_pkts, nb,
queue->prod_index,
queue->cons_index,
queue->free_index);
ark_mpu_dump(queue->mpu,
"TX Failure MPU: ",
queue->phys_qid);
}
/* let FPGA know producer index. */
if (likely(nb != 0))
ark_mpu_set_producer(queue->mpu, queue->prod_index);
return nb;
}
/* ************************************************************************* */
static int
eth_ark_tx_jumbo(struct ark_tx_queue *queue, struct rte_mbuf *mbuf,
uint32_t *user_meta, uint8_t meta_cnt)
{
struct rte_mbuf *next;
int32_t free_queue_space;
uint8_t flags = ARK_DDM_SOP;
free_queue_space = queue->queue_mask -
(queue->prod_index - queue->free_index);
/* We need up to 4 mbufs for first header and 2 for subsequent ones */
if (unlikely(free_queue_space < (2 + (2 * mbuf->nb_segs))))
return -1;
while (mbuf != NULL) {
next = mbuf->next;
flags |= (next == NULL) ? ARK_DDM_EOP : 0;
eth_ark_tx_desc_fill(queue, mbuf, flags, user_meta, meta_cnt);
flags &= ~ARK_DDM_SOP; /* drop SOP flags */
meta_cnt = 0; /* Meta only on SOP */
mbuf = next;
}
return 0;
}
/* ************************************************************************* */
int
eth_ark_tx_queue_setup(struct rte_eth_dev *dev,
uint16_t queue_idx,
uint16_t nb_desc,
unsigned int socket_id,
const struct rte_eth_txconf *tx_conf __rte_unused)
{
struct ark_adapter *ark = dev->data->dev_private;
struct ark_tx_queue *queue;
int status;
int qidx = queue_idx;
if (!rte_is_power_of_2(nb_desc)) {
ARK_PMD_LOG(ERR,
"DPDK Arkville configuration queue size"
" must be power of two %u (%s)\n",
nb_desc, __func__);
return -1;
}
/* Each packet requires at least 2 mpu elements - double desc count */
nb_desc = 2 * nb_desc;
/* Allocate queue struct */
queue = rte_zmalloc_socket("Ark_txqueue",
sizeof(struct ark_tx_queue),
64,
socket_id);
if (queue == 0) {
ARK_PMD_LOG(ERR, "Failed to allocate tx "
"queue memory in %s\n",
__func__);
return -ENOMEM;
}
/* we use zmalloc no need to initialize fields */
queue->queue_size = nb_desc;
queue->queue_mask = nb_desc - 1;
queue->phys_qid = qidx;
queue->queue_index = queue_idx;
dev->data->tx_queues[queue_idx] = queue;
queue->tx_user_meta_hook = ark->user_ext.tx_user_meta_hook;
queue->ext_user_data = ark->user_data[dev->data->port_id];
queue->meta_q =
rte_zmalloc_socket("Ark_txqueue meta",
nb_desc * sizeof(union ark_tx_meta),
64,
socket_id);
queue->bufs =
rte_zmalloc_socket("Ark_txqueue bufs",
nb_desc * sizeof(struct rte_mbuf *),
64,
socket_id);
if (queue->meta_q == 0 || queue->bufs == 0) {
ARK_PMD_LOG(ERR, "Failed to allocate "
"queue memory in %s\n", __func__);
rte_free(queue->meta_q);
rte_free(queue->bufs);
rte_free(queue);
return -ENOMEM;
}
queue->ddm = RTE_PTR_ADD(ark->ddm.v, qidx * ARK_DDM_QOFFSET);
queue->mpu = RTE_PTR_ADD(ark->mputx.v, qidx * ARK_MPU_QOFFSET);
status = eth_ark_tx_hw_queue_config(queue);
if (unlikely(status != 0)) {
rte_free(queue->meta_q);
rte_free(queue->bufs);
rte_free(queue);
return -1; /* ERROR CODE */
}
return 0;
}
/* ************************************************************************* */
static int
eth_ark_tx_hw_queue_config(struct ark_tx_queue *queue)
{
rte_iova_t queue_base, ring_base, cons_index_addr;
uint32_t write_interval_ns;
/* Verify HW -- MPU */
if (ark_mpu_verify(queue->mpu, sizeof(union ark_tx_meta)))
return -1;
queue_base = rte_malloc_virt2iova(queue);
ring_base = rte_malloc_virt2iova(queue->meta_q);
cons_index_addr =
queue_base + offsetof(struct ark_tx_queue, cons_index);
ark_mpu_stop(queue->mpu);
ark_mpu_reset(queue->mpu);
/* Stop and Reset and configure MPU */
ark_mpu_configure(queue->mpu, ring_base, queue->queue_size, 1);
/*
* Adjust the write interval based on queue size --
* increase pcie traffic when low mbuf count
* Queue sizes less than 128 are not allowed
*/
switch (queue->queue_size) {
case 128:
write_interval_ns = 500;
break;
case 256:
write_interval_ns = 500;
break;
case 512:
write_interval_ns = 1000;
break;
default:
write_interval_ns = 2000;
break;
}
/* Completion address in UDM */
ark_ddm_setup(queue->ddm, cons_index_addr, write_interval_ns);
return 0;
}
/* ************************************************************************* */
void
eth_ark_tx_queue_release(void *vtx_queue)
{
struct ark_tx_queue *queue;
queue = (struct ark_tx_queue *)vtx_queue;
ark_tx_hw_queue_stop(queue);
queue->cons_index = queue->prod_index;
free_completed_tx(queue);
rte_free(queue->meta_q);
rte_free(queue->bufs);
rte_free(queue);
}
/* ************************************************************************* */
int
eth_ark_tx_queue_stop(struct rte_eth_dev *dev, uint16_t queue_id)
{
struct ark_tx_queue *queue;
int cnt = 0;
queue = dev->data->tx_queues[queue_id];
/* Wait for DDM to send out all packets. */
while (queue->cons_index != queue->prod_index) {
usleep(100);
if (cnt++ > 10000)
return -1;
}
ark_mpu_stop(queue->mpu);
free_completed_tx(queue);
dev->data->tx_queue_state[queue_id] = RTE_ETH_QUEUE_STATE_STOPPED;
return 0;
}
int
eth_ark_tx_queue_start(struct rte_eth_dev *dev, uint16_t queue_id)
{
struct ark_tx_queue *queue;
queue = dev->data->tx_queues[queue_id];
if (dev->data->tx_queue_state[queue_id] == RTE_ETH_QUEUE_STATE_STARTED)
return 0;
ark_mpu_start(queue->mpu);
dev->data->tx_queue_state[queue_id] = RTE_ETH_QUEUE_STATE_STARTED;
return 0;
}
/* ************************************************************************* */
static void
free_completed_tx(struct ark_tx_queue *queue)
{
struct rte_mbuf *mbuf;
union ark_tx_meta *meta;
int32_t top_index;
top_index = queue->cons_index; /* read once */
while ((top_index - queue->free_index) > 0) {
meta = &queue->meta_q[queue->free_index & queue->queue_mask];
if (likely((meta->flags & ARK_DDM_SOP) != 0)) {
mbuf = queue->bufs[queue->free_index &
queue->queue_mask];
/* ref count of the mbuf is checked in this call. */
rte_pktmbuf_free(mbuf);
}
queue->free_index += (meta->meta_cnt + 2);
}
}
/* ************************************************************************* */
void
eth_tx_queue_stats_get(void *vqueue, struct rte_eth_stats *stats)
{
struct ark_tx_queue *queue;
struct ark_ddm_t *ddm;
uint64_t bytes, pkts;
queue = vqueue;
ddm = queue->ddm;
bytes = ark_ddm_queue_byte_count(ddm);
pkts = ark_ddm_queue_pkt_count(ddm);
stats->q_opackets[queue->queue_index] = pkts;
stats->q_obytes[queue->queue_index] = bytes;
stats->opackets += pkts;
stats->obytes += bytes;
stats->oerrors += queue->tx_errors;
}
void
eth_tx_queue_stats_reset(void *vqueue)
{
struct ark_tx_queue *queue;
struct ark_ddm_t *ddm;
queue = vqueue;
ddm = queue->ddm;
ark_ddm_queue_reset_stats(ddm);
queue->tx_errors = 0;
}