net/cnxk: enable PTP processing in vector Tx

Enable PTP offload in vector Tx burst function. Since, we can
no-longer use a single LMT line for burst of 4, split the LMT
into two and transmit twice.

Signed-off-by: Pavan Nikhilesh <pbhagavatula@marvell.com>
Acked-by: Nithin Dabilpuram <ndabilpuram@marvell.com>
This commit is contained in:
Pavan Nikhilesh 2021-06-29 13:14:21 +05:30 committed by Jerin Jacob
parent 3186a3a49c
commit 99fc1f6eef
6 changed files with 192 additions and 40 deletions

View File

@ -67,9 +67,7 @@ cn10k_eth_set_tx_function(struct rte_eth_dev *eth_dev)
#undef T
};
if (dev->scalar_ena ||
(dev->tx_offload_flags &
(NIX_TX_OFFLOAD_TSTAMP_F | NIX_TX_OFFLOAD_TSO_F)))
if (dev->scalar_ena || (dev->tx_offload_flags & NIX_TX_OFFLOAD_TSO_F))
pick_tx_func(eth_dev, nix_eth_tx_burst);
else
pick_tx_func(eth_dev, nix_eth_tx_vec_burst);

View File

@ -69,7 +69,9 @@ cn10k_nix_pkts_per_vec_brst(const uint16_t flags)
static __rte_always_inline uint8_t
cn10k_nix_tx_dwords_per_line(const uint16_t flags)
{
return (flags & NIX_TX_NEED_EXT_HDR) ? 6 : 8;
return (flags & NIX_TX_NEED_EXT_HDR) ?
((flags & NIX_TX_OFFLOAD_TSTAMP_F) ? 8 : 6) :
8;
}
static __rte_always_inline uint64_t
@ -695,13 +697,15 @@ cn10k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
uint64x2_t dataoff_iova0, dataoff_iova1, dataoff_iova2, dataoff_iova3;
uint64x2_t len_olflags0, len_olflags1, len_olflags2, len_olflags3;
uint64x2_t cmd0[NIX_DESCS_PER_LOOP], cmd1[NIX_DESCS_PER_LOOP],
cmd2[NIX_DESCS_PER_LOOP];
cmd2[NIX_DESCS_PER_LOOP], cmd3[NIX_DESCS_PER_LOOP];
uint64_t *mbuf0, *mbuf1, *mbuf2, *mbuf3, data, pa;
uint64x2_t senddesc01_w0, senddesc23_w0;
uint64x2_t senddesc01_w1, senddesc23_w1;
uint16_t left, scalar, burst, i, lmt_id;
uint64x2_t sendext01_w0, sendext23_w0;
uint64x2_t sendext01_w1, sendext23_w1;
uint64x2_t sendmem01_w0, sendmem23_w0;
uint64x2_t sendmem01_w1, sendmem23_w1;
uint64x2_t sgdesc01_w0, sgdesc23_w0;
uint64x2_t sgdesc01_w1, sgdesc23_w1;
struct cn10k_eth_txq *txq = tx_queue;
@ -733,6 +737,12 @@ cn10k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
sendext23_w0 = sendext01_w0;
sendext01_w1 = vdupq_n_u64(12 | 12U << 24);
sendext23_w1 = sendext01_w1;
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
sendmem01_w0 = vld1q_dup_u64(&txq->cmd[2]);
sendmem23_w0 = sendmem01_w0;
sendmem01_w1 = vld1q_dup_u64(&txq->cmd[3]);
sendmem23_w1 = sendmem01_w1;
}
}
/* Get LMT base address and LMT ID as lcore id */
@ -760,6 +770,17 @@ again:
sendext23_w1 = sendext01_w1;
}
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
/* Reset send mem alg to SETTSTMP from SUB*/
sendmem01_w0 = vbicq_u64(sendmem01_w0,
vdupq_n_u64(BIT_ULL(59)));
/* Reset send mem address to default. */
sendmem01_w1 =
vbicq_u64(sendmem01_w1, vdupq_n_u64(0xF));
sendmem23_w0 = sendmem01_w0;
sendmem23_w1 = sendmem01_w1;
}
/* Move mbufs to iova */
mbuf0 = (uint64_t *)tx_pkts[0];
mbuf1 = (uint64_t *)tx_pkts[1];
@ -1371,6 +1392,44 @@ again:
sendext23_w1 = vorrq_u64(sendext23_w1, ytmp128);
}
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
/* Tx ol_flag for timestam. */
const uint64x2_t olf = {PKT_TX_IEEE1588_TMST,
PKT_TX_IEEE1588_TMST};
/* Set send mem alg to SUB. */
const uint64x2_t alg = {BIT_ULL(59), BIT_ULL(59)};
/* Increment send mem address by 8. */
const uint64x2_t addr = {0x8, 0x8};
xtmp128 = vzip1q_u64(len_olflags0, len_olflags1);
ytmp128 = vzip1q_u64(len_olflags2, len_olflags3);
/* Check if timestamp is requested and generate inverted
* mask as we need not make any changes to default cmd
* value.
*/
xtmp128 = vmvnq_u32(vtstq_u64(olf, xtmp128));
ytmp128 = vmvnq_u32(vtstq_u64(olf, ytmp128));
/* Change send mem address to an 8 byte offset when
* TSTMP is disabled.
*/
sendmem01_w1 = vaddq_u64(sendmem01_w1,
vandq_u64(xtmp128, addr));
sendmem23_w1 = vaddq_u64(sendmem23_w1,
vandq_u64(ytmp128, addr));
/* Change send mem alg to SUB when TSTMP is disabled. */
sendmem01_w0 = vorrq_u64(sendmem01_w0,
vandq_u64(xtmp128, alg));
sendmem23_w0 = vorrq_u64(sendmem23_w0,
vandq_u64(ytmp128, alg));
cmd3[0] = vzip1q_u64(sendmem01_w0, sendmem01_w1);
cmd3[1] = vzip2q_u64(sendmem01_w0, sendmem01_w1);
cmd3[2] = vzip1q_u64(sendmem23_w0, sendmem23_w1);
cmd3[3] = vzip2q_u64(sendmem23_w0, sendmem23_w1);
}
if (flags & NIX_TX_OFFLOAD_MBUF_NOFF_F) {
/* Set don't free bit if reference count > 1 */
xmask01 = vdupq_n_u64(0);
@ -1458,19 +1517,39 @@ again:
if (flags & NIX_TX_NEED_EXT_HDR) {
/* Store the prepared send desc to LMT lines */
vst1q_u64(LMT_OFF(laddr, lnum, 0), cmd0[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 16), cmd2[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 32), cmd1[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 48), cmd0[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 64), cmd2[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 80), cmd1[1]);
lnum += 1;
vst1q_u64(LMT_OFF(laddr, lnum, 0), cmd0[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 16), cmd2[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 32), cmd1[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 48), cmd0[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 64), cmd2[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 80), cmd1[3]);
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
vst1q_u64(LMT_OFF(laddr, lnum, 0), cmd0[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 16), cmd2[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 32), cmd1[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 48), cmd3[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 64), cmd0[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 80), cmd2[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 96), cmd1[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 112), cmd3[1]);
lnum += 1;
vst1q_u64(LMT_OFF(laddr, lnum, 0), cmd0[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 16), cmd2[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 32), cmd1[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 48), cmd3[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 64), cmd0[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 80), cmd2[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 96), cmd1[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 112), cmd3[3]);
} else {
vst1q_u64(LMT_OFF(laddr, lnum, 0), cmd0[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 16), cmd2[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 32), cmd1[0]);
vst1q_u64(LMT_OFF(laddr, lnum, 48), cmd0[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 64), cmd2[1]);
vst1q_u64(LMT_OFF(laddr, lnum, 80), cmd1[1]);
lnum += 1;
vst1q_u64(LMT_OFF(laddr, lnum, 0), cmd0[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 16), cmd2[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 32), cmd1[2]);
vst1q_u64(LMT_OFF(laddr, lnum, 48), cmd0[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 64), cmd2[3]);
vst1q_u64(LMT_OFF(laddr, lnum, 80), cmd1[3]);
}
lnum += 1;
} else {
/* Store the prepared send desc to LMT lines */

View File

@ -13,9 +13,8 @@
{ \
uint64_t cmd[sz]; \
\
/* VLAN, TSTMP, TSO is not supported by vec */ \
if ((flags) & NIX_TX_OFFLOAD_TSTAMP_F || \
(flags) & NIX_TX_OFFLOAD_TSO_F) \
/* TSO is not supported by vec */ \
if ((flags) & NIX_TX_OFFLOAD_TSO_F) \
return 0; \
return cn10k_nix_xmit_pkts_vector(tx_queue, tx_pkts, pkts, cmd,\
(flags)); \

View File

@ -66,9 +66,7 @@ cn9k_eth_set_tx_function(struct rte_eth_dev *eth_dev)
#undef T
};
if (dev->scalar_ena ||
(dev->tx_offload_flags &
(NIX_TX_OFFLOAD_TSTAMP_F | NIX_TX_OFFLOAD_TSO_F)))
if (dev->scalar_ena || (dev->tx_offload_flags & NIX_TX_OFFLOAD_TSO_F))
pick_tx_func(eth_dev, nix_eth_tx_burst);
else
pick_tx_func(eth_dev, nix_eth_tx_vec_burst);

View File

@ -553,12 +553,14 @@ cn9k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
uint64x2_t dataoff_iova0, dataoff_iova1, dataoff_iova2, dataoff_iova3;
uint64x2_t len_olflags0, len_olflags1, len_olflags2, len_olflags3;
uint64x2_t cmd0[NIX_DESCS_PER_LOOP], cmd1[NIX_DESCS_PER_LOOP],
cmd2[NIX_DESCS_PER_LOOP];
cmd2[NIX_DESCS_PER_LOOP], cmd3[NIX_DESCS_PER_LOOP];
uint64_t *mbuf0, *mbuf1, *mbuf2, *mbuf3;
uint64x2_t senddesc01_w0, senddesc23_w0;
uint64x2_t senddesc01_w1, senddesc23_w1;
uint64x2_t sendext01_w0, sendext23_w0;
uint64x2_t sendext01_w1, sendext23_w1;
uint64x2_t sendmem01_w0, sendmem23_w0;
uint64x2_t sendmem01_w1, sendmem23_w1;
uint64x2_t sgdesc01_w0, sgdesc23_w0;
uint64x2_t sgdesc01_w1, sgdesc23_w1;
struct cn9k_eth_txq *txq = tx_queue;
@ -597,6 +599,12 @@ cn9k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
sendext23_w1 = sendext01_w1;
sgdesc01_w0 = vld1q_dup_u64(&txq->cmd[4]);
sgdesc23_w0 = sgdesc01_w0;
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
sendmem01_w0 = vld1q_dup_u64(&txq->cmd[6]);
sendmem23_w0 = sendmem01_w0;
sendmem01_w1 = vld1q_dup_u64(&txq->cmd[7]);
sendmem23_w1 = sendmem01_w1;
}
} else {
sgdesc01_w0 = vld1q_dup_u64(&txq->cmd[2]);
sgdesc23_w0 = sgdesc01_w0;
@ -618,6 +626,17 @@ cn9k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
sendext23_w1 = sendext01_w1;
}
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
/* Reset send mem alg to SETTSTMP from SUB*/
sendmem01_w0 = vbicq_u64(sendmem01_w0,
vdupq_n_u64(BIT_ULL(59)));
/* Reset send mem address to default. */
sendmem01_w1 =
vbicq_u64(sendmem01_w1, vdupq_n_u64(0xF));
sendmem23_w0 = sendmem01_w0;
sendmem23_w1 = sendmem01_w1;
}
/* Move mbufs to iova */
mbuf0 = (uint64_t *)tx_pkts[0];
mbuf1 = (uint64_t *)tx_pkts[1];
@ -1229,6 +1248,44 @@ cn9k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
sendext23_w1 = vorrq_u64(sendext23_w1, ytmp128);
}
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
/* Tx ol_flag for timestam. */
const uint64x2_t olf = {PKT_TX_IEEE1588_TMST,
PKT_TX_IEEE1588_TMST};
/* Set send mem alg to SUB. */
const uint64x2_t alg = {BIT_ULL(59), BIT_ULL(59)};
/* Increment send mem address by 8. */
const uint64x2_t addr = {0x8, 0x8};
xtmp128 = vzip1q_u64(len_olflags0, len_olflags1);
ytmp128 = vzip1q_u64(len_olflags2, len_olflags3);
/* Check if timestamp is requested and generate inverted
* mask as we need not make any changes to default cmd
* value.
*/
xtmp128 = vmvnq_u32(vtstq_u64(olf, xtmp128));
ytmp128 = vmvnq_u32(vtstq_u64(olf, ytmp128));
/* Change send mem address to an 8 byte offset when
* TSTMP is disabled.
*/
sendmem01_w1 = vaddq_u64(sendmem01_w1,
vandq_u64(xtmp128, addr));
sendmem23_w1 = vaddq_u64(sendmem23_w1,
vandq_u64(ytmp128, addr));
/* Change send mem alg to SUB when TSTMP is disabled. */
sendmem01_w0 = vorrq_u64(sendmem01_w0,
vandq_u64(xtmp128, alg));
sendmem23_w0 = vorrq_u64(sendmem23_w0,
vandq_u64(ytmp128, alg));
cmd3[0] = vzip1q_u64(sendmem01_w0, sendmem01_w1);
cmd3[1] = vzip2q_u64(sendmem01_w0, sendmem01_w1);
cmd3[2] = vzip1q_u64(sendmem23_w0, sendmem23_w1);
cmd3[3] = vzip2q_u64(sendmem23_w0, sendmem23_w1);
}
if (flags & NIX_TX_OFFLOAD_MBUF_NOFF_F) {
/* Set don't free bit if reference count > 1 */
xmask01 = vdupq_n_u64(0);
@ -1327,22 +1384,44 @@ cn9k_nix_xmit_pkts_vector(void *tx_queue, struct rte_mbuf **tx_pkts,
* Split and Tx twice.
*/
do {
vst1q_u64(lmt_addr, cmd0[0]);
vst1q_u64(lmt_addr + 2, cmd2[0]);
vst1q_u64(lmt_addr + 4, cmd1[0]);
vst1q_u64(lmt_addr + 6, cmd0[1]);
vst1q_u64(lmt_addr + 8, cmd2[1]);
vst1q_u64(lmt_addr + 10, cmd1[1]);
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
vst1q_u64(lmt_addr, cmd0[0]);
vst1q_u64(lmt_addr + 2, cmd2[0]);
vst1q_u64(lmt_addr + 4, cmd1[0]);
vst1q_u64(lmt_addr + 6, cmd3[0]);
vst1q_u64(lmt_addr + 8, cmd0[1]);
vst1q_u64(lmt_addr + 10, cmd2[1]);
vst1q_u64(lmt_addr + 12, cmd1[1]);
vst1q_u64(lmt_addr + 14, cmd3[1]);
} else {
vst1q_u64(lmt_addr, cmd0[0]);
vst1q_u64(lmt_addr + 2, cmd2[0]);
vst1q_u64(lmt_addr + 4, cmd1[0]);
vst1q_u64(lmt_addr + 6, cmd0[1]);
vst1q_u64(lmt_addr + 8, cmd2[1]);
vst1q_u64(lmt_addr + 10, cmd1[1]);
}
lmt_status = roc_lmt_submit_ldeor(io_addr);
} while (lmt_status == 0);
do {
vst1q_u64(lmt_addr, cmd0[2]);
vst1q_u64(lmt_addr + 2, cmd2[2]);
vst1q_u64(lmt_addr + 4, cmd1[2]);
vst1q_u64(lmt_addr + 6, cmd0[3]);
vst1q_u64(lmt_addr + 8, cmd2[3]);
vst1q_u64(lmt_addr + 10, cmd1[3]);
if (flags & NIX_TX_OFFLOAD_TSTAMP_F) {
vst1q_u64(lmt_addr, cmd0[2]);
vst1q_u64(lmt_addr + 2, cmd2[2]);
vst1q_u64(lmt_addr + 4, cmd1[2]);
vst1q_u64(lmt_addr + 6, cmd3[2]);
vst1q_u64(lmt_addr + 8, cmd0[3]);
vst1q_u64(lmt_addr + 10, cmd2[3]);
vst1q_u64(lmt_addr + 12, cmd1[3]);
vst1q_u64(lmt_addr + 14, cmd3[3]);
} else {
vst1q_u64(lmt_addr, cmd0[2]);
vst1q_u64(lmt_addr + 2, cmd2[2]);
vst1q_u64(lmt_addr + 4, cmd1[2]);
vst1q_u64(lmt_addr + 6, cmd0[3]);
vst1q_u64(lmt_addr + 8, cmd2[3]);
vst1q_u64(lmt_addr + 10, cmd1[3]);
}
lmt_status = roc_lmt_submit_ldeor(io_addr);
} while (lmt_status == 0);
} else {

View File

@ -13,9 +13,8 @@
{ \
uint64_t cmd[sz]; \
\
/* VLAN, TSTMP, TSO is not supported by vec */ \
if ((flags) & NIX_TX_OFFLOAD_TSTAMP_F || \
(flags) & NIX_TX_OFFLOAD_TSO_F) \
/* TSO is not supported by vec */ \
if ((flags) & NIX_TX_OFFLOAD_TSO_F) \
return 0; \
return cn9k_nix_xmit_pkts_vector(tx_queue, tx_pkts, pkts, cmd, \
(flags)); \