net/iavf: add offload path for Rx AVX512 flex descriptor
Add a specific path for RX AVX512 (flexible descriptor). In this path, support the HW offload features, like, checksum, VLAN stripping, RSS hash. This path is chosen automatically according to the configuration. 'inline' is used, then the duplicate code is generated by the compiler. Signed-off-by: Wenzhuo Lu <wenzhuo.lu@intel.com> Acked-by: Qi Zhang <qi.z.zhang@intel.com>
This commit is contained in:
parent
eff56a7b9f
commit
9c9aa00403
@ -119,6 +119,10 @@ New Features
|
||||
Updated the Intel iavf driver with new features and improvements, including:
|
||||
|
||||
* Added flow filter to support GTPU inner L3/L4 fields matching.
|
||||
* In AVX512 code, added the new RX and TX paths to use the HW offload
|
||||
features. When the HW offload features are configured to be used, the
|
||||
offload paths are chosen automatically. In parallel the support of HW
|
||||
offload features was removed from the legacy AVX512 paths.
|
||||
|
||||
* **Updated Intel ice driver.**
|
||||
|
||||
|
@ -2420,11 +2420,8 @@ iavf_set_rx_function(struct rte_eth_dev *dev)
|
||||
goto normal;
|
||||
|
||||
if (vf->vf_res->vf_cap_flags &
|
||||
VIRTCHNL_VF_OFFLOAD_RX_FLEX_DESC) {
|
||||
VIRTCHNL_VF_OFFLOAD_RX_FLEX_DESC)
|
||||
use_flex = true;
|
||||
if (use_avx512 && check_ret == IAVF_VECTOR_OFFLOAD_PATH)
|
||||
use_flex = false;
|
||||
}
|
||||
|
||||
for (i = 0; i < dev->data->nb_rx_queues; i++) {
|
||||
rxq = dev->data->rx_queues[i];
|
||||
@ -2452,9 +2449,14 @@ iavf_set_rx_function(struct rte_eth_dev *dev)
|
||||
iavf_recv_scattered_pkts_vec_avx2_flex_rxd :
|
||||
iavf_recv_scattered_pkts_vec_flex_rxd;
|
||||
#ifdef CC_AVX512_SUPPORT
|
||||
if (use_avx512)
|
||||
if (use_avx512) {
|
||||
if (check_ret == IAVF_VECTOR_PATH)
|
||||
dev->rx_pkt_burst =
|
||||
iavf_recv_scattered_pkts_vec_avx512_flex_rxd;
|
||||
else
|
||||
dev->rx_pkt_burst =
|
||||
iavf_recv_scattered_pkts_vec_avx512_flex_rxd_offload;
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
dev->rx_pkt_burst = use_avx2 ?
|
||||
@ -2491,9 +2493,14 @@ iavf_set_rx_function(struct rte_eth_dev *dev)
|
||||
iavf_recv_pkts_vec_avx2_flex_rxd :
|
||||
iavf_recv_pkts_vec_flex_rxd;
|
||||
#ifdef CC_AVX512_SUPPORT
|
||||
if (use_avx512)
|
||||
if (use_avx512) {
|
||||
if (check_ret == IAVF_VECTOR_PATH)
|
||||
dev->rx_pkt_burst =
|
||||
iavf_recv_pkts_vec_avx512_flex_rxd;
|
||||
else
|
||||
dev->rx_pkt_burst =
|
||||
iavf_recv_pkts_vec_avx512_flex_rxd_offload;
|
||||
}
|
||||
#endif
|
||||
} else {
|
||||
dev->rx_pkt_burst = use_avx2 ?
|
||||
|
@ -496,6 +496,9 @@ uint16_t iavf_recv_pkts_vec_avx512_offload(void *rx_queue,
|
||||
uint16_t iavf_recv_pkts_vec_avx512_flex_rxd(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts);
|
||||
uint16_t iavf_recv_pkts_vec_avx512_flex_rxd_offload(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts);
|
||||
uint16_t iavf_recv_scattered_pkts_vec_avx512(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts);
|
||||
@ -505,6 +508,9 @@ uint16_t iavf_recv_scattered_pkts_vec_avx512_offload(void *rx_queue,
|
||||
uint16_t iavf_recv_scattered_pkts_vec_avx512_flex_rxd(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts);
|
||||
uint16_t iavf_recv_scattered_pkts_vec_avx512_flex_rxd_offload(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts);
|
||||
uint16_t iavf_xmit_pkts_vec_avx512(void *tx_queue, struct rte_mbuf **tx_pkts,
|
||||
uint16_t nb_pkts);
|
||||
uint16_t iavf_xmit_pkts_vec_avx512_offload(void *tx_queue,
|
||||
|
@ -684,7 +684,7 @@ _iavf_recv_raw_pkts_vec_avx512(struct iavf_rx_queue *rxq,
|
||||
return received;
|
||||
}
|
||||
|
||||
static inline __m256i
|
||||
static __rte_always_inline __m256i
|
||||
flex_rxd_to_fdir_flags_vec_avx512(const __m256i fdir_id0_7)
|
||||
{
|
||||
#define FDID_MIS_MAGIC 0xFFFFFFFF
|
||||
@ -703,12 +703,16 @@ flex_rxd_to_fdir_flags_vec_avx512(const __m256i fdir_id0_7)
|
||||
return fdir_flags;
|
||||
}
|
||||
|
||||
static inline uint16_t
|
||||
static __rte_always_inline uint16_t
|
||||
_iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts, uint8_t *split_packet)
|
||||
uint16_t nb_pkts,
|
||||
uint8_t *split_packet,
|
||||
bool offload)
|
||||
{
|
||||
#ifdef IAVF_RX_PTYPE_OFFLOAD
|
||||
const uint32_t *type_table = rxq->vsi->adapter->ptype_tbl;
|
||||
#endif
|
||||
|
||||
const __m256i mbuf_init = _mm256_set_epi64x(0, 0, 0,
|
||||
rxq->mbuf_initializer);
|
||||
@ -812,71 +816,6 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
RTE_BUILD_BUG_ON(offsetof(struct rte_mbuf, hash) !=
|
||||
offsetof(struct rte_mbuf, rx_descriptor_fields1) + 12);
|
||||
|
||||
/* Status/Error flag masks */
|
||||
/**
|
||||
* mask everything except Checksum Reports, RSS indication
|
||||
* and VLAN indication.
|
||||
* bit6:4 for IP/L4 checksum errors.
|
||||
* bit12 is for RSS indication.
|
||||
* bit13 is for VLAN indication.
|
||||
*/
|
||||
const __m256i flags_mask =
|
||||
_mm256_set1_epi32((7 << 4) | (1 << 12) | (1 << 13));
|
||||
/**
|
||||
* data to be shuffled by the result of the flags mask shifted by 4
|
||||
* bits. This gives use the l3_l4 flags.
|
||||
*/
|
||||
const __m256i l3_l4_flags_shuf = _mm256_set_epi8(0, 0, 0, 0, 0, 0, 0, 0,
|
||||
/* shift right 1 bit to make sure it not exceed 255 */
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
/* second 128-bits */
|
||||
0, 0, 0, 0, 0, 0, 0, 0,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_GOOD) >> 1);
|
||||
const __m256i cksum_mask =
|
||||
_mm256_set1_epi32(PKT_RX_IP_CKSUM_GOOD | PKT_RX_IP_CKSUM_BAD |
|
||||
PKT_RX_L4_CKSUM_GOOD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_OUTER_IP_CKSUM_BAD);
|
||||
/**
|
||||
* data to be shuffled by result of flag mask, shifted down 12.
|
||||
* If RSS(bit12)/VLAN(bit13) are set,
|
||||
* shuffle moves appropriate flags in place.
|
||||
*/
|
||||
const __m256i rss_vlan_flags_shuf = _mm256_set_epi8(0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
PKT_RX_RSS_HASH | PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_RSS_HASH, 0,
|
||||
/* end up 128-bits */
|
||||
0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
PKT_RX_RSS_HASH | PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_RSS_HASH, 0);
|
||||
|
||||
uint16_t i, received;
|
||||
|
||||
for (i = 0, received = 0; i < nb_pkts;
|
||||
@ -940,6 +879,7 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
__m512i mb4_7 = _mm512_shuffle_epi8(raw_desc4_7, shuf_msk);
|
||||
|
||||
mb4_7 = _mm512_add_epi32(mb4_7, crc_adjust);
|
||||
#ifdef IAVF_RX_PTYPE_OFFLOAD
|
||||
/**
|
||||
* to get packet types, ptype is located in bit16-25
|
||||
* of each 128bits
|
||||
@ -961,6 +901,7 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
0, 0, 0, type_table[ptype5],
|
||||
0, 0, 0, type_table[ptype4]);
|
||||
mb4_7 = _mm512_mask_blend_epi32(0x1111, mb4_7, ptype4_7);
|
||||
#endif
|
||||
|
||||
/**
|
||||
* convert descriptors 0-3 into mbufs, re-arrange fields.
|
||||
@ -969,6 +910,7 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
__m512i mb0_3 = _mm512_shuffle_epi8(raw_desc0_3, shuf_msk);
|
||||
|
||||
mb0_3 = _mm512_add_epi32(mb0_3, crc_adjust);
|
||||
#ifdef IAVF_RX_PTYPE_OFFLOAD
|
||||
/**
|
||||
* to get packet types, ptype is located in bit16-25
|
||||
* of each 128bits
|
||||
@ -988,6 +930,7 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
0, 0, 0, type_table[ptype1],
|
||||
0, 0, 0, type_table[ptype0]);
|
||||
mb0_3 = _mm512_mask_blend_epi32(0x1111, mb0_3, ptype0_3);
|
||||
#endif
|
||||
|
||||
/**
|
||||
* use permute/extract to get status content
|
||||
@ -1007,9 +950,87 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
|
||||
/* now do flag manipulation */
|
||||
|
||||
/* merge flags */
|
||||
__m256i mbuf_flags = _mm256_set1_epi32(0);
|
||||
|
||||
if (offload) {
|
||||
#if defined(IAVF_RX_CSUM_OFFLOAD) || defined(IAVF_RX_VLAN_OFFLOAD) || defined(IAVF_RX_RSS_OFFLOAD)
|
||||
/* Status/Error flag masks */
|
||||
/**
|
||||
* mask everything except Checksum Reports, RSS indication
|
||||
* and VLAN indication.
|
||||
* bit6:4 for IP/L4 checksum errors.
|
||||
* bit12 is for RSS indication.
|
||||
* bit13 is for VLAN indication.
|
||||
*/
|
||||
const __m256i flags_mask =
|
||||
_mm256_set1_epi32((7 << 4) | (1 << 12) | (1 << 13));
|
||||
#endif
|
||||
#ifdef IAVF_RX_CSUM_OFFLOAD
|
||||
/**
|
||||
* data to be shuffled by the result of the flags mask shifted by 4
|
||||
* bits. This gives use the l3_l4 flags.
|
||||
*/
|
||||
const __m256i l3_l4_flags_shuf = _mm256_set_epi8(0, 0, 0, 0, 0, 0, 0, 0,
|
||||
/* shift right 1 bit to make sure it not exceed 255 */
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
/* second 128-bits */
|
||||
0, 0, 0, 0, 0, 0, 0, 0,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_OUTER_IP_CKSUM_BAD | PKT_RX_L4_CKSUM_GOOD |
|
||||
PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_BAD | PKT_RX_IP_CKSUM_GOOD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_BAD) >> 1,
|
||||
(PKT_RX_L4_CKSUM_GOOD | PKT_RX_IP_CKSUM_GOOD) >> 1);
|
||||
const __m256i cksum_mask =
|
||||
_mm256_set1_epi32(PKT_RX_IP_CKSUM_GOOD | PKT_RX_IP_CKSUM_BAD |
|
||||
PKT_RX_L4_CKSUM_GOOD | PKT_RX_L4_CKSUM_BAD |
|
||||
PKT_RX_OUTER_IP_CKSUM_BAD);
|
||||
#endif
|
||||
#if defined(IAVF_RX_VLAN_OFFLOAD) || defined(IAVF_RX_RSS_OFFLOAD)
|
||||
/**
|
||||
* data to be shuffled by result of flag mask, shifted down 12.
|
||||
* If RSS(bit12)/VLAN(bit13) are set,
|
||||
* shuffle moves appropriate flags in place.
|
||||
*/
|
||||
const __m256i rss_vlan_flags_shuf = _mm256_set_epi8(0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
PKT_RX_RSS_HASH | PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_RSS_HASH, 0,
|
||||
/* end up 128-bits */
|
||||
0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
0, 0, 0, 0,
|
||||
PKT_RX_RSS_HASH | PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED,
|
||||
PKT_RX_RSS_HASH, 0);
|
||||
#endif
|
||||
|
||||
#if defined(IAVF_RX_CSUM_OFFLOAD) || defined(IAVF_RX_VLAN_OFFLOAD) || defined(IAVF_RX_RSS_OFFLOAD)
|
||||
/* get only flag/error bits we want */
|
||||
const __m256i flag_bits =
|
||||
_mm256_and_si256(status0_7, flags_mask);
|
||||
#endif
|
||||
#ifdef IAVF_RX_CSUM_OFFLOAD
|
||||
/**
|
||||
* l3_l4_error flags, shuffle, then shift to correct adjustment
|
||||
* of flags in flags_shuf, and finally mask out extra bits
|
||||
@ -1018,17 +1039,25 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
_mm256_srli_epi32(flag_bits, 4));
|
||||
l3_l4_flags = _mm256_slli_epi32(l3_l4_flags, 1);
|
||||
l3_l4_flags = _mm256_and_si256(l3_l4_flags, cksum_mask);
|
||||
#endif
|
||||
#if defined(IAVF_RX_VLAN_OFFLOAD) || defined(IAVF_RX_RSS_OFFLOAD)
|
||||
/* set rss and vlan flags */
|
||||
const __m256i rss_vlan_flag_bits =
|
||||
_mm256_srli_epi32(flag_bits, 12);
|
||||
const __m256i rss_vlan_flags =
|
||||
_mm256_shuffle_epi8(rss_vlan_flags_shuf,
|
||||
rss_vlan_flag_bits);
|
||||
#endif
|
||||
|
||||
/* merge flags */
|
||||
__m256i mbuf_flags = _mm256_or_si256(l3_l4_flags,
|
||||
rss_vlan_flags);
|
||||
#ifdef IAVF_RX_CSUM_OFFLOAD
|
||||
mbuf_flags = _mm256_or_si256(mbuf_flags, l3_l4_flags);
|
||||
#endif
|
||||
#if defined(IAVF_RX_VLAN_OFFLOAD) || defined(IAVF_RX_RSS_OFFLOAD)
|
||||
mbuf_flags = _mm256_or_si256(mbuf_flags, rss_vlan_flags);
|
||||
#endif
|
||||
}
|
||||
|
||||
#ifdef IAVF_RX_FDIR_OFFLOAD
|
||||
if (rxq->fdir_enabled) {
|
||||
const __m512i fdir_permute_mask = _mm512_set_epi32
|
||||
(0, 0, 0, 0,
|
||||
@ -1070,6 +1099,7 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
rx_pkts[i + 7]->hash.fdir.hi =
|
||||
_mm256_extract_epi32(fdir_id0_7, 4);
|
||||
} /* if() on fdir_enabled */
|
||||
#endif
|
||||
|
||||
__m256i mb4_5 = _mm512_extracti64x4_epi64(mb4_7, 0);
|
||||
__m256i mb6_7 = _mm512_extracti64x4_epi64(mb4_7, 1);
|
||||
@ -1077,6 +1107,8 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
__m256i mb2_3 = _mm512_extracti64x4_epi64(mb0_3, 1);
|
||||
|
||||
#ifndef RTE_LIBRTE_IAVF_16BYTE_RX_DESC
|
||||
if (offload) {
|
||||
#ifdef IAVF_RX_RSS_OFFLOAD
|
||||
/**
|
||||
* needs to load 2nd 16B of each desc for RSS hash parsing,
|
||||
* will cause performance drop to get into this context.
|
||||
@ -1165,6 +1197,8 @@ _iavf_recv_raw_pkts_vec_avx512_flex_rxd(struct iavf_rx_queue *rxq,
|
||||
mb0_1 = _mm256_or_si256(mb0_1, rss_hash0_1);
|
||||
} /* if() on RSS hash parsing */
|
||||
#endif
|
||||
}
|
||||
#endif
|
||||
|
||||
/**
|
||||
* At this point, we have the 8 sets of flags in the low 16-bits
|
||||
@ -1330,7 +1364,7 @@ iavf_recv_pkts_vec_avx512_flex_rxd(void *rx_queue, struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts)
|
||||
{
|
||||
return _iavf_recv_raw_pkts_vec_avx512_flex_rxd(rx_queue, rx_pkts,
|
||||
nb_pkts, NULL);
|
||||
nb_pkts, NULL, false);
|
||||
}
|
||||
|
||||
/**
|
||||
@ -1412,17 +1446,18 @@ iavf_recv_scattered_pkts_vec_avx512(void *rx_queue, struct rte_mbuf **rx_pkts,
|
||||
* Notice:
|
||||
* - nb_pkts < IAVF_DESCS_PER_LOOP, just return no packet
|
||||
*/
|
||||
static uint16_t
|
||||
static __rte_always_inline uint16_t
|
||||
iavf_recv_scattered_burst_vec_avx512_flex_rxd(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts)
|
||||
uint16_t nb_pkts,
|
||||
bool offload)
|
||||
{
|
||||
struct iavf_rx_queue *rxq = rx_queue;
|
||||
uint8_t split_flags[IAVF_VPMD_RX_MAX_BURST] = {0};
|
||||
|
||||
/* get some new buffers */
|
||||
uint16_t nb_bufs = _iavf_recv_raw_pkts_vec_avx512_flex_rxd(rxq,
|
||||
rx_pkts, nb_pkts, split_flags);
|
||||
rx_pkts, nb_pkts, split_flags, offload);
|
||||
if (nb_bufs == 0)
|
||||
return 0;
|
||||
|
||||
@ -1455,10 +1490,11 @@ iavf_recv_scattered_burst_vec_avx512_flex_rxd(void *rx_queue,
|
||||
* Notice:
|
||||
* - nb_pkts < IAVF_DESCS_PER_LOOP, just return no packet
|
||||
*/
|
||||
uint16_t
|
||||
iavf_recv_scattered_pkts_vec_avx512_flex_rxd(void *rx_queue,
|
||||
static __rte_always_inline uint16_t
|
||||
iavf_recv_scattered_pkts_vec_avx512_flex_rxd_cmn(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts)
|
||||
uint16_t nb_pkts,
|
||||
bool offload)
|
||||
{
|
||||
uint16_t retval = 0;
|
||||
|
||||
@ -1466,14 +1502,25 @@ iavf_recv_scattered_pkts_vec_avx512_flex_rxd(void *rx_queue,
|
||||
uint16_t burst =
|
||||
iavf_recv_scattered_burst_vec_avx512_flex_rxd
|
||||
(rx_queue, rx_pkts + retval,
|
||||
IAVF_VPMD_RX_MAX_BURST);
|
||||
IAVF_VPMD_RX_MAX_BURST, offload);
|
||||
retval += burst;
|
||||
nb_pkts -= burst;
|
||||
if (burst < IAVF_VPMD_RX_MAX_BURST)
|
||||
return retval;
|
||||
}
|
||||
return retval + iavf_recv_scattered_burst_vec_avx512_flex_rxd(rx_queue,
|
||||
rx_pkts + retval, nb_pkts);
|
||||
rx_pkts + retval, nb_pkts, offload);
|
||||
}
|
||||
|
||||
uint16_t
|
||||
iavf_recv_scattered_pkts_vec_avx512_flex_rxd(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts)
|
||||
{
|
||||
return iavf_recv_scattered_pkts_vec_avx512_flex_rxd_cmn(rx_queue,
|
||||
rx_pkts,
|
||||
nb_pkts,
|
||||
false);
|
||||
}
|
||||
|
||||
uint16_t
|
||||
@ -1493,6 +1540,29 @@ iavf_recv_scattered_pkts_vec_avx512_offload(void *rx_queue,
|
||||
nb_pkts, true);
|
||||
}
|
||||
|
||||
uint16_t
|
||||
iavf_recv_pkts_vec_avx512_flex_rxd_offload(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts)
|
||||
{
|
||||
return _iavf_recv_raw_pkts_vec_avx512_flex_rxd(rx_queue,
|
||||
rx_pkts,
|
||||
nb_pkts,
|
||||
NULL,
|
||||
true);
|
||||
}
|
||||
|
||||
uint16_t
|
||||
iavf_recv_scattered_pkts_vec_avx512_flex_rxd_offload(void *rx_queue,
|
||||
struct rte_mbuf **rx_pkts,
|
||||
uint16_t nb_pkts)
|
||||
{
|
||||
return iavf_recv_scattered_pkts_vec_avx512_flex_rxd_cmn(rx_queue,
|
||||
rx_pkts,
|
||||
nb_pkts,
|
||||
true);
|
||||
}
|
||||
|
||||
static __rte_always_inline int
|
||||
iavf_tx_free_bufs_avx512(struct iavf_tx_queue *txq)
|
||||
{
|
||||
|
Loading…
Reference in New Issue
Block a user