2018-01-29 13:11:30 +00:00
|
|
|
/* SPDX-License-Identifier: BSD-3-Clause
|
|
|
|
* Copyright 2015 6WIND S.A.
|
2018-03-20 19:20:35 +00:00
|
|
|
* Copyright 2015 Mellanox Technologies, Ltd
|
2015-10-30 18:52:30 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include <stddef.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <stdint.h>
|
|
|
|
#include <stdlib.h>
|
2016-06-24 13:17:50 +00:00
|
|
|
#include <errno.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
|
|
|
|
#include <rte_malloc.h>
|
2021-01-29 16:48:19 +00:00
|
|
|
#include <ethdev_driver.h>
|
|
|
|
#include <ethdev_pci.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
#include <rte_pci.h>
|
2017-10-26 10:06:08 +00:00
|
|
|
#include <rte_bus_pci.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
#include <rte_common.h>
|
2016-06-24 13:17:50 +00:00
|
|
|
#include <rte_kvargs.h>
|
2018-05-24 14:36:49 +00:00
|
|
|
#include <rte_rwlock.h>
|
|
|
|
#include <rte_spinlock.h>
|
2018-07-10 16:04:48 +00:00
|
|
|
#include <rte_string_fns.h>
|
2019-07-16 14:34:55 +00:00
|
|
|
#include <rte_alarm.h>
|
2020-12-28 09:54:09 +00:00
|
|
|
#include <rte_cycles.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
|
2020-01-29 12:38:27 +00:00
|
|
|
#include <mlx5_glue.h>
|
|
|
|
#include <mlx5_devx_cmds.h>
|
2020-01-29 12:38:29 +00:00
|
|
|
#include <mlx5_common.h>
|
2020-06-19 07:30:08 +00:00
|
|
|
#include <mlx5_common_os.h>
|
2020-04-13 21:17:47 +00:00
|
|
|
#include <mlx5_common_mp.h>
|
2020-07-27 17:47:14 +00:00
|
|
|
#include <mlx5_common_pci.h>
|
2020-06-28 07:35:26 +00:00
|
|
|
#include <mlx5_malloc.h>
|
2020-01-29 12:38:27 +00:00
|
|
|
|
|
|
|
#include "mlx5_defs.h"
|
2015-10-30 18:52:30 +00:00
|
|
|
#include "mlx5.h"
|
|
|
|
#include "mlx5_utils.h"
|
2015-10-30 18:52:31 +00:00
|
|
|
#include "mlx5_rxtx.h"
|
2021-04-12 06:32:20 +00:00
|
|
|
#include "mlx5_rx.h"
|
2021-04-12 06:32:22 +00:00
|
|
|
#include "mlx5_tx.h"
|
2015-10-30 18:52:30 +00:00
|
|
|
#include "mlx5_autoconf.h"
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
#include "mlx5_mr.h"
|
2018-09-24 23:17:39 +00:00
|
|
|
#include "mlx5_flow.h"
|
2020-12-28 09:54:15 +00:00
|
|
|
#include "mlx5_flow_os.h"
|
2020-01-29 12:21:06 +00:00
|
|
|
#include "rte_pmd_mlx5.h"
|
2015-10-30 18:52:30 +00:00
|
|
|
|
2016-06-24 13:17:54 +00:00
|
|
|
/* Device parameter to enable RX completion queue compression. */
|
|
|
|
#define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en"
|
|
|
|
|
2019-01-15 17:38:58 +00:00
|
|
|
/* Device parameter to enable padding Rx packet to cacheline size. */
|
|
|
|
#define MLX5_RXQ_PKT_PAD_EN "rxq_pkt_pad_en"
|
|
|
|
|
2018-05-09 11:13:50 +00:00
|
|
|
/* Device parameter to enable Multi-Packet Rx queue. */
|
|
|
|
#define MLX5_RX_MPRQ_EN "mprq_en"
|
|
|
|
|
|
|
|
/* Device parameter to configure log 2 of the number of strides for MPRQ. */
|
|
|
|
#define MLX5_RX_MPRQ_LOG_STRIDE_NUM "mprq_log_stride_num"
|
|
|
|
|
2020-04-09 22:23:51 +00:00
|
|
|
/* Device parameter to configure log 2 of the stride size for MPRQ. */
|
|
|
|
#define MLX5_RX_MPRQ_LOG_STRIDE_SIZE "mprq_log_stride_size"
|
|
|
|
|
2018-05-09 11:13:50 +00:00
|
|
|
/* Device parameter to limit the size of memcpy'd packet for MPRQ. */
|
|
|
|
#define MLX5_RX_MPRQ_MAX_MEMCPY_LEN "mprq_max_memcpy_len"
|
|
|
|
|
|
|
|
/* Device parameter to set the minimum number of Rx queues to enable MPRQ. */
|
|
|
|
#define MLX5_RXQS_MIN_MPRQ "rxqs_min_mprq"
|
|
|
|
|
2019-07-21 14:24:53 +00:00
|
|
|
/* Device parameter to configure inline send. Deprecated, ignored.*/
|
2016-06-24 13:17:56 +00:00
|
|
|
#define MLX5_TXQ_INLINE "txq_inline"
|
|
|
|
|
2019-07-21 14:24:54 +00:00
|
|
|
/* Device parameter to limit packet size to inline with ordinary SEND. */
|
|
|
|
#define MLX5_TXQ_INLINE_MAX "txq_inline_max"
|
|
|
|
|
|
|
|
/* Device parameter to configure minimal data size to inline. */
|
|
|
|
#define MLX5_TXQ_INLINE_MIN "txq_inline_min"
|
|
|
|
|
|
|
|
/* Device parameter to limit packet size to inline with Enhanced MPW. */
|
|
|
|
#define MLX5_TXQ_INLINE_MPW "txq_inline_mpw"
|
|
|
|
|
2016-06-24 13:17:56 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to configure the number of TX queues threshold for
|
|
|
|
* enabling inline send.
|
|
|
|
*/
|
|
|
|
#define MLX5_TXQS_MIN_INLINE "txqs_min_inline"
|
|
|
|
|
2018-11-01 17:20:32 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to configure the number of TX queues threshold for
|
2019-07-21 14:24:53 +00:00
|
|
|
* enabling vectorized Tx, deprecated, ignored (no vectorized Tx routines).
|
2018-11-01 17:20:32 +00:00
|
|
|
*/
|
|
|
|
#define MLX5_TXQS_MAX_VEC "txqs_max_vec"
|
|
|
|
|
2016-06-24 13:17:57 +00:00
|
|
|
/* Device parameter to enable multi-packet send WQEs. */
|
|
|
|
#define MLX5_TXQ_MPW_EN "txq_mpw_en"
|
|
|
|
|
2019-11-08 15:07:50 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to force doorbell register mapping
|
|
|
|
* to non-cahed region eliminating the extra write memory barrier.
|
|
|
|
*/
|
|
|
|
#define MLX5_TX_DB_NC "tx_db_nc"
|
|
|
|
|
2019-07-21 14:24:53 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to include 2 dsegs in the title WQEBB.
|
|
|
|
* Deprecated, ignored.
|
|
|
|
*/
|
2017-03-15 23:55:44 +00:00
|
|
|
#define MLX5_TXQ_MPW_HDR_DSEG_EN "txq_mpw_hdr_dseg_en"
|
|
|
|
|
2019-07-21 14:24:53 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to limit the size of inlining packet.
|
|
|
|
* Deprecated, ignored.
|
|
|
|
*/
|
2017-03-15 23:55:44 +00:00
|
|
|
#define MLX5_TXQ_MAX_INLINE_LEN "txq_max_inline_len"
|
|
|
|
|
2020-07-16 08:23:05 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to enable Tx scheduling on timestamps
|
|
|
|
* and specify the packet pacing granularity in nanoseconds.
|
|
|
|
*/
|
|
|
|
#define MLX5_TX_PP "tx_pp"
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Device parameter to specify skew in nanoseconds on Tx datapath,
|
|
|
|
* it represents the time between SQ start WQE processing and
|
|
|
|
* appearing actual packet data on the wire.
|
|
|
|
*/
|
|
|
|
#define MLX5_TX_SKEW "tx_skew"
|
|
|
|
|
2019-07-21 14:24:53 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to enable hardware Tx vector.
|
|
|
|
* Deprecated, ignored (no vectorized Tx routines anymore).
|
|
|
|
*/
|
2017-08-02 15:32:56 +00:00
|
|
|
#define MLX5_TX_VEC_EN "tx_vec_en"
|
|
|
|
|
|
|
|
/* Device parameter to enable hardware Rx vector. */
|
|
|
|
#define MLX5_RX_VEC_EN "rx_vec_en"
|
|
|
|
|
2018-04-23 12:33:02 +00:00
|
|
|
/* Allow L3 VXLAN flow creation. */
|
|
|
|
#define MLX5_L3_VXLAN_EN "l3_vxlan_en"
|
|
|
|
|
2019-04-18 13:16:01 +00:00
|
|
|
/* Activate DV E-Switch flow steering. */
|
|
|
|
#define MLX5_DV_ESW_EN "dv_esw_en"
|
|
|
|
|
2018-09-24 23:17:54 +00:00
|
|
|
/* Activate DV flow steering. */
|
|
|
|
#define MLX5_DV_FLOW_EN "dv_flow_en"
|
|
|
|
|
net/mlx5: add devarg for extensive metadata support
The PMD parameter dv_xmeta_en is added to control extensive
metadata support. A nonzero value enables extensive flow
metadata support if device is capable and driver supports it.
This can enable extensive support of MARK and META item of
rte_flow. The newly introduced SET_TAG and SET_META actions
do not depend on dv_xmeta_en parameter, because there is
no compatibility issue for new entities. The dv_xmeta_en is
disabled by default.
There are some possible configurations, depending on parameter
value:
- 0, this is default value, defines the legacy mode, the MARK
and META related actions and items operate only within NIC Tx
and NIC Rx steering domains, no MARK and META information
crosses the domain boundaries. The MARK item is 24 bits wide,
the META item is 32 bits wide.
- 1, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The ``MARK`` item is 24 bits wide, the
META item width depends on kernel and firmware configurations
and might be 0, 16 or 32 bits. Within NIC Tx domain META data
width is 32 bits for compatibility, the actual width of data
transferred to the FDB domain depends on kernel configuration
and may be vary. The actual supported width can be retrieved
in runtime by series of rte_flow_validate() trials.
- 2, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The META item is 32 bits wide, the MARK
item width depends on kernel and firmware configurations and
might be 0, 16 or 24 bits. The actual supported width can be
retrieved in runtime by series of rte_flow_validate() trials.
If there is no E-Switch configuration the ``dv_xmeta_en`` parameter is
ignored and the device is configured to operate in legacy mode (0).
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2019-11-07 17:09:54 +00:00
|
|
|
/* Enable extensive flow metadata support. */
|
|
|
|
#define MLX5_DV_XMETA_EN "dv_xmeta_en"
|
|
|
|
|
2020-06-23 08:41:07 +00:00
|
|
|
/* Device parameter to let the user manage the lacp traffic of bonded device */
|
|
|
|
#define MLX5_LACP_BY_USER "lacp_by_user"
|
|
|
|
|
2018-04-05 15:07:21 +00:00
|
|
|
/* Activate Netlink support in VF mode. */
|
|
|
|
#define MLX5_VF_NL_EN "vf_nl_en"
|
|
|
|
|
2019-04-01 21:17:54 +00:00
|
|
|
/* Enable extending memsegs when creating a MR. */
|
|
|
|
#define MLX5_MR_EXT_MEMSEG_EN "mr_ext_memseg_en"
|
|
|
|
|
2018-07-10 16:04:58 +00:00
|
|
|
/* Select port representors to instantiate. */
|
|
|
|
#define MLX5_REPRESENTOR "representor"
|
|
|
|
|
2019-05-30 10:20:32 +00:00
|
|
|
/* Device parameter to configure the maximum number of dump files per queue. */
|
|
|
|
#define MLX5_MAX_DUMP_FILES_NUM "max_dump_files_num"
|
|
|
|
|
2019-07-22 14:51:59 +00:00
|
|
|
/* Configure timeout of LRO session (in microseconds). */
|
|
|
|
#define MLX5_LRO_TIMEOUT_USEC "lro_timeout_usec"
|
|
|
|
|
2020-03-24 12:59:01 +00:00
|
|
|
/*
|
|
|
|
* Device parameter to configure the total data buffer size for a single
|
|
|
|
* hairpin queue (logarithm value).
|
|
|
|
*/
|
|
|
|
#define MLX5_HP_BUF_SIZE "hp_buf_log_sz"
|
|
|
|
|
net/mlx5: add reclaim memory mode
Currently, when flow destroyed, some memory resources may still be kept
as cached to help next time create flow more efficiently.
Some system may need the resources to be more flexible with flow create
and destroy. After peak time, with millions of flows destroyed, the
system would prefer the resources to be reclaimed completely, no cache
is needed. Then the resources can be allocated and used by other
components. The system is not so sensitive about the flow insertion
rate, but more care about the resources.
Both DPDK mlx5 PMD driver and the low level component rdma-core have
provided the flow resources to be configured cached or not, but there is
no APIs or parameters exposed to user to configure the flow resources
cache mode. In this case, introduce a new PMD devarg to let user
configure the flow resources cache mode will be helpful.
This commit is to add a new "reclaim_mem_mode" to help user configure if
the destroyed flows' cache resources should be kept or not.
Their will be three mode can be chosen:
1. 0(none). It means the flow resources will be cached as usual. The
resources will be cached, helpful with flow insertion rate.
2. 1(light). It will only enable the DPDK PMD level resources reclaim.
3. 2(aggressive). Both DPDK PMD level and rdma-core low level will be
configured as reclaimed mode.
With these three mode, user can configure the resources cache mode with
different levels.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
2020-06-01 06:09:43 +00:00
|
|
|
/* Flow memory reclaim mode. */
|
|
|
|
#define MLX5_RECLAIM_MEM "reclaim_mem_mode"
|
|
|
|
|
net/mlx5: add option to allocate memory from system
Currently, for MLX5 PMD, once millions of flows created, the memory
consumption of the flows are also very huge. For the system with limited
memory, it means the system need to reserve most of the memory as huge
page memory to serve the flows in advance. And other normal applications
will have no chance to use this reserved memory any more. While most of
the time, the system will not have lots of flows, the reserved huge
page memory becomes a bit waste of memory at most of the time.
By the new sys_mem_en devarg, once set it to be true, it allows the PMD
allocate the memory from system by default with the new add mlx5 memory
management functions. Only once the MLX5_MEM_RTE flag is set, the memory
will be allocate from rte, otherwise, it allocates memory from system.
So in this case, the system with limited memory no need to reserve most
of the memory for hugepage. Only some needed memory for datapath objects
will be enough to allocated with explicitly flag. Other memory will be
allocated from system. For system with enough memory, no need to care
about the devarg, the memory will always be from rte hugepage.
One restriction is that for DPDK application with multiple PCI devices,
if the sys_mem_en devargs are different between the devices, the
sys_mem_en only gets the value from the first device devargs, and print
out a message to warn that.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2020-06-28 03:41:57 +00:00
|
|
|
/* The default memory allocator used in PMD. */
|
|
|
|
#define MLX5_SYS_MEM_EN "sys_mem_en"
|
2020-07-15 13:10:21 +00:00
|
|
|
/* Decap will be used or not. */
|
|
|
|
#define MLX5_DECAP_EN "decap_en"
|
net/mlx5: add option to allocate memory from system
Currently, for MLX5 PMD, once millions of flows created, the memory
consumption of the flows are also very huge. For the system with limited
memory, it means the system need to reserve most of the memory as huge
page memory to serve the flows in advance. And other normal applications
will have no chance to use this reserved memory any more. While most of
the time, the system will not have lots of flows, the reserved huge
page memory becomes a bit waste of memory at most of the time.
By the new sys_mem_en devarg, once set it to be true, it allows the PMD
allocate the memory from system by default with the new add mlx5 memory
management functions. Only once the MLX5_MEM_RTE flag is set, the memory
will be allocate from rte, otherwise, it allocates memory from system.
So in this case, the system with limited memory no need to reserve most
of the memory for hugepage. Only some needed memory for datapath objects
will be enough to allocated with explicitly flag. Other memory will be
allocated from system. For system with enough memory, no need to care
about the devarg, the memory will always be from rte hugepage.
One restriction is that for DPDK application with multiple PCI devices,
if the sys_mem_en devargs are different between the devices, the
sys_mem_en only gets the value from the first device devargs, and print
out a message to warn that.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2020-06-28 03:41:57 +00:00
|
|
|
|
2021-07-06 08:12:27 +00:00
|
|
|
/* Device parameter to configure allow or prevent duplicate rules pattern. */
|
|
|
|
#define MLX5_ALLOW_DUPLICATE_PATTERN "allow_duplicate_pattern"
|
|
|
|
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
/* Shared memory between primary and secondary processes. */
|
|
|
|
struct mlx5_shared_data *mlx5_shared_data;
|
|
|
|
|
2020-07-19 10:18:15 +00:00
|
|
|
/** Driver-specific log messages type. */
|
|
|
|
int mlx5_logtype;
|
2018-03-13 09:23:56 +00:00
|
|
|
|
2020-06-10 09:32:27 +00:00
|
|
|
static LIST_HEAD(, mlx5_dev_ctx_shared) mlx5_dev_ctx_list =
|
|
|
|
LIST_HEAD_INITIALIZER();
|
2020-12-28 12:32:59 +00:00
|
|
|
static pthread_mutex_t mlx5_dev_ctx_list_mutex;
|
2020-06-08 16:01:56 +00:00
|
|
|
static const struct mlx5_indexed_pool_config mlx5_ipool_cfg[] = {
|
2020-12-28 12:32:55 +00:00
|
|
|
#if defined(HAVE_IBV_FLOW_DV_SUPPORT) || !defined(HAVE_INFINIBAND_VERBS_H)
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_DECAP_ENCAP] = {
|
2020-04-16 02:42:02 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_dv_encap_decap_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 02:42:02 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:02 +00:00
|
|
|
.type = "mlx5_encap_decap_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_PUSH_VLAN] = {
|
2020-04-16 02:42:03 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_dv_push_vlan_action_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 02:42:03 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:03 +00:00
|
|
|
.type = "mlx5_push_vlan_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_TAG] = {
|
2020-04-16 02:42:04 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_dv_tag_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 02:42:04 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:04 +00:00
|
|
|
.type = "mlx5_tag_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_PORT_ID] = {
|
2020-04-16 02:42:05 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_dv_port_id_action_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 02:42:05 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:05 +00:00
|
|
|
.type = "mlx5_port_id_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_JUMP] = {
|
2020-04-16 02:42:06 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_tbl_data_entry),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 02:42:06 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:06 +00:00
|
|
|
.type = "mlx5_jump_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_SAMPLE] = {
|
2020-10-13 14:11:46 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_dv_sample_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-10-13 14:11:46 +00:00
|
|
|
.release_mem_en = 1,
|
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
|
|
|
.type = "mlx5_sample_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_DEST_ARRAY] = {
|
2020-10-13 14:11:50 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_dv_dest_array_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-10-13 14:11:50 +00:00
|
|
|
.release_mem_en = 1,
|
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
|
|
|
.type = "mlx5_dest_array_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_TUNNEL_ID] = {
|
|
|
|
.size = sizeof(struct mlx5_flow_tunnel),
|
2020-12-07 05:58:34 +00:00
|
|
|
.trunk_size = MLX5_MAX_TUNNELS,
|
2020-11-16 14:02:21 +00:00
|
|
|
.need_lock = 1,
|
|
|
|
.release_mem_en = 1,
|
|
|
|
.type = "mlx5_tunnel_offload",
|
|
|
|
},
|
|
|
|
[MLX5_IPOOL_TNL_TBL_ID] = {
|
|
|
|
.size = 0,
|
|
|
|
.need_lock = 1,
|
|
|
|
.type = "mlx5_flow_tnl_tbl_ipool",
|
|
|
|
},
|
2020-04-16 02:42:08 +00:00
|
|
|
#endif
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_MTR] = {
|
2021-04-20 10:55:10 +00:00
|
|
|
/**
|
|
|
|
* The ipool index should grow continually from small to big,
|
|
|
|
* for meter idx, so not set grow_trunk to avoid meter index
|
|
|
|
* not jump continually.
|
|
|
|
*/
|
2021-04-20 10:55:16 +00:00
|
|
|
.size = sizeof(struct mlx5_legacy_flow_meter),
|
2020-04-16 08:34:26 +00:00
|
|
|
.trunk_size = 64,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 08:34:26 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 08:34:26 +00:00
|
|
|
.type = "mlx5_meter_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_MCP] = {
|
2020-04-16 08:34:27 +00:00
|
|
|
.size = sizeof(struct mlx5_flow_mreg_copy_resource),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 08:34:27 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 08:34:27 +00:00
|
|
|
.type = "mlx5_mcp_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_HRXQ] = {
|
2020-04-16 02:42:07 +00:00
|
|
|
.size = (sizeof(struct mlx5_hrxq) + MLX5_RSS_HASH_KEY_LEN),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2020-04-16 02:42:07 +00:00
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:07 +00:00
|
|
|
.type = "mlx5_hrxq_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_MLX5_FLOW] = {
|
2020-06-08 16:01:56 +00:00
|
|
|
/*
|
|
|
|
* MLX5_IPOOL_MLX5_FLOW size varies for DV and VERBS flows.
|
|
|
|
* It set in run time according to PCI function configuration.
|
|
|
|
*/
|
|
|
|
.size = 0,
|
2020-04-16 02:42:08 +00:00
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
2020-10-28 09:33:20 +00:00
|
|
|
.need_lock = 1,
|
2021-07-13 08:44:39 +00:00
|
|
|
.release_mem_en = 0,
|
|
|
|
.per_core_cache = 1 << 19,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 02:42:08 +00:00
|
|
|
.type = "mlx5_flow_handle_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_RTE_FLOW] = {
|
2020-04-16 08:34:30 +00:00
|
|
|
.size = sizeof(struct rte_flow),
|
|
|
|
.trunk_size = 4096,
|
|
|
|
.need_lock = 1,
|
|
|
|
.release_mem_en = 1,
|
2020-06-28 07:35:26 +00:00
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
2020-04-16 08:34:30 +00:00
|
|
|
.type = "rte_flow_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_RSS_EXPANTION_FLOW_ID] = {
|
2020-10-28 09:33:24 +00:00
|
|
|
.size = 0,
|
|
|
|
.need_lock = 1,
|
|
|
|
.type = "mlx5_flow_rss_id_ipool",
|
|
|
|
},
|
2020-11-16 14:02:21 +00:00
|
|
|
[MLX5_IPOOL_RSS_SHARED_ACTIONS] = {
|
2020-11-01 17:57:50 +00:00
|
|
|
.size = sizeof(struct mlx5_shared_action_rss),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.grow_trunk = 3,
|
|
|
|
.grow_shift = 2,
|
|
|
|
.need_lock = 1,
|
|
|
|
.release_mem_en = 1,
|
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
|
|
|
.type = "mlx5_shared_action_rss",
|
|
|
|
},
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
[MLX5_IPOOL_MTR_POLICY] = {
|
|
|
|
/**
|
|
|
|
* The ipool index should grow continually from small to big,
|
|
|
|
* for policy idx, so not set grow_trunk to avoid policy index
|
|
|
|
* not jump continually.
|
|
|
|
*/
|
|
|
|
.size = sizeof(struct mlx5_flow_meter_sub_policy),
|
|
|
|
.trunk_size = 64,
|
|
|
|
.need_lock = 1,
|
|
|
|
.release_mem_en = 1,
|
|
|
|
.malloc = mlx5_malloc,
|
|
|
|
.free = mlx5_free,
|
|
|
|
.type = "mlx5_meter_policy_ipool",
|
|
|
|
},
|
2020-04-16 02:42:02 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2019-10-30 23:53:21 +00:00
|
|
|
#define MLX5_FLOW_MIN_ID_POOL_SIZE 512
|
|
|
|
#define MLX5_ID_GENERATION_ARRAY_FACTOR 16
|
|
|
|
|
2019-11-08 15:23:08 +00:00
|
|
|
#define MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE 4096
|
|
|
|
|
net/mlx5: refactor bonding representor probing
To probe representor on 2nd PF of kernel bonding device, had to specify
PF1 BDF in devarg:
<PF1_BDF>,representor=0
When closing bonding device, all representors had to be closed together
and this implies all representors have to use primary PF of bonding
device. So after probing representor port on 2nd PF, when locating new
probed device using device argument, the filter used 2nd PF as PCI
address and failed to locate new device.
Conflict happened by using current representor devargs:
- Use PCI BDF to specify representor owner PF
- Use PCI BDF to locate probed representor device.
- PMD uses primary PCI BDF as PCI device.
To resolve such conflicts, new representor syntax is introduced here:
<primary BDF>,representor=pfXvfY
All representors must use primary PF as owner PCI device, PMD internally
locate owner PCI address by checking representor "pfX" part. To EAL, all
representors are registered to primary PCI device, the 2nd PF is hidden
to EAL, thus all search should be consistent.
Same to VF representor, HPF (host PF on BlueField) uses same syntax to
probe, example: representor=pf1vf[0-3,-1]
This patch also adds pf index into kernel bonding representor port name:
<BDF>_<ib_name>_representor_pf<X>vf<Y>
Signed-off-by: Xueming Li <xuemingl@nvidia.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@nvidia.com>
2021-03-28 13:48:10 +00:00
|
|
|
/**
|
|
|
|
* Decide whether representor ID is a HPF(host PF) port on BF2.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Non-zero if HPF, otherwise 0.
|
|
|
|
*/
|
|
|
|
bool
|
|
|
|
mlx5_is_hpf(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
|
|
|
uint16_t repr = MLX5_REPRESENTOR_REPR(priv->representor_id);
|
|
|
|
int type = MLX5_REPRESENTOR_TYPE(priv->representor_id);
|
|
|
|
|
|
|
|
return priv->representor != 0 && type == RTE_ETH_REPRESENTOR_VF &&
|
|
|
|
MLX5_REPRESENTOR_REPR(-1) == repr;
|
|
|
|
}
|
|
|
|
|
2020-11-01 17:57:49 +00:00
|
|
|
/**
|
|
|
|
* Initialize the ASO aging management structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on success, a negative errno value otherwise and rte_errno is set.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mlx5_flow_aso_age_mng_init(struct mlx5_dev_ctx_shared *sh)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (sh->aso_age_mng)
|
|
|
|
return 0;
|
|
|
|
sh->aso_age_mng = mlx5_malloc(MLX5_MEM_ZERO, sizeof(*sh->aso_age_mng),
|
|
|
|
RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
|
|
|
|
if (!sh->aso_age_mng) {
|
|
|
|
DRV_LOG(ERR, "aso_age_mng allocation was failed.");
|
|
|
|
rte_errno = ENOMEM;
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
2021-04-20 10:55:17 +00:00
|
|
|
err = mlx5_aso_queue_init(sh, ASO_OPC_MOD_FLOW_HIT);
|
2020-11-01 17:57:49 +00:00
|
|
|
if (err) {
|
|
|
|
mlx5_free(sh->aso_age_mng);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
rte_spinlock_init(&sh->aso_age_mng->resize_sl);
|
|
|
|
rte_spinlock_init(&sh->aso_age_mng->free_sl);
|
|
|
|
LIST_INIT(&sh->aso_age_mng->free);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Close and release all the resources of the ASO aging management structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
mlx5_flow_aso_age_mng_close(struct mlx5_dev_ctx_shared *sh)
|
|
|
|
{
|
|
|
|
int i, j;
|
|
|
|
|
2021-04-20 10:55:17 +00:00
|
|
|
mlx5_aso_flow_hit_queue_poll_stop(sh);
|
|
|
|
mlx5_aso_queue_uninit(sh, ASO_OPC_MOD_FLOW_HIT);
|
2020-11-01 17:57:49 +00:00
|
|
|
if (sh->aso_age_mng->pools) {
|
|
|
|
struct mlx5_aso_age_pool *pool;
|
|
|
|
|
|
|
|
for (i = 0; i < sh->aso_age_mng->next; ++i) {
|
|
|
|
pool = sh->aso_age_mng->pools[i];
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy
|
|
|
|
(pool->flow_hit_aso_obj));
|
|
|
|
for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j)
|
|
|
|
if (pool->actions[j].dr_action)
|
|
|
|
claim_zero
|
2020-12-28 09:54:15 +00:00
|
|
|
(mlx5_flow_os_destroy_flow_action
|
|
|
|
(pool->actions[j].dr_action));
|
2020-11-01 17:57:49 +00:00
|
|
|
mlx5_free(pool);
|
|
|
|
}
|
|
|
|
mlx5_free(sh->aso_age_mng->pools);
|
|
|
|
}
|
2020-11-18 08:59:55 +00:00
|
|
|
mlx5_free(sh->aso_age_mng);
|
2020-11-01 17:57:49 +00:00
|
|
|
}
|
|
|
|
|
2020-04-29 02:25:09 +00:00
|
|
|
/**
|
|
|
|
* Initialize the shared aging list information per port.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object.
|
2020-04-29 02:25:09 +00:00
|
|
|
*/
|
|
|
|
static void
|
2020-06-03 15:05:55 +00:00
|
|
|
mlx5_flow_aging_init(struct mlx5_dev_ctx_shared *sh)
|
2020-04-29 02:25:09 +00:00
|
|
|
{
|
|
|
|
uint32_t i;
|
|
|
|
struct mlx5_age_info *age_info;
|
|
|
|
|
|
|
|
for (i = 0; i < sh->max_port; i++) {
|
|
|
|
age_info = &sh->port[i].age_info;
|
|
|
|
age_info->flags = 0;
|
|
|
|
TAILQ_INIT(&age_info->aged_counters);
|
2020-11-01 17:57:52 +00:00
|
|
|
LIST_INIT(&age_info->aged_aso);
|
2020-04-29 02:25:09 +00:00
|
|
|
rte_spinlock_init(&age_info->aged_sl);
|
|
|
|
MLX5_AGE_SET(age_info, MLX5_AGE_TRIGGER);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-16 14:34:53 +00:00
|
|
|
/**
|
|
|
|
* Initialize the counters management structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free
|
2019-07-16 14:34:53 +00:00
|
|
|
*/
|
|
|
|
static void
|
2020-06-03 15:05:55 +00:00
|
|
|
mlx5_flow_counters_mng_init(struct mlx5_dev_ctx_shared *sh)
|
2019-07-16 14:34:53 +00:00
|
|
|
{
|
2020-10-20 03:02:23 +00:00
|
|
|
int i;
|
2019-07-16 14:34:53 +00:00
|
|
|
|
2020-05-12 12:52:13 +00:00
|
|
|
memset(&sh->cmng, 0, sizeof(sh->cmng));
|
2019-07-16 14:34:53 +00:00
|
|
|
TAILQ_INIT(&sh->cmng.flow_counters);
|
2020-10-20 03:02:23 +00:00
|
|
|
sh->cmng.min_id = MLX5_CNT_BATCH_OFFSET;
|
|
|
|
sh->cmng.max_id = -1;
|
|
|
|
sh->cmng.last_pool_idx = POOL_IDX_INVALID;
|
2020-10-20 03:02:24 +00:00
|
|
|
rte_spinlock_init(&sh->cmng.pool_update_sl);
|
2020-10-20 03:02:23 +00:00
|
|
|
for (i = 0; i < MLX5_COUNTER_TYPE_MAX; i++) {
|
|
|
|
TAILQ_INIT(&sh->cmng.counters[i]);
|
|
|
|
rte_spinlock_init(&sh->cmng.csl[i]);
|
2020-04-29 02:25:09 +00:00
|
|
|
}
|
2019-07-16 14:34:53 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Destroy all the resources allocated for a counter memory management.
|
|
|
|
*
|
|
|
|
* @param[in] mng
|
|
|
|
* Pointer to the memory management structure.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
mlx5_flow_destroy_counter_stat_mem_mng(struct mlx5_counter_stats_mem_mng *mng)
|
|
|
|
{
|
|
|
|
uint8_t *mem = (uint8_t *)(uintptr_t)mng->raws[0].data;
|
|
|
|
|
|
|
|
LIST_REMOVE(mng, next);
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy(mng->dm));
|
2020-12-28 09:54:14 +00:00
|
|
|
claim_zero(mlx5_os_umem_dereg(mng->umem));
|
2020-06-28 07:35:26 +00:00
|
|
|
mlx5_free(mem);
|
2019-07-16 14:34:53 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Close and release all the resources of the counters management.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free.
|
2019-07-16 14:34:53 +00:00
|
|
|
*/
|
|
|
|
static void
|
2020-06-03 15:05:55 +00:00
|
|
|
mlx5_flow_counters_mng_close(struct mlx5_dev_ctx_shared *sh)
|
2019-07-16 14:34:53 +00:00
|
|
|
{
|
|
|
|
struct mlx5_counter_stats_mem_mng *mng;
|
2020-10-20 03:02:24 +00:00
|
|
|
int i, j;
|
2019-07-16 14:34:55 +00:00
|
|
|
int retries = 1024;
|
|
|
|
|
|
|
|
rte_errno = 0;
|
|
|
|
while (--retries) {
|
|
|
|
rte_eal_alarm_cancel(mlx5_flow_query_alarm, sh);
|
|
|
|
if (rte_errno != EINPROGRESS)
|
|
|
|
break;
|
|
|
|
rte_pause();
|
|
|
|
}
|
2020-10-20 03:02:23 +00:00
|
|
|
|
|
|
|
if (sh->cmng.pools) {
|
2020-05-12 12:52:13 +00:00
|
|
|
struct mlx5_flow_counter_pool *pool;
|
2020-10-20 03:02:24 +00:00
|
|
|
uint16_t n_valid = sh->cmng.n_valid;
|
2020-10-20 03:02:28 +00:00
|
|
|
bool fallback = sh->cmng.counter_fallback;
|
2020-05-12 12:52:13 +00:00
|
|
|
|
2020-10-20 03:02:24 +00:00
|
|
|
for (i = 0; i < n_valid; ++i) {
|
|
|
|
pool = sh->cmng.pools[i];
|
2020-10-20 03:02:28 +00:00
|
|
|
if (!fallback && pool->min_dcs)
|
2020-05-12 12:52:13 +00:00
|
|
|
claim_zero(mlx5_devx_cmd_destroy
|
|
|
|
(pool->min_dcs));
|
|
|
|
for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j) {
|
2020-10-20 03:02:28 +00:00
|
|
|
struct mlx5_flow_counter *cnt =
|
|
|
|
MLX5_POOL_GET_CNT(pool, j);
|
|
|
|
|
|
|
|
if (cnt->action)
|
2020-05-12 12:52:13 +00:00
|
|
|
claim_zero
|
2020-12-28 09:54:15 +00:00
|
|
|
(mlx5_flow_os_destroy_flow_action
|
2020-10-20 03:02:28 +00:00
|
|
|
(cnt->action));
|
|
|
|
if (fallback && MLX5_POOL_GET_CNT
|
|
|
|
(pool, j)->dcs_when_free)
|
2020-05-12 12:52:13 +00:00
|
|
|
claim_zero(mlx5_devx_cmd_destroy
|
2020-10-20 03:02:28 +00:00
|
|
|
(cnt->dcs_when_free));
|
2019-07-16 14:34:53 +00:00
|
|
|
}
|
2020-06-28 07:35:26 +00:00
|
|
|
mlx5_free(pool);
|
2019-07-16 14:34:53 +00:00
|
|
|
}
|
2020-10-20 03:02:23 +00:00
|
|
|
mlx5_free(sh->cmng.pools);
|
2019-07-16 14:34:53 +00:00
|
|
|
}
|
|
|
|
mng = LIST_FIRST(&sh->cmng.mem_mngs);
|
|
|
|
while (mng) {
|
|
|
|
mlx5_flow_destroy_counter_stat_mem_mng(mng);
|
|
|
|
mng = LIST_FIRST(&sh->cmng.mem_mngs);
|
|
|
|
}
|
|
|
|
memset(&sh->cmng, 0, sizeof(sh->cmng));
|
|
|
|
}
|
|
|
|
|
2021-04-20 10:55:17 +00:00
|
|
|
/**
|
|
|
|
* Initialize the aso flow meters management structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free
|
|
|
|
*/
|
|
|
|
int
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
mlx5_aso_flow_mtrs_mng_init(struct mlx5_dev_ctx_shared *sh)
|
2021-04-20 10:55:17 +00:00
|
|
|
{
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
if (!sh->mtrmng) {
|
|
|
|
sh->mtrmng = mlx5_malloc(MLX5_MEM_ZERO,
|
|
|
|
sizeof(*sh->mtrmng),
|
2021-04-20 10:55:17 +00:00
|
|
|
RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
if (!sh->mtrmng) {
|
|
|
|
DRV_LOG(ERR,
|
|
|
|
"meter management allocation was failed.");
|
2021-04-20 10:55:17 +00:00
|
|
|
rte_errno = ENOMEM;
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
if (sh->meter_aso_en) {
|
|
|
|
rte_spinlock_init(&sh->mtrmng->pools_mng.mtrsl);
|
|
|
|
LIST_INIT(&sh->mtrmng->pools_mng.meters);
|
|
|
|
}
|
|
|
|
sh->mtrmng->def_policy_id = MLX5_INVALID_POLICY_ID;
|
2021-04-20 10:55:17 +00:00
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Close and release all the resources of
|
|
|
|
* the ASO flow meter management structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
mlx5_aso_flow_mtrs_mng_close(struct mlx5_dev_ctx_shared *sh)
|
|
|
|
{
|
|
|
|
struct mlx5_aso_mtr_pool *mtr_pool;
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
struct mlx5_flow_mtr_mng *mtrmng = sh->mtrmng;
|
2021-04-20 10:55:17 +00:00
|
|
|
uint32_t idx;
|
2021-04-20 10:55:19 +00:00
|
|
|
#ifdef HAVE_MLX5_DR_CREATE_ACTION_ASO
|
|
|
|
struct mlx5_aso_mtr *aso_mtr;
|
|
|
|
int i;
|
|
|
|
#endif /* HAVE_MLX5_DR_CREATE_ACTION_ASO */
|
2021-04-20 10:55:17 +00:00
|
|
|
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
if (sh->meter_aso_en) {
|
|
|
|
mlx5_aso_queue_uninit(sh, ASO_OPC_MOD_POLICER);
|
|
|
|
idx = mtrmng->pools_mng.n_valid;
|
|
|
|
while (idx--) {
|
|
|
|
mtr_pool = mtrmng->pools_mng.pools[idx];
|
2021-04-20 10:55:19 +00:00
|
|
|
#ifdef HAVE_MLX5_DR_CREATE_ACTION_ASO
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
for (i = 0; i < MLX5_ASO_MTRS_PER_POOL; i++) {
|
|
|
|
aso_mtr = &mtr_pool->mtrs[i];
|
|
|
|
if (aso_mtr->fm.meter_action)
|
|
|
|
claim_zero
|
|
|
|
(mlx5_glue->destroy_flow_action
|
|
|
|
(aso_mtr->fm.meter_action));
|
|
|
|
}
|
2021-04-20 10:55:19 +00:00
|
|
|
#endif /* HAVE_MLX5_DR_CREATE_ACTION_ASO */
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
claim_zero(mlx5_devx_cmd_destroy
|
2021-04-20 10:55:17 +00:00
|
|
|
(mtr_pool->devx_obj));
|
net/mlx5: support meter policy operations
MLX5 PMD checks the validation of actions in policy while add
a new meter policy, if pass the validation, allocates the new
policy object from the meter policy indexed memory pool.
It is common to use the same policy for multiple meters.
MLX5 PMD supports two types of policy: termination policy and
no-termination policy.
Implement the next policy operations:
validate:
The driver doesn't support to configure actions in the flow
after the meter action except one case when the meter policy
is configured to do nothing in GREEN\YELLOW and only DROP action
in RED, this special policy is called non-terminated policy
and is handed as a singleton object internally.
For all the terminated policies, the next actions are supported:
GREEN - QUEUE, RSS, PORT_ID, JUMP, DROP, MARK and SET_TAG.
YELLOW - not supported at all -> must be empty.
RED - must include DROP action.
Hence, in ingress case, for example,
QUEUE\RSS\JUMP must be configured as last action for GREEN color.
All the above limitations will be validated.
create:
Validate the policy configuration.
Prepare the related tables and actions.
destroy:
Release the created policy resources.
Signed-off-by: Li Zhang <lizh@nvidia.com>
Acked-by: Matan Azrad <matan@nvidia.com>
2021-04-27 10:43:51 +00:00
|
|
|
mtrmng->pools_mng.n_valid--;
|
|
|
|
mlx5_free(mtr_pool);
|
|
|
|
}
|
|
|
|
mlx5_free(sh->mtrmng->pools_mng.pools);
|
2021-04-20 10:55:17 +00:00
|
|
|
}
|
|
|
|
mlx5_free(sh->mtrmng);
|
|
|
|
sh->mtrmng = NULL;
|
|
|
|
}
|
|
|
|
|
2020-11-01 17:57:49 +00:00
|
|
|
/* Send FLOW_AGED event if needed. */
|
|
|
|
void
|
|
|
|
mlx5_age_event_prepare(struct mlx5_dev_ctx_shared *sh)
|
|
|
|
{
|
|
|
|
struct mlx5_age_info *age_info;
|
|
|
|
uint32_t i;
|
|
|
|
|
|
|
|
for (i = 0; i < sh->max_port; i++) {
|
|
|
|
age_info = &sh->port[i].age_info;
|
|
|
|
if (!MLX5_AGE_GET(age_info, MLX5_AGE_EVENT_NEW))
|
|
|
|
continue;
|
2021-04-29 09:55:41 +00:00
|
|
|
MLX5_AGE_UNSET(age_info, MLX5_AGE_EVENT_NEW);
|
|
|
|
if (MLX5_AGE_GET(age_info, MLX5_AGE_TRIGGER)) {
|
|
|
|
MLX5_AGE_UNSET(age_info, MLX5_AGE_TRIGGER);
|
2020-11-01 17:57:49 +00:00
|
|
|
rte_eth_dev_callback_process
|
|
|
|
(&rte_eth_devices[sh->port[i].devx_ih_port_id],
|
|
|
|
RTE_ETH_EVENT_FLOW_AGED, NULL);
|
2021-04-29 09:55:41 +00:00
|
|
|
}
|
2020-11-01 17:57:49 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-05-05 12:23:15 +00:00
|
|
|
/*
|
|
|
|
* Initialize the ASO connection tracking structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
|
|
|
* Pointer to mlx5_dev_ctx_shared object.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on success, a negative errno value otherwise and rte_errno is set.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mlx5_flow_aso_ct_mng_init(struct mlx5_dev_ctx_shared *sh)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (sh->ct_mng)
|
|
|
|
return 0;
|
|
|
|
sh->ct_mng = mlx5_malloc(MLX5_MEM_ZERO, sizeof(*sh->ct_mng),
|
|
|
|
RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
|
|
|
|
if (!sh->ct_mng) {
|
|
|
|
DRV_LOG(ERR, "ASO CT management allocation failed.");
|
|
|
|
rte_errno = ENOMEM;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
|
|
|
err = mlx5_aso_queue_init(sh, ASO_OPC_MOD_CONNECTION_TRACKING);
|
|
|
|
if (err) {
|
|
|
|
mlx5_free(sh->ct_mng);
|
|
|
|
/* rte_errno should be extracted from the failure. */
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
|
|
|
rte_spinlock_init(&sh->ct_mng->ct_sl);
|
|
|
|
rte_rwlock_init(&sh->ct_mng->resize_rwl);
|
|
|
|
LIST_INIT(&sh->ct_mng->free_cts);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2021-05-05 12:23:19 +00:00
|
|
|
/*
|
|
|
|
* Close and release all the resources of the
|
|
|
|
* ASO connection tracking management structure.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
mlx5_flow_aso_ct_mng_close(struct mlx5_dev_ctx_shared *sh)
|
|
|
|
{
|
|
|
|
struct mlx5_aso_ct_pools_mng *mng = sh->ct_mng;
|
|
|
|
struct mlx5_aso_ct_pool *ct_pool;
|
|
|
|
struct mlx5_aso_ct_action *ct;
|
|
|
|
uint32_t idx;
|
|
|
|
uint32_t val;
|
|
|
|
uint32_t cnt;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
mlx5_aso_queue_uninit(sh, ASO_OPC_MOD_CONNECTION_TRACKING);
|
|
|
|
idx = mng->next;
|
|
|
|
while (idx--) {
|
|
|
|
cnt = 0;
|
|
|
|
ct_pool = mng->pools[idx];
|
|
|
|
for (i = 0; i < MLX5_ASO_CT_ACTIONS_PER_POOL; i++) {
|
|
|
|
ct = &ct_pool->actions[i];
|
|
|
|
val = __atomic_fetch_sub(&ct->refcnt, 1,
|
|
|
|
__ATOMIC_RELAXED);
|
|
|
|
MLX5_ASSERT(val == 1);
|
|
|
|
if (val > 1)
|
|
|
|
cnt++;
|
|
|
|
#ifdef HAVE_MLX5_DR_ACTION_ASO_CT
|
|
|
|
if (ct->dr_action_orig)
|
|
|
|
claim_zero(mlx5_glue->destroy_flow_action
|
|
|
|
(ct->dr_action_orig));
|
|
|
|
if (ct->dr_action_rply)
|
|
|
|
claim_zero(mlx5_glue->destroy_flow_action
|
|
|
|
(ct->dr_action_rply));
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy(ct_pool->devx_obj));
|
|
|
|
if (cnt) {
|
|
|
|
DRV_LOG(DEBUG, "%u ASO CT objects are being used in the pool %u",
|
|
|
|
cnt, i);
|
|
|
|
}
|
|
|
|
mlx5_free(ct_pool);
|
|
|
|
/* in case of failure. */
|
|
|
|
mng->next--;
|
|
|
|
}
|
|
|
|
mlx5_free(mng->pools);
|
|
|
|
mlx5_free(mng);
|
|
|
|
/* Management structure must be cleared to 0s during allocation. */
|
|
|
|
sh->ct_mng = NULL;
|
|
|
|
}
|
|
|
|
|
2020-04-16 02:42:02 +00:00
|
|
|
/**
|
|
|
|
* Initialize the flow resources' indexed mempool.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object.
|
2021-04-29 09:55:41 +00:00
|
|
|
* @param[in] config
|
2020-04-16 02:42:08 +00:00
|
|
|
* Pointer to user dev config.
|
2020-04-16 02:42:02 +00:00
|
|
|
*/
|
|
|
|
static void
|
2020-06-03 15:05:55 +00:00
|
|
|
mlx5_flow_ipool_create(struct mlx5_dev_ctx_shared *sh,
|
2020-06-08 16:01:56 +00:00
|
|
|
const struct mlx5_dev_config *config)
|
2020-04-16 02:42:02 +00:00
|
|
|
{
|
|
|
|
uint8_t i;
|
2020-06-08 16:01:56 +00:00
|
|
|
struct mlx5_indexed_pool_config cfg;
|
2020-04-16 02:42:02 +00:00
|
|
|
|
net/mlx5: add reclaim memory mode
Currently, when flow destroyed, some memory resources may still be kept
as cached to help next time create flow more efficiently.
Some system may need the resources to be more flexible with flow create
and destroy. After peak time, with millions of flows destroyed, the
system would prefer the resources to be reclaimed completely, no cache
is needed. Then the resources can be allocated and used by other
components. The system is not so sensitive about the flow insertion
rate, but more care about the resources.
Both DPDK mlx5 PMD driver and the low level component rdma-core have
provided the flow resources to be configured cached or not, but there is
no APIs or parameters exposed to user to configure the flow resources
cache mode. In this case, introduce a new PMD devarg to let user
configure the flow resources cache mode will be helpful.
This commit is to add a new "reclaim_mem_mode" to help user configure if
the destroyed flows' cache resources should be kept or not.
Their will be three mode can be chosen:
1. 0(none). It means the flow resources will be cached as usual. The
resources will be cached, helpful with flow insertion rate.
2. 1(light). It will only enable the DPDK PMD level resources reclaim.
3. 2(aggressive). Both DPDK PMD level and rdma-core low level will be
configured as reclaimed mode.
With these three mode, user can configure the resources cache mode with
different levels.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
2020-06-01 06:09:43 +00:00
|
|
|
for (i = 0; i < MLX5_IPOOL_MAX; ++i) {
|
2020-06-08 16:01:56 +00:00
|
|
|
cfg = mlx5_ipool_cfg[i];
|
|
|
|
switch (i) {
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
/*
|
|
|
|
* Set MLX5_IPOOL_MLX5_FLOW ipool size
|
|
|
|
* according to PCI function flow configuration.
|
|
|
|
*/
|
|
|
|
case MLX5_IPOOL_MLX5_FLOW:
|
|
|
|
cfg.size = config->dv_flow_en ?
|
|
|
|
sizeof(struct mlx5_flow_handle) :
|
|
|
|
MLX5_FLOW_HANDLE_VERBS_SIZE;
|
|
|
|
break;
|
|
|
|
}
|
2021-07-13 08:44:39 +00:00
|
|
|
if (config->reclaim_mode) {
|
2020-06-08 16:01:56 +00:00
|
|
|
cfg.release_mem_en = 1;
|
2021-07-13 08:44:39 +00:00
|
|
|
cfg.per_core_cache = 0;
|
|
|
|
}
|
2020-06-08 16:01:56 +00:00
|
|
|
sh->ipool[i] = mlx5_ipool_create(&cfg);
|
net/mlx5: add reclaim memory mode
Currently, when flow destroyed, some memory resources may still be kept
as cached to help next time create flow more efficiently.
Some system may need the resources to be more flexible with flow create
and destroy. After peak time, with millions of flows destroyed, the
system would prefer the resources to be reclaimed completely, no cache
is needed. Then the resources can be allocated and used by other
components. The system is not so sensitive about the flow insertion
rate, but more care about the resources.
Both DPDK mlx5 PMD driver and the low level component rdma-core have
provided the flow resources to be configured cached or not, but there is
no APIs or parameters exposed to user to configure the flow resources
cache mode. In this case, introduce a new PMD devarg to let user
configure the flow resources cache mode will be helpful.
This commit is to add a new "reclaim_mem_mode" to help user configure if
the destroyed flows' cache resources should be kept or not.
Their will be three mode can be chosen:
1. 0(none). It means the flow resources will be cached as usual. The
resources will be cached, helpful with flow insertion rate.
2. 1(light). It will only enable the DPDK PMD level resources reclaim.
3. 2(aggressive). Both DPDK PMD level and rdma-core low level will be
configured as reclaimed mode.
With these three mode, user can configure the resources cache mode with
different levels.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
2020-06-01 06:09:43 +00:00
|
|
|
}
|
2020-04-16 02:42:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Release the flow resources' indexed mempool.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object.
|
2020-04-16 02:42:02 +00:00
|
|
|
*/
|
|
|
|
static void
|
2020-06-03 15:05:55 +00:00
|
|
|
mlx5_flow_ipool_destroy(struct mlx5_dev_ctx_shared *sh)
|
2020-04-16 02:42:02 +00:00
|
|
|
{
|
|
|
|
uint8_t i;
|
|
|
|
|
|
|
|
for (i = 0; i < MLX5_IPOOL_MAX; ++i)
|
|
|
|
mlx5_ipool_destroy(sh->ipool[i]);
|
|
|
|
}
|
|
|
|
|
2020-07-17 07:11:46 +00:00
|
|
|
/*
|
|
|
|
* Check if dynamic flex parser for eCPRI already exists.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* true on exists, false on not.
|
|
|
|
*/
|
|
|
|
bool
|
|
|
|
mlx5_flex_parser_ecpri_exist(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
|
|
|
struct mlx5_flex_parser_profiles *prf =
|
|
|
|
&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
|
|
|
|
|
|
|
|
return !!prf->obj;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Allocation of a flex parser for eCPRI. Once created, this parser related
|
|
|
|
* resources will be held until the device is closed.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on success, a negative errno value otherwise and rte_errno is set.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mlx5_flex_parser_ecpri_alloc(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
|
|
|
struct mlx5_flex_parser_profiles *prf =
|
|
|
|
&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
|
2020-07-17 07:11:49 +00:00
|
|
|
struct mlx5_devx_graph_node_attr node = {
|
|
|
|
.modify_field_select = 0,
|
|
|
|
};
|
|
|
|
uint32_t ids[8];
|
|
|
|
int ret;
|
2020-07-17 07:11:46 +00:00
|
|
|
|
2020-07-17 07:11:50 +00:00
|
|
|
if (!priv->config.hca_attr.parse_graph_flex_node) {
|
|
|
|
DRV_LOG(ERR, "Dynamic flex parser is not supported "
|
|
|
|
"for device %s.", priv->dev_data->name);
|
|
|
|
return -ENOTSUP;
|
|
|
|
}
|
2020-07-17 07:11:49 +00:00
|
|
|
node.header_length_mode = MLX5_GRAPH_NODE_LEN_FIXED;
|
|
|
|
/* 8 bytes now: 4B common header + 4B message body header. */
|
|
|
|
node.header_length_base_value = 0x8;
|
|
|
|
/* After MAC layer: Ether / VLAN. */
|
|
|
|
node.in[0].arc_parse_graph_node = MLX5_GRAPH_ARC_NODE_MAC;
|
|
|
|
/* Type of compared condition should be 0xAEFE in the L2 layer. */
|
|
|
|
node.in[0].compare_condition_value = RTE_ETHER_TYPE_ECPRI;
|
|
|
|
/* Sample #0: type in common header. */
|
|
|
|
node.sample[0].flow_match_sample_en = 1;
|
|
|
|
/* Fixed offset. */
|
|
|
|
node.sample[0].flow_match_sample_offset_mode = 0x0;
|
|
|
|
/* Only the 2nd byte will be used. */
|
|
|
|
node.sample[0].flow_match_sample_field_base_offset = 0x0;
|
|
|
|
/* Sample #1: message payload. */
|
|
|
|
node.sample[1].flow_match_sample_en = 1;
|
|
|
|
/* Fixed offset. */
|
|
|
|
node.sample[1].flow_match_sample_offset_mode = 0x0;
|
|
|
|
/*
|
|
|
|
* Only the first two bytes will be used right now, and its offset will
|
|
|
|
* start after the common header that with the length of a DW(u32).
|
|
|
|
*/
|
|
|
|
node.sample[1].flow_match_sample_field_base_offset = sizeof(uint32_t);
|
|
|
|
prf->obj = mlx5_devx_cmd_create_flex_parser(priv->sh->ctx, &node);
|
|
|
|
if (!prf->obj) {
|
|
|
|
DRV_LOG(ERR, "Failed to create flex parser node object.");
|
|
|
|
return (rte_errno == 0) ? -ENODEV : -rte_errno;
|
|
|
|
}
|
|
|
|
prf->num = 2;
|
|
|
|
ret = mlx5_devx_cmd_query_parse_samples(prf->obj, ids, prf->num);
|
|
|
|
if (ret) {
|
|
|
|
DRV_LOG(ERR, "Failed to query sample IDs.");
|
|
|
|
return (rte_errno == 0) ? -ENODEV : -rte_errno;
|
|
|
|
}
|
|
|
|
prf->offset[0] = 0x0;
|
|
|
|
prf->offset[1] = sizeof(uint32_t);
|
|
|
|
prf->ids[0] = ids[0];
|
|
|
|
prf->ids[1] = ids[1];
|
2020-07-17 07:11:46 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-07-17 07:11:49 +00:00
|
|
|
/*
|
|
|
|
* Destroy the flex parser node, including the parser itself, input / output
|
|
|
|
* arcs and DW samples. Resources could be reused then.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
mlx5_flex_parser_ecpri_release(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
|
|
|
struct mlx5_flex_parser_profiles *prf =
|
|
|
|
&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
|
|
|
|
|
|
|
|
if (prf->obj)
|
|
|
|
mlx5_devx_cmd_destroy(prf->obj);
|
|
|
|
prf->obj = NULL;
|
|
|
|
}
|
|
|
|
|
2020-07-22 14:59:08 +00:00
|
|
|
/*
|
|
|
|
* Allocate Rx and Tx UARs in robust fashion.
|
|
|
|
* This routine handles the following UAR allocation issues:
|
|
|
|
*
|
|
|
|
* - tries to allocate the UAR with the most appropriate memory
|
|
|
|
* mapping type from the ones supported by the host
|
|
|
|
*
|
|
|
|
* - tries to allocate the UAR with non-NULL base address
|
|
|
|
* OFED 5.0.x and Upstream rdma_core before v29 returned the NULL as
|
|
|
|
* UAR base address if UAR was not the first object in the UAR page.
|
|
|
|
* It caused the PMD failure and we should try to get another UAR
|
|
|
|
* till we get the first one with non-NULL base address returned.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
mlx5_alloc_rxtx_uars(struct mlx5_dev_ctx_shared *sh,
|
|
|
|
const struct mlx5_dev_config *config)
|
|
|
|
{
|
|
|
|
uint32_t uar_mapping, retry;
|
|
|
|
int err = 0;
|
2020-08-25 09:31:13 +00:00
|
|
|
void *base_addr;
|
2020-07-22 14:59:08 +00:00
|
|
|
|
|
|
|
for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
|
|
|
|
#ifdef MLX5DV_UAR_ALLOC_TYPE_NC
|
|
|
|
/* Control the mapping type according to the settings. */
|
|
|
|
uar_mapping = (config->dbnc == MLX5_TXDB_NCACHED) ?
|
|
|
|
MLX5DV_UAR_ALLOC_TYPE_NC :
|
|
|
|
MLX5DV_UAR_ALLOC_TYPE_BF;
|
|
|
|
#else
|
|
|
|
RTE_SET_USED(config);
|
|
|
|
/*
|
|
|
|
* It seems we have no way to control the memory mapping type
|
|
|
|
* for the UAR, the default "Write-Combining" type is supposed.
|
|
|
|
* The UAR initialization on queue creation queries the
|
|
|
|
* actual mapping type done by Verbs/kernel and setups the
|
|
|
|
* PMD datapath accordingly.
|
|
|
|
*/
|
|
|
|
uar_mapping = 0;
|
|
|
|
#endif
|
|
|
|
sh->tx_uar = mlx5_glue->devx_alloc_uar(sh->ctx, uar_mapping);
|
|
|
|
#ifdef MLX5DV_UAR_ALLOC_TYPE_NC
|
|
|
|
if (!sh->tx_uar &&
|
|
|
|
uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
|
|
|
|
if (config->dbnc == MLX5_TXDB_CACHED ||
|
|
|
|
config->dbnc == MLX5_TXDB_HEURISTIC)
|
|
|
|
DRV_LOG(WARNING, "Devarg tx_db_nc setting "
|
|
|
|
"is not supported by DevX");
|
|
|
|
/*
|
|
|
|
* In some environments like virtual machine
|
|
|
|
* the Write Combining mapped might be not supported
|
|
|
|
* and UAR allocation fails. We try "Non-Cached"
|
|
|
|
* mapping for the case. The tx_burst routines take
|
|
|
|
* the UAR mapping type into account on UAR setup
|
|
|
|
* on queue creation.
|
|
|
|
*/
|
2021-02-24 08:17:35 +00:00
|
|
|
DRV_LOG(DEBUG, "Failed to allocate Tx DevX UAR (BF)");
|
2020-07-22 14:59:08 +00:00
|
|
|
uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
|
|
|
|
sh->tx_uar = mlx5_glue->devx_alloc_uar
|
|
|
|
(sh->ctx, uar_mapping);
|
|
|
|
} else if (!sh->tx_uar &&
|
|
|
|
uar_mapping == MLX5DV_UAR_ALLOC_TYPE_NC) {
|
|
|
|
if (config->dbnc == MLX5_TXDB_NCACHED)
|
|
|
|
DRV_LOG(WARNING, "Devarg tx_db_nc settings "
|
|
|
|
"is not supported by DevX");
|
|
|
|
/*
|
|
|
|
* If Verbs/kernel does not support "Non-Cached"
|
|
|
|
* try the "Write-Combining".
|
|
|
|
*/
|
2021-02-24 08:17:35 +00:00
|
|
|
DRV_LOG(DEBUG, "Failed to allocate Tx DevX UAR (NC)");
|
2020-07-22 14:59:08 +00:00
|
|
|
uar_mapping = MLX5DV_UAR_ALLOC_TYPE_BF;
|
|
|
|
sh->tx_uar = mlx5_glue->devx_alloc_uar
|
|
|
|
(sh->ctx, uar_mapping);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
if (!sh->tx_uar) {
|
|
|
|
DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (BF/NC)");
|
|
|
|
err = ENOMEM;
|
|
|
|
goto exit;
|
|
|
|
}
|
2020-08-25 09:31:13 +00:00
|
|
|
base_addr = mlx5_os_get_devx_uar_base_addr(sh->tx_uar);
|
|
|
|
if (base_addr)
|
2020-07-22 14:59:08 +00:00
|
|
|
break;
|
|
|
|
/*
|
|
|
|
* The UARs are allocated by rdma_core within the
|
|
|
|
* IB device context, on context closure all UARs
|
|
|
|
* will be freed, should be no memory/object leakage.
|
|
|
|
*/
|
2021-02-24 08:17:35 +00:00
|
|
|
DRV_LOG(DEBUG, "Retrying to allocate Tx DevX UAR");
|
2020-07-22 14:59:08 +00:00
|
|
|
sh->tx_uar = NULL;
|
|
|
|
}
|
|
|
|
/* Check whether we finally succeeded with valid UAR allocation. */
|
|
|
|
if (!sh->tx_uar) {
|
|
|
|
DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (NULL base)");
|
|
|
|
err = ENOMEM;
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
|
|
|
|
uar_mapping = 0;
|
|
|
|
sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
|
|
|
|
(sh->ctx, uar_mapping);
|
|
|
|
#ifdef MLX5DV_UAR_ALLOC_TYPE_NC
|
|
|
|
if (!sh->devx_rx_uar &&
|
|
|
|
uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
|
|
|
|
/*
|
|
|
|
* Rx UAR is used to control interrupts only,
|
|
|
|
* should be no datapath noticeable impact,
|
|
|
|
* can try "Non-Cached" mapping safely.
|
|
|
|
*/
|
2021-02-24 08:17:35 +00:00
|
|
|
DRV_LOG(DEBUG, "Failed to allocate Rx DevX UAR (BF)");
|
2020-07-22 14:59:08 +00:00
|
|
|
uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
|
|
|
|
sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
|
|
|
|
(sh->ctx, uar_mapping);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
if (!sh->devx_rx_uar) {
|
|
|
|
DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (BF/NC)");
|
|
|
|
err = ENOMEM;
|
|
|
|
goto exit;
|
|
|
|
}
|
2020-08-25 09:31:13 +00:00
|
|
|
base_addr = mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar);
|
|
|
|
if (base_addr)
|
2020-07-22 14:59:08 +00:00
|
|
|
break;
|
|
|
|
/*
|
|
|
|
* The UARs are allocated by rdma_core within the
|
|
|
|
* IB device context, on context closure all UARs
|
|
|
|
* will be freed, should be no memory/object leakage.
|
|
|
|
*/
|
2021-02-24 08:17:35 +00:00
|
|
|
DRV_LOG(DEBUG, "Retrying to allocate Rx DevX UAR");
|
2020-07-22 14:59:08 +00:00
|
|
|
sh->devx_rx_uar = NULL;
|
|
|
|
}
|
|
|
|
/* Check whether we finally succeeded with valid UAR allocation. */
|
|
|
|
if (!sh->devx_rx_uar) {
|
|
|
|
DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (NULL base)");
|
|
|
|
err = ENOMEM;
|
|
|
|
}
|
|
|
|
exit:
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2019-03-27 13:15:39 +00:00
|
|
|
/**
|
2020-06-10 09:32:27 +00:00
|
|
|
* Allocate shared device context. If there is multiport device the
|
2019-03-27 13:15:39 +00:00
|
|
|
* master and representors will share this context, if there is single
|
2020-06-10 09:32:27 +00:00
|
|
|
* port dedicated device, the context will be used by only given
|
2019-03-27 13:15:39 +00:00
|
|
|
* port due to unification.
|
|
|
|
*
|
2020-06-10 09:32:27 +00:00
|
|
|
* Routine first searches the context for the specified device name,
|
2019-03-27 13:15:39 +00:00
|
|
|
* if found the shared context assumed and reference counter is incremented.
|
|
|
|
* If no context found the new one is created and initialized with specified
|
2020-06-10 09:32:27 +00:00
|
|
|
* device context and parameters.
|
2019-03-27 13:15:39 +00:00
|
|
|
*
|
|
|
|
* @param[in] spawn
|
2020-06-10 09:32:27 +00:00
|
|
|
* Pointer to the device attributes (name, port, etc).
|
2019-11-08 15:07:50 +00:00
|
|
|
* @param[in] config
|
|
|
|
* Pointer to device configuration structure.
|
2019-03-27 13:15:39 +00:00
|
|
|
*
|
|
|
|
* @return
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object on success,
|
2019-03-27 13:15:39 +00:00
|
|
|
* otherwise NULL and rte_errno is set.
|
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
struct mlx5_dev_ctx_shared *
|
2020-06-10 09:32:27 +00:00
|
|
|
mlx5_alloc_shared_dev_ctx(const struct mlx5_dev_spawn_data *spawn,
|
|
|
|
const struct mlx5_dev_config *config)
|
2019-03-27 13:15:39 +00:00
|
|
|
{
|
2020-06-03 15:05:55 +00:00
|
|
|
struct mlx5_dev_ctx_shared *sh;
|
2019-03-27 13:15:39 +00:00
|
|
|
int err = 0;
|
2019-03-27 13:15:45 +00:00
|
|
|
uint32_t i;
|
2019-10-30 23:53:15 +00:00
|
|
|
struct mlx5_devx_tis_attr tis_attr = { 0 };
|
2019-03-27 13:15:39 +00:00
|
|
|
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(spawn);
|
2019-03-27 13:15:39 +00:00
|
|
|
/* Secondary process should not create the shared context. */
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
|
2020-06-10 09:32:27 +00:00
|
|
|
pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
|
2019-03-27 13:15:39 +00:00
|
|
|
/* Search for IB context by device name. */
|
2020-06-10 09:32:27 +00:00
|
|
|
LIST_FOREACH(sh, &mlx5_dev_ctx_list, next) {
|
2020-06-03 15:06:02 +00:00
|
|
|
if (!strcmp(sh->ibdev_name,
|
|
|
|
mlx5_os_get_dev_device_name(spawn->phys_dev))) {
|
2019-03-27 13:15:39 +00:00
|
|
|
sh->refcnt++;
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
}
|
2019-04-05 08:55:30 +00:00
|
|
|
/* No device found, we have to create new shared context. */
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(spawn->max_port);
|
2020-06-28 09:02:44 +00:00
|
|
|
sh = mlx5_malloc(MLX5_MEM_ZERO | MLX5_MEM_RTE,
|
2020-06-03 15:05:55 +00:00
|
|
|
sizeof(struct mlx5_dev_ctx_shared) +
|
2019-03-27 13:15:39 +00:00
|
|
|
spawn->max_port *
|
2020-06-10 09:32:27 +00:00
|
|
|
sizeof(struct mlx5_dev_shared_port),
|
2020-06-28 09:02:44 +00:00
|
|
|
RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (!sh) {
|
|
|
|
DRV_LOG(ERR, "shared context allocation failure");
|
|
|
|
rte_errno = ENOMEM;
|
|
|
|
goto exit;
|
|
|
|
}
|
2021-03-28 13:48:12 +00:00
|
|
|
if (spawn->bond_info)
|
|
|
|
sh->bond = *spawn->bond_info;
|
2020-06-03 15:06:00 +00:00
|
|
|
err = mlx5_os_open_device(spawn, config, sh);
|
|
|
|
if (!sh->ctx)
|
|
|
|
goto error;
|
2020-06-03 15:05:58 +00:00
|
|
|
err = mlx5_os_get_dev_attr(sh->ctx, &sh->device_attr);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (err) {
|
2020-06-03 15:05:58 +00:00
|
|
|
DRV_LOG(DEBUG, "mlx5_os_get_dev_attr() failed");
|
2019-03-27 13:15:39 +00:00
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
sh->refcnt = 1;
|
|
|
|
sh->max_port = spawn->max_port;
|
2020-06-03 15:05:56 +00:00
|
|
|
strncpy(sh->ibdev_name, mlx5_os_get_ctx_device_name(sh->ctx),
|
|
|
|
sizeof(sh->ibdev_name) - 1);
|
|
|
|
strncpy(sh->ibdev_path, mlx5_os_get_ctx_device_path(sh->ctx),
|
|
|
|
sizeof(sh->ibdev_path) - 1);
|
2019-03-27 13:15:45 +00:00
|
|
|
/*
|
|
|
|
* Setting port_id to max unallowed value means
|
|
|
|
* there is no interrupt subhandler installed for
|
|
|
|
* the given port index i.
|
|
|
|
*/
|
2019-10-22 07:33:35 +00:00
|
|
|
for (i = 0; i < sh->max_port; i++) {
|
2019-03-27 13:15:45 +00:00
|
|
|
sh->port[i].ih_port_id = RTE_MAX_ETHPORTS;
|
2019-10-22 07:33:35 +00:00
|
|
|
sh->port[i].devx_ih_port_id = RTE_MAX_ETHPORTS;
|
|
|
|
}
|
2020-12-28 09:54:13 +00:00
|
|
|
sh->pd = mlx5_os_alloc_pd(sh->ctx);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (sh->pd == NULL) {
|
|
|
|
DRV_LOG(ERR, "PD allocation failure");
|
|
|
|
err = ENOMEM;
|
|
|
|
goto error;
|
|
|
|
}
|
2019-10-30 23:53:15 +00:00
|
|
|
if (sh->devx) {
|
2020-06-03 15:06:00 +00:00
|
|
|
err = mlx5_os_get_pdn(sh->pd, &sh->pdn);
|
2019-10-30 23:53:15 +00:00
|
|
|
if (err) {
|
|
|
|
DRV_LOG(ERR, "Fail to extract pdn from PD");
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
sh->td = mlx5_devx_cmd_create_td(sh->ctx);
|
|
|
|
if (!sh->td) {
|
|
|
|
DRV_LOG(ERR, "TD allocation failure");
|
|
|
|
err = ENOMEM;
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
tis_attr.transport_domain = sh->td->id;
|
|
|
|
sh->tis = mlx5_devx_cmd_create_tis(sh->ctx, &tis_attr);
|
|
|
|
if (!sh->tis) {
|
|
|
|
DRV_LOG(ERR, "TIS allocation failure");
|
|
|
|
err = ENOMEM;
|
|
|
|
goto error;
|
|
|
|
}
|
2020-07-22 14:59:08 +00:00
|
|
|
err = mlx5_alloc_rxtx_uars(sh, config);
|
|
|
|
if (err)
|
2020-07-19 11:13:06 +00:00
|
|
|
goto error;
|
2020-08-25 09:31:13 +00:00
|
|
|
MLX5_ASSERT(sh->tx_uar);
|
|
|
|
MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->tx_uar));
|
|
|
|
|
|
|
|
MLX5_ASSERT(sh->devx_rx_uar);
|
|
|
|
MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar));
|
2019-07-22 14:52:15 +00:00
|
|
|
}
|
2020-07-16 08:23:06 +00:00
|
|
|
#ifndef RTE_ARCH_64
|
|
|
|
/* Initialize UAR access locks for 32bit implementations. */
|
|
|
|
rte_spinlock_init(&sh->uar_lock_cq);
|
|
|
|
for (i = 0; i < MLX5_UAR_PAGE_NUM_MAX; i++)
|
|
|
|
rte_spinlock_init(&sh->uar_lock[i]);
|
|
|
|
#endif
|
2019-04-27 04:32:56 +00:00
|
|
|
/*
|
|
|
|
* Once the device is added to the list of memory event
|
|
|
|
* callback, its global MR cache table cannot be expanded
|
|
|
|
* on the fly because of deadlock. If it overflows, lookup
|
|
|
|
* should be done by searching MR list linearly, which is slow.
|
|
|
|
*
|
|
|
|
* At this point the device is not added to the memory
|
|
|
|
* event list yet, context is just being created.
|
|
|
|
*/
|
2020-04-13 21:17:48 +00:00
|
|
|
err = mlx5_mr_btree_init(&sh->share_cache.cache,
|
2019-04-27 04:32:56 +00:00
|
|
|
MLX5_MR_BTREE_CACHE_N * 2,
|
2019-09-25 07:53:24 +00:00
|
|
|
spawn->pci_dev->device.numa_node);
|
2019-04-27 04:32:56 +00:00
|
|
|
if (err) {
|
|
|
|
err = rte_errno;
|
|
|
|
goto error;
|
|
|
|
}
|
2020-06-16 09:44:45 +00:00
|
|
|
mlx5_os_set_reg_mr_cb(&sh->share_cache.reg_mr_cb,
|
|
|
|
&sh->share_cache.dereg_mr_cb);
|
2020-06-03 15:06:00 +00:00
|
|
|
mlx5_os_dev_shared_handler_install(sh);
|
2020-06-18 07:24:43 +00:00
|
|
|
sh->cnt_id_tbl = mlx5_l3t_create(MLX5_L3T_TYPE_DWORD);
|
|
|
|
if (!sh->cnt_id_tbl) {
|
|
|
|
err = rte_errno;
|
|
|
|
goto error;
|
|
|
|
}
|
2021-01-07 13:08:27 +00:00
|
|
|
if (LIST_EMPTY(&mlx5_dev_ctx_list)) {
|
|
|
|
err = mlx5_flow_os_init_workspace_once();
|
|
|
|
if (err)
|
|
|
|
goto error;
|
|
|
|
}
|
2020-04-29 02:25:09 +00:00
|
|
|
mlx5_flow_aging_init(sh);
|
2019-07-16 14:34:53 +00:00
|
|
|
mlx5_flow_counters_mng_init(sh);
|
2020-04-16 02:42:08 +00:00
|
|
|
mlx5_flow_ipool_create(sh, config);
|
2019-08-06 15:00:33 +00:00
|
|
|
/* Add device to memory callback list. */
|
|
|
|
rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
|
|
|
|
LIST_INSERT_HEAD(&mlx5_shared_data->mem_event_cb_list,
|
|
|
|
sh, mem_event_cb);
|
|
|
|
rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
|
|
|
|
/* Add context to the global device list. */
|
2020-06-10 09:32:27 +00:00
|
|
|
LIST_INSERT_HEAD(&mlx5_dev_ctx_list, sh, next);
|
2021-01-17 10:21:20 +00:00
|
|
|
rte_spinlock_init(&sh->geneve_tlv_opt_sl);
|
2019-03-27 13:15:39 +00:00
|
|
|
exit:
|
2020-06-10 09:32:27 +00:00
|
|
|
pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
|
2019-03-27 13:15:39 +00:00
|
|
|
return sh;
|
|
|
|
error:
|
2020-07-16 08:23:08 +00:00
|
|
|
pthread_mutex_destroy(&sh->txpp.mutex);
|
2020-06-10 09:32:27 +00:00
|
|
|
pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(sh);
|
2020-07-22 14:59:08 +00:00
|
|
|
if (sh->cnt_id_tbl)
|
2020-06-18 07:24:43 +00:00
|
|
|
mlx5_l3t_destroy(sh->cnt_id_tbl);
|
2019-10-30 23:53:15 +00:00
|
|
|
if (sh->tis)
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy(sh->tis));
|
|
|
|
if (sh->td)
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy(sh->td));
|
2020-07-19 11:13:06 +00:00
|
|
|
if (sh->devx_rx_uar)
|
|
|
|
mlx5_glue->devx_free_uar(sh->devx_rx_uar);
|
2020-07-22 14:59:08 +00:00
|
|
|
if (sh->tx_uar)
|
|
|
|
mlx5_glue->devx_free_uar(sh->tx_uar);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (sh->pd)
|
2020-12-28 09:54:13 +00:00
|
|
|
claim_zero(mlx5_os_dealloc_pd(sh->pd));
|
2019-03-27 13:15:39 +00:00
|
|
|
if (sh->ctx)
|
|
|
|
claim_zero(mlx5_glue->close_device(sh->ctx));
|
2020-06-28 09:02:44 +00:00
|
|
|
mlx5_free(sh);
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(err > 0);
|
2019-03-27 13:15:39 +00:00
|
|
|
rte_errno = err;
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Free shared IB device context. Decrement counter and if zero free
|
|
|
|
* all allocated resources and close handles.
|
|
|
|
*
|
|
|
|
* @param[in] sh
|
2020-06-03 15:05:55 +00:00
|
|
|
* Pointer to mlx5_dev_ctx_shared object to free
|
2019-03-27 13:15:39 +00:00
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
void
|
2020-06-10 09:32:27 +00:00
|
|
|
mlx5_free_shared_dev_ctx(struct mlx5_dev_ctx_shared *sh)
|
2019-03-27 13:15:39 +00:00
|
|
|
{
|
2020-06-10 09:32:27 +00:00
|
|
|
pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
|
2020-01-30 16:14:39 +00:00
|
|
|
#ifdef RTE_LIBRTE_MLX5_DEBUG
|
2019-03-27 13:15:39 +00:00
|
|
|
/* Check the object presence in the list. */
|
2020-06-03 15:05:55 +00:00
|
|
|
struct mlx5_dev_ctx_shared *lctx;
|
2019-03-27 13:15:39 +00:00
|
|
|
|
2020-06-10 09:32:27 +00:00
|
|
|
LIST_FOREACH(lctx, &mlx5_dev_ctx_list, next)
|
2019-03-27 13:15:39 +00:00
|
|
|
if (lctx == sh)
|
|
|
|
break;
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(lctx);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (lctx != sh) {
|
|
|
|
DRV_LOG(ERR, "Freeing non-existing shared IB context");
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
#endif
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(sh);
|
|
|
|
MLX5_ASSERT(sh->refcnt);
|
2019-03-27 13:15:39 +00:00
|
|
|
/* Secondary process should not free the shared context. */
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (--sh->refcnt)
|
|
|
|
goto exit;
|
2019-08-06 15:00:33 +00:00
|
|
|
/* Remove from memory callback device list. */
|
|
|
|
rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
|
|
|
|
LIST_REMOVE(sh, mem_event_cb);
|
|
|
|
rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
|
2020-02-04 13:36:09 +00:00
|
|
|
/* Release created Memory Regions. */
|
2020-04-13 21:17:48 +00:00
|
|
|
mlx5_mr_release_cache(&sh->share_cache);
|
2019-08-06 15:00:33 +00:00
|
|
|
/* Remove context from the global device list. */
|
2019-03-27 13:15:39 +00:00
|
|
|
LIST_REMOVE(sh, next);
|
2021-01-07 13:08:27 +00:00
|
|
|
/* Release flow workspaces objects on the last device. */
|
|
|
|
if (LIST_EMPTY(&mlx5_dev_ctx_list))
|
|
|
|
mlx5_flow_os_release_workspace();
|
2020-07-21 12:03:38 +00:00
|
|
|
pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
|
2019-03-27 13:15:45 +00:00
|
|
|
/*
|
|
|
|
* Ensure there is no async event handler installed.
|
|
|
|
* Only primary process handles async device events.
|
|
|
|
**/
|
2019-07-16 14:34:53 +00:00
|
|
|
mlx5_flow_counters_mng_close(sh);
|
2020-11-01 17:57:49 +00:00
|
|
|
if (sh->aso_age_mng) {
|
|
|
|
mlx5_flow_aso_age_mng_close(sh);
|
|
|
|
sh->aso_age_mng = NULL;
|
|
|
|
}
|
2021-04-20 10:55:17 +00:00
|
|
|
if (sh->mtrmng)
|
|
|
|
mlx5_aso_flow_mtrs_mng_close(sh);
|
2020-04-16 02:42:02 +00:00
|
|
|
mlx5_flow_ipool_destroy(sh);
|
2020-06-03 15:06:00 +00:00
|
|
|
mlx5_os_dev_shared_handler_uninstall(sh);
|
2020-06-18 07:24:43 +00:00
|
|
|
if (sh->cnt_id_tbl) {
|
|
|
|
mlx5_l3t_destroy(sh->cnt_id_tbl);
|
|
|
|
sh->cnt_id_tbl = NULL;
|
|
|
|
}
|
2020-07-16 08:23:07 +00:00
|
|
|
if (sh->tx_uar) {
|
|
|
|
mlx5_glue->devx_free_uar(sh->tx_uar);
|
|
|
|
sh->tx_uar = NULL;
|
|
|
|
}
|
2019-03-27 13:15:39 +00:00
|
|
|
if (sh->pd)
|
2020-12-28 09:54:13 +00:00
|
|
|
claim_zero(mlx5_os_dealloc_pd(sh->pd));
|
2019-10-30 23:53:15 +00:00
|
|
|
if (sh->tis)
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy(sh->tis));
|
|
|
|
if (sh->td)
|
|
|
|
claim_zero(mlx5_devx_cmd_destroy(sh->td));
|
2020-07-19 11:13:06 +00:00
|
|
|
if (sh->devx_rx_uar)
|
|
|
|
mlx5_glue->devx_free_uar(sh->devx_rx_uar);
|
2019-03-27 13:15:39 +00:00
|
|
|
if (sh->ctx)
|
|
|
|
claim_zero(mlx5_glue->close_device(sh->ctx));
|
2021-01-17 10:21:20 +00:00
|
|
|
MLX5_ASSERT(sh->geneve_tlv_option_resource == NULL);
|
2020-07-16 08:23:08 +00:00
|
|
|
pthread_mutex_destroy(&sh->txpp.mutex);
|
2020-06-28 09:02:44 +00:00
|
|
|
mlx5_free(sh);
|
2020-07-21 12:03:38 +00:00
|
|
|
return;
|
2019-03-27 13:15:39 +00:00
|
|
|
exit:
|
2020-06-10 09:32:27 +00:00
|
|
|
pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
|
2019-03-27 13:15:39 +00:00
|
|
|
}
|
|
|
|
|
2019-11-17 12:14:54 +00:00
|
|
|
/**
|
2020-10-28 09:33:33 +00:00
|
|
|
* Destroy table hash list.
|
2019-11-17 12:14:54 +00:00
|
|
|
*
|
|
|
|
* @param[in] priv
|
|
|
|
* Pointer to the private device data structure.
|
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
void
|
2019-11-17 12:14:54 +00:00
|
|
|
mlx5_free_table_hash_list(struct mlx5_priv *priv)
|
|
|
|
{
|
2020-06-03 15:05:55 +00:00
|
|
|
struct mlx5_dev_ctx_shared *sh = priv->sh;
|
2019-11-17 12:14:54 +00:00
|
|
|
|
|
|
|
if (!sh->flow_tbls)
|
|
|
|
return;
|
2020-10-28 09:33:31 +00:00
|
|
|
mlx5_hlist_destroy(sh->flow_tbls);
|
2019-11-17 12:14:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Initialize flow table hash list and create the root tables entry
|
|
|
|
* for each domain.
|
|
|
|
*
|
|
|
|
* @param[in] priv
|
|
|
|
* Pointer to the private device data structure.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Zero on success, positive error code otherwise.
|
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
int
|
2020-10-28 09:33:33 +00:00
|
|
|
mlx5_alloc_table_hash_list(struct mlx5_priv *priv __rte_unused)
|
2019-11-17 12:14:54 +00:00
|
|
|
{
|
2020-10-28 09:33:33 +00:00
|
|
|
int err = 0;
|
|
|
|
/* Tables are only used in DV and DR modes. */
|
2020-12-28 12:32:55 +00:00
|
|
|
#if defined(HAVE_IBV_FLOW_DV_SUPPORT) || !defined(HAVE_INFINIBAND_VERBS_H)
|
2020-06-03 15:05:55 +00:00
|
|
|
struct mlx5_dev_ctx_shared *sh = priv->sh;
|
2019-11-17 12:14:54 +00:00
|
|
|
char s[MLX5_HLIST_NAMESIZE];
|
|
|
|
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(sh);
|
2019-11-17 12:14:54 +00:00
|
|
|
snprintf(s, sizeof(s), "%s_flow_table", priv->sh->ibdev_name);
|
2020-10-28 09:33:31 +00:00
|
|
|
sh->flow_tbls = mlx5_hlist_create(s, MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE,
|
2020-12-03 02:18:52 +00:00
|
|
|
0, 0, flow_dv_tbl_create_cb,
|
|
|
|
flow_dv_tbl_match_cb,
|
2020-10-28 09:33:33 +00:00
|
|
|
flow_dv_tbl_remove_cb);
|
2019-11-17 12:14:54 +00:00
|
|
|
if (!sh->flow_tbls) {
|
2020-06-17 13:53:24 +00:00
|
|
|
DRV_LOG(ERR, "flow tables with hash creation failed.");
|
2019-11-17 12:14:54 +00:00
|
|
|
err = ENOMEM;
|
|
|
|
return err;
|
|
|
|
}
|
2020-10-28 09:33:33 +00:00
|
|
|
sh->flow_tbls->ctx = sh;
|
2019-11-17 12:14:54 +00:00
|
|
|
#ifndef HAVE_MLX5DV_DR
|
2020-10-28 09:33:33 +00:00
|
|
|
struct rte_flow_error error;
|
|
|
|
struct rte_eth_dev *dev = &rte_eth_devices[priv->dev_data->port_id];
|
|
|
|
|
2019-11-17 12:14:54 +00:00
|
|
|
/*
|
|
|
|
* In case we have not DR support, the zero tables should be created
|
|
|
|
* because DV expect to see them even if they cannot be created by
|
|
|
|
* RDMA-CORE.
|
|
|
|
*/
|
2021-04-20 10:55:21 +00:00
|
|
|
if (!flow_dv_tbl_resource_get(dev, 0, 0, 0, 0,
|
|
|
|
NULL, 0, 1, 0, &error) ||
|
|
|
|
!flow_dv_tbl_resource_get(dev, 0, 1, 0, 0,
|
|
|
|
NULL, 0, 1, 0, &error) ||
|
|
|
|
!flow_dv_tbl_resource_get(dev, 0, 0, 1, 0,
|
|
|
|
NULL, 0, 1, 0, &error)) {
|
2019-11-17 12:14:54 +00:00
|
|
|
err = ENOMEM;
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
return err;
|
|
|
|
error:
|
|
|
|
mlx5_free_table_hash_list(priv);
|
|
|
|
#endif /* HAVE_MLX5DV_DR */
|
2020-10-28 09:33:33 +00:00
|
|
|
#endif
|
2019-11-17 12:14:54 +00:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2016-03-17 15:38:57 +00:00
|
|
|
/**
|
|
|
|
* Retrieve integer value from environment variable.
|
|
|
|
*
|
|
|
|
* @param[in] name
|
|
|
|
* Environment variable name.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Integer value, 0 if the variable is not set.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mlx5_getenv_int(const char *name)
|
|
|
|
{
|
|
|
|
const char *val = getenv(name);
|
|
|
|
|
|
|
|
if (val == NULL)
|
|
|
|
return 0;
|
|
|
|
return atoi(val);
|
|
|
|
}
|
|
|
|
|
2019-08-22 10:15:52 +00:00
|
|
|
/**
|
|
|
|
* DPDK callback to add udp tunnel port
|
|
|
|
*
|
|
|
|
* @param[in] dev
|
|
|
|
* A pointer to eth_dev
|
|
|
|
* @param[in] udp_tunnel
|
|
|
|
* A pointer to udp tunnel
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on valid udp ports and tunnels, -ENOTSUP otherwise.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mlx5_udp_tunnel_port_add(struct rte_eth_dev *dev __rte_unused,
|
|
|
|
struct rte_eth_udp_tunnel *udp_tunnel)
|
|
|
|
{
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(udp_tunnel != NULL);
|
2019-08-22 10:15:52 +00:00
|
|
|
if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN &&
|
|
|
|
udp_tunnel->udp_port == 4789)
|
|
|
|
return 0;
|
|
|
|
if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN_GPE &&
|
|
|
|
udp_tunnel->udp_port == 4790)
|
|
|
|
return 0;
|
|
|
|
return -ENOTSUP;
|
|
|
|
}
|
|
|
|
|
2019-04-10 18:41:17 +00:00
|
|
|
/**
|
|
|
|
* Initialize process private data structure.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on success, a negative errno value otherwise and rte_errno is set.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mlx5_proc_priv_init(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
|
|
|
struct mlx5_proc_priv *ppriv;
|
|
|
|
size_t ppriv_size;
|
|
|
|
|
2021-05-13 03:39:54 +00:00
|
|
|
mlx5_proc_priv_uninit(dev);
|
2019-04-10 18:41:17 +00:00
|
|
|
/*
|
|
|
|
* UAR register table follows the process private structure. BlueFlame
|
|
|
|
* registers for Tx queues are stored in the table.
|
|
|
|
*/
|
|
|
|
ppriv_size =
|
|
|
|
sizeof(struct mlx5_proc_priv) + priv->txqs_n * sizeof(void *);
|
2021-01-24 11:02:04 +00:00
|
|
|
ppriv = mlx5_malloc(MLX5_MEM_RTE | MLX5_MEM_ZERO, ppriv_size,
|
|
|
|
RTE_CACHE_LINE_SIZE, dev->device->numa_node);
|
2019-04-10 18:41:17 +00:00
|
|
|
if (!ppriv) {
|
|
|
|
rte_errno = ENOMEM;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
2021-01-24 11:02:04 +00:00
|
|
|
ppriv->uar_table_sz = priv->txqs_n;
|
2019-04-10 18:41:17 +00:00
|
|
|
dev->process_private = ppriv;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Un-initialize process private data structure.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*/
|
2021-01-24 11:02:05 +00:00
|
|
|
void
|
2019-04-10 18:41:17 +00:00
|
|
|
mlx5_proc_priv_uninit(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
if (!dev->process_private)
|
|
|
|
return;
|
2020-06-28 09:02:44 +00:00
|
|
|
mlx5_free(dev->process_private);
|
2019-04-10 18:41:17 +00:00
|
|
|
dev->process_private = NULL;
|
|
|
|
}
|
|
|
|
|
2015-10-30 18:52:30 +00:00
|
|
|
/**
|
|
|
|
* DPDK callback to close the device.
|
|
|
|
*
|
|
|
|
* Destroy all queues and objects, free memory.
|
|
|
|
*
|
|
|
|
* @param dev
|
|
|
|
* Pointer to Ethernet device structure.
|
|
|
|
*/
|
2020-09-28 23:14:10 +00:00
|
|
|
int
|
2015-10-30 18:52:30 +00:00
|
|
|
mlx5_dev_close(struct rte_eth_dev *dev)
|
|
|
|
{
|
2019-02-21 09:29:14 +00:00
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
2015-10-30 18:52:31 +00:00
|
|
|
unsigned int i;
|
2017-10-09 14:44:42 +00:00
|
|
|
int ret;
|
2015-10-30 18:52:30 +00:00
|
|
|
|
2020-05-28 06:59:49 +00:00
|
|
|
if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
|
|
|
|
/* Check if process_private released. */
|
|
|
|
if (!dev->process_private)
|
2020-09-28 23:14:10 +00:00
|
|
|
return 0;
|
2020-05-28 06:59:49 +00:00
|
|
|
mlx5_tx_uar_uninit_secondary(dev);
|
|
|
|
mlx5_proc_priv_uninit(dev);
|
|
|
|
rte_eth_dev_release_port(dev);
|
2020-09-28 23:14:10 +00:00
|
|
|
return 0;
|
2020-05-28 06:59:49 +00:00
|
|
|
}
|
|
|
|
if (!priv->sh)
|
2020-09-28 23:14:10 +00:00
|
|
|
return 0;
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(DEBUG, "port %u closing device \"%s\"",
|
|
|
|
dev->data->port_id,
|
2020-06-03 15:05:56 +00:00
|
|
|
((priv->sh->ctx != NULL) ?
|
|
|
|
mlx5_os_get_ctx_device_name(priv->sh->ctx) : ""));
|
2020-03-24 15:33:57 +00:00
|
|
|
/*
|
|
|
|
* If default mreg copy action is removed at the stop stage,
|
|
|
|
* the search will return none and nothing will be done anymore.
|
|
|
|
*/
|
|
|
|
mlx5_flow_stop_default(dev);
|
2018-03-05 12:21:04 +00:00
|
|
|
mlx5_traffic_disable(dev);
|
2020-03-24 15:33:57 +00:00
|
|
|
/*
|
|
|
|
* If all the flows are already flushed in the device stop stage,
|
|
|
|
* then this will return directly without any action.
|
|
|
|
*/
|
2021-07-13 08:44:39 +00:00
|
|
|
mlx5_flow_list_flush(dev, MLX5_FLOW_TYPE_GEN, true);
|
ethdev: introduce indirect flow action
Right now, rte_flow_shared_action_* APIs are used for some shared
actions, like RSS, count. The shared action should be created before
using it inside a flow. These shared actions sometimes are not
really shared but just some indirect actions decoupled from a flow.
The new functions rte_flow_action_handle_* are added to replace
the current shared functions rte_flow_shared_action_*.
There are two types of flow actions:
1. the direct (normal) actions that could be created and stored
within a flow rule. Such action is tied to its flow rule and
cannot be reused.
2. the indirect action, in the past, named shared_action. It is
created from a direct actioni, like count or rss, and then used
in the flow rules with an object handle. The PMD will take care
of the retrieve from indirect action to the direct action
when it is referenced.
The indirect action is accessed (update / query) w/o any flow rule,
just via the action object handle. For example, when querying or
resetting a counter, it could be done out of any flow using this
counter, but only the handle of the counter action object is
required.
The indirect action object could be shared by different flows or
used by a single flow, depending on the direct action type and
the real-life requirements.
The handle of an indirect action object is opaque and defined in
each driver and possibly different per direct action type.
The old name "shared" is improper in a sense and should be replaced.
Since the APIs are changed from "rte_flow_shared_action*" to the new
"rte_flow_action_handle*", the testpmd application code and command
line interfaces also need to be updated to do the adaption.
The testpmd application user guide is also updated. All the "shared
action" related parts are replaced with "indirect action" to have a
correct explanation.
The parameter of "update" interface is also changed. A general
pointer will replace the rte_flow_action struct pointer due to the
facts:
1. Some action may not support fields updating. In the example of a
counter, the only "update" supported should be the reset. So
passing a rte_flow_action struct pointer is meaningless and
there is even no such corresponding action struct. What's more,
if more than one operations should be supported, for some other
action, such pointer parameter may not meet the need.
2. Some action may need conditional or partial update, the current
parameter will not provide the ability to indicate which part(s)
to update.
For different types of indirect action objects, the pointer could
either be the same of rte_flow_action* struct - in order not to
break the current driver implementation, or some wrapper
structures with bits as masks to indicate which part to be
updated, depending on real needs of the corresponding direct
action. For different direct actions, the structures of indirect
action objects updating will be different.
All the underlayer PMD callbacks will be moved to these new APIs.
The RTE_FLOW_ACTION_TYPE_SHARED is kept for now in order not to
break the ABI. All the implementations are changed by using
RTE_FLOW_ACTION_TYPE_INDIRECT.
Since the APIs are changed from "rte_flow_shared_action*" to the new
"rte_flow_action_handle*" and the "update" interface's 3rd input
parameter is changed to generic pointer, the mlx5 PMD that uses these
APIs needs to do the adaption to the new APIs as well.
Signed-off-by: Bing Zhao <bingz@nvidia.com>
Acked-by: Andrey Vesnovaty <andreyv@nvidia.com>
Acked-by: Ori Kam <orika@nvidia.com>
Acked-by: Ajit Khaparde <ajit.khaparde@broadcom.com>
Acked-by: Thomas Monjalon <thomas@monjalon.net>
2021-04-19 14:38:29 +00:00
|
|
|
mlx5_action_handle_flush(dev);
|
2019-11-08 03:49:25 +00:00
|
|
|
mlx5_flow_meter_flush(dev, NULL);
|
2015-10-30 18:52:31 +00:00
|
|
|
/* Prevent crashes when queues are still in use. */
|
|
|
|
dev->rx_pkt_burst = removed_rx_burst;
|
|
|
|
dev->tx_pkt_burst = removed_tx_burst;
|
2019-04-01 21:12:56 +00:00
|
|
|
rte_wmb();
|
|
|
|
/* Disable datapath on secondary process. */
|
2020-07-19 10:18:15 +00:00
|
|
|
mlx5_mp_os_req_stop_rxtx(dev);
|
2020-07-17 07:11:49 +00:00
|
|
|
/* Free the eCPRI flex parser resource. */
|
|
|
|
mlx5_flex_parser_ecpri_release(dev);
|
2015-10-30 18:52:31 +00:00
|
|
|
if (priv->rxqs != NULL) {
|
|
|
|
/* XXX race condition if mlx5_rx_burst() is still running. */
|
2020-12-28 09:54:09 +00:00
|
|
|
rte_delay_us_sleep(1000);
|
2017-10-09 14:44:49 +00:00
|
|
|
for (i = 0; (i != priv->rxqs_n); ++i)
|
2018-03-05 12:21:04 +00:00
|
|
|
mlx5_rxq_release(dev, i);
|
2015-10-30 18:52:31 +00:00
|
|
|
priv->rxqs_n = 0;
|
|
|
|
priv->rxqs = NULL;
|
|
|
|
}
|
|
|
|
if (priv->txqs != NULL) {
|
|
|
|
/* XXX race condition if mlx5_tx_burst() is still running. */
|
2020-12-28 09:54:09 +00:00
|
|
|
rte_delay_us_sleep(1000);
|
2017-10-09 14:44:48 +00:00
|
|
|
for (i = 0; (i != priv->txqs_n); ++i)
|
2018-03-05 12:21:04 +00:00
|
|
|
mlx5_txq_release(dev, i);
|
2015-10-30 18:52:31 +00:00
|
|
|
priv->txqs_n = 0;
|
|
|
|
priv->txqs = NULL;
|
|
|
|
}
|
2019-04-10 18:41:17 +00:00
|
|
|
mlx5_proc_priv_uninit(dev);
|
2021-02-25 10:45:01 +00:00
|
|
|
if (priv->q_counters) {
|
|
|
|
mlx5_devx_cmd_destroy(priv->q_counters);
|
|
|
|
priv->q_counters = NULL;
|
|
|
|
}
|
2020-10-28 09:33:30 +00:00
|
|
|
if (priv->drop_queue.hrxq)
|
|
|
|
mlx5_drop_action_destroy(dev);
|
2019-11-07 17:10:04 +00:00
|
|
|
if (priv->mreg_cp_tbl)
|
2020-10-28 09:33:31 +00:00
|
|
|
mlx5_hlist_destroy(priv->mreg_cp_tbl);
|
2018-05-09 11:13:50 +00:00
|
|
|
mlx5_mprq_free_mp(dev);
|
2021-05-05 12:23:19 +00:00
|
|
|
if (priv->sh->ct_mng)
|
|
|
|
mlx5_flow_aso_ct_mng_close(priv->sh);
|
2020-06-03 15:06:00 +00:00
|
|
|
mlx5_os_free_shared_dr(priv);
|
2017-10-09 14:44:56 +00:00
|
|
|
if (priv->rss_conf.rss_key != NULL)
|
2020-06-28 07:35:26 +00:00
|
|
|
mlx5_free(priv->rss_conf.rss_key);
|
2015-11-02 18:11:57 +00:00
|
|
|
if (priv->reta_idx != NULL)
|
2020-06-28 07:35:26 +00:00
|
|
|
mlx5_free(priv->reta_idx);
|
2018-04-05 15:07:19 +00:00
|
|
|
if (priv->config.vf)
|
2020-08-25 09:31:09 +00:00
|
|
|
mlx5_os_mac_addr_flush(dev);
|
2018-07-10 16:04:52 +00:00
|
|
|
if (priv->nl_socket_route >= 0)
|
|
|
|
close(priv->nl_socket_route);
|
|
|
|
if (priv->nl_socket_rdma >= 0)
|
|
|
|
close(priv->nl_socket_rdma);
|
2019-07-30 09:20:24 +00:00
|
|
|
if (priv->vmwa_context)
|
|
|
|
mlx5_vlan_vmwa_exit(priv->vmwa_context);
|
2019-07-22 14:52:13 +00:00
|
|
|
ret = mlx5_hrxq_verify(dev);
|
2017-10-09 14:44:51 +00:00
|
|
|
if (ret)
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some hash Rx queue still remain",
|
|
|
|
dev->data->port_id);
|
2019-07-22 14:52:12 +00:00
|
|
|
ret = mlx5_ind_table_obj_verify(dev);
|
2017-10-09 14:44:50 +00:00
|
|
|
if (ret)
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some indirection table still remain",
|
|
|
|
dev->data->port_id);
|
2019-07-22 14:52:11 +00:00
|
|
|
ret = mlx5_rxq_obj_verify(dev);
|
2017-10-09 14:44:46 +00:00
|
|
|
if (ret)
|
2019-07-22 14:52:11 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some Rx queue objects still remain",
|
2018-03-13 09:23:56 +00:00
|
|
|
dev->data->port_id);
|
2018-03-05 12:21:04 +00:00
|
|
|
ret = mlx5_rxq_verify(dev);
|
2017-10-09 14:44:49 +00:00
|
|
|
if (ret)
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some Rx queues still remain",
|
|
|
|
dev->data->port_id);
|
2019-10-30 23:53:14 +00:00
|
|
|
ret = mlx5_txq_obj_verify(dev);
|
2017-10-09 14:44:47 +00:00
|
|
|
if (ret)
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some Verbs Tx queue still remain",
|
|
|
|
dev->data->port_id);
|
2018-03-05 12:21:04 +00:00
|
|
|
ret = mlx5_txq_verify(dev);
|
2017-10-09 14:44:48 +00:00
|
|
|
if (ret)
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some Tx queues still remain",
|
|
|
|
dev->data->port_id);
|
2018-03-05 12:21:04 +00:00
|
|
|
ret = mlx5_flow_verify(dev);
|
2017-10-09 14:44:42 +00:00
|
|
|
if (ret)
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "port %u some flows still remain",
|
|
|
|
dev->data->port_id);
|
2021-07-13 08:44:41 +00:00
|
|
|
mlx5_list_destroy(&priv->hrxqs);
|
2020-05-28 06:59:49 +00:00
|
|
|
/*
|
|
|
|
* Free the shared context in last turn, because the cleanup
|
|
|
|
* routines above may use some shared fields, like
|
2020-08-25 09:31:09 +00:00
|
|
|
* mlx5_os_mac_addr_flush() uses ibdev_path for retrieveing
|
2020-05-28 06:59:49 +00:00
|
|
|
* ifindex if Netlink fails.
|
|
|
|
*/
|
2020-06-10 09:32:27 +00:00
|
|
|
mlx5_free_shared_dev_ctx(priv->sh);
|
2018-07-10 16:04:54 +00:00
|
|
|
if (priv->domain_id != RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) {
|
|
|
|
unsigned int c = 0;
|
2019-04-01 02:26:59 +00:00
|
|
|
uint16_t port_id;
|
2018-07-10 16:04:54 +00:00
|
|
|
|
2019-10-07 13:56:19 +00:00
|
|
|
MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
|
2019-02-21 09:29:14 +00:00
|
|
|
struct mlx5_priv *opriv =
|
2019-04-01 02:26:59 +00:00
|
|
|
rte_eth_devices[port_id].data->dev_private;
|
2018-07-10 16:04:54 +00:00
|
|
|
|
|
|
|
if (!opriv ||
|
|
|
|
opriv->domain_id != priv->domain_id ||
|
2019-04-01 02:26:59 +00:00
|
|
|
&rte_eth_devices[port_id] == dev)
|
2018-07-10 16:04:54 +00:00
|
|
|
continue;
|
|
|
|
++c;
|
2019-09-25 07:53:33 +00:00
|
|
|
break;
|
2018-07-10 16:04:54 +00:00
|
|
|
}
|
|
|
|
if (!c)
|
|
|
|
claim_zero(rte_eth_switch_domain_free(priv->domain_id));
|
|
|
|
}
|
2015-10-30 18:52:30 +00:00
|
|
|
memset(priv, 0, sizeof(*priv));
|
2018-07-10 16:04:54 +00:00
|
|
|
priv->domain_id = RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID;
|
2018-10-23 18:26:04 +00:00
|
|
|
/*
|
|
|
|
* Reset mac_addrs to NULL such that it is not freed as part of
|
|
|
|
* rte_eth_dev_release_port(). mac_addrs is part of dev_private so
|
|
|
|
* it is freed when dev_private is freed.
|
|
|
|
*/
|
|
|
|
dev->data->mac_addrs = NULL;
|
2020-09-28 23:14:10 +00:00
|
|
|
return 0;
|
2015-10-30 18:52:30 +00:00
|
|
|
}
|
|
|
|
|
2020-12-28 12:32:56 +00:00
|
|
|
const struct eth_dev_ops mlx5_dev_ops = {
|
|
|
|
.dev_configure = mlx5_dev_configure,
|
|
|
|
.dev_start = mlx5_dev_start,
|
|
|
|
.dev_stop = mlx5_dev_stop,
|
|
|
|
.dev_set_link_down = mlx5_set_link_down,
|
|
|
|
.dev_set_link_up = mlx5_set_link_up,
|
|
|
|
.dev_close = mlx5_dev_close,
|
|
|
|
.promiscuous_enable = mlx5_promiscuous_enable,
|
|
|
|
.promiscuous_disable = mlx5_promiscuous_disable,
|
|
|
|
.allmulticast_enable = mlx5_allmulticast_enable,
|
|
|
|
.allmulticast_disable = mlx5_allmulticast_disable,
|
|
|
|
.link_update = mlx5_link_update,
|
|
|
|
.stats_get = mlx5_stats_get,
|
|
|
|
.stats_reset = mlx5_stats_reset,
|
|
|
|
.xstats_get = mlx5_xstats_get,
|
|
|
|
.xstats_reset = mlx5_xstats_reset,
|
|
|
|
.xstats_get_names = mlx5_xstats_get_names,
|
|
|
|
.fw_version_get = mlx5_fw_version_get,
|
|
|
|
.dev_infos_get = mlx5_dev_infos_get,
|
2021-03-28 13:48:08 +00:00
|
|
|
.representor_info_get = mlx5_representor_info_get,
|
2020-12-28 12:32:56 +00:00
|
|
|
.read_clock = mlx5_txpp_read_clock,
|
|
|
|
.dev_supported_ptypes_get = mlx5_dev_supported_ptypes_get,
|
|
|
|
.vlan_filter_set = mlx5_vlan_filter_set,
|
|
|
|
.rx_queue_setup = mlx5_rx_queue_setup,
|
|
|
|
.rx_hairpin_queue_setup = mlx5_rx_hairpin_queue_setup,
|
|
|
|
.tx_queue_setup = mlx5_tx_queue_setup,
|
|
|
|
.tx_hairpin_queue_setup = mlx5_tx_hairpin_queue_setup,
|
|
|
|
.rx_queue_release = mlx5_rx_queue_release,
|
|
|
|
.tx_queue_release = mlx5_tx_queue_release,
|
|
|
|
.rx_queue_start = mlx5_rx_queue_start,
|
|
|
|
.rx_queue_stop = mlx5_rx_queue_stop,
|
|
|
|
.tx_queue_start = mlx5_tx_queue_start,
|
|
|
|
.tx_queue_stop = mlx5_tx_queue_stop,
|
|
|
|
.flow_ctrl_get = mlx5_dev_get_flow_ctrl,
|
|
|
|
.flow_ctrl_set = mlx5_dev_set_flow_ctrl,
|
|
|
|
.mac_addr_remove = mlx5_mac_addr_remove,
|
|
|
|
.mac_addr_add = mlx5_mac_addr_add,
|
|
|
|
.mac_addr_set = mlx5_mac_addr_set,
|
|
|
|
.set_mc_addr_list = mlx5_set_mc_addr_list,
|
|
|
|
.mtu_set = mlx5_dev_set_mtu,
|
|
|
|
.vlan_strip_queue_set = mlx5_vlan_strip_queue_set,
|
|
|
|
.vlan_offload_set = mlx5_vlan_offload_set,
|
|
|
|
.reta_update = mlx5_dev_rss_reta_update,
|
|
|
|
.reta_query = mlx5_dev_rss_reta_query,
|
|
|
|
.rss_hash_update = mlx5_rss_hash_update,
|
|
|
|
.rss_hash_conf_get = mlx5_rss_hash_conf_get,
|
2021-03-21 09:00:00 +00:00
|
|
|
.flow_ops_get = mlx5_flow_ops_get,
|
2020-12-28 12:32:56 +00:00
|
|
|
.rxq_info_get = mlx5_rxq_info_get,
|
|
|
|
.txq_info_get = mlx5_txq_info_get,
|
|
|
|
.rx_burst_mode_get = mlx5_rx_burst_mode_get,
|
|
|
|
.tx_burst_mode_get = mlx5_tx_burst_mode_get,
|
|
|
|
.rx_queue_intr_enable = mlx5_rx_intr_enable,
|
|
|
|
.rx_queue_intr_disable = mlx5_rx_intr_disable,
|
|
|
|
.is_removed = mlx5_is_removed,
|
|
|
|
.udp_tunnel_port_add = mlx5_udp_tunnel_port_add,
|
|
|
|
.get_module_info = mlx5_get_module_info,
|
|
|
|
.get_module_eeprom = mlx5_get_module_eeprom,
|
|
|
|
.hairpin_cap_get = mlx5_hairpin_cap_get,
|
|
|
|
.mtr_ops_get = mlx5_flow_meter_ops_get,
|
|
|
|
.hairpin_bind = mlx5_hairpin_bind,
|
|
|
|
.hairpin_unbind = mlx5_hairpin_unbind,
|
|
|
|
.hairpin_get_peer_ports = mlx5_hairpin_get_peer_ports,
|
|
|
|
.hairpin_queue_peer_update = mlx5_hairpin_queue_peer_update,
|
|
|
|
.hairpin_queue_peer_bind = mlx5_hairpin_queue_peer_bind,
|
|
|
|
.hairpin_queue_peer_unbind = mlx5_hairpin_queue_peer_unbind,
|
2021-04-29 14:55:18 +00:00
|
|
|
.get_monitor_addr = mlx5_get_monitor_addr,
|
2020-12-28 12:32:56 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
/* Available operations from secondary process. */
|
|
|
|
const struct eth_dev_ops mlx5_dev_sec_ops = {
|
|
|
|
.stats_get = mlx5_stats_get,
|
|
|
|
.stats_reset = mlx5_stats_reset,
|
|
|
|
.xstats_get = mlx5_xstats_get,
|
|
|
|
.xstats_reset = mlx5_xstats_reset,
|
|
|
|
.xstats_get_names = mlx5_xstats_get_names,
|
|
|
|
.fw_version_get = mlx5_fw_version_get,
|
|
|
|
.dev_infos_get = mlx5_dev_infos_get,
|
|
|
|
.read_clock = mlx5_txpp_read_clock,
|
|
|
|
.rx_queue_start = mlx5_rx_queue_start,
|
|
|
|
.rx_queue_stop = mlx5_rx_queue_stop,
|
|
|
|
.tx_queue_start = mlx5_tx_queue_start,
|
|
|
|
.tx_queue_stop = mlx5_tx_queue_stop,
|
|
|
|
.rxq_info_get = mlx5_rxq_info_get,
|
|
|
|
.txq_info_get = mlx5_txq_info_get,
|
|
|
|
.rx_burst_mode_get = mlx5_rx_burst_mode_get,
|
|
|
|
.tx_burst_mode_get = mlx5_tx_burst_mode_get,
|
|
|
|
.get_module_info = mlx5_get_module_info,
|
|
|
|
.get_module_eeprom = mlx5_get_module_eeprom,
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Available operations in flow isolated mode. */
|
|
|
|
const struct eth_dev_ops mlx5_dev_ops_isolate = {
|
|
|
|
.dev_configure = mlx5_dev_configure,
|
|
|
|
.dev_start = mlx5_dev_start,
|
|
|
|
.dev_stop = mlx5_dev_stop,
|
|
|
|
.dev_set_link_down = mlx5_set_link_down,
|
|
|
|
.dev_set_link_up = mlx5_set_link_up,
|
|
|
|
.dev_close = mlx5_dev_close,
|
|
|
|
.promiscuous_enable = mlx5_promiscuous_enable,
|
|
|
|
.promiscuous_disable = mlx5_promiscuous_disable,
|
|
|
|
.allmulticast_enable = mlx5_allmulticast_enable,
|
|
|
|
.allmulticast_disable = mlx5_allmulticast_disable,
|
|
|
|
.link_update = mlx5_link_update,
|
|
|
|
.stats_get = mlx5_stats_get,
|
|
|
|
.stats_reset = mlx5_stats_reset,
|
|
|
|
.xstats_get = mlx5_xstats_get,
|
|
|
|
.xstats_reset = mlx5_xstats_reset,
|
|
|
|
.xstats_get_names = mlx5_xstats_get_names,
|
|
|
|
.fw_version_get = mlx5_fw_version_get,
|
|
|
|
.dev_infos_get = mlx5_dev_infos_get,
|
|
|
|
.read_clock = mlx5_txpp_read_clock,
|
|
|
|
.dev_supported_ptypes_get = mlx5_dev_supported_ptypes_get,
|
|
|
|
.vlan_filter_set = mlx5_vlan_filter_set,
|
|
|
|
.rx_queue_setup = mlx5_rx_queue_setup,
|
|
|
|
.rx_hairpin_queue_setup = mlx5_rx_hairpin_queue_setup,
|
|
|
|
.tx_queue_setup = mlx5_tx_queue_setup,
|
|
|
|
.tx_hairpin_queue_setup = mlx5_tx_hairpin_queue_setup,
|
|
|
|
.rx_queue_release = mlx5_rx_queue_release,
|
|
|
|
.tx_queue_release = mlx5_tx_queue_release,
|
|
|
|
.rx_queue_start = mlx5_rx_queue_start,
|
|
|
|
.rx_queue_stop = mlx5_rx_queue_stop,
|
|
|
|
.tx_queue_start = mlx5_tx_queue_start,
|
|
|
|
.tx_queue_stop = mlx5_tx_queue_stop,
|
|
|
|
.flow_ctrl_get = mlx5_dev_get_flow_ctrl,
|
|
|
|
.flow_ctrl_set = mlx5_dev_set_flow_ctrl,
|
|
|
|
.mac_addr_remove = mlx5_mac_addr_remove,
|
|
|
|
.mac_addr_add = mlx5_mac_addr_add,
|
|
|
|
.mac_addr_set = mlx5_mac_addr_set,
|
|
|
|
.set_mc_addr_list = mlx5_set_mc_addr_list,
|
|
|
|
.mtu_set = mlx5_dev_set_mtu,
|
|
|
|
.vlan_strip_queue_set = mlx5_vlan_strip_queue_set,
|
|
|
|
.vlan_offload_set = mlx5_vlan_offload_set,
|
2021-03-21 09:00:00 +00:00
|
|
|
.flow_ops_get = mlx5_flow_ops_get,
|
2020-12-28 12:32:56 +00:00
|
|
|
.rxq_info_get = mlx5_rxq_info_get,
|
|
|
|
.txq_info_get = mlx5_txq_info_get,
|
|
|
|
.rx_burst_mode_get = mlx5_rx_burst_mode_get,
|
|
|
|
.tx_burst_mode_get = mlx5_tx_burst_mode_get,
|
|
|
|
.rx_queue_intr_enable = mlx5_rx_intr_enable,
|
|
|
|
.rx_queue_intr_disable = mlx5_rx_intr_disable,
|
|
|
|
.is_removed = mlx5_is_removed,
|
|
|
|
.get_module_info = mlx5_get_module_info,
|
|
|
|
.get_module_eeprom = mlx5_get_module_eeprom,
|
|
|
|
.hairpin_cap_get = mlx5_hairpin_cap_get,
|
|
|
|
.mtr_ops_get = mlx5_flow_meter_ops_get,
|
|
|
|
.hairpin_bind = mlx5_hairpin_bind,
|
|
|
|
.hairpin_unbind = mlx5_hairpin_unbind,
|
|
|
|
.hairpin_get_peer_ports = mlx5_hairpin_get_peer_ports,
|
|
|
|
.hairpin_queue_peer_update = mlx5_hairpin_queue_peer_update,
|
|
|
|
.hairpin_queue_peer_bind = mlx5_hairpin_queue_peer_bind,
|
|
|
|
.hairpin_queue_peer_unbind = mlx5_hairpin_queue_peer_unbind,
|
2021-04-29 14:55:18 +00:00
|
|
|
.get_monitor_addr = mlx5_get_monitor_addr,
|
2020-12-28 12:32:56 +00:00
|
|
|
};
|
|
|
|
|
2016-06-24 13:17:50 +00:00
|
|
|
/**
|
|
|
|
* Verify and store value for device argument.
|
|
|
|
*
|
|
|
|
* @param[in] key
|
|
|
|
* Key argument to verify.
|
|
|
|
* @param[in] val
|
|
|
|
* Value associated with key.
|
|
|
|
* @param opaque
|
|
|
|
* User data.
|
|
|
|
*
|
|
|
|
* @return
|
2018-03-05 12:21:06 +00:00
|
|
|
* 0 on success, a negative errno value otherwise and rte_errno is set.
|
2016-06-24 13:17:50 +00:00
|
|
|
*/
|
|
|
|
static int
|
|
|
|
mlx5_args_check(const char *key, const char *val, void *opaque)
|
|
|
|
{
|
2018-01-10 09:16:58 +00:00
|
|
|
struct mlx5_dev_config *config = opaque;
|
2020-07-16 08:23:05 +00:00
|
|
|
unsigned long mod;
|
|
|
|
signed long tmp;
|
2016-06-24 13:17:50 +00:00
|
|
|
|
2018-07-10 16:04:58 +00:00
|
|
|
/* No-op, port representors are processed in mlx5_dev_spawn(). */
|
|
|
|
if (!strcmp(MLX5_REPRESENTOR, key))
|
|
|
|
return 0;
|
2016-06-24 13:17:54 +00:00
|
|
|
errno = 0;
|
2020-07-16 08:23:05 +00:00
|
|
|
tmp = strtol(val, NULL, 0);
|
2016-06-24 13:17:54 +00:00
|
|
|
if (errno) {
|
2018-03-05 12:21:06 +00:00
|
|
|
rte_errno = errno;
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "%s: \"%s\" is not a valid integer", key, val);
|
2018-03-05 12:21:06 +00:00
|
|
|
return -rte_errno;
|
2016-06-24 13:17:54 +00:00
|
|
|
}
|
2020-07-16 08:23:05 +00:00
|
|
|
if (tmp < 0 && strcmp(MLX5_TX_PP, key) && strcmp(MLX5_TX_SKEW, key)) {
|
|
|
|
/* Negative values are acceptable for some keys only. */
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
DRV_LOG(WARNING, "%s: invalid negative value \"%s\"", key, val);
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
|
|
|
mod = tmp >= 0 ? tmp : -tmp;
|
2016-06-24 13:17:54 +00:00
|
|
|
if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) {
|
2020-11-01 16:27:39 +00:00
|
|
|
if (tmp > MLX5_CQE_RESP_FORMAT_L34H_STRIDX) {
|
|
|
|
DRV_LOG(ERR, "invalid CQE compression "
|
|
|
|
"format parameter");
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
2018-01-10 09:16:58 +00:00
|
|
|
config->cqe_comp = !!tmp;
|
2020-11-01 16:27:39 +00:00
|
|
|
config->cqe_comp_fmt = tmp;
|
2019-01-15 17:38:58 +00:00
|
|
|
} else if (strcmp(MLX5_RXQ_PKT_PAD_EN, key) == 0) {
|
|
|
|
config->hw_padding = !!tmp;
|
2018-05-09 11:13:50 +00:00
|
|
|
} else if (strcmp(MLX5_RX_MPRQ_EN, key) == 0) {
|
|
|
|
config->mprq.enabled = !!tmp;
|
|
|
|
} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_NUM, key) == 0) {
|
|
|
|
config->mprq.stride_num_n = tmp;
|
2020-04-09 22:23:51 +00:00
|
|
|
} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_SIZE, key) == 0) {
|
|
|
|
config->mprq.stride_size_n = tmp;
|
2018-05-09 11:13:50 +00:00
|
|
|
} else if (strcmp(MLX5_RX_MPRQ_MAX_MEMCPY_LEN, key) == 0) {
|
|
|
|
config->mprq.max_memcpy_len = tmp;
|
|
|
|
} else if (strcmp(MLX5_RXQS_MIN_MPRQ, key) == 0) {
|
|
|
|
config->mprq.min_rxqs_num = tmp;
|
2016-06-24 13:17:56 +00:00
|
|
|
} else if (strcmp(MLX5_TXQ_INLINE, key) == 0) {
|
2019-07-21 14:24:54 +00:00
|
|
|
DRV_LOG(WARNING, "%s: deprecated parameter,"
|
|
|
|
" converted to txq_inline_max", key);
|
|
|
|
config->txq_inline_max = tmp;
|
|
|
|
} else if (strcmp(MLX5_TXQ_INLINE_MAX, key) == 0) {
|
|
|
|
config->txq_inline_max = tmp;
|
|
|
|
} else if (strcmp(MLX5_TXQ_INLINE_MIN, key) == 0) {
|
|
|
|
config->txq_inline_min = tmp;
|
|
|
|
} else if (strcmp(MLX5_TXQ_INLINE_MPW, key) == 0) {
|
|
|
|
config->txq_inline_mpw = tmp;
|
2016-06-24 13:17:56 +00:00
|
|
|
} else if (strcmp(MLX5_TXQS_MIN_INLINE, key) == 0) {
|
2018-01-10 09:16:58 +00:00
|
|
|
config->txqs_inline = tmp;
|
2018-11-01 17:20:32 +00:00
|
|
|
} else if (strcmp(MLX5_TXQS_MAX_VEC, key) == 0) {
|
2019-07-21 14:24:53 +00:00
|
|
|
DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
|
2016-06-24 13:17:57 +00:00
|
|
|
} else if (strcmp(MLX5_TXQ_MPW_EN, key) == 0) {
|
2018-08-13 06:47:57 +00:00
|
|
|
config->mps = !!tmp;
|
2019-11-08 15:07:50 +00:00
|
|
|
} else if (strcmp(MLX5_TX_DB_NC, key) == 0) {
|
2019-11-15 11:35:06 +00:00
|
|
|
if (tmp != MLX5_TXDB_CACHED &&
|
|
|
|
tmp != MLX5_TXDB_NCACHED &&
|
|
|
|
tmp != MLX5_TXDB_HEURISTIC) {
|
|
|
|
DRV_LOG(ERR, "invalid Tx doorbell "
|
|
|
|
"mapping parameter");
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
|
|
|
config->dbnc = tmp;
|
2017-03-15 23:55:44 +00:00
|
|
|
} else if (strcmp(MLX5_TXQ_MPW_HDR_DSEG_EN, key) == 0) {
|
2019-07-21 14:24:53 +00:00
|
|
|
DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
|
2017-03-15 23:55:44 +00:00
|
|
|
} else if (strcmp(MLX5_TXQ_MAX_INLINE_LEN, key) == 0) {
|
2019-07-21 14:24:54 +00:00
|
|
|
DRV_LOG(WARNING, "%s: deprecated parameter,"
|
|
|
|
" converted to txq_inline_mpw", key);
|
|
|
|
config->txq_inline_mpw = tmp;
|
2017-08-02 15:32:56 +00:00
|
|
|
} else if (strcmp(MLX5_TX_VEC_EN, key) == 0) {
|
2019-07-21 14:24:53 +00:00
|
|
|
DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
|
2020-07-16 08:23:05 +00:00
|
|
|
} else if (strcmp(MLX5_TX_PP, key) == 0) {
|
|
|
|
if (!mod) {
|
|
|
|
DRV_LOG(ERR, "Zero Tx packet pacing parameter");
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
|
|
|
config->tx_pp = tmp;
|
|
|
|
} else if (strcmp(MLX5_TX_SKEW, key) == 0) {
|
|
|
|
config->tx_skew = tmp;
|
2017-08-02 15:32:56 +00:00
|
|
|
} else if (strcmp(MLX5_RX_VEC_EN, key) == 0) {
|
2018-01-10 09:16:58 +00:00
|
|
|
config->rx_vec_en = !!tmp;
|
2018-04-23 12:33:02 +00:00
|
|
|
} else if (strcmp(MLX5_L3_VXLAN_EN, key) == 0) {
|
|
|
|
config->l3_vxlan_en = !!tmp;
|
2018-04-05 15:07:21 +00:00
|
|
|
} else if (strcmp(MLX5_VF_NL_EN, key) == 0) {
|
|
|
|
config->vf_nl_en = !!tmp;
|
2019-04-18 13:16:01 +00:00
|
|
|
} else if (strcmp(MLX5_DV_ESW_EN, key) == 0) {
|
|
|
|
config->dv_esw_en = !!tmp;
|
2018-09-24 23:17:54 +00:00
|
|
|
} else if (strcmp(MLX5_DV_FLOW_EN, key) == 0) {
|
|
|
|
config->dv_flow_en = !!tmp;
|
net/mlx5: add devarg for extensive metadata support
The PMD parameter dv_xmeta_en is added to control extensive
metadata support. A nonzero value enables extensive flow
metadata support if device is capable and driver supports it.
This can enable extensive support of MARK and META item of
rte_flow. The newly introduced SET_TAG and SET_META actions
do not depend on dv_xmeta_en parameter, because there is
no compatibility issue for new entities. The dv_xmeta_en is
disabled by default.
There are some possible configurations, depending on parameter
value:
- 0, this is default value, defines the legacy mode, the MARK
and META related actions and items operate only within NIC Tx
and NIC Rx steering domains, no MARK and META information
crosses the domain boundaries. The MARK item is 24 bits wide,
the META item is 32 bits wide.
- 1, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The ``MARK`` item is 24 bits wide, the
META item width depends on kernel and firmware configurations
and might be 0, 16 or 32 bits. Within NIC Tx domain META data
width is 32 bits for compatibility, the actual width of data
transferred to the FDB domain depends on kernel configuration
and may be vary. The actual supported width can be retrieved
in runtime by series of rte_flow_validate() trials.
- 2, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The META item is 32 bits wide, the MARK
item width depends on kernel and firmware configurations and
might be 0, 16 or 24 bits. The actual supported width can be
retrieved in runtime by series of rte_flow_validate() trials.
If there is no E-Switch configuration the ``dv_xmeta_en`` parameter is
ignored and the device is configured to operate in legacy mode (0).
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2019-11-07 17:09:54 +00:00
|
|
|
} else if (strcmp(MLX5_DV_XMETA_EN, key) == 0) {
|
|
|
|
if (tmp != MLX5_XMETA_MODE_LEGACY &&
|
|
|
|
tmp != MLX5_XMETA_MODE_META16 &&
|
2020-10-25 14:08:09 +00:00
|
|
|
tmp != MLX5_XMETA_MODE_META32 &&
|
|
|
|
tmp != MLX5_XMETA_MODE_MISS_INFO) {
|
2019-11-15 11:35:06 +00:00
|
|
|
DRV_LOG(ERR, "invalid extensive "
|
|
|
|
"metadata parameter");
|
net/mlx5: add devarg for extensive metadata support
The PMD parameter dv_xmeta_en is added to control extensive
metadata support. A nonzero value enables extensive flow
metadata support if device is capable and driver supports it.
This can enable extensive support of MARK and META item of
rte_flow. The newly introduced SET_TAG and SET_META actions
do not depend on dv_xmeta_en parameter, because there is
no compatibility issue for new entities. The dv_xmeta_en is
disabled by default.
There are some possible configurations, depending on parameter
value:
- 0, this is default value, defines the legacy mode, the MARK
and META related actions and items operate only within NIC Tx
and NIC Rx steering domains, no MARK and META information
crosses the domain boundaries. The MARK item is 24 bits wide,
the META item is 32 bits wide.
- 1, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The ``MARK`` item is 24 bits wide, the
META item width depends on kernel and firmware configurations
and might be 0, 16 or 32 bits. Within NIC Tx domain META data
width is 32 bits for compatibility, the actual width of data
transferred to the FDB domain depends on kernel configuration
and may be vary. The actual supported width can be retrieved
in runtime by series of rte_flow_validate() trials.
- 2, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The META item is 32 bits wide, the MARK
item width depends on kernel and firmware configurations and
might be 0, 16 or 24 bits. The actual supported width can be
retrieved in runtime by series of rte_flow_validate() trials.
If there is no E-Switch configuration the ``dv_xmeta_en`` parameter is
ignored and the device is configured to operate in legacy mode (0).
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2019-11-07 17:09:54 +00:00
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
2020-10-25 14:08:09 +00:00
|
|
|
if (tmp != MLX5_XMETA_MODE_MISS_INFO)
|
|
|
|
config->dv_xmeta_en = tmp;
|
|
|
|
else
|
|
|
|
config->dv_miss_info = 1;
|
2020-06-23 08:41:07 +00:00
|
|
|
} else if (strcmp(MLX5_LACP_BY_USER, key) == 0) {
|
|
|
|
config->lacp_by_user = !!tmp;
|
2019-04-01 21:17:54 +00:00
|
|
|
} else if (strcmp(MLX5_MR_EXT_MEMSEG_EN, key) == 0) {
|
|
|
|
config->mr_ext_memseg_en = !!tmp;
|
2019-05-30 10:20:32 +00:00
|
|
|
} else if (strcmp(MLX5_MAX_DUMP_FILES_NUM, key) == 0) {
|
|
|
|
config->max_dump_files_num = tmp;
|
2019-07-22 14:51:59 +00:00
|
|
|
} else if (strcmp(MLX5_LRO_TIMEOUT_USEC, key) == 0) {
|
|
|
|
config->lro.timeout = tmp;
|
2021-07-05 06:45:11 +00:00
|
|
|
} else if (strcmp(RTE_DEVARGS_KEY_CLASS, key) == 0) {
|
2020-01-29 12:38:46 +00:00
|
|
|
DRV_LOG(DEBUG, "class argument is %s.", val);
|
2020-03-24 12:59:01 +00:00
|
|
|
} else if (strcmp(MLX5_HP_BUF_SIZE, key) == 0) {
|
|
|
|
config->log_hp_size = tmp;
|
net/mlx5: add reclaim memory mode
Currently, when flow destroyed, some memory resources may still be kept
as cached to help next time create flow more efficiently.
Some system may need the resources to be more flexible with flow create
and destroy. After peak time, with millions of flows destroyed, the
system would prefer the resources to be reclaimed completely, no cache
is needed. Then the resources can be allocated and used by other
components. The system is not so sensitive about the flow insertion
rate, but more care about the resources.
Both DPDK mlx5 PMD driver and the low level component rdma-core have
provided the flow resources to be configured cached or not, but there is
no APIs or parameters exposed to user to configure the flow resources
cache mode. In this case, introduce a new PMD devarg to let user
configure the flow resources cache mode will be helpful.
This commit is to add a new "reclaim_mem_mode" to help user configure if
the destroyed flows' cache resources should be kept or not.
Their will be three mode can be chosen:
1. 0(none). It means the flow resources will be cached as usual. The
resources will be cached, helpful with flow insertion rate.
2. 1(light). It will only enable the DPDK PMD level resources reclaim.
3. 2(aggressive). Both DPDK PMD level and rdma-core low level will be
configured as reclaimed mode.
With these three mode, user can configure the resources cache mode with
different levels.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
2020-06-01 06:09:43 +00:00
|
|
|
} else if (strcmp(MLX5_RECLAIM_MEM, key) == 0) {
|
|
|
|
if (tmp != MLX5_RCM_NONE &&
|
|
|
|
tmp != MLX5_RCM_LIGHT &&
|
|
|
|
tmp != MLX5_RCM_AGGR) {
|
|
|
|
DRV_LOG(ERR, "Unrecognize %s: \"%s\"", key, val);
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
|
|
|
config->reclaim_mode = tmp;
|
net/mlx5: add option to allocate memory from system
Currently, for MLX5 PMD, once millions of flows created, the memory
consumption of the flows are also very huge. For the system with limited
memory, it means the system need to reserve most of the memory as huge
page memory to serve the flows in advance. And other normal applications
will have no chance to use this reserved memory any more. While most of
the time, the system will not have lots of flows, the reserved huge
page memory becomes a bit waste of memory at most of the time.
By the new sys_mem_en devarg, once set it to be true, it allows the PMD
allocate the memory from system by default with the new add mlx5 memory
management functions. Only once the MLX5_MEM_RTE flag is set, the memory
will be allocate from rte, otherwise, it allocates memory from system.
So in this case, the system with limited memory no need to reserve most
of the memory for hugepage. Only some needed memory for datapath objects
will be enough to allocated with explicitly flag. Other memory will be
allocated from system. For system with enough memory, no need to care
about the devarg, the memory will always be from rte hugepage.
One restriction is that for DPDK application with multiple PCI devices,
if the sys_mem_en devargs are different between the devices, the
sys_mem_en only gets the value from the first device devargs, and print
out a message to warn that.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2020-06-28 03:41:57 +00:00
|
|
|
} else if (strcmp(MLX5_SYS_MEM_EN, key) == 0) {
|
|
|
|
config->sys_mem_en = !!tmp;
|
2020-07-15 13:10:21 +00:00
|
|
|
} else if (strcmp(MLX5_DECAP_EN, key) == 0) {
|
|
|
|
config->decap_en = !!tmp;
|
2021-07-06 08:12:27 +00:00
|
|
|
} else if (strcmp(MLX5_ALLOW_DUPLICATE_PATTERN, key) == 0) {
|
|
|
|
config->allow_duplicate_pattern = !!tmp;
|
2016-06-24 13:17:54 +00:00
|
|
|
} else {
|
2018-03-13 09:23:56 +00:00
|
|
|
DRV_LOG(WARNING, "%s: unknown parameter", key);
|
2018-03-05 12:21:06 +00:00
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
2016-06-24 13:17:54 +00:00
|
|
|
}
|
|
|
|
return 0;
|
2016-06-24 13:17:50 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Parse device parameters.
|
|
|
|
*
|
2018-01-10 09:16:58 +00:00
|
|
|
* @param config
|
|
|
|
* Pointer to device configuration structure.
|
2016-06-24 13:17:50 +00:00
|
|
|
* @param devargs
|
|
|
|
* Device arguments structure.
|
|
|
|
*
|
|
|
|
* @return
|
2018-03-05 12:21:06 +00:00
|
|
|
* 0 on success, a negative errno value otherwise and rte_errno is set.
|
2016-06-24 13:17:50 +00:00
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
int
|
2018-01-10 09:16:58 +00:00
|
|
|
mlx5_args(struct mlx5_dev_config *config, struct rte_devargs *devargs)
|
2016-06-24 13:17:50 +00:00
|
|
|
{
|
|
|
|
const char **params = (const char *[]){
|
2016-06-24 13:17:54 +00:00
|
|
|
MLX5_RXQ_CQE_COMP_EN,
|
2019-01-15 17:38:58 +00:00
|
|
|
MLX5_RXQ_PKT_PAD_EN,
|
2018-05-09 11:13:50 +00:00
|
|
|
MLX5_RX_MPRQ_EN,
|
|
|
|
MLX5_RX_MPRQ_LOG_STRIDE_NUM,
|
2020-04-09 22:23:51 +00:00
|
|
|
MLX5_RX_MPRQ_LOG_STRIDE_SIZE,
|
2018-05-09 11:13:50 +00:00
|
|
|
MLX5_RX_MPRQ_MAX_MEMCPY_LEN,
|
|
|
|
MLX5_RXQS_MIN_MPRQ,
|
2016-06-24 13:17:56 +00:00
|
|
|
MLX5_TXQ_INLINE,
|
2019-07-21 14:24:54 +00:00
|
|
|
MLX5_TXQ_INLINE_MIN,
|
|
|
|
MLX5_TXQ_INLINE_MAX,
|
|
|
|
MLX5_TXQ_INLINE_MPW,
|
2016-06-24 13:17:56 +00:00
|
|
|
MLX5_TXQS_MIN_INLINE,
|
2018-11-01 17:20:32 +00:00
|
|
|
MLX5_TXQS_MAX_VEC,
|
2016-06-24 13:17:57 +00:00
|
|
|
MLX5_TXQ_MPW_EN,
|
2017-03-15 23:55:44 +00:00
|
|
|
MLX5_TXQ_MPW_HDR_DSEG_EN,
|
|
|
|
MLX5_TXQ_MAX_INLINE_LEN,
|
2019-11-08 15:07:50 +00:00
|
|
|
MLX5_TX_DB_NC,
|
2020-07-16 08:23:05 +00:00
|
|
|
MLX5_TX_PP,
|
|
|
|
MLX5_TX_SKEW,
|
2017-08-02 15:32:56 +00:00
|
|
|
MLX5_TX_VEC_EN,
|
|
|
|
MLX5_RX_VEC_EN,
|
2018-04-23 12:33:02 +00:00
|
|
|
MLX5_L3_VXLAN_EN,
|
2018-04-05 15:07:21 +00:00
|
|
|
MLX5_VF_NL_EN,
|
2019-04-18 13:16:01 +00:00
|
|
|
MLX5_DV_ESW_EN,
|
2018-09-24 23:17:54 +00:00
|
|
|
MLX5_DV_FLOW_EN,
|
net/mlx5: add devarg for extensive metadata support
The PMD parameter dv_xmeta_en is added to control extensive
metadata support. A nonzero value enables extensive flow
metadata support if device is capable and driver supports it.
This can enable extensive support of MARK and META item of
rte_flow. The newly introduced SET_TAG and SET_META actions
do not depend on dv_xmeta_en parameter, because there is
no compatibility issue for new entities. The dv_xmeta_en is
disabled by default.
There are some possible configurations, depending on parameter
value:
- 0, this is default value, defines the legacy mode, the MARK
and META related actions and items operate only within NIC Tx
and NIC Rx steering domains, no MARK and META information
crosses the domain boundaries. The MARK item is 24 bits wide,
the META item is 32 bits wide.
- 1, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The ``MARK`` item is 24 bits wide, the
META item width depends on kernel and firmware configurations
and might be 0, 16 or 32 bits. Within NIC Tx domain META data
width is 32 bits for compatibility, the actual width of data
transferred to the FDB domain depends on kernel configuration
and may be vary. The actual supported width can be retrieved
in runtime by series of rte_flow_validate() trials.
- 2, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The META item is 32 bits wide, the MARK
item width depends on kernel and firmware configurations and
might be 0, 16 or 24 bits. The actual supported width can be
retrieved in runtime by series of rte_flow_validate() trials.
If there is no E-Switch configuration the ``dv_xmeta_en`` parameter is
ignored and the device is configured to operate in legacy mode (0).
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2019-11-07 17:09:54 +00:00
|
|
|
MLX5_DV_XMETA_EN,
|
2020-06-23 08:41:07 +00:00
|
|
|
MLX5_LACP_BY_USER,
|
2019-04-01 21:17:54 +00:00
|
|
|
MLX5_MR_EXT_MEMSEG_EN,
|
2018-07-10 16:04:58 +00:00
|
|
|
MLX5_REPRESENTOR,
|
2019-05-30 10:20:32 +00:00
|
|
|
MLX5_MAX_DUMP_FILES_NUM,
|
2019-07-22 14:51:59 +00:00
|
|
|
MLX5_LRO_TIMEOUT_USEC,
|
2021-07-05 06:45:11 +00:00
|
|
|
RTE_DEVARGS_KEY_CLASS,
|
2020-03-24 12:59:01 +00:00
|
|
|
MLX5_HP_BUF_SIZE,
|
net/mlx5: add reclaim memory mode
Currently, when flow destroyed, some memory resources may still be kept
as cached to help next time create flow more efficiently.
Some system may need the resources to be more flexible with flow create
and destroy. After peak time, with millions of flows destroyed, the
system would prefer the resources to be reclaimed completely, no cache
is needed. Then the resources can be allocated and used by other
components. The system is not so sensitive about the flow insertion
rate, but more care about the resources.
Both DPDK mlx5 PMD driver and the low level component rdma-core have
provided the flow resources to be configured cached or not, but there is
no APIs or parameters exposed to user to configure the flow resources
cache mode. In this case, introduce a new PMD devarg to let user
configure the flow resources cache mode will be helpful.
This commit is to add a new "reclaim_mem_mode" to help user configure if
the destroyed flows' cache resources should be kept or not.
Their will be three mode can be chosen:
1. 0(none). It means the flow resources will be cached as usual. The
resources will be cached, helpful with flow insertion rate.
2. 1(light). It will only enable the DPDK PMD level resources reclaim.
3. 2(aggressive). Both DPDK PMD level and rdma-core low level will be
configured as reclaimed mode.
With these three mode, user can configure the resources cache mode with
different levels.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
2020-06-01 06:09:43 +00:00
|
|
|
MLX5_RECLAIM_MEM,
|
net/mlx5: add option to allocate memory from system
Currently, for MLX5 PMD, once millions of flows created, the memory
consumption of the flows are also very huge. For the system with limited
memory, it means the system need to reserve most of the memory as huge
page memory to serve the flows in advance. And other normal applications
will have no chance to use this reserved memory any more. While most of
the time, the system will not have lots of flows, the reserved huge
page memory becomes a bit waste of memory at most of the time.
By the new sys_mem_en devarg, once set it to be true, it allows the PMD
allocate the memory from system by default with the new add mlx5 memory
management functions. Only once the MLX5_MEM_RTE flag is set, the memory
will be allocate from rte, otherwise, it allocates memory from system.
So in this case, the system with limited memory no need to reserve most
of the memory for hugepage. Only some needed memory for datapath objects
will be enough to allocated with explicitly flag. Other memory will be
allocated from system. For system with enough memory, no need to care
about the devarg, the memory will always be from rte hugepage.
One restriction is that for DPDK application with multiple PCI devices,
if the sys_mem_en devargs are different between the devices, the
sys_mem_en only gets the value from the first device devargs, and print
out a message to warn that.
Signed-off-by: Suanming Mou <suanmingm@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2020-06-28 03:41:57 +00:00
|
|
|
MLX5_SYS_MEM_EN,
|
2020-07-15 13:10:21 +00:00
|
|
|
MLX5_DECAP_EN,
|
2021-07-06 08:12:27 +00:00
|
|
|
MLX5_ALLOW_DUPLICATE_PATTERN,
|
2016-06-24 13:17:50 +00:00
|
|
|
NULL,
|
|
|
|
};
|
|
|
|
struct rte_kvargs *kvlist;
|
|
|
|
int ret = 0;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
if (devargs == NULL)
|
|
|
|
return 0;
|
|
|
|
/* Following UGLY cast is done to pass checkpatch. */
|
|
|
|
kvlist = rte_kvargs_parse(devargs->args, params);
|
2019-05-30 10:20:33 +00:00
|
|
|
if (kvlist == NULL) {
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return -rte_errno;
|
|
|
|
}
|
2016-06-24 13:17:50 +00:00
|
|
|
/* Process parameters. */
|
|
|
|
for (i = 0; (params[i] != NULL); ++i) {
|
|
|
|
if (rte_kvargs_count(kvlist, params[i])) {
|
|
|
|
ret = rte_kvargs_process(kvlist, params[i],
|
2018-01-10 09:16:58 +00:00
|
|
|
mlx5_args_check, config);
|
2018-03-05 12:21:06 +00:00
|
|
|
if (ret) {
|
|
|
|
rte_errno = EINVAL;
|
2017-01-22 08:24:47 +00:00
|
|
|
rte_kvargs_free(kvlist);
|
2018-03-05 12:21:06 +00:00
|
|
|
return -rte_errno;
|
2017-01-22 08:24:47 +00:00
|
|
|
}
|
2016-06-24 13:17:50 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
rte_kvargs_free(kvlist);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2019-07-21 14:24:57 +00:00
|
|
|
/**
|
|
|
|
* Configures the minimal amount of data to inline into WQE
|
|
|
|
* while sending packets.
|
|
|
|
*
|
|
|
|
* - the txq_inline_min has the maximal priority, if this
|
|
|
|
* key is specified in devargs
|
|
|
|
* - if DevX is enabled the inline mode is queried from the
|
|
|
|
* device (HCA attributes and NIC vport context if needed).
|
2020-02-24 19:52:14 +00:00
|
|
|
* - otherwise L2 mode (18 bytes) is assumed for ConnectX-4/4 Lx
|
2019-07-21 14:24:57 +00:00
|
|
|
* and none (0 bytes) for other NICs
|
|
|
|
*
|
|
|
|
* @param spawn
|
|
|
|
* Verbs device parameters (name, port, switch_info) to spawn.
|
|
|
|
* @param config
|
|
|
|
* Device configuration parameters.
|
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
void
|
2019-07-21 14:24:57 +00:00
|
|
|
mlx5_set_min_inline(struct mlx5_dev_spawn_data *spawn,
|
|
|
|
struct mlx5_dev_config *config)
|
|
|
|
{
|
|
|
|
if (config->txq_inline_min != MLX5_ARG_UNSET) {
|
|
|
|
/* Application defines size of inlined data explicitly. */
|
|
|
|
switch (spawn->pci_dev->id.device_id) {
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
|
|
|
|
if (config->txq_inline_min <
|
|
|
|
(int)MLX5_INLINE_HSIZE_L2) {
|
|
|
|
DRV_LOG(DEBUG,
|
|
|
|
"txq_inline_mix aligned to minimal"
|
|
|
|
" ConnectX-4 required value %d",
|
|
|
|
(int)MLX5_INLINE_HSIZE_L2);
|
|
|
|
config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
if (config->hca_attr.eth_net_offloads) {
|
|
|
|
/* We have DevX enabled, inline mode queried successfully. */
|
|
|
|
switch (config->hca_attr.wqe_inline_mode) {
|
|
|
|
case MLX5_CAP_INLINE_MODE_L2:
|
|
|
|
/* outer L2 header must be inlined. */
|
|
|
|
config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_CAP_INLINE_MODE_NOT_REQUIRED:
|
|
|
|
/* No inline data are required by NIC. */
|
|
|
|
config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
|
|
|
|
config->hw_vlan_insert =
|
|
|
|
config->hca_attr.wqe_vlan_insert;
|
|
|
|
DRV_LOG(DEBUG, "Tx VLAN insertion is supported");
|
|
|
|
goto exit;
|
|
|
|
case MLX5_CAP_INLINE_MODE_VPORT_CONTEXT:
|
|
|
|
/* inline mode is defined by NIC vport context. */
|
|
|
|
if (!config->hca_attr.eth_virt)
|
|
|
|
break;
|
|
|
|
switch (config->hca_attr.vport_inline_mode) {
|
|
|
|
case MLX5_INLINE_MODE_NONE:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_NONE;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_INLINE_MODE_L2:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_L2;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_INLINE_MODE_IP:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_L3;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_INLINE_MODE_TCP_UDP:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_L4;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_INLINE_MODE_INNER_L2:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_INNER_L2;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_INLINE_MODE_INNER_IP:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_INNER_L3;
|
|
|
|
goto exit;
|
|
|
|
case MLX5_INLINE_MODE_INNER_TCP_UDP:
|
|
|
|
config->txq_inline_min =
|
|
|
|
MLX5_INLINE_HSIZE_INNER_L4;
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* We get here if we are unable to deduce
|
|
|
|
* inline data size with DevX. Try PCI ID
|
|
|
|
* to determine old NICs.
|
|
|
|
*/
|
|
|
|
switch (spawn->pci_dev->id.device_id) {
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX4LX:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF:
|
2019-08-05 13:03:49 +00:00
|
|
|
config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
|
2019-07-21 14:24:57 +00:00
|
|
|
config->hw_vlan_insert = 0;
|
|
|
|
break;
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX5:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX5VF:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX5EX:
|
|
|
|
case PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF:
|
|
|
|
/*
|
|
|
|
* These NICs support VLAN insertion from WQE and
|
|
|
|
* report the wqe_vlan_insert flag. But there is the bug
|
|
|
|
* and PFC control may be broken, so disable feature.
|
|
|
|
*/
|
|
|
|
config->hw_vlan_insert = 0;
|
2019-07-31 22:41:11 +00:00
|
|
|
config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
|
2019-07-21 14:24:57 +00:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
exit:
|
|
|
|
DRV_LOG(DEBUG, "min tx inline configured: %d", config->txq_inline_min);
|
|
|
|
}
|
|
|
|
|
2019-11-07 17:09:55 +00:00
|
|
|
/**
|
|
|
|
* Configures the metadata mask fields in the shared context.
|
|
|
|
*
|
|
|
|
* @param [in] dev
|
|
|
|
* Pointer to Ethernet device.
|
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
void
|
2019-11-07 17:09:55 +00:00
|
|
|
mlx5_set_metadata_mask(struct rte_eth_dev *dev)
|
|
|
|
{
|
|
|
|
struct mlx5_priv *priv = dev->data->dev_private;
|
2020-06-03 15:05:55 +00:00
|
|
|
struct mlx5_dev_ctx_shared *sh = priv->sh;
|
2019-11-07 17:09:55 +00:00
|
|
|
uint32_t meta, mark, reg_c0;
|
|
|
|
|
|
|
|
reg_c0 = ~priv->vport_meta_mask;
|
|
|
|
switch (priv->config.dv_xmeta_en) {
|
|
|
|
case MLX5_XMETA_MODE_LEGACY:
|
|
|
|
meta = UINT32_MAX;
|
|
|
|
mark = MLX5_FLOW_MARK_MASK;
|
|
|
|
break;
|
|
|
|
case MLX5_XMETA_MODE_META16:
|
|
|
|
meta = reg_c0 >> rte_bsf32(reg_c0);
|
|
|
|
mark = MLX5_FLOW_MARK_MASK;
|
|
|
|
break;
|
|
|
|
case MLX5_XMETA_MODE_META32:
|
|
|
|
meta = UINT32_MAX;
|
|
|
|
mark = (reg_c0 >> rte_bsf32(reg_c0)) & MLX5_FLOW_MARK_MASK;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
meta = 0;
|
|
|
|
mark = 0;
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(false);
|
2019-11-07 17:09:55 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (sh->dv_mark_mask && sh->dv_mark_mask != mark)
|
|
|
|
DRV_LOG(WARNING, "metadata MARK mask mismatche %08X:%08X",
|
|
|
|
sh->dv_mark_mask, mark);
|
|
|
|
else
|
|
|
|
sh->dv_mark_mask = mark;
|
|
|
|
if (sh->dv_meta_mask && sh->dv_meta_mask != meta)
|
|
|
|
DRV_LOG(WARNING, "metadata META mask mismatche %08X:%08X",
|
|
|
|
sh->dv_meta_mask, meta);
|
|
|
|
else
|
|
|
|
sh->dv_meta_mask = meta;
|
|
|
|
if (sh->dv_regc0_mask && sh->dv_regc0_mask != reg_c0)
|
|
|
|
DRV_LOG(WARNING, "metadata reg_c0 mask mismatche %08X:%08X",
|
|
|
|
sh->dv_meta_mask, reg_c0);
|
|
|
|
else
|
|
|
|
sh->dv_regc0_mask = reg_c0;
|
|
|
|
DRV_LOG(DEBUG, "metadata mode %u", priv->config.dv_xmeta_en);
|
|
|
|
DRV_LOG(DEBUG, "metadata MARK mask %08X", sh->dv_mark_mask);
|
|
|
|
DRV_LOG(DEBUG, "metadata META mask %08X", sh->dv_meta_mask);
|
|
|
|
DRV_LOG(DEBUG, "metadata reg_c0 mask %08X", sh->dv_regc0_mask);
|
|
|
|
}
|
|
|
|
|
2020-01-29 12:21:06 +00:00
|
|
|
int
|
|
|
|
rte_pmd_mlx5_get_dyn_flag_names(char *names[], unsigned int n)
|
|
|
|
{
|
|
|
|
static const char *const dynf_names[] = {
|
|
|
|
RTE_PMD_MLX5_FINE_GRANULARITY_INLINE,
|
2020-07-16 08:23:05 +00:00
|
|
|
RTE_MBUF_DYNFLAG_METADATA_NAME,
|
|
|
|
RTE_MBUF_DYNFLAG_TX_TIMESTAMP_NAME
|
2020-01-29 12:21:06 +00:00
|
|
|
};
|
|
|
|
unsigned int i;
|
|
|
|
|
|
|
|
if (n < RTE_DIM(dynf_names))
|
|
|
|
return -ENOMEM;
|
|
|
|
for (i = 0; i < RTE_DIM(dynf_names); i++) {
|
|
|
|
if (names[i] == NULL)
|
|
|
|
return -EINVAL;
|
|
|
|
strcpy(names[i], dynf_names[i]);
|
|
|
|
}
|
|
|
|
return RTE_DIM(dynf_names);
|
|
|
|
}
|
|
|
|
|
2019-09-25 07:53:35 +00:00
|
|
|
/**
|
2020-06-03 15:06:00 +00:00
|
|
|
* Comparison callback to sort device data.
|
2019-09-25 07:53:35 +00:00
|
|
|
*
|
2020-06-03 15:06:00 +00:00
|
|
|
* This is meant to be used with qsort().
|
2019-09-25 07:53:35 +00:00
|
|
|
*
|
2020-06-03 15:06:00 +00:00
|
|
|
* @param a[in]
|
|
|
|
* Pointer to pointer to first data object.
|
|
|
|
* @param b[in]
|
|
|
|
* Pointer to pointer to second data object.
|
2019-09-25 07:53:35 +00:00
|
|
|
*
|
|
|
|
* @return
|
2020-06-03 15:06:00 +00:00
|
|
|
* 0 if both objects are equal, less than 0 if the first argument is less
|
|
|
|
* than the second, greater than 0 otherwise.
|
2019-09-25 07:53:35 +00:00
|
|
|
*/
|
2020-06-03 15:06:00 +00:00
|
|
|
int
|
2019-09-25 07:53:35 +00:00
|
|
|
mlx5_dev_check_sibling_config(struct mlx5_priv *priv,
|
|
|
|
struct mlx5_dev_config *config)
|
|
|
|
{
|
2020-06-03 15:05:55 +00:00
|
|
|
struct mlx5_dev_ctx_shared *sh = priv->sh;
|
2019-09-25 07:53:35 +00:00
|
|
|
struct mlx5_dev_config *sh_conf = NULL;
|
|
|
|
uint16_t port_id;
|
|
|
|
|
2020-01-30 16:14:40 +00:00
|
|
|
MLX5_ASSERT(sh);
|
2019-09-25 07:53:35 +00:00
|
|
|
/* Nothing to compare for the single/first device. */
|
|
|
|
if (sh->refcnt == 1)
|
|
|
|
return 0;
|
|
|
|
/* Find the device with shared context. */
|
2019-10-07 13:56:19 +00:00
|
|
|
MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
|
2019-09-25 07:53:35 +00:00
|
|
|
struct mlx5_priv *opriv =
|
|
|
|
rte_eth_devices[port_id].data->dev_private;
|
|
|
|
|
|
|
|
if (opriv && opriv != priv && opriv->sh == sh) {
|
|
|
|
sh_conf = &opriv->config;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!sh_conf)
|
|
|
|
return 0;
|
|
|
|
if (sh_conf->dv_flow_en ^ config->dv_flow_en) {
|
|
|
|
DRV_LOG(ERR, "\"dv_flow_en\" configuration mismatch"
|
|
|
|
" for shared %s context", sh->ibdev_name);
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return rte_errno;
|
|
|
|
}
|
net/mlx5: add devarg for extensive metadata support
The PMD parameter dv_xmeta_en is added to control extensive
metadata support. A nonzero value enables extensive flow
metadata support if device is capable and driver supports it.
This can enable extensive support of MARK and META item of
rte_flow. The newly introduced SET_TAG and SET_META actions
do not depend on dv_xmeta_en parameter, because there is
no compatibility issue for new entities. The dv_xmeta_en is
disabled by default.
There are some possible configurations, depending on parameter
value:
- 0, this is default value, defines the legacy mode, the MARK
and META related actions and items operate only within NIC Tx
and NIC Rx steering domains, no MARK and META information
crosses the domain boundaries. The MARK item is 24 bits wide,
the META item is 32 bits wide.
- 1, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The ``MARK`` item is 24 bits wide, the
META item width depends on kernel and firmware configurations
and might be 0, 16 or 32 bits. Within NIC Tx domain META data
width is 32 bits for compatibility, the actual width of data
transferred to the FDB domain depends on kernel configuration
and may be vary. The actual supported width can be retrieved
in runtime by series of rte_flow_validate() trials.
- 2, this engages extensive metadata mode, the MARK and META
related actions and items operate within all supported steering
domains, including FDB, MARK and META information may cross
the domain boundaries. The META item is 32 bits wide, the MARK
item width depends on kernel and firmware configurations and
might be 0, 16 or 24 bits. The actual supported width can be
retrieved in runtime by series of rte_flow_validate() trials.
If there is no E-Switch configuration the ``dv_xmeta_en`` parameter is
ignored and the device is configured to operate in legacy mode (0).
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Matan Azrad <matan@mellanox.com>
2019-11-07 17:09:54 +00:00
|
|
|
if (sh_conf->dv_xmeta_en ^ config->dv_xmeta_en) {
|
|
|
|
DRV_LOG(ERR, "\"dv_xmeta_en\" configuration mismatch"
|
|
|
|
" for shared %s context", sh->ibdev_name);
|
|
|
|
rte_errno = EINVAL;
|
|
|
|
return rte_errno;
|
|
|
|
}
|
2019-09-25 07:53:35 +00:00
|
|
|
return 0;
|
|
|
|
}
|
2015-10-30 18:52:30 +00:00
|
|
|
|
2019-10-07 13:56:19 +00:00
|
|
|
/**
|
|
|
|
* Look for the ethernet device belonging to mlx5 driver.
|
|
|
|
*
|
|
|
|
* @param[in] port_id
|
|
|
|
* port_id to start looking for device.
|
|
|
|
* @param[in] pci_dev
|
|
|
|
* Pointer to the hint PCI device. When device is being probed
|
|
|
|
* the its siblings (master and preceding representors might
|
2020-06-03 15:06:00 +00:00
|
|
|
* not have assigned driver yet (because the mlx5_os_pci_probe()
|
2019-10-07 13:56:19 +00:00
|
|
|
* is not completed yet, for this case match on hint PCI
|
|
|
|
* device may be used to detect sibling device.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* port_id of found device, RTE_MAX_ETHPORT if not found.
|
|
|
|
*/
|
2019-09-25 07:53:33 +00:00
|
|
|
uint16_t
|
2019-10-07 13:56:19 +00:00
|
|
|
mlx5_eth_find_next(uint16_t port_id, struct rte_pci_device *pci_dev)
|
2019-09-25 07:53:33 +00:00
|
|
|
{
|
|
|
|
while (port_id < RTE_MAX_ETHPORTS) {
|
|
|
|
struct rte_eth_dev *dev = &rte_eth_devices[port_id];
|
|
|
|
|
|
|
|
if (dev->state != RTE_ETH_DEV_UNUSED &&
|
|
|
|
dev->device &&
|
2019-10-07 13:56:19 +00:00
|
|
|
(dev->device == &pci_dev->device ||
|
|
|
|
(dev->device->driver &&
|
|
|
|
dev->device->driver->name &&
|
2021-03-15 21:05:55 +00:00
|
|
|
!strcmp(dev->device->driver->name, MLX5_PCI_DRIVER_NAME))))
|
2019-09-25 07:53:33 +00:00
|
|
|
break;
|
|
|
|
port_id++;
|
|
|
|
}
|
|
|
|
if (port_id >= RTE_MAX_ETHPORTS)
|
|
|
|
return RTE_MAX_ETHPORTS;
|
|
|
|
return port_id;
|
|
|
|
}
|
|
|
|
|
2018-10-23 18:26:05 +00:00
|
|
|
/**
|
|
|
|
* DPDK callback to remove a PCI device.
|
|
|
|
*
|
|
|
|
* This function removes all Ethernet devices belong to a given PCI device.
|
|
|
|
*
|
|
|
|
* @param[in] pci_dev
|
|
|
|
* Pointer to the PCI device.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* 0 on success, the function cannot fail.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
mlx5_pci_remove(struct rte_pci_device *pci_dev)
|
|
|
|
{
|
|
|
|
uint16_t port_id;
|
2020-10-16 13:32:59 +00:00
|
|
|
int ret = 0;
|
2018-10-23 18:26:05 +00:00
|
|
|
|
2020-05-28 06:59:49 +00:00
|
|
|
RTE_ETH_FOREACH_DEV_OF(port_id, &pci_dev->device) {
|
|
|
|
/*
|
|
|
|
* mlx5_dev_close() is not registered to secondary process,
|
|
|
|
* call the close function explicitly for secondary process.
|
|
|
|
*/
|
|
|
|
if (rte_eal_process_type() == RTE_PROC_SECONDARY)
|
2020-10-16 13:32:59 +00:00
|
|
|
ret |= mlx5_dev_close(&rte_eth_devices[port_id]);
|
2020-05-28 06:59:49 +00:00
|
|
|
else
|
2020-10-16 13:32:59 +00:00
|
|
|
ret |= rte_eth_dev_close(port_id);
|
2020-05-28 06:59:49 +00:00
|
|
|
}
|
2020-10-16 13:32:59 +00:00
|
|
|
return ret == 0 ? 0 : -EIO;
|
2018-10-23 18:26:05 +00:00
|
|
|
}
|
|
|
|
|
2015-10-30 18:52:30 +00:00
|
|
|
static const struct rte_pci_id mlx5_pci_id_map[] = {
|
|
|
|
{
|
2016-06-24 13:17:40 +00:00
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4)
|
2015-10-30 18:52:30 +00:00
|
|
|
},
|
|
|
|
{
|
2016-06-24 13:17:40 +00:00
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4VF)
|
2015-10-30 18:52:30 +00:00
|
|
|
},
|
|
|
|
{
|
2016-06-24 13:17:40 +00:00
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4LX)
|
2015-10-30 18:52:30 +00:00
|
|
|
},
|
|
|
|
{
|
2016-06-24 13:17:40 +00:00
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF)
|
2015-10-30 18:52:30 +00:00
|
|
|
},
|
2017-01-06 00:49:31 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5)
|
|
|
|
},
|
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5VF)
|
|
|
|
},
|
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5EX)
|
|
|
|
},
|
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF)
|
|
|
|
},
|
2018-05-15 06:12:50 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5BF)
|
|
|
|
},
|
2018-09-02 13:55:59 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5BFVF)
|
|
|
|
},
|
2018-12-31 12:43:48 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6)
|
|
|
|
},
|
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6VF)
|
|
|
|
},
|
2019-11-07 09:36:09 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6DX)
|
|
|
|
},
|
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
2020-11-19 08:06:10 +00:00
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTXVF)
|
2019-11-07 09:36:09 +00:00
|
|
|
},
|
2020-02-13 16:11:42 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6DXBF)
|
|
|
|
},
|
2020-07-08 09:14:04 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6LX)
|
|
|
|
},
|
2020-10-26 11:41:47 +00:00
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX7)
|
|
|
|
},
|
|
|
|
{
|
|
|
|
RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX7BF)
|
|
|
|
},
|
2015-10-30 18:52:30 +00:00
|
|
|
{
|
|
|
|
.vendor_id = 0
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2020-07-27 17:47:14 +00:00
|
|
|
static struct mlx5_pci_driver mlx5_driver = {
|
|
|
|
.driver_class = MLX5_CLASS_NET,
|
|
|
|
.pci_driver = {
|
|
|
|
.driver = {
|
2021-03-15 21:05:55 +00:00
|
|
|
.name = MLX5_PCI_DRIVER_NAME,
|
2020-07-27 17:47:14 +00:00
|
|
|
},
|
|
|
|
.id_table = mlx5_pci_id_map,
|
|
|
|
.probe = mlx5_os_pci_probe,
|
|
|
|
.remove = mlx5_pci_remove,
|
|
|
|
.dma_map = mlx5_dma_map,
|
|
|
|
.dma_unmap = mlx5_dma_unmap,
|
|
|
|
.drv_flags = PCI_DRV_FLAGS,
|
2015-10-30 18:52:30 +00:00
|
|
|
},
|
|
|
|
};
|
|
|
|
|
2020-07-01 12:33:35 +00:00
|
|
|
/* Initialize driver log type. */
|
log: register with standardized names
Let's try to enforce the convention where most drivers use a pmd. logtype
with their class reflected in it, and libraries use a lib. logtype.
Introduce two new macros:
- RTE_LOG_REGISTER_DEFAULT can be used when a single logtype is
used in a component. It is associated to the default name provided
by the build system,
- RTE_LOG_REGISTER_SUFFIX can be used when multiple logtypes are used,
and then the passed name is appended to the default name,
RTE_LOG_REGISTER is left untouched for existing external users
and for components that do not comply with the convention.
There is a new Meson variable log_prefix to adapt the default name
for baseband (pmd.bb.), bus (no pmd.) and mempool (no pmd.) classes.
Note: achieved with below commands + reverted change on net/bonding +
edits on crypto/virtio, compress/mlx5, regex/mlx5
$ git grep -l RTE_LOG_REGISTER drivers/ |
while read file; do
pattern=${file##drivers/};
class=${pattern%%/*};
pattern=${pattern#$class/};
drv=${pattern%%/*};
case "$class" in
baseband) pattern=pmd.bb.$drv;;
bus) pattern=bus.$drv;;
mempool) pattern=mempool.$drv;;
*) pattern=pmd.$class.$drv;;
esac
sed -i -e 's/RTE_LOG_REGISTER(\(.*\), '$pattern',/RTE_LOG_REGISTER_DEFAULT(\1,/' $file;
sed -i -e 's/RTE_LOG_REGISTER(\(.*\), '$pattern'\.\(.*\),/RTE_LOG_REGISTER_SUFFIX(\1, \2,/' $file;
done
$ git grep -l RTE_LOG_REGISTER lib/ |
while read file; do
pattern=${file##lib/};
pattern=lib.${pattern%%/*};
sed -i -e 's/RTE_LOG_REGISTER(\(.*\), '$pattern',/RTE_LOG_REGISTER_DEFAULT(\1,/' $file;
sed -i -e 's/RTE_LOG_REGISTER(\(.*\), '$pattern'\.\(.*\),/RTE_LOG_REGISTER_SUFFIX(\1, \2,/' $file;
done
Signed-off-by: David Marchand <david.marchand@redhat.com>
Signed-off-by: Thomas Monjalon <thomas@monjalon.net>
Acked-by: Bruce Richardson <bruce.richardson@intel.com>
2021-04-26 12:51:08 +00:00
|
|
|
RTE_LOG_REGISTER_DEFAULT(mlx5_logtype, NOTICE)
|
2020-07-01 12:33:35 +00:00
|
|
|
|
2015-10-30 18:52:30 +00:00
|
|
|
/**
|
|
|
|
* Driver initialization routine.
|
|
|
|
*/
|
2018-06-18 12:32:21 +00:00
|
|
|
RTE_INIT(rte_mlx5_pmd_init)
|
2015-10-30 18:52:30 +00:00
|
|
|
{
|
2020-12-28 12:32:59 +00:00
|
|
|
pthread_mutex_init(&mlx5_dev_ctx_list_mutex, NULL);
|
2020-07-27 17:47:11 +00:00
|
|
|
mlx5_common_init();
|
2018-04-08 12:41:20 +00:00
|
|
|
/* Build the static tables for Verbs conversion. */
|
2017-07-26 19:29:33 +00:00
|
|
|
mlx5_set_ptype_table();
|
2018-04-08 12:41:20 +00:00
|
|
|
mlx5_set_cksum_table();
|
|
|
|
mlx5_set_swp_types_table();
|
2020-01-29 12:38:27 +00:00
|
|
|
if (mlx5_glue)
|
2020-07-27 17:47:14 +00:00
|
|
|
mlx5_pci_driver_register(&mlx5_driver);
|
2015-10-30 18:52:30 +00:00
|
|
|
}
|
|
|
|
|
2016-10-10 05:43:15 +00:00
|
|
|
RTE_PMD_EXPORT_NAME(net_mlx5, __COUNTER__);
|
|
|
|
RTE_PMD_REGISTER_PCI_TABLE(net_mlx5, mlx5_pci_id_map);
|
2016-12-15 13:46:39 +00:00
|
|
|
RTE_PMD_REGISTER_KMOD_DEP(net_mlx5, "* ib_uverbs & mlx5_core & mlx5_ib");
|