2018-01-29 13:11:30 +00:00
|
|
|
/* SPDX-License-Identifier: BSD-3-Clause
|
|
|
|
* Copyright 2015 6WIND S.A.
|
2018-03-20 19:20:35 +00:00
|
|
|
* Copyright 2015 Mellanox Technologies, Ltd
|
2015-10-30 18:52:30 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef RTE_PMD_MLX5_H_
|
|
|
|
#define RTE_PMD_MLX5_H_
|
|
|
|
|
|
|
|
#include <stddef.h>
|
2019-07-05 13:10:30 +00:00
|
|
|
#include <stdbool.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
#include <stdint.h>
|
|
|
|
#include <limits.h>
|
|
|
|
#include <net/if.h>
|
|
|
|
#include <netinet/in.h>
|
2017-10-09 14:44:53 +00:00
|
|
|
#include <sys/queue.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
|
|
|
|
/* Verbs header. */
|
|
|
|
/* ISO C doesn't support unnamed structs/unions, disabling -pedantic. */
|
|
|
|
#ifdef PEDANTIC
|
2016-09-19 14:36:54 +00:00
|
|
|
#pragma GCC diagnostic ignored "-Wpedantic"
|
2015-10-30 18:52:30 +00:00
|
|
|
#endif
|
|
|
|
#include <infiniband/verbs.h>
|
|
|
|
#ifdef PEDANTIC
|
2016-09-19 14:36:54 +00:00
|
|
|
#pragma GCC diagnostic error "-Wpedantic"
|
2015-10-30 18:52:30 +00:00
|
|
|
#endif
|
|
|
|
|
2017-07-07 00:04:20 +00:00
|
|
|
#include <rte_pci.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
#include <rte_ether.h>
|
2018-01-22 00:16:22 +00:00
|
|
|
#include <rte_ethdev_driver.h>
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
#include <rte_rwlock.h>
|
2015-10-30 18:57:23 +00:00
|
|
|
#include <rte_interrupts.h>
|
2016-03-17 15:38:55 +00:00
|
|
|
#include <rte_errno.h>
|
2016-12-29 15:15:17 +00:00
|
|
|
#include <rte_flow.h>
|
2015-10-30 18:52:30 +00:00
|
|
|
|
|
|
|
#include "mlx5_utils.h"
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
#include "mlx5_mr.h"
|
2015-10-30 18:52:30 +00:00
|
|
|
#include "mlx5_autoconf.h"
|
|
|
|
#include "mlx5_defs.h"
|
2019-07-22 14:52:10 +00:00
|
|
|
#include "mlx5_glue.h"
|
2015-10-30 18:52:30 +00:00
|
|
|
|
|
|
|
enum {
|
|
|
|
PCI_VENDOR_ID_MELLANOX = 0x15b3,
|
|
|
|
};
|
|
|
|
|
|
|
|
enum {
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4 = 0x1013,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4VF = 0x1014,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4LX = 0x1015,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF = 0x1016,
|
2017-01-06 00:49:31 +00:00
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5 = 0x1017,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5VF = 0x1018,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5EX = 0x1019,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF = 0x101a,
|
2018-05-15 06:12:50 +00:00
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5BF = 0xa2d2,
|
2018-09-02 13:55:59 +00:00
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX5BFVF = 0xa2d3,
|
2018-12-31 12:43:48 +00:00
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6 = 0x101b,
|
|
|
|
PCI_DEVICE_ID_MELLANOX_CONNECTX6VF = 0x101c,
|
2015-10-30 18:52:30 +00:00
|
|
|
};
|
|
|
|
|
2019-04-01 21:12:54 +00:00
|
|
|
/* Request types for IPC. */
|
|
|
|
enum mlx5_mp_req_type {
|
|
|
|
MLX5_MP_REQ_VERBS_CMD_FD = 1,
|
2019-04-01 21:17:55 +00:00
|
|
|
MLX5_MP_REQ_CREATE_MR,
|
2019-04-01 21:12:56 +00:00
|
|
|
MLX5_MP_REQ_START_RXTX,
|
|
|
|
MLX5_MP_REQ_STOP_RXTX,
|
2019-05-30 10:20:38 +00:00
|
|
|
MLX5_MP_REQ_QUEUE_STATE_MODIFY,
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_mp_arg_queue_state_modify {
|
|
|
|
uint8_t is_wq; /* Set if WQ. */
|
|
|
|
uint16_t queue_id; /* DPDK queue ID. */
|
|
|
|
enum ibv_wq_state state; /* WQ requested state. */
|
2019-04-01 21:12:54 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
/* Pameters for IPC. */
|
|
|
|
struct mlx5_mp_param {
|
|
|
|
enum mlx5_mp_req_type type;
|
|
|
|
int port_id;
|
|
|
|
int result;
|
2019-04-01 21:17:55 +00:00
|
|
|
RTE_STD_C11
|
|
|
|
union {
|
|
|
|
uintptr_t addr; /* MLX5_MP_REQ_CREATE_MR */
|
2019-05-30 10:20:38 +00:00
|
|
|
struct mlx5_mp_arg_queue_state_modify state_modify;
|
|
|
|
/* MLX5_MP_REQ_QUEUE_STATE_MODIFY */
|
2019-04-01 21:17:55 +00:00
|
|
|
} args;
|
2019-04-01 21:12:54 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
/** Request timeout for IPC. */
|
|
|
|
#define MLX5_MP_REQ_TIMEOUT_SEC 5
|
|
|
|
|
|
|
|
/** Key string for IPC. */
|
|
|
|
#define MLX5_MP_NAME "net_mlx5_mp"
|
|
|
|
|
net/mlx5: support PF representor
On BlueField platform we have the new entity - PF representor.
This one represents the PCI PF attached to external host on the
side of ARM. The traffic sent by the external host to the NIC
via PF will be seem by ARM on this PF representor.
This patch refactors port recognizing capability on the base of
physical port name. We have two groups of name formats. Legacy
name formats are supported by kernels before ver 5.0 (being
more precise - before the patch [1]) or before Mellanox OFED 4.6,
and new naming formats added by the patch [1].
Legacy naming formats are supported:
- missing physical port name (no sysfs/netlink key) at all,
master is assumed
- decimal digits (for example "12"), representor is assumed,
the value is the index of attached VF
New naming formats are supported:
- "p" followed by decimal digits, for example "p2", master
is assumed
- "pf" followed by PF index concatenated with "vf" followed by
VF index, for example "pf0vf1", representor is assumed.
If index of VF is "-1" it is a special case of host PF
representor, this representor must be indexed in devargs
as 65535, for example representor=[0-3,65535] will
allow representors for VF0, VF1, VF2, VF3 and for host PF.
Note: do not specify representor=[0-65535], it causes devargs
processing error, because number of ports (rte_eth_dev) is
limited.
Applications should distinguish representors and master devices
exclusively by device flag RTE_ETH_DEV_REPRESENTOR and do not
rely on switch port_id (mlx5 PMD deduces ones from representor_id)
values returned by dev_infos_get() API.
[1] https://www.spinics.net/lists/netdev/msg547007.html
Linux-tree: c12ecc23 (Or Gerlitz 2018-04-25 17:32 +0300)
"net/mlx5e: Move to use common phys port names for vport representors"
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Shahaf Shuler <shahafs@mellanox.com>
2019-04-16 14:10:28 +00:00
|
|
|
/* Recognized Infiniband device physical port name types. */
|
|
|
|
enum mlx5_phys_port_name_type {
|
|
|
|
MLX5_PHYS_PORT_NAME_TYPE_NOTSET = 0, /* Not set. */
|
|
|
|
MLX5_PHYS_PORT_NAME_TYPE_LEGACY, /* before kernel ver < 5.0 */
|
|
|
|
MLX5_PHYS_PORT_NAME_TYPE_UPLINK, /* p0, kernel ver >= 5.0 */
|
|
|
|
MLX5_PHYS_PORT_NAME_TYPE_PFVF, /* pf0vf0, kernel ver >= 5.0 */
|
|
|
|
MLX5_PHYS_PORT_NAME_TYPE_UNKNOWN, /* Unrecognized. */
|
|
|
|
};
|
|
|
|
|
2018-07-10 16:04:52 +00:00
|
|
|
/** Switch information returned by mlx5_nl_switch_info(). */
|
|
|
|
struct mlx5_switch_info {
|
|
|
|
uint32_t master:1; /**< Master device. */
|
|
|
|
uint32_t representor:1; /**< Representor device. */
|
net/mlx5: support PF representor
On BlueField platform we have the new entity - PF representor.
This one represents the PCI PF attached to external host on the
side of ARM. The traffic sent by the external host to the NIC
via PF will be seem by ARM on this PF representor.
This patch refactors port recognizing capability on the base of
physical port name. We have two groups of name formats. Legacy
name formats are supported by kernels before ver 5.0 (being
more precise - before the patch [1]) or before Mellanox OFED 4.6,
and new naming formats added by the patch [1].
Legacy naming formats are supported:
- missing physical port name (no sysfs/netlink key) at all,
master is assumed
- decimal digits (for example "12"), representor is assumed,
the value is the index of attached VF
New naming formats are supported:
- "p" followed by decimal digits, for example "p2", master
is assumed
- "pf" followed by PF index concatenated with "vf" followed by
VF index, for example "pf0vf1", representor is assumed.
If index of VF is "-1" it is a special case of host PF
representor, this representor must be indexed in devargs
as 65535, for example representor=[0-3,65535] will
allow representors for VF0, VF1, VF2, VF3 and for host PF.
Note: do not specify representor=[0-65535], it causes devargs
processing error, because number of ports (rte_eth_dev) is
limited.
Applications should distinguish representors and master devices
exclusively by device flag RTE_ETH_DEV_REPRESENTOR and do not
rely on switch port_id (mlx5 PMD deduces ones from representor_id)
values returned by dev_infos_get() API.
[1] https://www.spinics.net/lists/netdev/msg547007.html
Linux-tree: c12ecc23 (Or Gerlitz 2018-04-25 17:32 +0300)
"net/mlx5e: Move to use common phys port names for vport representors"
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Shahaf Shuler <shahafs@mellanox.com>
2019-04-16 14:10:28 +00:00
|
|
|
enum mlx5_phys_port_name_type name_type; /** < Port name type. */
|
|
|
|
int32_t pf_num; /**< PF number (valid for pfxvfx format only). */
|
2018-07-10 16:04:52 +00:00
|
|
|
int32_t port_name; /**< Representor port name. */
|
|
|
|
uint64_t switch_id; /**< Switch identifier. */
|
|
|
|
};
|
|
|
|
|
2019-04-27 04:32:57 +00:00
|
|
|
LIST_HEAD(mlx5_dev_list, mlx5_ibv_shared);
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
|
2019-04-01 21:12:55 +00:00
|
|
|
/* Shared data between primary and secondary processes. */
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
struct mlx5_shared_data {
|
2019-04-01 21:12:55 +00:00
|
|
|
rte_spinlock_t lock;
|
|
|
|
/* Global spinlock for primary and secondary processes. */
|
|
|
|
int init_done; /* Whether primary has done initialization. */
|
|
|
|
unsigned int secondary_cnt; /* Number of secondary processes init'd. */
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
struct mlx5_dev_list mem_event_cb_list;
|
|
|
|
rte_rwlock_t mem_event_rwlock;
|
|
|
|
};
|
|
|
|
|
2019-04-01 21:12:55 +00:00
|
|
|
/* Per-process data structure, not visible to other processes. */
|
|
|
|
struct mlx5_local_data {
|
|
|
|
int init_done; /* Whether a secondary has done initialization. */
|
|
|
|
};
|
|
|
|
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
extern struct mlx5_shared_data *mlx5_shared_data;
|
|
|
|
|
2018-09-17 09:46:34 +00:00
|
|
|
struct mlx5_counter_ctrl {
|
|
|
|
/* Name of the counter. */
|
|
|
|
char dpdk_name[RTE_ETH_XSTATS_NAME_SIZE];
|
|
|
|
/* Name of the counter on the device table. */
|
|
|
|
char ctr_name[RTE_ETH_XSTATS_NAME_SIZE];
|
|
|
|
uint32_t ib:1; /**< Nonzero for IB counters. */
|
|
|
|
};
|
|
|
|
|
2017-01-17 14:37:08 +00:00
|
|
|
struct mlx5_xstats_ctrl {
|
|
|
|
/* Number of device stats. */
|
|
|
|
uint16_t stats_n;
|
2018-09-17 09:46:34 +00:00
|
|
|
/* Number of device stats identified by PMD. */
|
|
|
|
uint16_t mlx5_stats_n;
|
2017-01-17 14:37:08 +00:00
|
|
|
/* Index in the device counters table. */
|
|
|
|
uint16_t dev_table_idx[MLX5_MAX_XSTATS];
|
|
|
|
uint64_t base[MLX5_MAX_XSTATS];
|
2018-09-17 09:46:34 +00:00
|
|
|
struct mlx5_counter_ctrl info[MLX5_MAX_XSTATS];
|
2017-01-17 14:37:08 +00:00
|
|
|
};
|
|
|
|
|
2018-11-23 08:03:37 +00:00
|
|
|
struct mlx5_stats_ctrl {
|
|
|
|
/* Base for imissed counter. */
|
|
|
|
uint64_t imissed_base;
|
|
|
|
};
|
|
|
|
|
2019-07-16 14:34:53 +00:00
|
|
|
/* devX creation object */
|
|
|
|
struct mlx5_devx_obj {
|
|
|
|
struct mlx5dv_devx_obj *obj; /* The DV object. */
|
|
|
|
int id; /* The object ID. */
|
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_devx_mkey_attr {
|
|
|
|
uint64_t addr;
|
|
|
|
uint64_t size;
|
|
|
|
uint32_t umem_id;
|
|
|
|
uint32_t pd;
|
2019-01-03 15:06:37 +00:00
|
|
|
};
|
|
|
|
|
2019-07-22 14:52:00 +00:00
|
|
|
/* HCA supports this number of time periods for LRO. */
|
|
|
|
#define MLX5_LRO_NUM_SUPP_PERIODS 4
|
|
|
|
|
2019-04-18 13:16:01 +00:00
|
|
|
/* HCA attributes. */
|
|
|
|
struct mlx5_hca_attr {
|
|
|
|
uint32_t eswitch_manager:1;
|
2019-07-16 14:34:56 +00:00
|
|
|
uint32_t flow_counters_dump:1;
|
2019-07-16 14:34:53 +00:00
|
|
|
uint8_t flow_counter_bulk_alloc_bitmap;
|
2019-07-21 14:24:56 +00:00
|
|
|
uint32_t eth_net_offloads:1;
|
|
|
|
uint32_t eth_virt:1;
|
|
|
|
uint32_t wqe_vlan_insert:1;
|
|
|
|
uint32_t wqe_inline_mode:2;
|
|
|
|
uint32_t vport_inline_mode:3;
|
2019-07-22 14:52:00 +00:00
|
|
|
uint32_t lro_cap:1;
|
|
|
|
uint32_t tunnel_lro_gre:1;
|
|
|
|
uint32_t tunnel_lro_vxlan:1;
|
|
|
|
uint32_t lro_max_msg_sz_mode:2;
|
|
|
|
uint32_t lro_timer_supported_periods[MLX5_LRO_NUM_SUPP_PERIODS];
|
2019-04-18 13:16:01 +00:00
|
|
|
};
|
|
|
|
|
2017-10-09 14:44:53 +00:00
|
|
|
/* Flow list . */
|
|
|
|
TAILQ_HEAD(mlx5_flows, rte_flow);
|
|
|
|
|
2018-01-10 09:16:58 +00:00
|
|
|
/* Default PMD specific parameter value. */
|
|
|
|
#define MLX5_ARG_UNSET (-1)
|
|
|
|
|
2019-07-22 14:51:59 +00:00
|
|
|
#define MLX5_LRO_SUPPORTED(dev) \
|
|
|
|
(((struct mlx5_priv *)((dev)->data->dev_private))->config.lro.supported)
|
|
|
|
|
|
|
|
/* LRO configurations structure. */
|
|
|
|
struct mlx5_lro_config {
|
|
|
|
uint32_t supported:1; /* Whether LRO is supported. */
|
|
|
|
uint32_t timeout; /* User configuration. */
|
|
|
|
};
|
|
|
|
|
2018-01-10 09:16:58 +00:00
|
|
|
/*
|
|
|
|
* Device configuration structure.
|
|
|
|
*
|
|
|
|
* Merged configuration from:
|
|
|
|
*
|
|
|
|
* - Device capabilities,
|
|
|
|
* - User device parameters disabled features.
|
|
|
|
*/
|
|
|
|
struct mlx5_dev_config {
|
|
|
|
unsigned int hw_csum:1; /* Checksum offload is supported. */
|
|
|
|
unsigned int hw_vlan_strip:1; /* VLAN stripping is supported. */
|
2019-07-21 14:24:57 +00:00
|
|
|
unsigned int hw_vlan_insert:1; /* VLAN insertion in WQE is supported. */
|
2018-01-10 09:16:58 +00:00
|
|
|
unsigned int hw_fcs_strip:1; /* FCS stripping is supported. */
|
|
|
|
unsigned int hw_padding:1; /* End alignment padding is supported. */
|
2018-04-05 15:07:19 +00:00
|
|
|
unsigned int vf:1; /* This is a VF. */
|
2018-02-25 07:28:37 +00:00
|
|
|
unsigned int tunnel_en:1;
|
|
|
|
/* Whether tunnel stateless offloads are supported. */
|
2018-05-15 11:07:14 +00:00
|
|
|
unsigned int mpls_en:1; /* MPLS over GRE/UDP is enabled. */
|
2018-01-10 09:16:58 +00:00
|
|
|
unsigned int cqe_comp:1; /* CQE compression is enabled. */
|
2018-10-25 06:24:00 +00:00
|
|
|
unsigned int cqe_pad:1; /* CQE padding is enabled. */
|
2018-01-10 09:17:00 +00:00
|
|
|
unsigned int tso:1; /* Whether TSO is supported. */
|
2018-01-10 09:16:58 +00:00
|
|
|
unsigned int rx_vec_en:1; /* Rx vector is enabled. */
|
2019-04-01 21:17:54 +00:00
|
|
|
unsigned int mr_ext_memseg_en:1;
|
|
|
|
/* Whether memseg should be extended for MR creation. */
|
2018-04-23 12:33:02 +00:00
|
|
|
unsigned int l3_vxlan_en:1; /* Enable L3 VXLAN flow creation. */
|
2018-04-05 15:07:21 +00:00
|
|
|
unsigned int vf_nl_en:1; /* Enable Netlink requests in VF mode. */
|
2019-04-18 13:16:01 +00:00
|
|
|
unsigned int dv_esw_en:1; /* Enable E-Switch DV flow. */
|
2018-09-24 23:17:54 +00:00
|
|
|
unsigned int dv_flow_en:1; /* Enable DV flow. */
|
2018-04-08 12:41:20 +00:00
|
|
|
unsigned int swp:1; /* Tx generic tunnel checksum and TSO offload. */
|
2019-01-03 15:06:37 +00:00
|
|
|
unsigned int devx:1; /* Whether devx interface is available or not. */
|
2019-07-22 14:52:02 +00:00
|
|
|
unsigned int dest_tir:1; /* Whether advanced DR API is available. */
|
2018-05-09 11:13:50 +00:00
|
|
|
struct {
|
|
|
|
unsigned int enabled:1; /* Whether MPRQ is enabled. */
|
|
|
|
unsigned int stride_num_n; /* Number of strides. */
|
|
|
|
unsigned int min_stride_size_n; /* Min size of a stride. */
|
|
|
|
unsigned int max_stride_size_n; /* Max size of a stride. */
|
|
|
|
unsigned int max_memcpy_len;
|
|
|
|
/* Maximum packet size to memcpy Rx packets. */
|
|
|
|
unsigned int min_rxqs_num;
|
|
|
|
/* Rx queue count threshold to enable MPRQ. */
|
|
|
|
} mprq; /* Configurations for Multi-Packet RQ. */
|
2018-08-13 06:47:57 +00:00
|
|
|
int mps; /* Multi-packet send supported mode. */
|
2018-07-12 09:30:49 +00:00
|
|
|
unsigned int flow_prio; /* Number of flow priorities. */
|
2018-01-10 09:16:58 +00:00
|
|
|
unsigned int tso_max_payload_sz; /* Maximum TCP payload for TSO. */
|
|
|
|
unsigned int ind_table_max_size; /* Maximum indirection table size. */
|
2019-05-30 10:20:32 +00:00
|
|
|
unsigned int max_dump_files_num; /* Maximum dump files per queue. */
|
2018-01-10 09:16:58 +00:00
|
|
|
int txqs_inline; /* Queue number threshold for inlining. */
|
2019-07-21 14:24:54 +00:00
|
|
|
int txq_inline_min; /* Minimal amount of data bytes to inline. */
|
|
|
|
int txq_inline_max; /* Max packet size for inlining with SEND. */
|
|
|
|
int txq_inline_mpw; /* Max packet size for inlining with eMPW. */
|
2019-04-18 13:16:01 +00:00
|
|
|
struct mlx5_hca_attr hca_attr; /* HCA attributes. */
|
2019-07-22 14:51:59 +00:00
|
|
|
struct mlx5_lro_config lro; /* LRO configuration. */
|
2018-01-10 09:16:58 +00:00
|
|
|
};
|
|
|
|
|
2019-07-22 14:52:06 +00:00
|
|
|
struct mlx5_devx_wq_attr {
|
|
|
|
uint32_t wq_type:4;
|
|
|
|
uint32_t wq_signature:1;
|
|
|
|
uint32_t end_padding_mode:2;
|
|
|
|
uint32_t cd_slave:1;
|
|
|
|
uint32_t hds_skip_first_sge:1;
|
|
|
|
uint32_t log2_hds_buf_size:3;
|
|
|
|
uint32_t page_offset:5;
|
|
|
|
uint32_t lwm:16;
|
|
|
|
uint32_t pd:24;
|
|
|
|
uint32_t uar_page:24;
|
|
|
|
uint64_t dbr_addr;
|
|
|
|
uint32_t hw_counter;
|
|
|
|
uint32_t sw_counter;
|
|
|
|
uint32_t log_wq_stride:4;
|
|
|
|
uint32_t log_wq_pg_sz:5;
|
|
|
|
uint32_t log_wq_sz:5;
|
|
|
|
uint32_t dbr_umem_valid:1;
|
|
|
|
uint32_t wq_umem_valid:1;
|
|
|
|
uint32_t log_hairpin_num_packets:5;
|
|
|
|
uint32_t log_hairpin_data_sz:5;
|
|
|
|
uint32_t single_wqe_log_num_of_strides:4;
|
|
|
|
uint32_t two_byte_shift_en:1;
|
|
|
|
uint32_t single_stride_log_num_of_bytes:3;
|
|
|
|
uint32_t dbr_umem_id;
|
|
|
|
uint32_t wq_umem_id;
|
|
|
|
uint64_t wq_umem_offset;
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Create RQ attributes structure, used by create RQ operation. */
|
|
|
|
struct mlx5_devx_create_rq_attr {
|
|
|
|
uint32_t rlky:1;
|
|
|
|
uint32_t delay_drop_en:1;
|
|
|
|
uint32_t scatter_fcs:1;
|
|
|
|
uint32_t vsd:1;
|
|
|
|
uint32_t mem_rq_type:4;
|
|
|
|
uint32_t state:4;
|
|
|
|
uint32_t flush_in_error_en:1;
|
|
|
|
uint32_t hairpin:1;
|
|
|
|
uint32_t user_index:24;
|
|
|
|
uint32_t cqn:24;
|
|
|
|
uint32_t counter_set_id:8;
|
|
|
|
uint32_t rmpn:24;
|
|
|
|
struct mlx5_devx_wq_attr wq_attr;
|
|
|
|
};
|
|
|
|
|
2019-07-22 14:52:07 +00:00
|
|
|
/* Modify RQ attributes structure, used by modify RQ operation. */
|
|
|
|
struct mlx5_devx_modify_rq_attr {
|
|
|
|
uint32_t rqn:24;
|
|
|
|
uint32_t rq_state:4; /* Current RQ state. */
|
|
|
|
uint32_t state:4; /* Required RQ state. */
|
|
|
|
uint32_t scatter_fcs:1;
|
|
|
|
uint32_t vsd:1;
|
|
|
|
uint32_t counter_set_id:8;
|
|
|
|
uint32_t hairpin_peer_sq:24;
|
|
|
|
uint32_t hairpin_peer_vhca:16;
|
|
|
|
uint64_t modify_bitmask;
|
|
|
|
uint32_t lwm:16; /* Contained WQ lwm. */
|
|
|
|
};
|
|
|
|
|
2019-07-22 14:52:08 +00:00
|
|
|
struct mlx5_rx_hash_field_select {
|
|
|
|
uint32_t l3_prot_type:1;
|
|
|
|
uint32_t l4_prot_type:1;
|
|
|
|
uint32_t selected_fields:30;
|
|
|
|
};
|
|
|
|
|
|
|
|
/* TIR attributes structure, used by TIR operations. */
|
|
|
|
struct mlx5_devx_tir_attr {
|
|
|
|
uint32_t disp_type:4;
|
|
|
|
uint32_t lro_timeout_period_usecs:16;
|
|
|
|
uint32_t lro_enable_mask:4;
|
|
|
|
uint32_t lro_max_msg_sz:8;
|
|
|
|
uint32_t inline_rqn:24;
|
|
|
|
uint32_t rx_hash_symmetric:1;
|
|
|
|
uint32_t tunneled_offload_en:1;
|
|
|
|
uint32_t indirect_table:24;
|
|
|
|
uint32_t rx_hash_fn:4;
|
|
|
|
uint32_t self_lb_block:2;
|
|
|
|
uint32_t transport_domain:24;
|
|
|
|
uint32_t rx_hash_toeplitz_key[10];
|
|
|
|
struct mlx5_rx_hash_field_select rx_hash_field_selector_outer;
|
|
|
|
struct mlx5_rx_hash_field_select rx_hash_field_selector_inner;
|
|
|
|
};
|
|
|
|
|
2019-07-22 14:52:09 +00:00
|
|
|
/* RQT attributes structure, used by RQT operations. */
|
|
|
|
struct mlx5_devx_rqt_attr {
|
|
|
|
uint32_t rqt_max_size:16;
|
|
|
|
uint32_t rqt_actual_size:16;
|
|
|
|
uint32_t rq_list[];
|
|
|
|
};
|
|
|
|
|
2018-01-22 12:33:38 +00:00
|
|
|
/**
|
2019-07-18 19:40:52 +00:00
|
|
|
* Type of object being allocated.
|
2018-01-22 12:33:38 +00:00
|
|
|
*/
|
|
|
|
enum mlx5_verbs_alloc_type {
|
|
|
|
MLX5_VERBS_ALLOC_TYPE_NONE,
|
|
|
|
MLX5_VERBS_ALLOC_TYPE_TX_QUEUE,
|
|
|
|
MLX5_VERBS_ALLOC_TYPE_RX_QUEUE,
|
|
|
|
};
|
|
|
|
|
2019-07-30 09:20:24 +00:00
|
|
|
/* VLAN netdev for VLAN workaround. */
|
|
|
|
struct mlx5_vlan_dev {
|
|
|
|
uint32_t refcnt;
|
|
|
|
uint32_t ifindex; /**< Own interface index. */
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Structure for VF VLAN workaround. */
|
|
|
|
struct mlx5_vf_vlan {
|
|
|
|
uint32_t tag:12;
|
|
|
|
uint32_t created:1;
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Array of VLAN devices created on the base of VF
|
|
|
|
* used for workaround in virtual environments.
|
|
|
|
*/
|
|
|
|
struct mlx5_vlan_vmwa_context {
|
|
|
|
int nl_socket;
|
|
|
|
uint32_t nl_sn;
|
|
|
|
uint32_t vf_ifindex;
|
|
|
|
struct rte_eth_dev *dev;
|
|
|
|
struct mlx5_vlan_dev vlan_dev[4096];
|
|
|
|
};
|
|
|
|
|
2018-01-22 12:33:38 +00:00
|
|
|
/**
|
|
|
|
* Verbs allocator needs a context to know in the callback which kind of
|
|
|
|
* resources it is allocating.
|
|
|
|
*/
|
|
|
|
struct mlx5_verbs_alloc_ctx {
|
|
|
|
enum mlx5_verbs_alloc_type type; /* Kind of object being allocated. */
|
|
|
|
const void *obj; /* Pointer to the DPDK object. */
|
|
|
|
};
|
|
|
|
|
net/mlx5: add new memory region support
This is the new design of Memory Region (MR) for mlx PMD, in order to:
- Accommodate the new memory hotplug model.
- Support non-contiguous Mempool.
There are multiple layers for MR search.
L0 is to look up the last-hit entry which is pointed by mr_ctrl->mru (Most
Recently Used). If L0 misses, L1 is to look up the address in a fixed-sized
array by linear search. L0/L1 is in an inline function -
mlx5_mr_lookup_cache().
If L1 misses, the bottom-half function is called to look up the address
from the bigger local cache of the queue. This is L2 - mlx5_mr_addr2mr_bh()
and it is not an inline function. Data structure for L2 is the Binary Tree.
If L2 misses, the search falls into the slowest path which takes locks in
order to access global device cache (priv->mr.cache) which is also a B-tree
and caches the original MR list (priv->mr.mr_list) of the device. Unless
the global cache is overflowed, it is all-inclusive of the MR list. This is
L3 - mlx5_mr_lookup_dev(). The size of the L3 cache table is limited and
can't be expanded on the fly due to deadlock. Refer to the comments in the
code for the details - mr_lookup_dev(). If L3 is overflowed, the list will
have to be searched directly bypassing the cache although it is slower.
If L3 misses, a new MR for the address should be created -
mlx5_mr_create(). When it creates a new MR, it tries to register adjacent
memsegs as much as possible which are virtually contiguous around the
address. This must take two locks - memory_hotplug_lock and
priv->mr.rwlock. Due to memory_hotplug_lock, there can't be any
allocation/free of memory inside.
In the free callback of the memory hotplug event, freed space is searched
from the MR list and corresponding bits are cleared from the bitmap of MRs.
This can fragment a MR and the MR will have multiple search entries in the
caches. Once there's a change by the event, the global cache must be
rebuilt and all the per-queue caches will be flushed as well. If memory is
frequently freed in run-time, that may cause jitter on dataplane processing
in the worst case by incurring MR cache flush and rebuild. But, it would be
the least probable scenario.
To guarantee the most optimal performance, it is highly recommended to use
an EAL option - '--socket-mem'. Then, the reserved memory will be pinned
and won't be freed dynamically. And it is also recommended to configure
per-lcore cache of Mempool. Even though there're many MRs for a device or
MRs are highly fragmented, the cache of Mempool will be much helpful to
reduce misses on per-queue caches anyway.
'--legacy-mem' is also supported.
Signed-off-by: Yongseok Koh <yskoh@mellanox.com>
2018-05-09 11:09:04 +00:00
|
|
|
LIST_HEAD(mlx5_mr_list, mlx5_mr);
|
|
|
|
|
2018-07-12 09:30:48 +00:00
|
|
|
/* Flow drop context necessary due to Verbs API. */
|
|
|
|
struct mlx5_drop {
|
|
|
|
struct mlx5_hrxq *hrxq; /* Hash Rx queue queue. */
|
2019-07-22 14:52:11 +00:00
|
|
|
struct mlx5_rxq_obj *rxq; /* Rx queue object. */
|
2018-07-12 09:30:48 +00:00
|
|
|
};
|
|
|
|
|
2019-07-16 14:34:53 +00:00
|
|
|
#define MLX5_COUNTERS_PER_POOL 512
|
2019-07-16 14:34:55 +00:00
|
|
|
#define MLX5_MAX_PENDING_QUERIES 4
|
2019-07-16 14:34:53 +00:00
|
|
|
|
|
|
|
struct mlx5_flow_counter_pool;
|
|
|
|
|
|
|
|
struct flow_counter_stats {
|
|
|
|
uint64_t hits;
|
|
|
|
uint64_t bytes;
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Counters information. */
|
|
|
|
struct mlx5_flow_counter {
|
|
|
|
TAILQ_ENTRY(mlx5_flow_counter) next;
|
|
|
|
/**< Pointer to the next flow counter structure. */
|
|
|
|
uint32_t shared:1; /**< Share counter ID with other flow rules. */
|
|
|
|
uint32_t batch: 1;
|
|
|
|
/**< Whether the counter was allocated by batch command. */
|
|
|
|
uint32_t ref_cnt:30; /**< Reference counter. */
|
|
|
|
uint32_t id; /**< Counter ID. */
|
|
|
|
union { /**< Holds the counters for the rule. */
|
|
|
|
#if defined(HAVE_IBV_DEVICE_COUNTERS_SET_V42)
|
|
|
|
struct ibv_counter_set *cs;
|
|
|
|
#elif defined(HAVE_IBV_DEVICE_COUNTERS_SET_V45)
|
|
|
|
struct ibv_counters *cs;
|
|
|
|
#endif
|
|
|
|
struct mlx5_devx_obj *dcs; /**< Counter Devx object. */
|
|
|
|
struct mlx5_flow_counter_pool *pool; /**< The counter pool. */
|
|
|
|
};
|
2019-07-16 14:34:55 +00:00
|
|
|
union {
|
|
|
|
uint64_t hits; /**< Reset value of hits packets. */
|
|
|
|
int64_t query_gen; /**< Generation of the last release. */
|
|
|
|
};
|
2019-07-16 14:34:53 +00:00
|
|
|
uint64_t bytes; /**< Reset value of bytes. */
|
|
|
|
void *action; /**< Pointer to the dv action. */
|
|
|
|
};
|
|
|
|
|
|
|
|
TAILQ_HEAD(mlx5_counters, mlx5_flow_counter);
|
|
|
|
|
|
|
|
/* Counter pool structure - query is in pool resolution. */
|
|
|
|
struct mlx5_flow_counter_pool {
|
|
|
|
TAILQ_ENTRY(mlx5_flow_counter_pool) next;
|
|
|
|
struct mlx5_counters counters; /* Free counter list. */
|
2019-07-16 14:34:55 +00:00
|
|
|
union {
|
|
|
|
struct mlx5_devx_obj *min_dcs;
|
|
|
|
rte_atomic64_t a64_dcs;
|
|
|
|
};
|
|
|
|
/* The devx object of the minimum counter ID. */
|
|
|
|
rte_atomic64_t query_gen;
|
|
|
|
uint32_t n_counters: 16; /* Number of devx allocated counters. */
|
|
|
|
rte_spinlock_t sl; /* The pool lock. */
|
|
|
|
struct mlx5_counter_stats_raw *raw;
|
|
|
|
struct mlx5_counter_stats_raw *raw_hw; /* The raw on HW working. */
|
|
|
|
struct mlx5_flow_counter counters_raw[]; /* The pool counters memory. */
|
2019-07-16 14:34:53 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
struct mlx5_counter_stats_raw;
|
|
|
|
|
|
|
|
/* Memory management structure for group of counter statistics raws. */
|
|
|
|
struct mlx5_counter_stats_mem_mng {
|
|
|
|
LIST_ENTRY(mlx5_counter_stats_mem_mng) next;
|
|
|
|
struct mlx5_counter_stats_raw *raws;
|
|
|
|
struct mlx5_devx_obj *dm;
|
|
|
|
struct mlx5dv_devx_umem *umem;
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Raw memory structure for the counter statistics values of a pool. */
|
|
|
|
struct mlx5_counter_stats_raw {
|
|
|
|
LIST_ENTRY(mlx5_counter_stats_raw) next;
|
|
|
|
int min_dcs_id;
|
|
|
|
struct mlx5_counter_stats_mem_mng *mem_mng;
|
|
|
|
volatile struct flow_counter_stats *data;
|
|
|
|
};
|
|
|
|
|
|
|
|
TAILQ_HEAD(mlx5_counter_pools, mlx5_flow_counter_pool);
|
|
|
|
|
|
|
|
/* Container structure for counter pools. */
|
|
|
|
struct mlx5_pools_container {
|
2019-07-16 14:34:55 +00:00
|
|
|
rte_atomic16_t n_valid; /* Number of valid pools. */
|
2019-07-16 14:34:53 +00:00
|
|
|
uint16_t n; /* Number of pools. */
|
|
|
|
struct mlx5_counter_pools pool_list; /* Counter pool list. */
|
|
|
|
struct mlx5_flow_counter_pool **pools; /* Counter pool array. */
|
|
|
|
struct mlx5_counter_stats_mem_mng *init_mem_mng;
|
|
|
|
/* Hold the memory management for the next allocated pools raws. */
|
|
|
|
};
|
|
|
|
|
|
|
|
/* Counter global management structure. */
|
|
|
|
struct mlx5_flow_counter_mng {
|
2019-07-16 14:34:55 +00:00
|
|
|
uint8_t mhi[2]; /* master \ host container index. */
|
|
|
|
struct mlx5_pools_container ccont[2 * 2];
|
|
|
|
/* 2 containers for single and for batch for double-buffer. */
|
2019-07-16 14:34:53 +00:00
|
|
|
struct mlx5_counters flow_counters; /* Legacy flow counter list. */
|
2019-07-16 14:34:55 +00:00
|
|
|
uint8_t pending_queries;
|
|
|
|
uint8_t batch;
|
|
|
|
uint16_t pool_index;
|
|
|
|
uint8_t query_thread_on;
|
2019-07-16 14:34:53 +00:00
|
|
|
LIST_HEAD(mem_mngs, mlx5_counter_stats_mem_mng) mem_mngs;
|
2019-07-16 14:34:55 +00:00
|
|
|
LIST_HEAD(stat_raws, mlx5_counter_stats_raw) free_stat_raws;
|
2019-07-16 14:34:53 +00:00
|
|
|
};
|
|
|
|
|
2019-03-27 13:15:39 +00:00
|
|
|
/* Per port data of shared IB device. */
|
|
|
|
struct mlx5_ibv_shared_port {
|
|
|
|
uint32_t ih_port_id;
|
|
|
|
/*
|
|
|
|
* Interrupt handler port_id. Used by shared interrupt
|
|
|
|
* handler to find the corresponding rte_eth device
|
|
|
|
* by IB port index. If value is equal or greater
|
|
|
|
* RTE_MAX_ETHPORTS it means there is no subhandler
|
|
|
|
* installed for specified IB port index.
|
|
|
|
*/
|
|
|
|
};
|
|
|
|
|
2019-04-04 13:04:25 +00:00
|
|
|
/* Table structure. */
|
|
|
|
struct mlx5_flow_tbl_resource {
|
|
|
|
void *obj; /**< Pointer to DR table object. */
|
|
|
|
rte_atomic32_t refcnt; /**< Reference counter. */
|
|
|
|
};
|
|
|
|
|
2019-09-11 11:03:36 +00:00
|
|
|
#define MLX5_MAX_TABLES UINT16_MAX
|
|
|
|
#define MLX5_MAX_TABLES_FDB UINT16_MAX
|
2019-04-04 13:04:25 +00:00
|
|
|
|
2019-07-22 14:52:10 +00:00
|
|
|
#define MLX5_DBR_PAGE_SIZE 4096 /* Must be >= 512. */
|
|
|
|
#define MLX5_DBR_SIZE 8
|
|
|
|
#define MLX5_DBR_PER_PAGE (MLX5_DBR_PAGE_SIZE / MLX5_DBR_SIZE)
|
|
|
|
#define MLX5_DBR_BITMAP_SIZE (MLX5_DBR_PER_PAGE / 64)
|
|
|
|
|
|
|
|
struct mlx5_devx_dbr_page {
|
|
|
|
/* Door-bell records, must be first member in structure. */
|
|
|
|
uint8_t dbrs[MLX5_DBR_PAGE_SIZE];
|
|
|
|
LIST_ENTRY(mlx5_devx_dbr_page) next; /* Pointer to the next element. */
|
|
|
|
struct mlx5dv_devx_umem *umem;
|
|
|
|
uint32_t dbr_count; /* Number of door-bell records in use. */
|
|
|
|
/* 1 bit marks matching door-bell is in use. */
|
|
|
|
uint64_t dbr_bitmap[MLX5_DBR_BITMAP_SIZE];
|
|
|
|
};
|
|
|
|
|
2019-03-27 13:15:39 +00:00
|
|
|
/*
|
|
|
|
* Shared Infiniband device context for Master/Representors
|
|
|
|
* which belong to same IB device with multiple IB ports.
|
|
|
|
**/
|
|
|
|
struct mlx5_ibv_shared {
|
|
|
|
LIST_ENTRY(mlx5_ibv_shared) next;
|
|
|
|
uint32_t refcnt;
|
|
|
|
uint32_t devx:1; /* Opened with DV. */
|
|
|
|
uint32_t max_port; /* Maximal IB device port index. */
|
|
|
|
struct ibv_context *ctx; /* Verbs/DV context. */
|
|
|
|
struct ibv_pd *pd; /* Protection Domain. */
|
2019-07-22 14:52:15 +00:00
|
|
|
uint32_t pdn; /* Protection Domain number. */
|
2019-07-22 14:52:05 +00:00
|
|
|
uint32_t tdn; /* Transport Domain number. */
|
2019-03-27 13:15:39 +00:00
|
|
|
char ibdev_name[IBV_SYSFS_NAME_MAX]; /* IB device name. */
|
|
|
|
char ibdev_path[IBV_SYSFS_PATH_MAX]; /* IB device path for secondary */
|
|
|
|
struct ibv_device_attr_ex device_attr; /* Device properties. */
|
2019-04-27 04:32:57 +00:00
|
|
|
LIST_ENTRY(mlx5_ibv_shared) mem_event_cb;
|
|
|
|
/**< Called by memory event callback. */
|
2019-04-27 04:32:56 +00:00
|
|
|
struct {
|
|
|
|
uint32_t dev_gen; /* Generation number to flush local caches. */
|
|
|
|
rte_rwlock_t rwlock; /* MR Lock. */
|
|
|
|
struct mlx5_mr_btree cache; /* Global MR cache table. */
|
|
|
|
struct mlx5_mr_list mr_list; /* Registered MR list. */
|
|
|
|
struct mlx5_mr_list mr_free_list; /* Freed MR list. */
|
|
|
|
} mr;
|
2019-04-04 13:04:24 +00:00
|
|
|
/* Shared DV/DR flow data section. */
|
2019-04-04 13:04:25 +00:00
|
|
|
pthread_mutex_t dv_mutex; /* DV context mutex. */
|
2019-04-04 13:04:24 +00:00
|
|
|
uint32_t dv_refcnt; /* DV/DR data reference counter. */
|
2019-05-01 20:40:45 +00:00
|
|
|
void *fdb_domain; /* FDB Direct Rules name space handle. */
|
2019-04-18 13:16:01 +00:00
|
|
|
struct mlx5_flow_tbl_resource fdb_tbl[MLX5_MAX_TABLES_FDB];
|
|
|
|
/* FDB Direct Rules tables. */
|
2019-05-01 20:40:45 +00:00
|
|
|
void *rx_domain; /* RX Direct Rules name space handle. */
|
2019-04-04 13:04:25 +00:00
|
|
|
struct mlx5_flow_tbl_resource rx_tbl[MLX5_MAX_TABLES];
|
|
|
|
/* RX Direct Rules tables. */
|
2019-05-01 20:40:45 +00:00
|
|
|
void *tx_domain; /* TX Direct Rules name space handle. */
|
2019-04-04 13:04:25 +00:00
|
|
|
struct mlx5_flow_tbl_resource tx_tbl[MLX5_MAX_TABLES];
|
2019-08-13 14:07:24 +00:00
|
|
|
/* TX Direct Rules tables. */
|
2019-04-18 13:16:07 +00:00
|
|
|
void *esw_drop_action; /* Pointer to DR E-Switch drop action. */
|
2019-09-09 15:56:45 +00:00
|
|
|
void *pop_vlan_action; /* Pointer to DR pop VLAN action. */
|
|
|
|
/* TX Direct Rules tables/ */
|
2019-04-04 13:04:25 +00:00
|
|
|
LIST_HEAD(matchers, mlx5_flow_dv_matcher) matchers;
|
|
|
|
LIST_HEAD(encap_decap, mlx5_flow_dv_encap_decap_resource) encaps_decaps;
|
|
|
|
LIST_HEAD(modify_cmd, mlx5_flow_dv_modify_hdr_resource) modify_cmds;
|
|
|
|
LIST_HEAD(tag, mlx5_flow_dv_tag_resource) tags;
|
|
|
|
LIST_HEAD(jump, mlx5_flow_dv_jump_tbl_resource) jump_tbl;
|
2019-04-18 13:16:05 +00:00
|
|
|
LIST_HEAD(port_id_action_list, mlx5_flow_dv_port_id_action_resource)
|
|
|
|
port_id_action_list; /* List of port ID actions. */
|
2019-09-09 15:56:46 +00:00
|
|
|
LIST_HEAD(push_vlan_action_list, mlx5_flow_dv_push_vlan_action_resource)
|
|
|
|
push_vlan_action_list; /* List of push VLAN actions. */
|
2019-07-16 14:34:53 +00:00
|
|
|
struct mlx5_flow_counter_mng cmng; /* Counters management structure. */
|
2019-04-04 13:04:24 +00:00
|
|
|
/* Shared interrupt handler section. */
|
2019-03-27 13:15:45 +00:00
|
|
|
pthread_mutex_t intr_mutex; /* Interrupt config mutex. */
|
|
|
|
uint32_t intr_cnt; /* Interrupt handler reference counter. */
|
2019-03-27 13:15:39 +00:00
|
|
|
struct rte_intr_handle intr_handle; /* Interrupt handler for device. */
|
2019-07-16 14:34:55 +00:00
|
|
|
struct rte_intr_handle intr_handle_devx; /* DEVX interrupt handler. */
|
|
|
|
struct mlx5dv_devx_cmd_comp *devx_comp; /* DEVX async comp obj. */
|
2019-03-27 13:15:39 +00:00
|
|
|
struct mlx5_ibv_shared_port port[]; /* per device port data array. */
|
|
|
|
};
|
|
|
|
|
2019-04-10 18:41:17 +00:00
|
|
|
/* Per-process private structure. */
|
|
|
|
struct mlx5_proc_priv {
|
|
|
|
size_t uar_table_sz;
|
|
|
|
/* Size of UAR register table. */
|
|
|
|
void *uar_table[];
|
|
|
|
/* Table of UAR registers for each process. */
|
|
|
|
};
|
|
|
|
|
|
|
|
#define MLX5_PROC_PRIV(port_id) \
|
|
|
|
((struct mlx5_proc_priv *)rte_eth_devices[port_id].process_private)
|
|
|
|
|
2019-02-21 09:29:14 +00:00
|
|
|
struct mlx5_priv {
|
2018-05-09 11:04:50 +00:00
|
|
|
struct rte_eth_dev_data *dev_data; /* Pointer to device data. */
|
2019-03-27 13:15:39 +00:00
|
|
|
struct mlx5_ibv_shared *sh; /* Shared IB device context. */
|
|
|
|
uint32_t ibv_port; /* IB device port number. */
|
2019-09-25 07:53:24 +00:00
|
|
|
struct rte_pci_device *pci_dev; /* Backend PCI device. */
|
2019-05-21 16:13:03 +00:00
|
|
|
struct rte_ether_addr mac[MLX5_MAX_MAC_ADDRESSES]; /* MAC addresses. */
|
2018-04-05 15:07:19 +00:00
|
|
|
BITFIELD_DECLARE(mac_own, uint64_t, MLX5_MAX_MAC_ADDRESSES);
|
|
|
|
/* Bit-field of MAC addresses owned by the PMD. */
|
2015-10-30 18:52:40 +00:00
|
|
|
uint16_t vlan_filter[MLX5_MAX_VLAN_IDS]; /* VLAN filters table. */
|
|
|
|
unsigned int vlan_filter_n; /* Number of configured VLAN filters. */
|
2015-10-30 18:52:30 +00:00
|
|
|
/* Device properties. */
|
|
|
|
uint16_t mtu; /* Configured MTU. */
|
2017-05-24 13:44:08 +00:00
|
|
|
unsigned int isolated:1; /* Whether isolated mode is enabled. */
|
2018-07-10 16:04:54 +00:00
|
|
|
unsigned int representor:1; /* Device is a port representor. */
|
2019-03-27 13:15:35 +00:00
|
|
|
unsigned int master:1; /* Device is a E-Switch master. */
|
2019-04-04 13:04:24 +00:00
|
|
|
unsigned int dr_shared:1; /* DV/DR data is shared. */
|
2019-07-16 14:34:56 +00:00
|
|
|
unsigned int counter_fallback:1; /* Use counter fallback management. */
|
2018-07-10 16:04:54 +00:00
|
|
|
uint16_t domain_id; /* Switch domain identifier. */
|
2019-03-27 13:15:35 +00:00
|
|
|
uint16_t vport_id; /* Associated VF vport index (if any). */
|
2019-09-25 07:53:30 +00:00
|
|
|
uint32_t vport_meta_tag; /* Used for vport index match ove VF LAG. */
|
|
|
|
uint32_t vport_meta_mask; /* Used for vport index field match mask. */
|
2018-07-10 16:04:54 +00:00
|
|
|
int32_t representor_id; /* Port representor identifier. */
|
2019-07-21 14:56:40 +00:00
|
|
|
unsigned int if_index; /* Associated kernel network device index. */
|
2015-10-30 18:52:31 +00:00
|
|
|
/* RX/TX queues. */
|
|
|
|
unsigned int rxqs_n; /* RX queues array size. */
|
|
|
|
unsigned int txqs_n; /* TX queues array size. */
|
2017-10-09 14:44:39 +00:00
|
|
|
struct mlx5_rxq_data *(*rxqs)[]; /* RX queues. */
|
2017-10-09 14:44:40 +00:00
|
|
|
struct mlx5_txq_data *(*txqs)[]; /* TX queues. */
|
2018-05-09 11:13:50 +00:00
|
|
|
struct rte_mempool *mprq_mp; /* Mempool for Multi-Packet RQ. */
|
2017-10-09 14:44:56 +00:00
|
|
|
struct rte_eth_rss_conf rss_conf; /* RSS configuration. */
|
2015-11-02 18:11:57 +00:00
|
|
|
unsigned int (*reta_idx)[]; /* RETA index table. */
|
|
|
|
unsigned int reta_idx_n; /* RETA index size. */
|
2018-07-12 09:30:48 +00:00
|
|
|
struct mlx5_drop drop_queue; /* Flow drop queues. */
|
2017-10-09 14:44:53 +00:00
|
|
|
struct mlx5_flows flows; /* RTE Flow rules. */
|
|
|
|
struct mlx5_flows ctrl_flows; /* Control flow rules. */
|
2017-10-09 14:44:49 +00:00
|
|
|
LIST_HEAD(rxq, mlx5_rxq_ctrl) rxqsctrl; /* DPDK Rx queues. */
|
2019-07-22 14:52:11 +00:00
|
|
|
LIST_HEAD(rxqobj, mlx5_rxq_obj) rxqsobj; /* Verbs/DevX Rx queues. */
|
2017-10-09 14:44:51 +00:00
|
|
|
LIST_HEAD(hrxq, mlx5_hrxq) hrxqs; /* Verbs Hash Rx queues. */
|
2017-10-09 14:44:48 +00:00
|
|
|
LIST_HEAD(txq, mlx5_txq_ctrl) txqsctrl; /* DPDK Tx queues. */
|
2017-10-09 14:44:47 +00:00
|
|
|
LIST_HEAD(txqibv, mlx5_txq_ibv) txqsibv; /* Verbs Tx queues. */
|
2019-07-22 14:52:12 +00:00
|
|
|
/* Indirection tables. */
|
|
|
|
LIST_HEAD(ind_tables, mlx5_ind_table_obj) ind_tbls;
|
2019-04-04 09:54:08 +00:00
|
|
|
/* Pointer to next element. */
|
|
|
|
rte_atomic32_t refcnt; /**< Reference counter. */
|
|
|
|
struct ibv_flow_action *verbs_action;
|
|
|
|
/**< Verbs modify header action object. */
|
|
|
|
uint8_t ft_type; /**< Flow table type, Rx or Tx. */
|
2019-07-22 14:52:24 +00:00
|
|
|
uint8_t max_lro_msg_size;
|
2019-04-04 09:54:06 +00:00
|
|
|
/* Tags resources cache. */
|
2016-10-26 09:44:01 +00:00
|
|
|
uint32_t link_speed_capa; /* Link speed capabilities. */
|
2017-01-17 14:37:08 +00:00
|
|
|
struct mlx5_xstats_ctrl xstats_ctrl; /* Extended stats control. */
|
2018-11-23 08:03:37 +00:00
|
|
|
struct mlx5_stats_ctrl stats_ctrl; /* Stats control. */
|
2018-01-10 09:16:58 +00:00
|
|
|
struct mlx5_dev_config config; /* Device configuration. */
|
2018-01-22 12:33:38 +00:00
|
|
|
struct mlx5_verbs_alloc_ctx verbs_alloc_ctx;
|
|
|
|
/* Context for Verbs allocator. */
|
2018-07-10 16:04:52 +00:00
|
|
|
int nl_socket_rdma; /* Netlink socket (NETLINK_RDMA). */
|
|
|
|
int nl_socket_route; /* Netlink socket (NETLINK_ROUTE). */
|
2018-04-05 15:07:19 +00:00
|
|
|
uint32_t nl_sn; /* Netlink message sequence number. */
|
2019-07-22 14:52:10 +00:00
|
|
|
LIST_HEAD(dbrpage, mlx5_devx_dbr_page) dbrpgs; /* Door-bell pages. */
|
2019-07-30 09:20:24 +00:00
|
|
|
struct mlx5_vlan_vmwa_context *vmwa_context; /* VLAN WA context. */
|
2018-07-12 12:01:31 +00:00
|
|
|
#ifndef RTE_ARCH_64
|
|
|
|
rte_spinlock_t uar_lock_cq; /* CQs share a common distinct UAR */
|
|
|
|
rte_spinlock_t uar_lock[MLX5_UAR_PAGE_NUM_MAX];
|
|
|
|
/* UAR same-page access control required in 32bit implementations. */
|
|
|
|
#endif
|
2015-10-30 18:52:30 +00:00
|
|
|
};
|
|
|
|
|
2018-05-09 11:04:50 +00:00
|
|
|
#define PORT_ID(priv) ((priv)->dev_data->port_id)
|
|
|
|
#define ETH_DEV(priv) (&rte_eth_devices[PORT_ID(priv)])
|
|
|
|
|
2016-03-17 15:38:57 +00:00
|
|
|
/* mlx5.c */
|
|
|
|
|
|
|
|
int mlx5_getenv_int(const char *);
|
2019-04-10 18:41:17 +00:00
|
|
|
int mlx5_proc_priv_init(struct rte_eth_dev *dev);
|
2019-07-22 14:52:10 +00:00
|
|
|
int64_t mlx5_get_dbr(struct rte_eth_dev *dev,
|
|
|
|
struct mlx5_devx_dbr_page **dbr_page);
|
|
|
|
int32_t mlx5_release_dbr(struct rte_eth_dev *dev, uint32_t umem_id,
|
|
|
|
uint64_t offset);
|
2019-08-22 10:15:52 +00:00
|
|
|
int mlx5_udp_tunnel_port_add(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_udp_tunnel *udp_tunnel);
|
2016-03-17 15:38:57 +00:00
|
|
|
|
2015-10-30 18:52:30 +00:00
|
|
|
/* mlx5_ethdev.c */
|
|
|
|
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_get_ifname(const struct rte_eth_dev *dev, char (*ifname)[IF_NAMESIZE]);
|
2019-04-05 13:25:55 +00:00
|
|
|
int mlx5_get_master_ifname(const char *ibdev_path, char (*ifname)[IF_NAMESIZE]);
|
2018-07-25 11:24:33 +00:00
|
|
|
unsigned int mlx5_ifindex(const struct rte_eth_dev *dev);
|
2018-10-08 06:28:17 +00:00
|
|
|
int mlx5_ifreq(const struct rte_eth_dev *dev, int req, struct ifreq *ifr);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_get_mtu(struct rte_eth_dev *dev, uint16_t *mtu);
|
|
|
|
int mlx5_set_flags(struct rte_eth_dev *dev, unsigned int keep,
|
|
|
|
unsigned int flags);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_dev_configure(struct rte_eth_dev *dev);
|
2019-09-12 16:42:28 +00:00
|
|
|
int mlx5_dev_infos_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *info);
|
2019-05-02 12:11:34 +00:00
|
|
|
int mlx5_read_clock(struct rte_eth_dev *dev, uint64_t *clock);
|
2019-02-06 22:25:19 +00:00
|
|
|
int mlx5_fw_version_get(struct rte_eth_dev *dev, char *fw_ver, size_t fw_size);
|
2016-03-14 20:50:50 +00:00
|
|
|
const uint32_t *mlx5_dev_supported_ptypes_get(struct rte_eth_dev *dev);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_link_update(struct rte_eth_dev *dev, int wait_to_complete);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_force_link_status_change(struct rte_eth_dev *dev, int status);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_dev_set_mtu(struct rte_eth_dev *dev, uint16_t mtu);
|
|
|
|
int mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_fc_conf *fc_conf);
|
|
|
|
int mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_fc_conf *fc_conf);
|
2019-09-25 07:53:25 +00:00
|
|
|
int mlx5_dev_to_pci_addr(const char *dev_path,
|
|
|
|
struct rte_pci_addr *pci_addr);
|
2018-03-05 12:20:58 +00:00
|
|
|
void mlx5_dev_link_status_handler(void *arg);
|
2018-03-05 12:21:04 +00:00
|
|
|
void mlx5_dev_interrupt_handler(void *arg);
|
2019-07-16 14:34:55 +00:00
|
|
|
void mlx5_dev_interrupt_handler_devx(void *arg);
|
2018-03-05 12:21:04 +00:00
|
|
|
void mlx5_dev_interrupt_handler_uninstall(struct rte_eth_dev *dev);
|
|
|
|
void mlx5_dev_interrupt_handler_install(struct rte_eth_dev *dev);
|
2016-03-17 15:38:54 +00:00
|
|
|
int mlx5_set_link_down(struct rte_eth_dev *dev);
|
|
|
|
int mlx5_set_link_up(struct rte_eth_dev *dev);
|
2018-01-20 21:12:21 +00:00
|
|
|
int mlx5_is_removed(struct rte_eth_dev *dev);
|
2018-03-05 12:21:04 +00:00
|
|
|
eth_tx_burst_t mlx5_select_tx_function(struct rte_eth_dev *dev);
|
|
|
|
eth_rx_burst_t mlx5_select_rx_function(struct rte_eth_dev *dev);
|
2018-07-10 16:04:54 +00:00
|
|
|
unsigned int mlx5_dev_to_port_id(const struct rte_device *dev,
|
|
|
|
uint16_t *port_list,
|
|
|
|
unsigned int port_list_n);
|
2019-09-25 07:53:31 +00:00
|
|
|
struct mlx5_priv *mlx5_port_to_eswitch_info(uint16_t port);
|
|
|
|
struct mlx5_priv *mlx5_dev_to_eswitch_info(struct rte_eth_dev *dev);
|
2018-07-24 08:36:45 +00:00
|
|
|
int mlx5_sysfs_switch_info(unsigned int ifindex,
|
|
|
|
struct mlx5_switch_info *info);
|
net/mlx5: support PF representor
On BlueField platform we have the new entity - PF representor.
This one represents the PCI PF attached to external host on the
side of ARM. The traffic sent by the external host to the NIC
via PF will be seem by ARM on this PF representor.
This patch refactors port recognizing capability on the base of
physical port name. We have two groups of name formats. Legacy
name formats are supported by kernels before ver 5.0 (being
more precise - before the patch [1]) or before Mellanox OFED 4.6,
and new naming formats added by the patch [1].
Legacy naming formats are supported:
- missing physical port name (no sysfs/netlink key) at all,
master is assumed
- decimal digits (for example "12"), representor is assumed,
the value is the index of attached VF
New naming formats are supported:
- "p" followed by decimal digits, for example "p2", master
is assumed
- "pf" followed by PF index concatenated with "vf" followed by
VF index, for example "pf0vf1", representor is assumed.
If index of VF is "-1" it is a special case of host PF
representor, this representor must be indexed in devargs
as 65535, for example representor=[0-3,65535] will
allow representors for VF0, VF1, VF2, VF3 and for host PF.
Note: do not specify representor=[0-65535], it causes devargs
processing error, because number of ports (rte_eth_dev) is
limited.
Applications should distinguish representors and master devices
exclusively by device flag RTE_ETH_DEV_REPRESENTOR and do not
rely on switch port_id (mlx5 PMD deduces ones from representor_id)
values returned by dev_infos_get() API.
[1] https://www.spinics.net/lists/netdev/msg547007.html
Linux-tree: c12ecc23 (Or Gerlitz 2018-04-25 17:32 +0300)
"net/mlx5e: Move to use common phys port names for vport representors"
Signed-off-by: Viacheslav Ovsiienko <viacheslavo@mellanox.com>
Acked-by: Shahaf Shuler <shahafs@mellanox.com>
2019-04-16 14:10:28 +00:00
|
|
|
void mlx5_sysfs_check_switch_info(bool device_dir,
|
|
|
|
struct mlx5_switch_info *switch_info);
|
|
|
|
void mlx5_nl_check_switch_info(bool nun_vf_set,
|
|
|
|
struct mlx5_switch_info *switch_info);
|
|
|
|
void mlx5_translate_port_name(const char *port_name_in,
|
2019-03-17 06:23:03 +00:00
|
|
|
struct mlx5_switch_info *port_info_out);
|
2019-05-27 04:58:32 +00:00
|
|
|
void mlx5_intr_callback_unregister(const struct rte_intr_handle *handle,
|
|
|
|
rte_intr_callback_fn cb_fn, void *cb_arg);
|
2019-09-09 11:04:35 +00:00
|
|
|
int mlx5_get_module_info(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_dev_module_info *modinfo);
|
|
|
|
int mlx5_get_module_eeprom(struct rte_eth_dev *dev,
|
|
|
|
struct rte_dev_eeprom_info *info);
|
2015-10-30 18:52:30 +00:00
|
|
|
|
|
|
|
/* mlx5_mac.c */
|
|
|
|
|
2019-05-21 16:13:05 +00:00
|
|
|
int mlx5_get_mac(struct rte_eth_dev *dev, uint8_t (*mac)[RTE_ETHER_ADDR_LEN]);
|
2018-03-05 12:20:58 +00:00
|
|
|
void mlx5_mac_addr_remove(struct rte_eth_dev *dev, uint32_t index);
|
2019-05-21 16:13:03 +00:00
|
|
|
int mlx5_mac_addr_add(struct rte_eth_dev *dev, struct rte_ether_addr *mac,
|
2018-03-05 12:20:58 +00:00
|
|
|
uint32_t index, uint32_t vmdq);
|
2019-05-21 16:13:03 +00:00
|
|
|
int mlx5_mac_addr_set(struct rte_eth_dev *dev, struct rte_ether_addr *mac_addr);
|
2018-04-23 11:09:28 +00:00
|
|
|
int mlx5_set_mc_addr_list(struct rte_eth_dev *dev,
|
2019-05-21 16:13:03 +00:00
|
|
|
struct rte_ether_addr *mc_addr_set,
|
|
|
|
uint32_t nb_mc_addr);
|
2015-10-30 18:52:30 +00:00
|
|
|
|
2015-10-30 18:55:11 +00:00
|
|
|
/* mlx5_rss.c */
|
|
|
|
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_rss_hash_update(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_rss_conf *rss_conf);
|
|
|
|
int mlx5_rss_hash_conf_get(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_rss_conf *rss_conf);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_rss_reta_index_resize(struct rte_eth_dev *dev, unsigned int reta_size);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_dev_rss_reta_query(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_rss_reta_entry64 *reta_conf,
|
|
|
|
uint16_t reta_size);
|
|
|
|
int mlx5_dev_rss_reta_update(struct rte_eth_dev *dev,
|
|
|
|
struct rte_eth_rss_reta_entry64 *reta_conf,
|
|
|
|
uint16_t reta_size);
|
2015-10-30 18:55:11 +00:00
|
|
|
|
2015-10-30 18:52:37 +00:00
|
|
|
/* mlx5_rxmode.c */
|
|
|
|
|
2019-09-14 11:37:24 +00:00
|
|
|
int mlx5_promiscuous_enable(struct rte_eth_dev *dev);
|
|
|
|
int mlx5_promiscuous_disable(struct rte_eth_dev *dev);
|
2019-09-24 12:56:10 +00:00
|
|
|
int mlx5_allmulticast_enable(struct rte_eth_dev *dev);
|
|
|
|
int mlx5_allmulticast_disable(struct rte_eth_dev *dev);
|
2015-10-30 18:52:37 +00:00
|
|
|
|
2015-10-30 18:52:36 +00:00
|
|
|
/* mlx5_stats.c */
|
|
|
|
|
2018-11-23 08:03:37 +00:00
|
|
|
void mlx5_stats_init(struct rte_eth_dev *dev);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *stats);
|
2019-09-06 14:34:54 +00:00
|
|
|
int mlx5_stats_reset(struct rte_eth_dev *dev);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_xstats_get(struct rte_eth_dev *dev, struct rte_eth_xstat *stats,
|
|
|
|
unsigned int n);
|
2019-09-06 14:34:54 +00:00
|
|
|
int mlx5_xstats_reset(struct rte_eth_dev *dev);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_xstats_get_names(struct rte_eth_dev *dev __rte_unused,
|
2018-03-05 12:20:58 +00:00
|
|
|
struct rte_eth_xstat_name *xstats_names,
|
|
|
|
unsigned int n);
|
2015-10-30 18:52:36 +00:00
|
|
|
|
2015-10-30 18:52:40 +00:00
|
|
|
/* mlx5_vlan.c */
|
|
|
|
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_vlan_filter_set(struct rte_eth_dev *dev, uint16_t vlan_id, int on);
|
|
|
|
void mlx5_vlan_strip_queue_set(struct rte_eth_dev *dev, uint16_t queue, int on);
|
|
|
|
int mlx5_vlan_offload_set(struct rte_eth_dev *dev, int mask);
|
2015-10-30 18:52:40 +00:00
|
|
|
|
2015-10-30 18:52:33 +00:00
|
|
|
/* mlx5_trigger.c */
|
|
|
|
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_dev_start(struct rte_eth_dev *dev);
|
|
|
|
void mlx5_dev_stop(struct rte_eth_dev *dev);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_traffic_enable(struct rte_eth_dev *dev);
|
2018-03-05 12:21:05 +00:00
|
|
|
void mlx5_traffic_disable(struct rte_eth_dev *dev);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_traffic_restart(struct rte_eth_dev *dev);
|
2015-10-30 18:52:33 +00:00
|
|
|
|
2017-10-09 14:44:38 +00:00
|
|
|
/* mlx5_flow.c */
|
2016-03-03 14:26:43 +00:00
|
|
|
|
2018-07-12 09:30:49 +00:00
|
|
|
int mlx5_flow_discover_priorities(struct rte_eth_dev *dev);
|
2018-07-12 09:30:48 +00:00
|
|
|
void mlx5_flow_print(struct rte_flow *flow);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_flow_validate(struct rte_eth_dev *dev,
|
|
|
|
const struct rte_flow_attr *attr,
|
|
|
|
const struct rte_flow_item items[],
|
|
|
|
const struct rte_flow_action actions[],
|
|
|
|
struct rte_flow_error *error);
|
|
|
|
struct rte_flow *mlx5_flow_create(struct rte_eth_dev *dev,
|
|
|
|
const struct rte_flow_attr *attr,
|
|
|
|
const struct rte_flow_item items[],
|
|
|
|
const struct rte_flow_action actions[],
|
|
|
|
struct rte_flow_error *error);
|
|
|
|
int mlx5_flow_destroy(struct rte_eth_dev *dev, struct rte_flow *flow,
|
|
|
|
struct rte_flow_error *error);
|
2018-03-05 12:21:04 +00:00
|
|
|
void mlx5_flow_list_flush(struct rte_eth_dev *dev, struct mlx5_flows *list);
|
2018-03-05 12:20:58 +00:00
|
|
|
int mlx5_flow_flush(struct rte_eth_dev *dev, struct rte_flow_error *error);
|
|
|
|
int mlx5_flow_query(struct rte_eth_dev *dev, struct rte_flow *flow,
|
2018-04-26 17:29:19 +00:00
|
|
|
const struct rte_flow_action *action, void *data,
|
2018-03-05 12:20:58 +00:00
|
|
|
struct rte_flow_error *error);
|
|
|
|
int mlx5_flow_isolate(struct rte_eth_dev *dev, int enable,
|
|
|
|
struct rte_flow_error *error);
|
|
|
|
int mlx5_dev_filter_ctrl(struct rte_eth_dev *dev,
|
|
|
|
enum rte_filter_type filter_type,
|
|
|
|
enum rte_filter_op filter_op,
|
|
|
|
void *arg);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_flow_start(struct rte_eth_dev *dev, struct mlx5_flows *list);
|
|
|
|
void mlx5_flow_stop(struct rte_eth_dev *dev, struct mlx5_flows *list);
|
|
|
|
int mlx5_flow_verify(struct rte_eth_dev *dev);
|
|
|
|
int mlx5_ctrl_flow_vlan(struct rte_eth_dev *dev,
|
|
|
|
struct rte_flow_item_eth *eth_spec,
|
|
|
|
struct rte_flow_item_eth *eth_mask,
|
|
|
|
struct rte_flow_item_vlan *vlan_spec,
|
|
|
|
struct rte_flow_item_vlan *vlan_mask);
|
|
|
|
int mlx5_ctrl_flow(struct rte_eth_dev *dev,
|
|
|
|
struct rte_flow_item_eth *eth_spec,
|
|
|
|
struct rte_flow_item_eth *eth_mask);
|
2019-09-11 11:03:36 +00:00
|
|
|
struct rte_flow *mlx5_flow_create_esw_table_zero_flow(struct rte_eth_dev *dev);
|
2018-03-05 12:21:04 +00:00
|
|
|
int mlx5_flow_create_drop_queue(struct rte_eth_dev *dev);
|
|
|
|
void mlx5_flow_delete_drop_queue(struct rte_eth_dev *dev);
|
2019-07-16 14:34:55 +00:00
|
|
|
void mlx5_flow_async_pool_query_handle(struct mlx5_ibv_shared *sh,
|
|
|
|
uint64_t async_id, int status);
|
|
|
|
void mlx5_set_query_alarm(struct mlx5_ibv_shared *sh);
|
|
|
|
void mlx5_flow_query_alarm(void *arg);
|
2016-12-29 15:15:17 +00:00
|
|
|
|
2019-04-01 21:12:54 +00:00
|
|
|
/* mlx5_mp.c */
|
2019-04-01 21:12:56 +00:00
|
|
|
void mlx5_mp_req_start_rxtx(struct rte_eth_dev *dev);
|
|
|
|
void mlx5_mp_req_stop_rxtx(struct rte_eth_dev *dev);
|
2019-04-01 21:17:55 +00:00
|
|
|
int mlx5_mp_req_mr_create(struct rte_eth_dev *dev, uintptr_t addr);
|
2019-04-01 21:12:54 +00:00
|
|
|
int mlx5_mp_req_verbs_cmd_fd(struct rte_eth_dev *dev);
|
2019-05-30 10:20:38 +00:00
|
|
|
int mlx5_mp_req_queue_state_modify(struct rte_eth_dev *dev,
|
|
|
|
struct mlx5_mp_arg_queue_state_modify *sm);
|
2019-04-25 12:45:15 +00:00
|
|
|
int mlx5_mp_init_primary(void);
|
2019-04-01 21:12:55 +00:00
|
|
|
void mlx5_mp_uninit_primary(void);
|
2019-04-25 12:45:15 +00:00
|
|
|
int mlx5_mp_init_secondary(void);
|
2019-04-01 21:12:56 +00:00
|
|
|
void mlx5_mp_uninit_secondary(void);
|
2017-10-06 15:45:49 +00:00
|
|
|
|
2018-04-05 15:07:19 +00:00
|
|
|
/* mlx5_nl.c */
|
|
|
|
|
2018-07-24 06:50:27 +00:00
|
|
|
int mlx5_nl_init(int protocol);
|
2019-05-21 16:13:03 +00:00
|
|
|
int mlx5_nl_mac_addr_add(struct rte_eth_dev *dev, struct rte_ether_addr *mac,
|
2018-04-05 15:07:19 +00:00
|
|
|
uint32_t index);
|
2019-05-21 16:13:03 +00:00
|
|
|
int mlx5_nl_mac_addr_remove(struct rte_eth_dev *dev, struct rte_ether_addr *mac,
|
2018-04-05 15:07:19 +00:00
|
|
|
uint32_t index);
|
|
|
|
void mlx5_nl_mac_addr_sync(struct rte_eth_dev *dev);
|
|
|
|
void mlx5_nl_mac_addr_flush(struct rte_eth_dev *dev);
|
2018-04-05 15:07:20 +00:00
|
|
|
int mlx5_nl_promisc(struct rte_eth_dev *dev, int enable);
|
|
|
|
int mlx5_nl_allmulti(struct rte_eth_dev *dev, int enable);
|
2019-03-27 13:15:37 +00:00
|
|
|
unsigned int mlx5_nl_portnum(int nl, const char *name);
|
2019-03-27 13:15:36 +00:00
|
|
|
unsigned int mlx5_nl_ifindex(int nl, const char *name, uint32_t pindex);
|
2018-07-10 16:04:52 +00:00
|
|
|
int mlx5_nl_switch_info(int nl, unsigned int ifindex,
|
|
|
|
struct mlx5_switch_info *info);
|
2018-04-05 15:07:19 +00:00
|
|
|
|
2019-07-30 09:20:24 +00:00
|
|
|
struct mlx5_vlan_vmwa_context *mlx5_vlan_vmwa_init(struct rte_eth_dev *dev,
|
|
|
|
uint32_t ifindex);
|
|
|
|
void mlx5_vlan_vmwa_exit(struct mlx5_vlan_vmwa_context *ctx);
|
|
|
|
void mlx5_vlan_vmwa_release(struct rte_eth_dev *dev,
|
|
|
|
struct mlx5_vf_vlan *vf_vlan);
|
|
|
|
void mlx5_vlan_vmwa_acquire(struct rte_eth_dev *dev,
|
|
|
|
struct mlx5_vf_vlan *vf_vlan);
|
|
|
|
|
2019-01-03 15:06:37 +00:00
|
|
|
/* mlx5_devx_cmds.c */
|
|
|
|
|
2019-07-16 14:34:53 +00:00
|
|
|
struct mlx5_devx_obj *mlx5_devx_cmd_flow_counter_alloc(struct ibv_context *ctx,
|
|
|
|
uint32_t bulk_sz);
|
|
|
|
int mlx5_devx_cmd_destroy(struct mlx5_devx_obj *obj);
|
|
|
|
int mlx5_devx_cmd_flow_counter_query(struct mlx5_devx_obj *dcs,
|
|
|
|
int clear, uint32_t n_counters,
|
|
|
|
uint64_t *pkts, uint64_t *bytes,
|
2019-07-16 14:34:55 +00:00
|
|
|
uint32_t mkey, void *addr,
|
|
|
|
struct mlx5dv_devx_cmd_comp *cmd_comp,
|
|
|
|
uint64_t async_id);
|
2019-04-18 13:16:01 +00:00
|
|
|
int mlx5_devx_cmd_query_hca_attr(struct ibv_context *ctx,
|
|
|
|
struct mlx5_hca_attr *attr);
|
2019-07-16 14:34:53 +00:00
|
|
|
struct mlx5_devx_obj *mlx5_devx_cmd_mkey_create(struct ibv_context *ctx,
|
|
|
|
struct mlx5_devx_mkey_attr *attr);
|
2019-07-16 14:34:55 +00:00
|
|
|
int mlx5_devx_get_out_command_status(void *out);
|
2019-07-22 14:52:04 +00:00
|
|
|
int mlx5_devx_cmd_qp_query_tis_td(struct ibv_qp *qp, uint32_t tis_num,
|
|
|
|
uint32_t *tis_td);
|
2019-07-22 14:52:06 +00:00
|
|
|
struct mlx5_devx_obj *mlx5_devx_cmd_create_rq(struct ibv_context *ctx,
|
|
|
|
struct mlx5_devx_create_rq_attr *rq_attr,
|
|
|
|
int socket);
|
2019-07-22 14:52:07 +00:00
|
|
|
int mlx5_devx_cmd_modify_rq(struct mlx5_devx_obj *rq,
|
|
|
|
struct mlx5_devx_modify_rq_attr *rq_attr);
|
2019-07-22 14:52:08 +00:00
|
|
|
struct mlx5_devx_obj *mlx5_devx_cmd_create_tir(struct ibv_context *ctx,
|
|
|
|
struct mlx5_devx_tir_attr *tir_attr);
|
2019-07-22 14:52:09 +00:00
|
|
|
struct mlx5_devx_obj *mlx5_devx_cmd_create_rqt(struct ibv_context *ctx,
|
|
|
|
struct mlx5_devx_rqt_attr *rqt_attr);
|
2019-07-22 14:52:06 +00:00
|
|
|
|
2015-10-30 18:52:30 +00:00
|
|
|
#endif /* RTE_PMD_MLX5_H_ */
|