2017-12-19 15:49:03 +00:00
|
|
|
/* SPDX-License-Identifier: BSD-3-Clause
|
eal: add channel for multi-process communication
Previouly, there are three channels for multi-process
(i.e., primary/secondary) communication.
1. Config-file based channel, in which, the primary process writes
info into a pre-defined config file, and the secondary process
reads the info out.
2. vfio submodule has its own channel based on unix socket for the
secondary process to get container fd and group fd from the
primary process.
3. pdump submodule also has its own channel based on unix socket for
packet dump.
It'd be good to have a generic communication channel for multi-process
communication to accommodate the requirements including:
a. Secondary wants to send info to primary, for example, secondary
would like to send request (about some specific vdev to primary).
b. Sending info at any time, instead of just initialization time.
c. Share FDs with the other side, for vdev like vhost, related FDs
(memory region, kick) should be shared.
d. A send message request needs the other side to response immediately.
This patch proposes to create a communication channel, based on datagram
unix socket, for above requirements. Each process will block on a unix
socket waiting for messages from the peers.
Three new APIs are added:
1. rte_eal_mp_action_register() is used to register an action,
indexed by a string, when a component at receiver side would like
to response the messages from the peer processe.
2. rte_eal_mp_action_unregister() is used to unregister the action
if the calling component does not want to response the messages.
3. rte_eal_mp_sendmsg() is used to send a message, and returns
immediately. If there are n secondary processes, the primary
process will send n messages.
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:08 +00:00
|
|
|
* Copyright(c) 2010-2018 Intel Corporation
|
2012-09-04 13:54:00 +01:00
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _RTE_EAL_H_
|
|
|
|
#define _RTE_EAL_H_
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @file
|
|
|
|
*
|
|
|
|
* EAL Configuration API
|
|
|
|
*/
|
|
|
|
|
2012-12-20 00:00:00 +01:00
|
|
|
#include <stdint.h>
|
2015-02-17 10:08:06 +08:00
|
|
|
#include <sched.h>
|
eal: add synchronous multi-process communication
We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.
We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The caller
can specify the timeout. And the response messages will be collected
and returned so that the caller can decide how to translate them.
The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.
sender-process receiver-process
---------------------- ----------------
thread-n
|_rte_eal_mp_request() ----------> mp-thread
|_timedwait() |_process_msg()
|_action()
|_rte_eal_mp_reply()
mp_thread <---------------------|
|_process_msg()
|_signal(send_thread)
thread-m <----------|
|_collect-reply
* A secondary process is only allowed to talk to the primary process.
* If there are multiple secondary processes for the primary process,
it will send request to peer1, collect response from peer1; then
send request to peer2, collect response from peer2, and so on.
* When thread-n is sending request, thread-m of that process can send
request at the same time.
* For pair <action_name, peer>, we guarantee that only one such request
is on the fly.
Suggested-by: Anatoly Burakov <anatoly.burakov@intel.com>
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:09 +00:00
|
|
|
#include <time.h>
|
2015-02-17 10:08:06 +08:00
|
|
|
|
2017-12-21 14:00:04 +01:00
|
|
|
#include <rte_config.h>
|
2018-01-21 20:48:06 -05:00
|
|
|
#include <rte_compat.h>
|
2015-02-17 10:08:06 +08:00
|
|
|
#include <rte_per_lcore.h>
|
2017-10-06 16:33:42 +05:30
|
|
|
#include <rte_bus.h>
|
2012-09-04 13:54:00 +01:00
|
|
|
|
2017-10-26 12:05:51 +02:00
|
|
|
#include <rte_pci_dev_feature_defs.h>
|
|
|
|
|
2012-09-04 13:54:00 +01:00
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define RTE_MAGIC 19820526 /**< Magic number written by the main partition when ready. */
|
|
|
|
|
2015-07-28 17:51:44 -07:00
|
|
|
/* Maximum thread_name length. */
|
|
|
|
#define RTE_MAX_THREAD_NAME_LEN 16
|
|
|
|
|
2012-09-04 13:54:00 +01:00
|
|
|
/**
|
|
|
|
* The lcore role (used in RTE or not).
|
|
|
|
*/
|
|
|
|
enum rte_lcore_role_t {
|
|
|
|
ROLE_RTE,
|
|
|
|
ROLE_OFF,
|
2017-07-11 15:19:27 +01:00
|
|
|
ROLE_SERVICE,
|
2012-09-04 13:54:00 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The type of process in a linuxapp, multi-process setup
|
|
|
|
*/
|
|
|
|
enum rte_proc_type_t {
|
|
|
|
RTE_PROC_AUTO = -1, /* allow auto-detection of primary/secondary */
|
|
|
|
RTE_PROC_PRIMARY = 0, /* set to zero, so primary is the default */
|
|
|
|
RTE_PROC_SECONDARY,
|
|
|
|
|
|
|
|
RTE_PROC_INVALID
|
|
|
|
};
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The global RTE configuration structure.
|
|
|
|
*/
|
|
|
|
struct rte_config {
|
|
|
|
uint32_t master_lcore; /**< Id of the master lcore */
|
|
|
|
uint32_t lcore_count; /**< Number of available logical cores. */
|
2018-03-31 18:08:13 +01:00
|
|
|
uint32_t numa_node_count; /**< Number of detected NUMA nodes. */
|
|
|
|
uint32_t numa_nodes[RTE_MAX_NUMA_NODES]; /**< List of detected NUMA nodes. */
|
2017-07-11 15:19:27 +01:00
|
|
|
uint32_t service_lcore_count;/**< Number of available service cores. */
|
2012-09-04 13:54:00 +01:00
|
|
|
enum rte_lcore_role_t lcore_role[RTE_MAX_LCORE]; /**< State of cores. */
|
|
|
|
|
|
|
|
/** Primary or secondary configuration */
|
|
|
|
enum rte_proc_type_t process_type;
|
|
|
|
|
2017-10-06 16:33:42 +05:30
|
|
|
/** PA or VA mapping mode */
|
|
|
|
enum rte_iova_mode iova_mode;
|
|
|
|
|
2012-09-04 13:54:00 +01:00
|
|
|
/**
|
|
|
|
* Pointer to memory configuration, which may be shared across multiple
|
2016-02-08 11:30:07 +01:00
|
|
|
* DPDK instances
|
2012-09-04 13:54:00 +01:00
|
|
|
*/
|
|
|
|
struct rte_mem_config *mem_config;
|
|
|
|
} __attribute__((__packed__));
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Get the global configuration structure.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* A pointer to the global configuration structure.
|
|
|
|
*/
|
|
|
|
struct rte_config *rte_eal_get_configuration(void);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Get a lcore's role.
|
|
|
|
*
|
|
|
|
* @param lcore_id
|
|
|
|
* The identifier of the lcore.
|
|
|
|
* @return
|
|
|
|
* The role of the lcore.
|
|
|
|
*/
|
|
|
|
enum rte_lcore_role_t rte_eal_lcore_role(unsigned lcore_id);
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Get the process type in a multi-process setup
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* The process type
|
|
|
|
*/
|
|
|
|
enum rte_proc_type_t rte_eal_process_type(void);
|
|
|
|
|
2014-08-26 16:11:39 +02:00
|
|
|
/**
|
|
|
|
* Request iopl privilege for all RPL.
|
|
|
|
*
|
|
|
|
* This function should be called by pmds which need access to ioports.
|
|
|
|
|
|
|
|
* @return
|
|
|
|
* - On success, returns 0.
|
|
|
|
* - On failure, returns -1.
|
|
|
|
*/
|
|
|
|
int rte_eal_iopl_init(void);
|
|
|
|
|
2012-09-04 13:54:00 +01:00
|
|
|
/**
|
|
|
|
* Initialize the Environment Abstraction Layer (EAL).
|
|
|
|
*
|
|
|
|
* This function is to be executed on the MASTER lcore only, as soon
|
|
|
|
* as possible in the application's main() function.
|
|
|
|
*
|
2014-09-26 16:04:00 +02:00
|
|
|
* The function finishes the initialization process before main() is called.
|
|
|
|
* It puts the SLAVE lcores in the WAIT state.
|
2012-09-04 13:54:00 +01:00
|
|
|
*
|
|
|
|
* When the multi-partition feature is supported, depending on the
|
|
|
|
* configuration (if CONFIG_RTE_EAL_MAIN_PARTITION is disabled), this
|
|
|
|
* function waits to ensure that the magic number is set before
|
|
|
|
* returning. See also the rte_eal_get_configuration() function. Note:
|
|
|
|
* This behavior may change in the future.
|
|
|
|
*
|
|
|
|
* @param argc
|
2016-12-08 10:56:45 -05:00
|
|
|
* A non-negative value. If it is greater than 0, the array members
|
|
|
|
* for argv[0] through argv[argc] (non-inclusive) shall contain pointers
|
|
|
|
* to strings.
|
2012-09-04 13:54:00 +01:00
|
|
|
* @param argv
|
2016-12-08 10:56:45 -05:00
|
|
|
* An array of strings. The contents of the array, as well as the strings
|
|
|
|
* which are pointed to by the array, may be modified by this function.
|
2012-09-04 13:54:00 +01:00
|
|
|
* @return
|
|
|
|
* - On success, the number of parsed arguments, which is greater or
|
|
|
|
* equal to zero. After the call to rte_eal_init(),
|
2016-12-08 10:56:45 -05:00
|
|
|
* all arguments argv[x] with x < ret may have been modified by this
|
|
|
|
* function call and should not be further interpreted by the
|
|
|
|
* application. The EAL does not take any ownership of the memory used
|
|
|
|
* for either the argv array, or its members.
|
2017-03-22 16:19:40 -04:00
|
|
|
* - On failure, -1 and rte_errno is set to a value indicating the cause
|
|
|
|
* for failure. In some instances, the application will need to be
|
|
|
|
* restarted as part of clearing the issue.
|
|
|
|
*
|
|
|
|
* Error codes returned via rte_errno:
|
|
|
|
* EACCES indicates a permissions issue.
|
|
|
|
*
|
|
|
|
* EAGAIN indicates either a bus or system resource was not available,
|
|
|
|
* setup may be attempted again.
|
|
|
|
*
|
|
|
|
* EALREADY indicates that the rte_eal_init function has already been
|
|
|
|
* called, and cannot be called again.
|
|
|
|
*
|
|
|
|
* EFAULT indicates the tailq configuration name was not found in
|
|
|
|
* memory configuration.
|
|
|
|
*
|
|
|
|
* EINVAL indicates invalid parameters were passed as argv/argc.
|
|
|
|
*
|
|
|
|
* ENOMEM indicates failure likely caused by an out-of-memory condition.
|
|
|
|
*
|
|
|
|
* ENODEV indicates memory setup issues.
|
|
|
|
*
|
|
|
|
* ENOTSUP indicates that the EAL cannot initialize on this system.
|
|
|
|
*
|
|
|
|
* EPROTO indicates that the PCI bus is either not present, or is not
|
|
|
|
* readable by the eal.
|
2017-07-11 15:19:27 +01:00
|
|
|
*
|
|
|
|
* ENOEXEC indicates that a service core failed to launch successfully.
|
2012-09-04 13:54:00 +01:00
|
|
|
*/
|
|
|
|
int rte_eal_init(int argc, char **argv);
|
2016-03-09 13:37:25 +00:00
|
|
|
|
2018-01-29 16:37:30 +00:00
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Clean up the Environment Abstraction Layer (EAL)
|
|
|
|
*
|
|
|
|
* This function must be called to release any internal resources that EAL has
|
|
|
|
* allocated during rte_eal_init(). After this call, no DPDK function calls may
|
|
|
|
* be made. It is expected that common usage of this function is to call it
|
|
|
|
* just before terminating the process.
|
|
|
|
*
|
|
|
|
* @return 0 Successfully released all internal EAL resources
|
|
|
|
* @return -EFAULT There was an error in releasing all resources.
|
|
|
|
*/
|
2018-01-21 20:48:06 -05:00
|
|
|
int __rte_experimental rte_eal_cleanup(void);
|
2018-01-29 16:37:30 +00:00
|
|
|
|
2016-03-09 13:37:25 +00:00
|
|
|
/**
|
|
|
|
* Check if a primary process is currently alive
|
|
|
|
*
|
|
|
|
* This function returns true when a primary process is currently
|
|
|
|
* active.
|
|
|
|
*
|
|
|
|
* @param config_file_path
|
|
|
|
* The config_file_path argument provided should point at the location
|
|
|
|
* that the primary process will create its config file. If NULL, the default
|
|
|
|
* config file path is used.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* - If alive, returns 1.
|
|
|
|
* - If dead, returns 0.
|
|
|
|
*/
|
|
|
|
int rte_eal_primary_proc_alive(const char *config_file_path);
|
|
|
|
|
eal: add channel for multi-process communication
Previouly, there are three channels for multi-process
(i.e., primary/secondary) communication.
1. Config-file based channel, in which, the primary process writes
info into a pre-defined config file, and the secondary process
reads the info out.
2. vfio submodule has its own channel based on unix socket for the
secondary process to get container fd and group fd from the
primary process.
3. pdump submodule also has its own channel based on unix socket for
packet dump.
It'd be good to have a generic communication channel for multi-process
communication to accommodate the requirements including:
a. Secondary wants to send info to primary, for example, secondary
would like to send request (about some specific vdev to primary).
b. Sending info at any time, instead of just initialization time.
c. Share FDs with the other side, for vdev like vhost, related FDs
(memory region, kick) should be shared.
d. A send message request needs the other side to response immediately.
This patch proposes to create a communication channel, based on datagram
unix socket, for above requirements. Each process will block on a unix
socket waiting for messages from the peers.
Three new APIs are added:
1. rte_eal_mp_action_register() is used to register an action,
indexed by a string, when a component at receiver side would like
to response the messages from the peer processe.
2. rte_eal_mp_action_unregister() is used to unregister the action
if the calling component does not want to response the messages.
3. rte_eal_mp_sendmsg() is used to send a message, and returns
immediately. If there are n secondary processes, the primary
process will send n messages.
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:08 +00:00
|
|
|
#define RTE_MP_MAX_FD_NUM 8 /* The max amount of fds */
|
|
|
|
#define RTE_MP_MAX_NAME_LEN 64 /* The max length of action name */
|
|
|
|
#define RTE_MP_MAX_PARAM_LEN 256 /* The max length of param */
|
|
|
|
struct rte_mp_msg {
|
|
|
|
char name[RTE_MP_MAX_NAME_LEN];
|
|
|
|
int len_param;
|
|
|
|
int num_fds;
|
|
|
|
uint8_t param[RTE_MP_MAX_PARAM_LEN];
|
|
|
|
int fds[RTE_MP_MAX_FD_NUM];
|
|
|
|
};
|
|
|
|
|
eal: add synchronous multi-process communication
We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.
We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The caller
can specify the timeout. And the response messages will be collected
and returned so that the caller can decide how to translate them.
The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.
sender-process receiver-process
---------------------- ----------------
thread-n
|_rte_eal_mp_request() ----------> mp-thread
|_timedwait() |_process_msg()
|_action()
|_rte_eal_mp_reply()
mp_thread <---------------------|
|_process_msg()
|_signal(send_thread)
thread-m <----------|
|_collect-reply
* A secondary process is only allowed to talk to the primary process.
* If there are multiple secondary processes for the primary process,
it will send request to peer1, collect response from peer1; then
send request to peer2, collect response from peer2, and so on.
* When thread-n is sending request, thread-m of that process can send
request at the same time.
* For pair <action_name, peer>, we guarantee that only one such request
is on the fly.
Suggested-by: Anatoly Burakov <anatoly.burakov@intel.com>
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:09 +00:00
|
|
|
struct rte_mp_reply {
|
|
|
|
int nb_sent;
|
|
|
|
int nb_received;
|
|
|
|
struct rte_mp_msg *msgs; /* caller to free */
|
|
|
|
};
|
|
|
|
|
eal: add channel for multi-process communication
Previouly, there are three channels for multi-process
(i.e., primary/secondary) communication.
1. Config-file based channel, in which, the primary process writes
info into a pre-defined config file, and the secondary process
reads the info out.
2. vfio submodule has its own channel based on unix socket for the
secondary process to get container fd and group fd from the
primary process.
3. pdump submodule also has its own channel based on unix socket for
packet dump.
It'd be good to have a generic communication channel for multi-process
communication to accommodate the requirements including:
a. Secondary wants to send info to primary, for example, secondary
would like to send request (about some specific vdev to primary).
b. Sending info at any time, instead of just initialization time.
c. Share FDs with the other side, for vdev like vhost, related FDs
(memory region, kick) should be shared.
d. A send message request needs the other side to response immediately.
This patch proposes to create a communication channel, based on datagram
unix socket, for above requirements. Each process will block on a unix
socket waiting for messages from the peers.
Three new APIs are added:
1. rte_eal_mp_action_register() is used to register an action,
indexed by a string, when a component at receiver side would like
to response the messages from the peer processe.
2. rte_eal_mp_action_unregister() is used to unregister the action
if the calling component does not want to response the messages.
3. rte_eal_mp_sendmsg() is used to send a message, and returns
immediately. If there are n secondary processes, the primary
process will send n messages.
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:08 +00:00
|
|
|
/**
|
|
|
|
* Action function typedef used by other components.
|
|
|
|
*
|
|
|
|
* As we create socket channel for primary/secondary communication, use
|
|
|
|
* this function typedef to register action for coming messages.
|
|
|
|
*/
|
eal: add synchronous multi-process communication
We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.
We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The caller
can specify the timeout. And the response messages will be collected
and returned so that the caller can decide how to translate them.
The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.
sender-process receiver-process
---------------------- ----------------
thread-n
|_rte_eal_mp_request() ----------> mp-thread
|_timedwait() |_process_msg()
|_action()
|_rte_eal_mp_reply()
mp_thread <---------------------|
|_process_msg()
|_signal(send_thread)
thread-m <----------|
|_collect-reply
* A secondary process is only allowed to talk to the primary process.
* If there are multiple secondary processes for the primary process,
it will send request to peer1, collect response from peer1; then
send request to peer2, collect response from peer2, and so on.
* When thread-n is sending request, thread-m of that process can send
request at the same time.
* For pair <action_name, peer>, we guarantee that only one such request
is on the fly.
Suggested-by: Anatoly Burakov <anatoly.burakov@intel.com>
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:09 +00:00
|
|
|
typedef int (*rte_mp_t)(const struct rte_mp_msg *msg, const void *peer);
|
eal: add channel for multi-process communication
Previouly, there are three channels for multi-process
(i.e., primary/secondary) communication.
1. Config-file based channel, in which, the primary process writes
info into a pre-defined config file, and the secondary process
reads the info out.
2. vfio submodule has its own channel based on unix socket for the
secondary process to get container fd and group fd from the
primary process.
3. pdump submodule also has its own channel based on unix socket for
packet dump.
It'd be good to have a generic communication channel for multi-process
communication to accommodate the requirements including:
a. Secondary wants to send info to primary, for example, secondary
would like to send request (about some specific vdev to primary).
b. Sending info at any time, instead of just initialization time.
c. Share FDs with the other side, for vdev like vhost, related FDs
(memory region, kick) should be shared.
d. A send message request needs the other side to response immediately.
This patch proposes to create a communication channel, based on datagram
unix socket, for above requirements. Each process will block on a unix
socket waiting for messages from the peers.
Three new APIs are added:
1. rte_eal_mp_action_register() is used to register an action,
indexed by a string, when a component at receiver side would like
to response the messages from the peer processe.
2. rte_eal_mp_action_unregister() is used to unregister the action
if the calling component does not want to response the messages.
3. rte_eal_mp_sendmsg() is used to send a message, and returns
immediately. If there are n secondary processes, the primary
process will send n messages.
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:08 +00:00
|
|
|
|
2018-03-31 18:06:16 +01:00
|
|
|
/**
|
|
|
|
* Asynchronous reply function typedef used by other components.
|
|
|
|
*
|
|
|
|
* As we create socket channel for primary/secondary communication, use
|
|
|
|
* this function typedef to register action for coming responses to asynchronous
|
|
|
|
* requests.
|
|
|
|
*/
|
|
|
|
typedef int (*rte_mp_async_reply_t)(const struct rte_mp_msg *request,
|
|
|
|
const struct rte_mp_reply *reply);
|
|
|
|
|
eal: add channel for multi-process communication
Previouly, there are three channels for multi-process
(i.e., primary/secondary) communication.
1. Config-file based channel, in which, the primary process writes
info into a pre-defined config file, and the secondary process
reads the info out.
2. vfio submodule has its own channel based on unix socket for the
secondary process to get container fd and group fd from the
primary process.
3. pdump submodule also has its own channel based on unix socket for
packet dump.
It'd be good to have a generic communication channel for multi-process
communication to accommodate the requirements including:
a. Secondary wants to send info to primary, for example, secondary
would like to send request (about some specific vdev to primary).
b. Sending info at any time, instead of just initialization time.
c. Share FDs with the other side, for vdev like vhost, related FDs
(memory region, kick) should be shared.
d. A send message request needs the other side to response immediately.
This patch proposes to create a communication channel, based on datagram
unix socket, for above requirements. Each process will block on a unix
socket waiting for messages from the peers.
Three new APIs are added:
1. rte_eal_mp_action_register() is used to register an action,
indexed by a string, when a component at receiver side would like
to response the messages from the peer processe.
2. rte_eal_mp_action_unregister() is used to unregister the action
if the calling component does not want to response the messages.
3. rte_eal_mp_sendmsg() is used to send a message, and returns
immediately. If there are n secondary processes, the primary
process will send n messages.
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:08 +00:00
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Register an action function for primary/secondary communication.
|
|
|
|
*
|
|
|
|
* Call this function to register an action, if the calling component wants
|
|
|
|
* to response the messages from the corresponding component in its primary
|
|
|
|
* process or secondary processes.
|
|
|
|
*
|
|
|
|
* @param name
|
|
|
|
* The name argument plays as the nonredundant key to find the action.
|
|
|
|
*
|
|
|
|
* @param action
|
|
|
|
* The action argument is the function pointer to the action function.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* - 0 on success.
|
|
|
|
* - (<0) on failure.
|
|
|
|
*/
|
|
|
|
int __rte_experimental
|
|
|
|
rte_mp_action_register(const char *name, rte_mp_t action);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Unregister an action function for primary/secondary communication.
|
|
|
|
*
|
|
|
|
* Call this function to unregister an action if the calling component does
|
|
|
|
* not want to response the messages from the corresponding component in its
|
|
|
|
* primary process or secondary processes.
|
|
|
|
*
|
|
|
|
* @param name
|
|
|
|
* The name argument plays as the nonredundant key to find the action.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
void __rte_experimental
|
|
|
|
rte_mp_action_unregister(const char *name);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Send a message to the peer process.
|
|
|
|
*
|
|
|
|
* This function will send a message which will be responsed by the action
|
|
|
|
* identified by name in the peer process.
|
|
|
|
*
|
|
|
|
* @param msg
|
|
|
|
* The msg argument contains the customized message.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* - On success, return 0.
|
|
|
|
* - On failure, return -1, and the reason will be stored in rte_errno.
|
|
|
|
*/
|
|
|
|
int __rte_experimental
|
|
|
|
rte_mp_sendmsg(struct rte_mp_msg *msg);
|
|
|
|
|
eal: add synchronous multi-process communication
We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.
We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The caller
can specify the timeout. And the response messages will be collected
and returned so that the caller can decide how to translate them.
The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.
sender-process receiver-process
---------------------- ----------------
thread-n
|_rte_eal_mp_request() ----------> mp-thread
|_timedwait() |_process_msg()
|_action()
|_rte_eal_mp_reply()
mp_thread <---------------------|
|_process_msg()
|_signal(send_thread)
thread-m <----------|
|_collect-reply
* A secondary process is only allowed to talk to the primary process.
* If there are multiple secondary processes for the primary process,
it will send request to peer1, collect response from peer1; then
send request to peer2, collect response from peer2, and so on.
* When thread-n is sending request, thread-m of that process can send
request at the same time.
* For pair <action_name, peer>, we guarantee that only one such request
is on the fly.
Suggested-by: Anatoly Burakov <anatoly.burakov@intel.com>
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:09 +00:00
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Send a request to the peer process and expect a reply.
|
|
|
|
*
|
|
|
|
* This function sends a request message to the peer process, and will
|
|
|
|
* block until receiving reply message from the peer process.
|
|
|
|
*
|
|
|
|
* @note The caller is responsible to free reply->replies.
|
|
|
|
*
|
|
|
|
* @param req
|
|
|
|
* The req argument contains the customized request message.
|
|
|
|
*
|
|
|
|
* @param reply
|
|
|
|
* The reply argument will be for storing all the replied messages;
|
|
|
|
* the caller is responsible for free reply->replies.
|
|
|
|
*
|
|
|
|
* @param ts
|
|
|
|
* The ts argument specifies how long we can wait for the peer(s) to reply.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* - On success, return 0.
|
|
|
|
* - On failure, return -1, and the reason will be stored in rte_errno.
|
|
|
|
*/
|
|
|
|
int __rte_experimental
|
2018-03-31 18:06:15 +01:00
|
|
|
rte_mp_request_sync(struct rte_mp_msg *req, struct rte_mp_reply *reply,
|
eal: add synchronous multi-process communication
We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.
We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The caller
can specify the timeout. And the response messages will be collected
and returned so that the caller can decide how to translate them.
The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.
sender-process receiver-process
---------------------- ----------------
thread-n
|_rte_eal_mp_request() ----------> mp-thread
|_timedwait() |_process_msg()
|_action()
|_rte_eal_mp_reply()
mp_thread <---------------------|
|_process_msg()
|_signal(send_thread)
thread-m <----------|
|_collect-reply
* A secondary process is only allowed to talk to the primary process.
* If there are multiple secondary processes for the primary process,
it will send request to peer1, collect response from peer1; then
send request to peer2, collect response from peer2, and so on.
* When thread-n is sending request, thread-m of that process can send
request at the same time.
* For pair <action_name, peer>, we guarantee that only one such request
is on the fly.
Suggested-by: Anatoly Burakov <anatoly.burakov@intel.com>
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:09 +00:00
|
|
|
const struct timespec *ts);
|
|
|
|
|
2018-03-31 18:06:16 +01:00
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Send a request to the peer process and expect a reply in a separate callback.
|
|
|
|
*
|
|
|
|
* This function sends a request message to the peer process, and will not
|
|
|
|
* block. Instead, reply will be received in a separate callback.
|
|
|
|
*
|
|
|
|
* @param req
|
|
|
|
* The req argument contains the customized request message.
|
|
|
|
*
|
|
|
|
* @param ts
|
|
|
|
* The ts argument specifies how long we can wait for the peer(s) to reply.
|
|
|
|
*
|
|
|
|
* @param clb
|
|
|
|
* The callback to trigger when all responses for this request have arrived.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* - On success, return 0.
|
|
|
|
* - On failure, return -1, and the reason will be stored in rte_errno.
|
|
|
|
*/
|
|
|
|
int __rte_experimental
|
|
|
|
rte_mp_request_async(struct rte_mp_msg *req, const struct timespec *ts,
|
|
|
|
rte_mp_async_reply_t clb);
|
|
|
|
|
eal: add synchronous multi-process communication
We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.
We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The caller
can specify the timeout. And the response messages will be collected
and returned so that the caller can decide how to translate them.
The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.
sender-process receiver-process
---------------------- ----------------
thread-n
|_rte_eal_mp_request() ----------> mp-thread
|_timedwait() |_process_msg()
|_action()
|_rte_eal_mp_reply()
mp_thread <---------------------|
|_process_msg()
|_signal(send_thread)
thread-m <----------|
|_collect-reply
* A secondary process is only allowed to talk to the primary process.
* If there are multiple secondary processes for the primary process,
it will send request to peer1, collect response from peer1; then
send request to peer2, collect response from peer2, and so on.
* When thread-n is sending request, thread-m of that process can send
request at the same time.
* For pair <action_name, peer>, we guarantee that only one such request
is on the fly.
Suggested-by: Anatoly Burakov <anatoly.burakov@intel.com>
Suggested-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng.tan@intel.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
Acked-by: Konstantin Ananyev <konstantin.ananyev@intel.com>
2018-01-30 06:58:09 +00:00
|
|
|
/**
|
|
|
|
* @warning
|
|
|
|
* @b EXPERIMENTAL: this API may change without prior notice
|
|
|
|
*
|
|
|
|
* Send a reply to the peer process.
|
|
|
|
*
|
|
|
|
* This function will send a reply message in response to a request message
|
|
|
|
* received previously.
|
|
|
|
*
|
|
|
|
* @param msg
|
|
|
|
* The msg argument contains the customized message.
|
|
|
|
*
|
|
|
|
* @param peer
|
|
|
|
* The peer argument is the pointer to the peer socket path.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* - On success, return 0.
|
|
|
|
* - On failure, return -1, and the reason will be stored in rte_errno.
|
|
|
|
*/
|
|
|
|
int __rte_experimental
|
|
|
|
rte_mp_reply(struct rte_mp_msg *msg, const char *peer);
|
|
|
|
|
2013-06-03 00:00:00 +00:00
|
|
|
/**
|
|
|
|
* Usage function typedef used by the application usage function.
|
|
|
|
*
|
2017-11-10 00:24:23 -08:00
|
|
|
* Use this function typedef to define and call rte_set_application_usage_hook()
|
2013-06-03 00:00:00 +00:00
|
|
|
* routine.
|
|
|
|
*/
|
|
|
|
typedef void (*rte_usage_hook_t)(const char * prgname);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Add application usage routine callout from the eal_usage() routine.
|
|
|
|
*
|
|
|
|
* This function allows the application to include its usage message
|
|
|
|
* in the EAL system usage message. The routine rte_set_application_usage_hook()
|
|
|
|
* needs to be called before the rte_eal_init() routine in the application.
|
|
|
|
*
|
|
|
|
* This routine is optional for the application and will behave as if the set
|
|
|
|
* routine was never called as the default behavior.
|
|
|
|
*
|
2015-06-18 23:43:06 +02:00
|
|
|
* @param usage_func
|
2013-06-03 00:00:00 +00:00
|
|
|
* The func argument is a function pointer to the application usage routine.
|
|
|
|
* Called function is defined using rte_usage_hook_t typedef, which is of
|
|
|
|
* the form void rte_usage_func(const char * prgname).
|
|
|
|
*
|
|
|
|
* Calling this routine with a NULL value will reset the usage hook routine and
|
|
|
|
* return the current value, which could be NULL.
|
|
|
|
* @return
|
|
|
|
* - Returns the current value of the rte_application_usage pointer to allow
|
|
|
|
* the caller to daisy chain the usage routines if needing more then one.
|
|
|
|
*/
|
|
|
|
rte_usage_hook_t
|
2015-06-18 23:43:06 +02:00
|
|
|
rte_set_application_usage_hook(rte_usage_hook_t usage_func);
|
2012-09-04 13:54:00 +01:00
|
|
|
|
2012-12-20 00:00:00 +01:00
|
|
|
/**
|
2014-06-04 00:42:50 +01:00
|
|
|
* macro to get the lock of tailq in mem_config
|
2012-12-20 00:00:00 +01:00
|
|
|
*/
|
|
|
|
#define RTE_EAL_TAILQ_RWLOCK (&rte_eal_get_configuration()->mem_config->qlock)
|
|
|
|
|
|
|
|
/**
|
|
|
|
* macro to get the multiple lock of mempool shared by mutiple-instance
|
|
|
|
*/
|
|
|
|
#define RTE_EAL_MEMPOOL_RWLOCK (&rte_eal_get_configuration()->mem_config->mplock)
|
|
|
|
|
2013-03-29 11:34:00 +01:00
|
|
|
/**
|
|
|
|
* Whether EAL is using huge pages (disabled by --no-huge option).
|
|
|
|
* The no-huge mode cannot be used with UIO poll-mode drivers like igb/ixgbe.
|
|
|
|
* It is useful for NIC drivers (e.g. librte_pmd_mlx4, librte_pmd_vmxnet3) or
|
|
|
|
* crypto drivers (e.g. librte_crypto_nitrox) provided by third-parties such
|
|
|
|
* as 6WIND.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Nonzero if hugepages are enabled.
|
|
|
|
*/
|
|
|
|
int rte_eal_has_hugepages(void);
|
|
|
|
|
2017-10-26 12:05:51 +02:00
|
|
|
/**
|
|
|
|
* Whether EAL is using PCI bus.
|
|
|
|
* Disabled by --no-pci option.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Nonzero if the PCI bus is enabled.
|
|
|
|
*/
|
|
|
|
int rte_eal_has_pci(void);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Whether the EAL was asked to create UIO device.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Nonzero if true.
|
|
|
|
*/
|
|
|
|
int rte_eal_create_uio_dev(void);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The user-configured vfio interrupt mode.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* Interrupt mode configured with the command line,
|
|
|
|
* RTE_INTR_MODE_NONE by default.
|
|
|
|
*/
|
|
|
|
enum rte_intr_mode rte_eal_vfio_intr_mode(void);
|
|
|
|
|
2015-02-17 10:08:06 +08:00
|
|
|
/**
|
|
|
|
* A wrap API for syscall gettid.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* On success, returns the thread ID of calling process.
|
|
|
|
* It is always successful.
|
|
|
|
*/
|
|
|
|
int rte_sys_gettid(void);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Get system unique thread id.
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* On success, returns the thread ID of calling process.
|
|
|
|
* It is always successful.
|
|
|
|
*/
|
|
|
|
static inline int rte_gettid(void)
|
|
|
|
{
|
|
|
|
static RTE_DEFINE_PER_LCORE(int, _thread_id) = -1;
|
|
|
|
if (RTE_PER_LCORE(_thread_id) == -1)
|
|
|
|
RTE_PER_LCORE(_thread_id) = rte_sys_gettid();
|
|
|
|
return RTE_PER_LCORE(_thread_id);
|
|
|
|
}
|
|
|
|
|
2017-10-06 16:33:42 +05:30
|
|
|
/**
|
|
|
|
* Get the iova mode
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* enum rte_iova_mode value.
|
|
|
|
*/
|
|
|
|
enum rte_iova_mode rte_eal_iova_mode(void);
|
|
|
|
|
2018-02-02 13:33:01 +05:30
|
|
|
/**
|
|
|
|
* Get user provided pool ops name for mbuf
|
|
|
|
*
|
|
|
|
* @return
|
|
|
|
* returns user provided pool ops name.
|
|
|
|
*/
|
2018-08-07 23:34:43 +02:00
|
|
|
const char *
|
2018-02-02 13:33:01 +05:30
|
|
|
rte_eal_mbuf_user_pool_ops(void);
|
|
|
|
|
2012-09-04 13:54:00 +01:00
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#endif /* _RTE_EAL_H_ */
|