numam-spdk/include/spdk/sock.h
Ben Walker 7ef33c86b8 sock/posix: Zero copy send
If available, automatically use MSG_ZEROCOPY when sending on sockets.
Storage workloads contain sufficient data transfer sizes that this is
always a performance improvement, regardless of workload.

Change-Id: I14429d78c22ad3bc036aec13c9fce6453e899c92
Signed-off-by: Ben Walker <benjamin.walker@intel.com>
Reviewed-on: https://review.gerrithub.io/c/spdk/spdk/+/471752
Tested-by: SPDK CI Jenkins <sys_sgci@intel.com>
Reviewed-by: Shuhei Matsumoto <shuhei.matsumoto.xt@hitachi.com>
Reviewed-by: Jim Harris <james.r.harris@intel.com>
Reviewed-by: Or Gerlitz <gerlitz.or@gmail.com>
2020-01-27 17:42:24 +00:00

359 lines
11 KiB
C

/*-
* BSD LICENSE
*
* Copyright (c) Intel Corporation.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
* * Neither the name of Intel Corporation nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
/** \file
* TCP socket abstraction layer
*/
#ifndef SPDK_SOCK_H
#define SPDK_SOCK_H
#include "spdk/stdinc.h"
#include "spdk/queue.h"
#ifdef __cplusplus
extern "C" {
#endif
struct spdk_sock;
struct spdk_sock_group;
/**
* Anywhere this struct is used, an iovec array is assumed to
* immediately follow the last member in memory, without any
* padding.
*
* A simpler implementation would be to place a 0-length array
* of struct iovec at the end of this request. However, embedding
* a structure that ends with a variable length array inside of
* another structure is a GNU C extension and not standard.
*/
struct spdk_sock_request {
/* When the request is completed, this callback will be called.
* err will be 0 on success or a negated errno value on failure. */
void (*cb_fn)(void *cb_arg, int err);
void *cb_arg;
/**
* These fields are used by the socket layer and should not be modified
*/
struct __sock_request_internal {
TAILQ_ENTRY(spdk_sock_request) link;
uint32_t offset;
} internal;
int iovcnt;
/* struct iovec iov[]; */
};
#define SPDK_SOCK_REQUEST_IOV(req, i) ((struct iovec *)(((uint8_t *)req + sizeof(struct spdk_sock_request)) + (sizeof(struct iovec) * i)))
/**
* Get client and server addresses of the given socket.
*
* \param sock Socket to get address.
* \param saddr A pointer to the buffer to hold the address of server.
* \param slen Length of the buffer 'saddr'.
* \param sport A pointer(May be NULL) to the buffer to hold the port info of server.
* \param caddr A pointer to the buffer to hold the address of client.
* \param clen Length of the buffer 'caddr'.
* \param cport A pointer(May be NULL) to the buffer to hold the port info of server.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_getaddr(struct spdk_sock *sock, char *saddr, int slen, uint16_t *sport,
char *caddr, int clen, uint16_t *cport);
/**
* Create a socket using the specific sock implementation, connect the socket
* to the specified address and port (of the server), and then return the socket.
* This function is used by client.
*
* \param ip IP address of the server.
* \param port Port number of the server.
* \param impl_name The sock_implementation to use, such as "posix". If impl_name is
* specified, it will *only* try to listen on that impl. If it is NULL, it will try
* all the sock implementations in order and uses the first sock implementation which
* can connect. For example, it will try vpp, posix as an example.
*
* \return a pointer to the connected socket on success, or NULL on failure.
*/
struct spdk_sock *spdk_sock_connect(const char *ip, int port, char *impl_name);
/**
* Create a socket using the specific sock implementation, bind the socket to
* the specified address and port and listen on the socket, and then return the socket.
* This function is used by server.
*
* \param ip IP address to listen on.
* \param port Port number.
* \param impl_name The sock_implementation to use, such as "posix". If impl_name is
* specified, it will *only* try to listen on that impl. If it is NULL, it will try
* all the sock implementations in order and uses the first sock implementation which
* can listen. For example, it will try vpp, posix as an example.
*
* \return a pointer to the listened socket on success, or NULL on failure.
*/
struct spdk_sock *spdk_sock_listen(const char *ip, int port, char *impl_name);
/**
* Accept a new connection from a client on the specified socket and return a
* socket structure which holds the connection.
*
* \param sock Listening socket.
*
* \return a pointer to the accepted socket on success, or NULL on failure.
*/
struct spdk_sock *spdk_sock_accept(struct spdk_sock *sock);
/**
* Close a socket.
*
* \param sock Socket to close.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_close(struct spdk_sock **sock);
/**
* Flush a socket from data gathered in previous writev_async calls.
*
* \param sock Socket to flush.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_flush(struct spdk_sock *sock);
/**
* Receive a message from the given socket.
*
* \param sock Socket to receive message.
* \param buf Pointer to a buffer to hold the data.
* \param len Length of the buffer.
*
* \return the length of the received message on success, -1 on failure.
*/
ssize_t spdk_sock_recv(struct spdk_sock *sock, void *buf, size_t len);
/**
* Write message to the given socket from the I/O vector array.
*
* \param sock Socket to write to.
* \param iov I/O vector.
* \param iovcnt Number of I/O vectors in the array.
*
* \return the length of written message on success, -1 on failure.
*/
ssize_t spdk_sock_writev(struct spdk_sock *sock, struct iovec *iov, int iovcnt);
/**
* Write data to the given socket asynchronously, calling
* the provided callback when the data has been written.
*
* \param sock Socket to write to.
* \param req The write request to submit.
*/
void spdk_sock_writev_async(struct spdk_sock *sock, struct spdk_sock_request *req);
/**
* Read message from the given socket to the I/O vector array.
*
* \param sock Socket to receive message.
* \param iov I/O vector.
* \param iovcnt Number of I/O vectors in the array.
*
* \return the length of the received message on success, -1 on failure.
*/
ssize_t spdk_sock_readv(struct spdk_sock *sock, struct iovec *iov, int iovcnt);
/**
* Set the value used to specify the low water mark (in bytes) for this socket.
*
* \param sock Socket to set for.
* \param nbytes Value for recvlowat.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_set_recvlowat(struct spdk_sock *sock, int nbytes);
/**
* Set receive buffer size for the given socket.
*
* \param sock Socket to set buffer size for.
* \param sz Buffer size in bytes.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_set_recvbuf(struct spdk_sock *sock, int sz);
/**
* Set priority for the given socket.
*
* \param sock Socket to set the priority.
* \param priority Priority given by the user.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_set_priority(struct spdk_sock *sock, int priority);
/**
* Set send buffer size for the given socket.
*
* \param sock Socket to set buffer size for.
* \param sz Buffer size in bytes.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_set_sendbuf(struct spdk_sock *sock, int sz);
/**
* Check whether the address of socket is ipv6.
*
* \param sock Socket to check.
*
* \return true if the address of socket is ipv6, or false otherwise.
*/
bool spdk_sock_is_ipv6(struct spdk_sock *sock);
/**
* Check whether the address of socket is ipv4.
*
* \param sock Socket to check.
*
* \return true if the address of socket is ipv4, or false otherwise.
*/
bool spdk_sock_is_ipv4(struct spdk_sock *sock);
/**
* Check whether the socket is currently connected.
*
* \param sock Socket to check
*
* \return true if the socket is connected or false otherwise.
*/
bool spdk_sock_is_connected(struct spdk_sock *sock);
/**
* Callback function for spdk_sock_group_add_sock().
*
* \param arg Argument for the callback function.
* \param group Socket group.
* \param sock Socket.
*/
typedef void (*spdk_sock_cb)(void *arg, struct spdk_sock_group *group, struct spdk_sock *sock);
/**
* Create a new socket group with user provided pointer
*
* \param ctx the context provided by user.
* \return a pointer to the created group on success, or NULL on failure.
*/
struct spdk_sock_group *spdk_sock_group_create(void *ctx);
/**
* Get the ctx of the sock group
*
* \param sock_group Socket group.
* \return a pointer which is ctx of the sock_group.
*/
void *spdk_sock_group_get_ctx(struct spdk_sock_group *sock_group);
/**
* Add a socket to the group.
*
* \param group Socket group.
* \param sock Socket to add.
* \param cb_fn Called when the operation completes.
* \param cb_arg Argument passed to the callback function.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_group_add_sock(struct spdk_sock_group *group, struct spdk_sock *sock,
spdk_sock_cb cb_fn, void *cb_arg);
/**
* Remove a socket from the group.
*
* \param group Socket group.
* \param sock Socket to remove.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_group_remove_sock(struct spdk_sock_group *group, struct spdk_sock *sock);
/**
* Poll incoming events for each registered socket.
*
* \param group Group to poll.
*
* \return the number of events on success, -1 on failure.
*/
int spdk_sock_group_poll(struct spdk_sock_group *group);
/**
* Poll incoming events up to max_events for each registered socket.
*
* \param group Group to poll.
* \param max_events Number of maximum events to poll for each socket.
*
* \return the number of events on success, -1 on failure.
*/
int spdk_sock_group_poll_count(struct spdk_sock_group *group, int max_events);
/**
* Close all registered sockets of the group and then remove the group.
*
* \param group Group to close.
*
* \return 0 on success, -1 on failure.
*/
int spdk_sock_group_close(struct spdk_sock_group **group);
/**
* Get the optimal sock group for this sock.
*
* \param sock The socket
* \param group Returns the optimal sock group. If there is no optimal sock group, returns NULL.
*
* \return 0 on success. Negated errno on failure.
*/
int spdk_sock_get_optimal_sock_group(struct spdk_sock *sock, struct spdk_sock_group **group);
#ifdef __cplusplus
}
#endif
#endif /* SPDK_SOCK_H */