751 lines
16 KiB
C

/*
* Copyright (c) 2005-2006 Intel Corporation. All rights reserved.
*
* This software is available to you under a choice of one of two
* licenses. You may choose to be licensed under the terms of the GNU
* General Public License (GPL) Version 2, available from the file
* COPYING in the main directory of this source tree, or the
* OpenIB.org BSD license below:
*
* Redistribution and use in source and binary forms, with or
* without modification, are permitted provided that the following
* conditions are met:
*
* - Redistributions of source code must retain the above
* copyright notice, this list of conditions and the following
* disclaimer.
*
* - Redistributions in binary form must reproduce the above
* copyright notice, this list of conditions and the following
* disclaimer in the documentation and/or other materials
* provided with the distribution.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*
* $Id$
*/
#include <stdlib.h>
#include <string.h>
#include <stdio.h>
#include <errno.h>
#include <sys/types.h>
#include <netinet/in.h>
#include <sys/socket.h>
#include <netdb.h>
#include <byteswap.h>
#include <getopt.h>
#include <rdma/rdma_cma.h>
#if __BYTE_ORDER == __BIG_ENDIAN
static inline uint64_t cpu_to_be64(uint64_t x) { return x; }
static inline uint32_t cpu_to_be32(uint32_t x) { return x; }
#else
static inline uint64_t cpu_to_be64(uint64_t x) { return bswap_64(x); }
static inline uint32_t cpu_to_be32(uint32_t x) { return bswap_32(x); }
#endif
struct cmatest_node {
int id;
struct rdma_cm_id *cma_id;
int connected;
struct ibv_pd *pd;
struct ibv_cq *cq[2];
struct ibv_mr *mr;
void *mem;
};
enum CQ_INDEX {
SEND_CQ_INDEX,
RECV_CQ_INDEX
};
struct cmatest {
struct rdma_event_channel *channel;
struct cmatest_node *nodes;
int conn_index;
int connects_left;
int disconnects_left;
struct rdma_addr addr;
};
static struct cmatest test;
static int connections = 1;
static int message_size = 100;
static int message_count = 10;
static uint16_t port = 7471;
static uint8_t set_tos = 0;
static uint8_t tos;
static uint8_t migrate = 0;
static char *dst_addr;
static char *src_addr;
static int create_message(struct cmatest_node *node)
{
if (!message_size)
message_count = 0;
if (!message_count)
return 0;
node->mem = malloc(message_size);
if (!node->mem) {
printf("failed message allocation\n");
return -1;
}
node->mr = ibv_reg_mr(node->pd, node->mem, message_size,
IBV_ACCESS_LOCAL_WRITE);
if (!node->mr) {
printf("failed to reg MR\n");
goto err;
}
return 0;
err:
free(node->mem);
return -1;
}
static int init_node(struct cmatest_node *node)
{
struct ibv_qp_init_attr init_qp_attr;
int cqe, ret;
node->pd = ibv_alloc_pd(node->cma_id->verbs);
if (!node->pd) {
ret = -ENOMEM;
printf("cmatose: unable to allocate PD\n");
goto out;
}
cqe = message_count ? message_count : 1;
node->cq[SEND_CQ_INDEX] = ibv_create_cq(node->cma_id->verbs, cqe, node, 0, 0);
node->cq[RECV_CQ_INDEX] = ibv_create_cq(node->cma_id->verbs, cqe, node, 0, 0);
if (!node->cq[SEND_CQ_INDEX] || !node->cq[RECV_CQ_INDEX]) {
ret = -ENOMEM;
printf("cmatose: unable to create CQ\n");
goto out;
}
memset(&init_qp_attr, 0, sizeof init_qp_attr);
init_qp_attr.cap.max_send_wr = cqe;
init_qp_attr.cap.max_recv_wr = cqe;
init_qp_attr.cap.max_send_sge = 1;
init_qp_attr.cap.max_recv_sge = 1;
init_qp_attr.qp_context = node;
init_qp_attr.sq_sig_all = 1;
init_qp_attr.qp_type = IBV_QPT_RC;
init_qp_attr.send_cq = node->cq[SEND_CQ_INDEX];
init_qp_attr.recv_cq = node->cq[RECV_CQ_INDEX];
ret = rdma_create_qp(node->cma_id, node->pd, &init_qp_attr);
if (ret) {
perror("cmatose: unable to create QP");
goto out;
}
ret = create_message(node);
if (ret) {
printf("cmatose: failed to create messages: %d\n", ret);
goto out;
}
out:
return ret;
}
static int post_recvs(struct cmatest_node *node)
{
struct ibv_recv_wr recv_wr, *recv_failure;
struct ibv_sge sge;
int i, ret = 0;
if (!message_count)
return 0;
recv_wr.next = NULL;
recv_wr.sg_list = &sge;
recv_wr.num_sge = 1;
recv_wr.wr_id = (uintptr_t) node;
sge.length = message_size;
sge.lkey = node->mr->lkey;
sge.addr = (uintptr_t) node->mem;
for (i = 0; i < message_count && !ret; i++ ) {
ret = ibv_post_recv(node->cma_id->qp, &recv_wr, &recv_failure);
if (ret) {
printf("failed to post receives: %d\n", ret);
break;
}
}
return ret;
}
static int post_sends(struct cmatest_node *node)
{
struct ibv_send_wr send_wr, *bad_send_wr;
struct ibv_sge sge;
int i, ret = 0;
if (!node->connected || !message_count)
return 0;
send_wr.next = NULL;
send_wr.sg_list = &sge;
send_wr.num_sge = 1;
send_wr.opcode = IBV_WR_SEND;
send_wr.send_flags = 0;
send_wr.wr_id = (unsigned long)node;
sge.length = message_size;
sge.lkey = node->mr->lkey;
sge.addr = (uintptr_t) node->mem;
for (i = 0; i < message_count && !ret; i++) {
ret = ibv_post_send(node->cma_id->qp, &send_wr, &bad_send_wr);
if (ret)
printf("failed to post sends: %d\n", ret);
}
return ret;
}
static void connect_error(void)
{
test.disconnects_left--;
test.connects_left--;
}
static int addr_handler(struct cmatest_node *node)
{
int ret;
if (set_tos) {
ret = rdma_set_option(node->cma_id, RDMA_OPTION_ID,
RDMA_OPTION_ID_TOS, &tos, sizeof tos);
if (ret)
perror("cmatose: set TOS option failed");
}
ret = rdma_resolve_route(node->cma_id, 2000);
if (ret) {
perror("cmatose: resolve route failed");
connect_error();
}
return ret;
}
static int route_handler(struct cmatest_node *node)
{
struct rdma_conn_param conn_param;
int ret;
ret = init_node(node);
if (ret)
goto err;
ret = post_recvs(node);
if (ret)
goto err;
memset(&conn_param, 0, sizeof conn_param);
conn_param.responder_resources = 1;
conn_param.initiator_depth = 1;
conn_param.retry_count = 5;
ret = rdma_connect(node->cma_id, &conn_param);
if (ret) {
perror("cmatose: failure connecting");
goto err;
}
return 0;
err:
connect_error();
return ret;
}
static int connect_handler(struct rdma_cm_id *cma_id)
{
struct cmatest_node *node;
struct rdma_conn_param conn_param;
int ret;
if (test.conn_index == connections) {
ret = -ENOMEM;
goto err1;
}
node = &test.nodes[test.conn_index++];
node->cma_id = cma_id;
cma_id->context = node;
ret = init_node(node);
if (ret)
goto err2;
ret = post_recvs(node);
if (ret)
goto err2;
memset(&conn_param, 0, sizeof conn_param);
conn_param.responder_resources = 1;
conn_param.initiator_depth = 1;
ret = rdma_accept(node->cma_id, &conn_param);
if (ret) {
perror("cmatose: failure accepting");
goto err2;
}
return 0;
err2:
node->cma_id = NULL;
connect_error();
err1:
printf("cmatose: failing connection request\n");
rdma_reject(cma_id, NULL, 0);
return ret;
}
static int cma_handler(struct rdma_cm_id *cma_id, struct rdma_cm_event *event)
{
int ret = 0;
switch (event->event) {
case RDMA_CM_EVENT_ADDR_RESOLVED:
ret = addr_handler(cma_id->context);
break;
case RDMA_CM_EVENT_ROUTE_RESOLVED:
ret = route_handler(cma_id->context);
break;
case RDMA_CM_EVENT_CONNECT_REQUEST:
ret = connect_handler(cma_id);
break;
case RDMA_CM_EVENT_ESTABLISHED:
((struct cmatest_node *) cma_id->context)->connected = 1;
test.connects_left--;
break;
case RDMA_CM_EVENT_ADDR_ERROR:
case RDMA_CM_EVENT_ROUTE_ERROR:
case RDMA_CM_EVENT_CONNECT_ERROR:
case RDMA_CM_EVENT_UNREACHABLE:
case RDMA_CM_EVENT_REJECTED:
printf("cmatose: event: %s, error: %d\n",
rdma_event_str(event->event), event->status);
connect_error();
break;
case RDMA_CM_EVENT_DISCONNECTED:
rdma_disconnect(cma_id);
test.disconnects_left--;
break;
case RDMA_CM_EVENT_DEVICE_REMOVAL:
/* Cleanup will occur after test completes. */
break;
default:
break;
}
return ret;
}
static void destroy_node(struct cmatest_node *node)
{
if (!node->cma_id)
return;
if (node->cma_id->qp)
rdma_destroy_qp(node->cma_id);
if (node->cq[SEND_CQ_INDEX])
ibv_destroy_cq(node->cq[SEND_CQ_INDEX]);
if (node->cq[RECV_CQ_INDEX])
ibv_destroy_cq(node->cq[RECV_CQ_INDEX]);
if (node->mem) {
ibv_dereg_mr(node->mr);
free(node->mem);
}
if (node->pd)
ibv_dealloc_pd(node->pd);
/* Destroy the RDMA ID after all device resources */
rdma_destroy_id(node->cma_id);
}
static int alloc_nodes(void)
{
int ret, i;
test.nodes = malloc(sizeof *test.nodes * connections);
if (!test.nodes) {
printf("cmatose: unable to allocate memory for test nodes\n");
return -ENOMEM;
}
memset(test.nodes, 0, sizeof *test.nodes * connections);
for (i = 0; i < connections; i++) {
test.nodes[i].id = i;
if (dst_addr) {
ret = rdma_create_id(test.channel,
&test.nodes[i].cma_id,
&test.nodes[i], RDMA_PS_TCP);
if (ret)
goto err;
}
}
return 0;
err:
while (--i >= 0)
rdma_destroy_id(test.nodes[i].cma_id);
free(test.nodes);
return ret;
}
static void destroy_nodes(void)
{
int i;
for (i = 0; i < connections; i++)
destroy_node(&test.nodes[i]);
free(test.nodes);
}
static int poll_cqs(enum CQ_INDEX index)
{
struct ibv_wc wc[8];
int done, i, ret;
for (i = 0; i < connections; i++) {
if (!test.nodes[i].connected)
continue;
for (done = 0; done < message_count; done += ret) {
ret = ibv_poll_cq(test.nodes[i].cq[index], 8, wc);
if (ret < 0) {
printf("cmatose: failed polling CQ: %d\n", ret);
return ret;
}
}
}
return 0;
}
static int connect_events(void)
{
struct rdma_cm_event *event;
int err = 0, ret = 0;
while (test.connects_left && !err) {
err = rdma_get_cm_event(test.channel, &event);
if (!err) {
cma_handler(event->id, event);
rdma_ack_cm_event(event);
} else {
perror("cmatose: failure in rdma_get_cm_event in connect events");
ret = errno;
}
}
return ret;
}
static int disconnect_events(void)
{
struct rdma_cm_event *event;
int err = 0, ret = 0;
while (test.disconnects_left && !err) {
err = rdma_get_cm_event(test.channel, &event);
if (!err) {
cma_handler(event->id, event);
rdma_ack_cm_event(event);
} else {
perror("cmatose: failure in rdma_get_cm_event in disconnect events");
ret = errno;
}
}
return ret;
}
static int migrate_channel(struct rdma_cm_id *listen_id)
{
struct rdma_event_channel *channel;
int i, ret;
printf("migrating to new event channel\n");
channel = rdma_create_event_channel();
if (!channel) {
perror("cmatose: failed to create event channel");
return -1;
}
ret = 0;
if (listen_id)
ret = rdma_migrate_id(listen_id, channel);
for (i = 0; i < connections && !ret; i++)
ret = rdma_migrate_id(test.nodes[i].cma_id, channel);
if (!ret) {
rdma_destroy_event_channel(test.channel);
test.channel = channel;
} else
perror("cmatose: failure migrating to channel");
return ret;
}
static int get_addr(char *dst, struct sockaddr *addr)
{
struct addrinfo *res;
int ret;
ret = getaddrinfo(dst, NULL, NULL, &res);
if (ret) {
printf("getaddrinfo failed - invalid hostname or IP address\n");
return ret;
}
if (res->ai_family == PF_INET)
memcpy(addr, res->ai_addr, sizeof(struct sockaddr_in));
else if (res->ai_family == PF_INET6)
memcpy(addr, res->ai_addr, sizeof(struct sockaddr_in6));
else
ret = -1;
freeaddrinfo(res);
return ret;
}
static int run_server(void)
{
struct rdma_cm_id *listen_id;
int i, ret;
printf("cmatose: starting server\n");
ret = rdma_create_id(test.channel, &listen_id, &test, RDMA_PS_TCP);
if (ret) {
perror("cmatose: listen request failed");
return ret;
}
if (src_addr) {
ret = get_addr(src_addr, &test.addr.src_addr);
if (ret)
goto out;
if (test.addr.src_addr.sa_family == AF_INET)
((struct sockaddr_in *) &test.addr.src_addr)->sin_port = port;
else
((struct sockaddr_in6 *) &test.addr.src_addr)->sin6_port = port;
} else {
test.addr.src_addr.sa_family = PF_INET;
((struct sockaddr_in *) &test.addr.src_addr)->sin_port = port;
}
ret = rdma_bind_addr(listen_id, &test.addr.src_addr);
if (ret) {
perror("cmatose: bind address failed");
goto out;
}
ret = rdma_listen(listen_id, 0);
if (ret) {
perror("cmatose: failure trying to listen");
goto out;
}
ret = connect_events();
if (ret)
goto out;
if (message_count) {
printf("initiating data transfers\n");
for (i = 0; i < connections; i++) {
ret = post_sends(&test.nodes[i]);
if (ret)
goto out;
}
printf("completing sends\n");
ret = poll_cqs(SEND_CQ_INDEX);
if (ret)
goto out;
printf("receiving data transfers\n");
ret = poll_cqs(RECV_CQ_INDEX);
if (ret)
goto out;
printf("data transfers complete\n");
}
if (migrate) {
ret = migrate_channel(listen_id);
if (ret)
goto out;
}
printf("cmatose: disconnecting\n");
for (i = 0; i < connections; i++) {
if (!test.nodes[i].connected)
continue;
test.nodes[i].connected = 0;
rdma_disconnect(test.nodes[i].cma_id);
}
ret = disconnect_events();
printf("disconnected\n");
out:
rdma_destroy_id(listen_id);
return ret;
}
static int run_client(void)
{
int i, ret, ret2;
printf("cmatose: starting client\n");
if (src_addr) {
ret = get_addr(src_addr, &test.addr.src_addr);
if (ret)
return ret;
}
ret = get_addr(dst_addr, &test.addr.dst_addr);
if (ret)
return ret;
if (test.addr.dst_addr.sa_family == AF_INET)
((struct sockaddr_in *) &test.addr.dst_addr)->sin_port = port;
else
((struct sockaddr_in6 *) &test.addr.dst_addr)->sin6_port = port;
printf("cmatose: connecting\n");
for (i = 0; i < connections; i++) {
ret = rdma_resolve_addr(test.nodes[i].cma_id,
src_addr ? &test.addr.src_addr : NULL,
&test.addr.dst_addr, 2000);
if (ret) {
perror("cmatose: failure getting addr");
connect_error();
return ret;
}
}
ret = connect_events();
if (ret)
goto disc;
if (message_count) {
printf("receiving data transfers\n");
ret = poll_cqs(RECV_CQ_INDEX);
if (ret)
goto disc;
printf("sending replies\n");
for (i = 0; i < connections; i++) {
ret = post_sends(&test.nodes[i]);
if (ret)
goto disc;
}
printf("data transfers complete\n");
}
ret = 0;
if (migrate) {
ret = migrate_channel(NULL);
if (ret)
goto out;
}
disc:
ret2 = disconnect_events();
if (ret2)
ret = ret2;
out:
return ret;
}
int main(int argc, char **argv)
{
int op, ret;
while ((op = getopt(argc, argv, "s:b:c:C:S:t:p:m")) != -1) {
switch (op) {
case 's':
dst_addr = optarg;
break;
case 'b':
src_addr = optarg;
break;
case 'c':
connections = atoi(optarg);
break;
case 'C':
message_count = atoi(optarg);
break;
case 'S':
message_size = atoi(optarg);
break;
case 't':
set_tos = 1;
tos = (uint8_t) atoi(optarg);
break;
case 'p':
port = atoi(optarg);
break;
case 'm':
migrate = 1;
break;
default:
printf("usage: %s\n", argv[0]);
printf("\t[-s server_address]\n");
printf("\t[-b bind_address]\n");
printf("\t[-c connections]\n");
printf("\t[-C message_count]\n");
printf("\t[-S message_size]\n");
printf("\t[-t type_of_service]\n");
printf("\t[-p port_number]\n");
printf("\t[-m(igrate)]\n");
exit(1);
}
}
test.connects_left = connections;
test.disconnects_left = connections;
test.channel = rdma_create_event_channel();
if (!test.channel) {
printf("failed to create event channel\n");
exit(1);
}
if (alloc_nodes())
exit(1);
if (dst_addr)
ret = run_client();
else
ret = run_server();
printf("test complete\n");
destroy_nodes();
rdma_destroy_event_channel(test.channel);
printf("return status %d\n", ret);
return ret;
}