1 /*
2 * Copyright (c) 2005-2007 Intel Corporation. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 *
32 * $Id$
33 */
34
35 #include <stdlib.h>
36 #include <string.h>
37 #include <stdio.h>
38 #include <errno.h>
39 #include <sys/types.h>
40 #include <arpa/inet.h>
41 #include <sys/socket.h>
42 #include <netdb.h>
43 #include <unistd.h>
44 #include <getopt.h>
45
46 #include <rdma/rdma_cma.h>
47 #include <infiniband/ib.h>
48
49 struct cmatest_node {
50 int id;
51 struct rdma_cm_id *cma_id;
52 int connected;
53 struct ibv_pd *pd;
54 struct ibv_cq *cq;
55 struct ibv_mr *mr;
56 struct ibv_ah *ah;
57 uint32_t remote_qpn;
58 uint32_t remote_qkey;
59 void *mem;
60 };
61
62 struct cmatest {
63 struct rdma_event_channel *channel;
64 pthread_t cmathread;
65 struct cmatest_node *nodes;
66 int conn_index;
67 int connects_left;
68
69 struct sockaddr_storage dst_in;
70 struct sockaddr *dst_addr;
71 struct sockaddr_storage src_in;
72 struct sockaddr *src_addr;
73 };
74
75 static struct cmatest test;
76 static int connections = 1;
77 static int message_size = 100;
78 static int message_count = 10;
79 static int is_sender;
80 static int unmapped_addr;
81 static char *dst_addr;
82 static char *src_addr;
83 static enum rdma_port_space port_space = RDMA_PS_UDP;
84
create_message(struct cmatest_node * node)85 static int create_message(struct cmatest_node *node)
86 {
87 if (!message_size)
88 message_count = 0;
89
90 if (!message_count)
91 return 0;
92
93 node->mem = malloc(message_size + sizeof(struct ibv_grh));
94 if (!node->mem) {
95 printf("failed message allocation\n");
96 return -1;
97 }
98 node->mr = ibv_reg_mr(node->pd, node->mem,
99 message_size + sizeof(struct ibv_grh),
100 IBV_ACCESS_LOCAL_WRITE);
101 if (!node->mr) {
102 printf("failed to reg MR\n");
103 goto err;
104 }
105 return 0;
106 err:
107 free(node->mem);
108 return -1;
109 }
110
verify_test_params(struct cmatest_node * node)111 static int verify_test_params(struct cmatest_node *node)
112 {
113 struct ibv_port_attr port_attr;
114 int ret;
115
116 ret = ibv_query_port(node->cma_id->verbs, node->cma_id->port_num,
117 &port_attr);
118 if (ret)
119 return ret;
120
121 if (message_count && message_size > (1 << (port_attr.active_mtu + 7))) {
122 printf("mckey: message_size %d is larger than active mtu %d\n",
123 message_size, 1 << (port_attr.active_mtu + 7));
124 return -EINVAL;
125 }
126
127 return 0;
128 }
129
init_node(struct cmatest_node * node)130 static int init_node(struct cmatest_node *node)
131 {
132 struct ibv_qp_init_attr init_qp_attr;
133 int cqe, ret;
134
135 node->pd = ibv_alloc_pd(node->cma_id->verbs);
136 if (!node->pd) {
137 ret = -ENOMEM;
138 printf("mckey: unable to allocate PD\n");
139 goto out;
140 }
141
142 cqe = message_count ? message_count * 2 : 2;
143 node->cq = ibv_create_cq(node->cma_id->verbs, cqe, node, NULL, 0);
144 if (!node->cq) {
145 ret = -ENOMEM;
146 printf("mckey: unable to create CQ\n");
147 goto out;
148 }
149
150 memset(&init_qp_attr, 0, sizeof init_qp_attr);
151 init_qp_attr.cap.max_send_wr = message_count ? message_count : 1;
152 init_qp_attr.cap.max_recv_wr = message_count ? message_count : 1;
153 init_qp_attr.cap.max_send_sge = 1;
154 init_qp_attr.cap.max_recv_sge = 1;
155 init_qp_attr.qp_context = node;
156 init_qp_attr.sq_sig_all = 0;
157 init_qp_attr.qp_type = IBV_QPT_UD;
158 init_qp_attr.send_cq = node->cq;
159 init_qp_attr.recv_cq = node->cq;
160 ret = rdma_create_qp(node->cma_id, node->pd, &init_qp_attr);
161 if (ret) {
162 perror("mckey: unable to create QP");
163 goto out;
164 }
165
166 ret = create_message(node);
167 if (ret) {
168 printf("mckey: failed to create messages: %d\n", ret);
169 goto out;
170 }
171 out:
172 return ret;
173 }
174
post_recvs(struct cmatest_node * node)175 static int post_recvs(struct cmatest_node *node)
176 {
177 struct ibv_recv_wr recv_wr, *recv_failure;
178 struct ibv_sge sge;
179 int i, ret = 0;
180
181 if (!message_count)
182 return 0;
183
184 recv_wr.next = NULL;
185 recv_wr.sg_list = &sge;
186 recv_wr.num_sge = 1;
187 recv_wr.wr_id = (uintptr_t) node;
188
189 sge.length = message_size + sizeof(struct ibv_grh);
190 sge.lkey = node->mr->lkey;
191 sge.addr = (uintptr_t) node->mem;
192
193 for (i = 0; i < message_count && !ret; i++ ) {
194 ret = ibv_post_recv(node->cma_id->qp, &recv_wr, &recv_failure);
195 if (ret) {
196 printf("failed to post receives: %d\n", ret);
197 break;
198 }
199 }
200 return ret;
201 }
202
post_sends(struct cmatest_node * node,int signal_flag)203 static int post_sends(struct cmatest_node *node, int signal_flag)
204 {
205 struct ibv_send_wr send_wr, *bad_send_wr;
206 struct ibv_sge sge;
207 int i, ret = 0;
208
209 if (!node->connected || !message_count)
210 return 0;
211
212 send_wr.next = NULL;
213 send_wr.sg_list = &sge;
214 send_wr.num_sge = 1;
215 send_wr.opcode = IBV_WR_SEND_WITH_IMM;
216 send_wr.send_flags = signal_flag;
217 send_wr.wr_id = (unsigned long)node;
218 send_wr.imm_data = htobe32(node->cma_id->qp->qp_num);
219
220 send_wr.wr.ud.ah = node->ah;
221 send_wr.wr.ud.remote_qpn = node->remote_qpn;
222 send_wr.wr.ud.remote_qkey = node->remote_qkey;
223
224 sge.length = message_size;
225 sge.lkey = node->mr->lkey;
226 sge.addr = (uintptr_t) node->mem;
227
228 for (i = 0; i < message_count && !ret; i++) {
229 ret = ibv_post_send(node->cma_id->qp, &send_wr, &bad_send_wr);
230 if (ret)
231 printf("failed to post sends: %d\n", ret);
232 }
233 return ret;
234 }
235
connect_error(void)236 static void connect_error(void)
237 {
238 test.connects_left--;
239 }
240
addr_handler(struct cmatest_node * node)241 static int addr_handler(struct cmatest_node *node)
242 {
243 int ret;
244
245 ret = verify_test_params(node);
246 if (ret)
247 goto err;
248
249 ret = init_node(node);
250 if (ret)
251 goto err;
252
253 if (!is_sender) {
254 ret = post_recvs(node);
255 if (ret)
256 goto err;
257 }
258
259 ret = rdma_join_multicast(node->cma_id, test.dst_addr, node);
260 if (ret) {
261 perror("mckey: failure joining");
262 goto err;
263 }
264 return 0;
265 err:
266 connect_error();
267 return ret;
268 }
269
join_handler(struct cmatest_node * node,struct rdma_ud_param * param)270 static int join_handler(struct cmatest_node *node,
271 struct rdma_ud_param *param)
272 {
273 char buf[40];
274
275 inet_ntop(AF_INET6, param->ah_attr.grh.dgid.raw, buf, 40);
276 printf("mckey: joined dgid: %s mlid 0x%x sl %d\n", buf,
277 param->ah_attr.dlid, param->ah_attr.sl);
278
279 node->remote_qpn = param->qp_num;
280 node->remote_qkey = param->qkey;
281 node->ah = ibv_create_ah(node->pd, ¶m->ah_attr);
282 if (!node->ah) {
283 printf("mckey: failure creating address handle\n");
284 goto err;
285 }
286
287 node->connected = 1;
288 test.connects_left--;
289 return 0;
290 err:
291 connect_error();
292 return -1;
293 }
294
cma_handler(struct rdma_cm_id * cma_id,struct rdma_cm_event * event)295 static int cma_handler(struct rdma_cm_id *cma_id, struct rdma_cm_event *event)
296 {
297 int ret = 0;
298
299 switch (event->event) {
300 case RDMA_CM_EVENT_ADDR_RESOLVED:
301 ret = addr_handler(cma_id->context);
302 break;
303 case RDMA_CM_EVENT_MULTICAST_JOIN:
304 ret = join_handler(cma_id->context, &event->param.ud);
305 break;
306 case RDMA_CM_EVENT_ADDR_ERROR:
307 case RDMA_CM_EVENT_ROUTE_ERROR:
308 case RDMA_CM_EVENT_MULTICAST_ERROR:
309 printf("mckey: event: %s, error: %d\n",
310 rdma_event_str(event->event), event->status);
311 connect_error();
312 ret = event->status;
313 break;
314 case RDMA_CM_EVENT_DEVICE_REMOVAL:
315 /* Cleanup will occur after test completes. */
316 break;
317 default:
318 break;
319 }
320 return ret;
321 }
322
cma_thread(void * arg)323 static void *cma_thread(void *arg)
324 {
325 struct rdma_cm_event *event;
326 int ret;
327
328 while (1) {
329 ret = rdma_get_cm_event(test.channel, &event);
330 if (ret) {
331 perror("rdma_get_cm_event");
332 break;
333 }
334
335 switch (event->event) {
336 case RDMA_CM_EVENT_MULTICAST_ERROR:
337 case RDMA_CM_EVENT_ADDR_CHANGE:
338 printf("mckey: event: %s, status: %d\n",
339 rdma_event_str(event->event), event->status);
340 break;
341 default:
342 break;
343 }
344
345 rdma_ack_cm_event(event);
346 }
347 return NULL;
348 }
349
destroy_node(struct cmatest_node * node)350 static void destroy_node(struct cmatest_node *node)
351 {
352 if (!node->cma_id)
353 return;
354
355 if (node->ah)
356 ibv_destroy_ah(node->ah);
357
358 if (node->cma_id->qp)
359 rdma_destroy_qp(node->cma_id);
360
361 if (node->cq)
362 ibv_destroy_cq(node->cq);
363
364 if (node->mem) {
365 ibv_dereg_mr(node->mr);
366 free(node->mem);
367 }
368
369 if (node->pd)
370 ibv_dealloc_pd(node->pd);
371
372 /* Destroy the RDMA ID after all device resources */
373 rdma_destroy_id(node->cma_id);
374 }
375
alloc_nodes(void)376 static int alloc_nodes(void)
377 {
378 int ret, i;
379
380 test.nodes = malloc(sizeof *test.nodes * connections);
381 if (!test.nodes) {
382 printf("mckey: unable to allocate memory for test nodes\n");
383 return -ENOMEM;
384 }
385 memset(test.nodes, 0, sizeof *test.nodes * connections);
386
387 for (i = 0; i < connections; i++) {
388 test.nodes[i].id = i;
389 ret = rdma_create_id(test.channel, &test.nodes[i].cma_id,
390 &test.nodes[i], port_space);
391 if (ret)
392 goto err;
393 }
394 return 0;
395 err:
396 while (--i >= 0)
397 rdma_destroy_id(test.nodes[i].cma_id);
398 free(test.nodes);
399 return ret;
400 }
401
destroy_nodes(void)402 static void destroy_nodes(void)
403 {
404 int i;
405
406 for (i = 0; i < connections; i++)
407 destroy_node(&test.nodes[i]);
408 free(test.nodes);
409 }
410
poll_cqs(void)411 static int poll_cqs(void)
412 {
413 struct ibv_wc wc[8];
414 int done, i, ret;
415
416 for (i = 0; i < connections; i++) {
417 if (!test.nodes[i].connected)
418 continue;
419
420 for (done = 0; done < message_count; done += ret) {
421 ret = ibv_poll_cq(test.nodes[i].cq, 8, wc);
422 if (ret < 0) {
423 printf("mckey: failed polling CQ: %d\n", ret);
424 return ret;
425 }
426 }
427 }
428 return 0;
429 }
430
connect_events(void)431 static int connect_events(void)
432 {
433 struct rdma_cm_event *event;
434 int ret = 0;
435
436 while (test.connects_left && !ret) {
437 ret = rdma_get_cm_event(test.channel, &event);
438 if (!ret) {
439 ret = cma_handler(event->id, event);
440 rdma_ack_cm_event(event);
441 }
442 }
443 return ret;
444 }
445
get_addr(char * dst,struct sockaddr * addr)446 static int get_addr(char *dst, struct sockaddr *addr)
447 {
448 struct addrinfo *res;
449 int ret;
450
451 ret = getaddrinfo(dst, NULL, NULL, &res);
452 if (ret) {
453 printf("getaddrinfo failed (%s) - invalid hostname or IP address\n", gai_strerror(ret));
454 return ret;
455 }
456
457 memcpy(addr, res->ai_addr, res->ai_addrlen);
458 freeaddrinfo(res);
459 return ret;
460 }
461
get_dst_addr(char * dst,struct sockaddr * addr)462 static int get_dst_addr(char *dst, struct sockaddr *addr)
463 {
464 struct sockaddr_ib *sib;
465
466 if (!unmapped_addr)
467 return get_addr(dst, addr);
468
469 sib = (struct sockaddr_ib *) addr;
470 memset(sib, 0, sizeof *sib);
471 sib->sib_family = AF_IB;
472 return inet_pton(AF_INET6, dst, &sib->sib_addr) != 1;
473 }
474
run(void)475 static int run(void)
476 {
477 int i, ret, err;
478
479 printf("mckey: starting %s\n", is_sender ? "client" : "server");
480 if (src_addr) {
481 ret = get_addr(src_addr, (struct sockaddr *) &test.src_in);
482 if (ret)
483 return ret;
484 }
485
486 ret = get_dst_addr(dst_addr, (struct sockaddr *) &test.dst_in);
487 if (ret)
488 return ret;
489
490 printf("mckey: joining\n");
491 for (i = 0; i < connections; i++) {
492 if (src_addr) {
493 ret = rdma_bind_addr(test.nodes[i].cma_id,
494 test.src_addr);
495 if (ret) {
496 perror("mckey: addr bind failure");
497 connect_error();
498 return ret;
499 }
500 }
501
502 if (unmapped_addr)
503 ret = addr_handler(&test.nodes[i]);
504 else
505 ret = rdma_resolve_addr(test.nodes[i].cma_id,
506 test.src_addr, test.dst_addr,
507 2000);
508 if (ret) {
509 perror("mckey: resolve addr failure");
510 connect_error();
511 return ret;
512 }
513 }
514
515 ret = connect_events();
516 if (ret)
517 goto out;
518
519 pthread_create(&test.cmathread, NULL, cma_thread, NULL);
520
521 /*
522 * Pause to give SM chance to configure switches. We don't want to
523 * handle reliability issue in this simple test program.
524 */
525 sleep(3);
526
527 if (message_count) {
528 if (is_sender) {
529 printf("initiating data transfers\n");
530 for (i = 0; i < connections; i++) {
531 ret = post_sends(&test.nodes[i], 0);
532 if (ret)
533 goto out;
534 }
535 } else {
536 printf("receiving data transfers\n");
537 ret = poll_cqs();
538 if (ret)
539 goto out;
540 }
541 printf("data transfers complete\n");
542 }
543 out:
544 for (i = 0; i < connections; i++) {
545 err = rdma_leave_multicast(test.nodes[i].cma_id,
546 test.dst_addr);
547 if (err) {
548 perror("mckey: failure leaving");
549 ret = err;
550 }
551 }
552 return ret;
553 }
554
main(int argc,char ** argv)555 int main(int argc, char **argv)
556 {
557 int op, ret;
558
559
560 while ((op = getopt(argc, argv, "m:M:sb:c:C:S:p:")) != -1) {
561 switch (op) {
562 case 'm':
563 dst_addr = optarg;
564 break;
565 case 'M':
566 unmapped_addr = 1;
567 dst_addr = optarg;
568 break;
569 case 's':
570 is_sender = 1;
571 break;
572 case 'b':
573 src_addr = optarg;
574 test.src_addr = (struct sockaddr *) &test.src_in;
575 break;
576 case 'c':
577 connections = atoi(optarg);
578 break;
579 case 'C':
580 message_count = atoi(optarg);
581 break;
582 case 'S':
583 message_size = atoi(optarg);
584 break;
585 case 'p':
586 port_space = strtol(optarg, NULL, 0);
587 break;
588 default:
589 printf("usage: %s\n", argv[0]);
590 printf("\t-m multicast_address\n");
591 printf("\t[-M unmapped_multicast_address]\n"
592 "\t replaces -m and requires -b\n");
593 printf("\t[-s(ender)]\n");
594 printf("\t[-b bind_address]\n");
595 printf("\t[-c connections]\n");
596 printf("\t[-C message_count]\n");
597 printf("\t[-S message_size]\n");
598 printf("\t[-p port_space - %#x for UDP (default), "
599 "%#x for IPOIB]\n", RDMA_PS_UDP, RDMA_PS_IPOIB);
600 exit(1);
601 }
602 }
603
604 if (unmapped_addr && !src_addr) {
605 printf("unmapped multicast address requires binding "
606 "to source address\n");
607 exit(1);
608 }
609
610 test.dst_addr = (struct sockaddr *) &test.dst_in;
611 test.connects_left = connections;
612
613 test.channel = rdma_create_event_channel();
614 if (!test.channel) {
615 perror("failed to create event channel");
616 exit(1);
617 }
618
619 if (alloc_nodes())
620 exit(1);
621
622 ret = run();
623
624 printf("test complete\n");
625 destroy_nodes();
626 rdma_destroy_event_channel(test.channel);
627
628 printf("return status %d\n", ret);
629 return ret;
630 }
631