xref: /freebsd/contrib/ofed/librdmacm/examples/mckey.c (revision fed1ca4b719c56c930f2259d80663cd34be812bb)
1 /*
2  * Copyright (c) 2005-2007 Intel Corporation.  All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  *
32  * $Id$
33  */
34 
35 #include <stdlib.h>
36 #include <string.h>
37 #include <stdio.h>
38 #include <errno.h>
39 #include <sys/types.h>
40 #include <netinet/in.h>
41 #include <arpa/inet.h>
42 #include <sys/socket.h>
43 #include <netdb.h>
44 #include <byteswap.h>
45 #include <unistd.h>
46 #include <getopt.h>
47 
48 #include <rdma/rdma_cma.h>
49 
50 struct cmatest_node {
51 	int			id;
52 	struct rdma_cm_id	*cma_id;
53 	int			connected;
54 	struct ibv_pd		*pd;
55 	struct ibv_cq		*cq;
56 	struct ibv_mr		*mr;
57 	struct ibv_ah		*ah;
58 	uint32_t		remote_qpn;
59 	uint32_t		remote_qkey;
60 	void			*mem;
61 };
62 
63 struct cmatest {
64 	struct rdma_event_channel *channel;
65 	pthread_t 		cmathread;
66 	struct cmatest_node	*nodes;
67 	int			conn_index;
68 	int			connects_left;
69 
70 	struct sockaddr_in6	dst_in;
71 	struct sockaddr		*dst_addr;
72 	struct sockaddr_in6	src_in;
73 	struct sockaddr		*src_addr;
74 };
75 
76 static struct cmatest test;
77 static int connections = 1;
78 static int message_size = 100;
79 static int message_count = 10;
80 static int is_sender;
81 static int unmapped_addr;
82 static char *dst_addr;
83 static char *src_addr;
84 static enum rdma_port_space port_space = RDMA_PS_UDP;
85 
86 static int create_message(struct cmatest_node *node)
87 {
88 	if (!message_size)
89 		message_count = 0;
90 
91 	if (!message_count)
92 		return 0;
93 
94 	node->mem = malloc(message_size + sizeof(struct ibv_grh));
95 	if (!node->mem) {
96 		printf("failed message allocation\n");
97 		return -1;
98 	}
99 	node->mr = ibv_reg_mr(node->pd, node->mem,
100 			      message_size + sizeof(struct ibv_grh),
101 			      IBV_ACCESS_LOCAL_WRITE);
102 	if (!node->mr) {
103 		printf("failed to reg MR\n");
104 		goto err;
105 	}
106 	return 0;
107 err:
108 	free(node->mem);
109 	return -1;
110 }
111 
112 static int verify_test_params(struct cmatest_node *node)
113 {
114 	struct ibv_port_attr port_attr;
115 	int ret;
116 
117 	ret = ibv_query_port(node->cma_id->verbs, node->cma_id->port_num,
118 			     &port_attr);
119 	if (ret)
120 		return ret;
121 
122 	if (message_count && message_size > (1 << (port_attr.active_mtu + 7))) {
123 		printf("mckey: message_size %d is larger than active mtu %d\n",
124 		       message_size, 1 << (port_attr.active_mtu + 7));
125 		return -EINVAL;
126 	}
127 
128 	return 0;
129 }
130 
131 static int init_node(struct cmatest_node *node)
132 {
133 	struct ibv_qp_init_attr init_qp_attr;
134 	int cqe, ret;
135 
136 	node->pd = ibv_alloc_pd(node->cma_id->verbs);
137 	if (!node->pd) {
138 		ret = -ENOMEM;
139 		printf("mckey: unable to allocate PD\n");
140 		goto out;
141 	}
142 
143 	cqe = message_count ? message_count * 2 : 2;
144 	node->cq = ibv_create_cq(node->cma_id->verbs, cqe, node, 0, 0);
145 	if (!node->cq) {
146 		ret = -ENOMEM;
147 		printf("mckey: unable to create CQ\n");
148 		goto out;
149 	}
150 
151 	memset(&init_qp_attr, 0, sizeof init_qp_attr);
152 	init_qp_attr.cap.max_send_wr = message_count ? message_count : 1;
153 	init_qp_attr.cap.max_recv_wr = message_count ? message_count : 1;
154 	init_qp_attr.cap.max_send_sge = 1;
155 	init_qp_attr.cap.max_recv_sge = 1;
156 	init_qp_attr.qp_context = node;
157 	init_qp_attr.sq_sig_all = 0;
158 	init_qp_attr.qp_type = IBV_QPT_UD;
159 	init_qp_attr.send_cq = node->cq;
160 	init_qp_attr.recv_cq = node->cq;
161 	ret = rdma_create_qp(node->cma_id, node->pd, &init_qp_attr);
162 	if (ret) {
163 		perror("mckey: unable to create QP");
164 		goto out;
165 	}
166 
167 	ret = create_message(node);
168 	if (ret) {
169 		printf("mckey: failed to create messages: %d\n", ret);
170 		goto out;
171 	}
172 out:
173 	return ret;
174 }
175 
176 static int post_recvs(struct cmatest_node *node)
177 {
178 	struct ibv_recv_wr recv_wr, *recv_failure;
179 	struct ibv_sge sge;
180 	int i, ret = 0;
181 
182 	if (!message_count)
183 		return 0;
184 
185 	recv_wr.next = NULL;
186 	recv_wr.sg_list = &sge;
187 	recv_wr.num_sge = 1;
188 	recv_wr.wr_id = (uintptr_t) node;
189 
190 	sge.length = message_size + sizeof(struct ibv_grh);
191 	sge.lkey = node->mr->lkey;
192 	sge.addr = (uintptr_t) node->mem;
193 
194 	for (i = 0; i < message_count && !ret; i++ ) {
195 		ret = ibv_post_recv(node->cma_id->qp, &recv_wr, &recv_failure);
196 		if (ret) {
197 			printf("failed to post receives: %d\n", ret);
198 			break;
199 		}
200 	}
201 	return ret;
202 }
203 
204 static int post_sends(struct cmatest_node *node, int signal_flag)
205 {
206 	struct ibv_send_wr send_wr, *bad_send_wr;
207 	struct ibv_sge sge;
208 	int i, ret = 0;
209 
210 	if (!node->connected || !message_count)
211 		return 0;
212 
213 	send_wr.next = NULL;
214 	send_wr.sg_list = &sge;
215 	send_wr.num_sge = 1;
216 	send_wr.opcode = IBV_WR_SEND_WITH_IMM;
217 	send_wr.send_flags = signal_flag;
218 	send_wr.wr_id = (unsigned long)node;
219 	send_wr.imm_data = htonl(node->cma_id->qp->qp_num);
220 
221 	send_wr.wr.ud.ah = node->ah;
222 	send_wr.wr.ud.remote_qpn = node->remote_qpn;
223 	send_wr.wr.ud.remote_qkey = node->remote_qkey;
224 
225 	sge.length = message_size;
226 	sge.lkey = node->mr->lkey;
227 	sge.addr = (uintptr_t) node->mem;
228 
229 	for (i = 0; i < message_count && !ret; i++) {
230 		ret = ibv_post_send(node->cma_id->qp, &send_wr, &bad_send_wr);
231 		if (ret)
232 			printf("failed to post sends: %d\n", ret);
233 	}
234 	return ret;
235 }
236 
237 static void connect_error(void)
238 {
239 	test.connects_left--;
240 }
241 
242 static int addr_handler(struct cmatest_node *node)
243 {
244 	int ret;
245 
246 	ret = verify_test_params(node);
247 	if (ret)
248 		goto err;
249 
250 	ret = init_node(node);
251 	if (ret)
252 		goto err;
253 
254 	if (!is_sender) {
255 		ret = post_recvs(node);
256 		if (ret)
257 			goto err;
258 	}
259 
260 	ret = rdma_join_multicast(node->cma_id, test.dst_addr, node);
261 	if (ret) {
262 		perror("mckey: failure joining");
263 		goto err;
264 	}
265 	return 0;
266 err:
267 	connect_error();
268 	return ret;
269 }
270 
271 static int join_handler(struct cmatest_node *node,
272 			struct rdma_ud_param *param)
273 {
274 	char buf[40];
275 
276 	inet_ntop(AF_INET6, param->ah_attr.grh.dgid.raw, buf, 40);
277 	printf("mckey: joined dgid: %s mlid 0x%x sl %d\n", buf,
278 		param->ah_attr.dlid, param->ah_attr.sl);
279 
280 	node->remote_qpn = param->qp_num;
281 	node->remote_qkey = param->qkey;
282 	node->ah = ibv_create_ah(node->pd, &param->ah_attr);
283 	if (!node->ah) {
284 		printf("mckey: failure creating address handle\n");
285 		goto err;
286 	}
287 
288 	node->connected = 1;
289 	test.connects_left--;
290 	return 0;
291 err:
292 	connect_error();
293 	return -1;
294 }
295 
296 static int cma_handler(struct rdma_cm_id *cma_id, struct rdma_cm_event *event)
297 {
298 	int ret = 0;
299 
300 	switch (event->event) {
301 	case RDMA_CM_EVENT_ADDR_RESOLVED:
302 		ret = addr_handler(cma_id->context);
303 		break;
304 	case RDMA_CM_EVENT_MULTICAST_JOIN:
305 		ret = join_handler(cma_id->context, &event->param.ud);
306 		break;
307 	case RDMA_CM_EVENT_ADDR_ERROR:
308 	case RDMA_CM_EVENT_ROUTE_ERROR:
309 	case RDMA_CM_EVENT_MULTICAST_ERROR:
310 		printf("mckey: event: %s, error: %d\n",
311 		       rdma_event_str(event->event), event->status);
312 		connect_error();
313 		ret = event->status;
314 		break;
315 	case RDMA_CM_EVENT_DEVICE_REMOVAL:
316 		/* Cleanup will occur after test completes. */
317 		break;
318 	default:
319 		break;
320 	}
321 	return ret;
322 }
323 
324 static void *cma_thread(void *arg)
325 {
326 	struct rdma_cm_event *event;
327 	int ret;
328 
329 	while (1) {
330 		ret = rdma_get_cm_event(test.channel, &event);
331 		if (ret) {
332 			perror("rdma_get_cm_event");
333 			break;
334 		}
335 
336 		switch (event->event) {
337 		case RDMA_CM_EVENT_MULTICAST_ERROR:
338 		case RDMA_CM_EVENT_ADDR_CHANGE:
339 			printf("mckey: event: %s, status: %d\n",
340 			       rdma_event_str(event->event), event->status);
341 			break;
342 		default:
343 			break;
344 		}
345 
346 		rdma_ack_cm_event(event);
347 	}
348 	return NULL;
349 }
350 
351 static void destroy_node(struct cmatest_node *node)
352 {
353 	if (!node->cma_id)
354 		return;
355 
356 	if (node->ah)
357 		ibv_destroy_ah(node->ah);
358 
359 	if (node->cma_id->qp)
360 		rdma_destroy_qp(node->cma_id);
361 
362 	if (node->cq)
363 		ibv_destroy_cq(node->cq);
364 
365 	if (node->mem) {
366 		ibv_dereg_mr(node->mr);
367 		free(node->mem);
368 	}
369 
370 	if (node->pd)
371 		ibv_dealloc_pd(node->pd);
372 
373 	/* Destroy the RDMA ID after all device resources */
374 	rdma_destroy_id(node->cma_id);
375 }
376 
377 static int alloc_nodes(void)
378 {
379 	int ret, i;
380 
381 	test.nodes = malloc(sizeof *test.nodes * connections);
382 	if (!test.nodes) {
383 		printf("mckey: unable to allocate memory for test nodes\n");
384 		return -ENOMEM;
385 	}
386 	memset(test.nodes, 0, sizeof *test.nodes * connections);
387 
388 	for (i = 0; i < connections; i++) {
389 		test.nodes[i].id = i;
390 		ret = rdma_create_id(test.channel, &test.nodes[i].cma_id,
391 				     &test.nodes[i], port_space);
392 		if (ret)
393 			goto err;
394 	}
395 	return 0;
396 err:
397 	while (--i >= 0)
398 		rdma_destroy_id(test.nodes[i].cma_id);
399 	free(test.nodes);
400 	return ret;
401 }
402 
403 static void destroy_nodes(void)
404 {
405 	int i;
406 
407 	for (i = 0; i < connections; i++)
408 		destroy_node(&test.nodes[i]);
409 	free(test.nodes);
410 }
411 
412 static int poll_cqs(void)
413 {
414 	struct ibv_wc wc[8];
415 	int done, i, ret;
416 
417 	for (i = 0; i < connections; i++) {
418 		if (!test.nodes[i].connected)
419 			continue;
420 
421 		for (done = 0; done < message_count; done += ret) {
422 			ret = ibv_poll_cq(test.nodes[i].cq, 8, wc);
423 			if (ret < 0) {
424 				printf("mckey: failed polling CQ: %d\n", ret);
425 				return ret;
426 			}
427 		}
428 	}
429 	return 0;
430 }
431 
432 static int connect_events(void)
433 {
434 	struct rdma_cm_event *event;
435 	int ret = 0;
436 
437 	while (test.connects_left && !ret) {
438 		ret = rdma_get_cm_event(test.channel, &event);
439 		if (!ret) {
440 			ret = cma_handler(event->id, event);
441 			rdma_ack_cm_event(event);
442 		}
443 	}
444 	return ret;
445 }
446 
447 static int get_addr(char *dst, struct sockaddr *addr)
448 {
449 	struct addrinfo *res;
450 	int ret;
451 
452 	ret = getaddrinfo(dst, NULL, NULL, &res);
453 	if (ret) {
454 		printf("getaddrinfo failed - invalid hostname or IP address\n");
455 		return ret;
456 	}
457 
458 	memcpy(addr, res->ai_addr, res->ai_addrlen);
459 	freeaddrinfo(res);
460 	return ret;
461 }
462 
463 static int run(void)
464 {
465 	int i, ret;
466 
467 	printf("mckey: starting %s\n", is_sender ? "client" : "server");
468 	if (src_addr) {
469 		ret = get_addr(src_addr, (struct sockaddr *) &test.src_in);
470 		if (ret)
471 			return ret;
472 	}
473 
474 	ret = get_addr(dst_addr, (struct sockaddr *) &test.dst_in);
475 	if (ret)
476 		return ret;
477 
478 	printf("mckey: joining\n");
479 	for (i = 0; i < connections; i++) {
480 		if (src_addr) {
481 			ret = rdma_bind_addr(test.nodes[i].cma_id,
482 					     test.src_addr);
483 			if (ret) {
484 				perror("mckey: addr bind failure");
485 				connect_error();
486 				return ret;
487 			}
488 		}
489 
490 		if (unmapped_addr)
491 			ret = addr_handler(&test.nodes[i]);
492 		else
493 			ret = rdma_resolve_addr(test.nodes[i].cma_id,
494 						test.src_addr, test.dst_addr,
495 						2000);
496 		if (ret) {
497 			perror("mckey: resolve addr failure");
498 			connect_error();
499 			return ret;
500 		}
501 	}
502 
503 	ret = connect_events();
504 	if (ret)
505 		goto out;
506 
507 	pthread_create(&test.cmathread, NULL, cma_thread, NULL);
508 
509 	/*
510 	 * Pause to give SM chance to configure switches.  We don't want to
511 	 * handle reliability issue in this simple test program.
512 	 */
513 	sleep(3);
514 
515 	if (message_count) {
516 		if (is_sender) {
517 			printf("initiating data transfers\n");
518 			for (i = 0; i < connections; i++) {
519 				ret = post_sends(&test.nodes[i], 0);
520 				if (ret)
521 					goto out;
522 			}
523 		} else {
524 			printf("receiving data transfers\n");
525 			ret = poll_cqs();
526 			if (ret)
527 				goto out;
528 		}
529 		printf("data transfers complete\n");
530 	}
531 out:
532 	for (i = 0; i < connections; i++) {
533 		ret = rdma_leave_multicast(test.nodes[i].cma_id,
534 					   test.dst_addr);
535 		if (ret)
536 			perror("mckey: failure leaving");
537 	}
538 	return ret;
539 }
540 
541 int main(int argc, char **argv)
542 {
543 	int op, ret;
544 
545 
546 	while ((op = getopt(argc, argv, "m:M:sb:c:C:S:p:")) != -1) {
547 		switch (op) {
548 		case 'm':
549 			dst_addr = optarg;
550 			break;
551 		case 'M':
552 			unmapped_addr = 1;
553 			dst_addr = optarg;
554 			break;
555 		case 's':
556 			is_sender = 1;
557 			break;
558 		case 'b':
559 			src_addr = optarg;
560 			test.src_addr = (struct sockaddr *) &test.src_in;
561 			break;
562 		case 'c':
563 			connections = atoi(optarg);
564 			break;
565 		case 'C':
566 			message_count = atoi(optarg);
567 			break;
568 		case 'S':
569 			message_size = atoi(optarg);
570 			break;
571 		case 'p':
572 			port_space = strtol(optarg, NULL, 0);
573 			break;
574 		default:
575 			printf("usage: %s\n", argv[0]);
576 			printf("\t-m multicast_address\n");
577 			printf("\t[-M unmapped_multicast_address]\n"
578 			       "\t replaces -m and requires -b\n");
579 			printf("\t[-s(ender)]\n");
580 			printf("\t[-b bind_address]\n");
581 			printf("\t[-c connections]\n");
582 			printf("\t[-C message_count]\n");
583 			printf("\t[-S message_size]\n");
584 			printf("\t[-p port_space - %#x for UDP (default), "
585 			       "%#x for IPOIB]\n", RDMA_PS_UDP, RDMA_PS_IPOIB);
586 			exit(1);
587 		}
588 	}
589 
590 	if (unmapped_addr && !src_addr) {
591 		printf("unmapped multicast address requires binding "
592 			"to source address\n");
593 		exit(1);
594 	}
595 
596 	test.dst_addr = (struct sockaddr *) &test.dst_in;
597 	test.connects_left = connections;
598 
599 	test.channel = rdma_create_event_channel();
600 	if (!test.channel) {
601 		perror("failed to create event channel");
602 		exit(1);
603 	}
604 
605 	if (alloc_nodes())
606 		exit(1);
607 
608 	ret = run();
609 
610 	printf("test complete\n");
611 	destroy_nodes();
612 	rdma_destroy_event_channel(test.channel);
613 
614 	printf("return status %d\n", ret);
615 	return ret;
616 }
617