1 /* 2 * Copyright (c) 2005 Topspin Communications. All rights reserved. 3 * Copyright (c) 2005, 2006, 2007 Cisco Systems. All rights reserved. 4 * Copyright (c) 2005 PathScale, Inc. All rights reserved. 5 * Copyright (c) 2006 Mellanox Technologies. All rights reserved. 6 * 7 * This software is available to you under a choice of one of two 8 * licenses. You may choose to be licensed under the terms of the GNU 9 * General Public License (GPL) Version 2, available from the file 10 * COPYING in the main directory of this source tree, or the 11 * OpenIB.org BSD license below: 12 * 13 * Redistribution and use in source and binary forms, with or 14 * without modification, are permitted provided that the following 15 * conditions are met: 16 * 17 * - Redistributions of source code must retain the above 18 * copyright notice, this list of conditions and the following 19 * disclaimer. 20 * 21 * - Redistributions in binary form must reproduce the above 22 * copyright notice, this list of conditions and the following 23 * disclaimer in the documentation and/or other materials 24 * provided with the distribution. 25 * 26 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 27 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 28 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 29 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 30 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 31 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 32 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 33 * SOFTWARE. 34 */ 35 36 #include <linux/file.h> 37 #include <linux/fs.h> 38 #include <linux/slab.h> 39 #include <linux/sched.h> 40 41 #include <linux/uaccess.h> 42 43 #include <rdma/uverbs_types.h> 44 #include <rdma/uverbs_std_types.h> 45 #include <rdma/ib_ucaps.h> 46 #include "rdma_core.h" 47 48 #include "uverbs.h" 49 #include "core_priv.h" 50 51 /* 52 * Copy a response to userspace. If the provided 'resp' is larger than the 53 * user buffer it is silently truncated. If the user provided a larger buffer 54 * then the trailing portion is zero filled. 55 * 56 * These semantics are intended to support future extension of the output 57 * structures. 58 */ 59 static int uverbs_response(struct uverbs_attr_bundle *attrs, const void *resp, 60 size_t resp_len) 61 { 62 int ret; 63 64 if (uverbs_attr_is_valid(attrs, UVERBS_ATTR_CORE_OUT)) 65 return uverbs_copy_to_struct_or_zero( 66 attrs, UVERBS_ATTR_CORE_OUT, resp, resp_len); 67 68 if (copy_to_user(attrs->ucore.outbuf, resp, 69 min(attrs->ucore.outlen, resp_len))) 70 return -EFAULT; 71 72 if (resp_len < attrs->ucore.outlen) { 73 /* 74 * Zero fill any extra memory that user 75 * space might have provided. 76 */ 77 ret = clear_user(attrs->ucore.outbuf + resp_len, 78 attrs->ucore.outlen - resp_len); 79 if (ret) 80 return -EFAULT; 81 } 82 83 return 0; 84 } 85 86 static int uverbs_request(struct uverbs_attr_bundle *attrs, void *req, 87 size_t req_len) 88 { 89 int ret; 90 91 ret = copy_struct_from_user(req, req_len, attrs->ucore.inbuf, 92 attrs->ucore.inlen); 93 if (ret == -E2BIG) 94 ret = -EOPNOTSUPP; 95 return ret; 96 } 97 98 /* 99 * Generate the value for the 'response_length' protocol used by write_ex. 100 * This is the number of bytes the kernel actually wrote. Userspace can use 101 * this to detect what structure members in the response the kernel 102 * understood. 103 */ 104 static u32 uverbs_response_length(struct uverbs_attr_bundle *attrs, 105 size_t resp_len) 106 { 107 return min_t(size_t, attrs->ucore.outlen, resp_len); 108 } 109 110 /* 111 * The iterator version of the request interface is for handlers that need to 112 * step over a flex array at the end of a command header. 113 */ 114 struct uverbs_req_iter { 115 const void __user *cur; 116 const void __user *end; 117 }; 118 119 static int uverbs_request_start(struct uverbs_attr_bundle *attrs, 120 struct uverbs_req_iter *iter, 121 void *req, 122 size_t req_len) 123 { 124 if (attrs->ucore.inlen < req_len) 125 return -ENOSPC; 126 127 if (copy_from_user(req, attrs->ucore.inbuf, req_len)) 128 return -EFAULT; 129 130 iter->cur = attrs->ucore.inbuf + req_len; 131 iter->end = attrs->ucore.inbuf + attrs->ucore.inlen; 132 return 0; 133 } 134 135 static int uverbs_request_next(struct uverbs_req_iter *iter, void *val, 136 size_t len) 137 { 138 if (iter->cur + len > iter->end) 139 return -ENOSPC; 140 141 if (copy_from_user(val, iter->cur, len)) 142 return -EFAULT; 143 144 iter->cur += len; 145 return 0; 146 } 147 148 static const void __user *uverbs_request_next_ptr(struct uverbs_req_iter *iter, 149 size_t len) 150 { 151 const void __user *res = iter->cur; 152 153 if (len > iter->end - iter->cur) 154 return (void __force __user *)ERR_PTR(-ENOSPC); 155 iter->cur += len; 156 return res; 157 } 158 159 static int uverbs_request_finish(struct uverbs_req_iter *iter) 160 { 161 if (!ib_is_buffer_cleared(iter->cur, iter->end - iter->cur)) 162 return -EOPNOTSUPP; 163 return 0; 164 } 165 166 /* 167 * When calling a destroy function during an error unwind we need to pass in 168 * the udata that is sanitized of all user arguments. Ie from the driver 169 * perspective it looks like no udata was passed. 170 */ 171 struct ib_udata *uverbs_get_cleared_udata(struct uverbs_attr_bundle *attrs) 172 { 173 attrs->driver_udata = (struct ib_udata){}; 174 return &attrs->driver_udata; 175 } 176 177 static struct ib_uverbs_completion_event_file * 178 _ib_uverbs_lookup_comp_file(s32 fd, struct uverbs_attr_bundle *attrs) 179 { 180 struct ib_uobject *uobj = ufd_get_read(UVERBS_OBJECT_COMP_CHANNEL, 181 fd, attrs); 182 183 if (IS_ERR(uobj)) 184 return ERR_CAST(uobj); 185 186 uverbs_uobject_get(uobj); 187 uobj_put_read(uobj); 188 189 return container_of(uobj, struct ib_uverbs_completion_event_file, 190 uobj); 191 } 192 #define ib_uverbs_lookup_comp_file(_fd, _ufile) \ 193 _ib_uverbs_lookup_comp_file((_fd)*typecheck(s32, _fd), _ufile) 194 195 int ib_alloc_ucontext(struct uverbs_attr_bundle *attrs) 196 { 197 struct ib_uverbs_file *ufile = attrs->ufile; 198 struct ib_ucontext *ucontext; 199 struct ib_device *ib_dev; 200 201 ib_dev = srcu_dereference(ufile->device->ib_dev, 202 &ufile->device->disassociate_srcu); 203 if (!ib_dev) 204 return -EIO; 205 206 ucontext = rdma_zalloc_drv_obj(ib_dev, ib_ucontext); 207 if (!ucontext) 208 return -ENOMEM; 209 210 ucontext->device = ib_dev; 211 ucontext->ufile = ufile; 212 xa_init_flags(&ucontext->mmap_xa, XA_FLAGS_ALLOC); 213 214 rdma_restrack_new(&ucontext->res, RDMA_RESTRACK_CTX); 215 rdma_restrack_set_name(&ucontext->res, NULL); 216 attrs->context = ucontext; 217 return 0; 218 } 219 220 int ib_init_ucontext(struct uverbs_attr_bundle *attrs) 221 { 222 struct ib_ucontext *ucontext = attrs->context; 223 struct ib_uverbs_file *file = attrs->ufile; 224 int *fd_array; 225 int fd_count; 226 int ret; 227 228 if (!down_read_trylock(&file->hw_destroy_rwsem)) 229 return -EIO; 230 mutex_lock(&file->ucontext_lock); 231 if (file->ucontext) { 232 ret = -EINVAL; 233 goto err; 234 } 235 236 ret = ib_rdmacg_try_charge(&ucontext->cg_obj, ucontext->device, 237 RDMACG_RESOURCE_HCA_HANDLE); 238 if (ret) 239 goto err; 240 241 if (uverbs_attr_is_valid(attrs, UVERBS_ATTR_GET_CONTEXT_FD_ARR)) { 242 fd_count = uverbs_attr_ptr_get_array_size(attrs, 243 UVERBS_ATTR_GET_CONTEXT_FD_ARR, 244 sizeof(int)); 245 if (fd_count < 0) { 246 ret = fd_count; 247 goto err_uncharge; 248 } 249 250 fd_array = uverbs_attr_get_alloced_ptr(attrs, 251 UVERBS_ATTR_GET_CONTEXT_FD_ARR); 252 ret = ib_get_ucaps(fd_array, fd_count, &ucontext->enabled_caps); 253 if (ret) 254 goto err_uncharge; 255 } 256 257 ret = ucontext->device->ops.alloc_ucontext(ucontext, 258 &attrs->driver_udata); 259 if (ret) 260 goto err_uncharge; 261 262 rdma_restrack_add(&ucontext->res); 263 264 /* 265 * Make sure that ib_uverbs_get_ucontext() sees the pointer update 266 * only after all writes to setup the ucontext have completed 267 */ 268 smp_store_release(&file->ucontext, ucontext); 269 270 mutex_unlock(&file->ucontext_lock); 271 up_read(&file->hw_destroy_rwsem); 272 return 0; 273 274 err_uncharge: 275 ib_rdmacg_uncharge(&ucontext->cg_obj, ucontext->device, 276 RDMACG_RESOURCE_HCA_HANDLE); 277 err: 278 mutex_unlock(&file->ucontext_lock); 279 up_read(&file->hw_destroy_rwsem); 280 return ret; 281 } 282 283 static int ib_uverbs_get_context(struct uverbs_attr_bundle *attrs) 284 { 285 struct ib_uverbs_get_context_resp resp; 286 struct ib_uverbs_get_context cmd; 287 struct ib_device *ib_dev; 288 struct ib_uobject *uobj; 289 int ret; 290 291 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 292 if (ret) 293 return ret; 294 295 ret = ib_alloc_ucontext(attrs); 296 if (ret) 297 return ret; 298 299 uobj = uobj_alloc(UVERBS_OBJECT_ASYNC_EVENT, attrs, &ib_dev); 300 if (IS_ERR(uobj)) { 301 ret = PTR_ERR(uobj); 302 goto err_ucontext; 303 } 304 305 resp = (struct ib_uverbs_get_context_resp){ 306 .num_comp_vectors = attrs->ufile->device->num_comp_vectors, 307 .async_fd = uobj->id, 308 }; 309 ret = uverbs_response(attrs, &resp, sizeof(resp)); 310 if (ret) 311 goto err_uobj; 312 313 ret = ib_init_ucontext(attrs); 314 if (ret) 315 goto err_uobj; 316 317 ib_uverbs_init_async_event_file( 318 container_of(uobj, struct ib_uverbs_async_event_file, uobj)); 319 rdma_alloc_commit_uobject(uobj, attrs); 320 return 0; 321 322 err_uobj: 323 rdma_alloc_abort_uobject(uobj, attrs, false); 324 err_ucontext: 325 rdma_restrack_put(&attrs->context->res); 326 kfree(attrs->context); 327 attrs->context = NULL; 328 return ret; 329 } 330 331 static void copy_query_dev_fields(struct ib_ucontext *ucontext, 332 struct ib_uverbs_query_device_resp *resp, 333 struct ib_device_attr *attr) 334 { 335 struct ib_device *ib_dev = ucontext->device; 336 337 resp->fw_ver = attr->fw_ver; 338 resp->node_guid = ib_dev->node_guid; 339 resp->sys_image_guid = attr->sys_image_guid; 340 resp->max_mr_size = attr->max_mr_size; 341 resp->page_size_cap = attr->page_size_cap; 342 resp->vendor_id = attr->vendor_id; 343 resp->vendor_part_id = attr->vendor_part_id; 344 resp->hw_ver = attr->hw_ver; 345 resp->max_qp = attr->max_qp; 346 resp->max_qp_wr = attr->max_qp_wr; 347 resp->device_cap_flags = lower_32_bits(attr->device_cap_flags); 348 resp->max_sge = min(attr->max_send_sge, attr->max_recv_sge); 349 resp->max_sge_rd = attr->max_sge_rd; 350 resp->max_cq = attr->max_cq; 351 resp->max_cqe = attr->max_cqe; 352 resp->max_mr = attr->max_mr; 353 resp->max_pd = attr->max_pd; 354 resp->max_qp_rd_atom = attr->max_qp_rd_atom; 355 resp->max_ee_rd_atom = attr->max_ee_rd_atom; 356 resp->max_res_rd_atom = attr->max_res_rd_atom; 357 resp->max_qp_init_rd_atom = attr->max_qp_init_rd_atom; 358 resp->max_ee_init_rd_atom = attr->max_ee_init_rd_atom; 359 resp->atomic_cap = attr->atomic_cap; 360 resp->max_ee = attr->max_ee; 361 resp->max_rdd = attr->max_rdd; 362 resp->max_mw = attr->max_mw; 363 resp->max_raw_ipv6_qp = attr->max_raw_ipv6_qp; 364 resp->max_raw_ethy_qp = attr->max_raw_ethy_qp; 365 resp->max_mcast_grp = attr->max_mcast_grp; 366 resp->max_mcast_qp_attach = attr->max_mcast_qp_attach; 367 resp->max_total_mcast_qp_attach = attr->max_total_mcast_qp_attach; 368 resp->max_ah = attr->max_ah; 369 resp->max_srq = attr->max_srq; 370 resp->max_srq_wr = attr->max_srq_wr; 371 resp->max_srq_sge = attr->max_srq_sge; 372 resp->max_pkeys = attr->max_pkeys; 373 resp->local_ca_ack_delay = attr->local_ca_ack_delay; 374 resp->phys_port_cnt = min_t(u32, ib_dev->phys_port_cnt, U8_MAX); 375 } 376 377 static int ib_uverbs_query_device(struct uverbs_attr_bundle *attrs) 378 { 379 struct ib_uverbs_query_device cmd; 380 struct ib_uverbs_query_device_resp resp; 381 struct ib_ucontext *ucontext; 382 int ret; 383 384 ucontext = ib_uverbs_get_ucontext(attrs); 385 if (IS_ERR(ucontext)) 386 return PTR_ERR(ucontext); 387 388 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 389 if (ret) 390 return ret; 391 392 memset(&resp, 0, sizeof resp); 393 copy_query_dev_fields(ucontext, &resp, &ucontext->device->attrs); 394 395 return uverbs_response(attrs, &resp, sizeof(resp)); 396 } 397 398 static int ib_uverbs_query_port(struct uverbs_attr_bundle *attrs) 399 { 400 struct ib_uverbs_query_port cmd; 401 struct ib_uverbs_query_port_resp resp; 402 struct ib_port_attr attr; 403 int ret; 404 struct ib_ucontext *ucontext; 405 struct ib_device *ib_dev; 406 407 ucontext = ib_uverbs_get_ucontext(attrs); 408 if (IS_ERR(ucontext)) 409 return PTR_ERR(ucontext); 410 ib_dev = ucontext->device; 411 412 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 413 if (ret) 414 return ret; 415 416 ret = ib_query_port(ib_dev, cmd.port_num, &attr); 417 if (ret) 418 return ret; 419 420 memset(&resp, 0, sizeof resp); 421 copy_port_attr_to_resp(&attr, &resp, ib_dev, cmd.port_num); 422 423 return uverbs_response(attrs, &resp, sizeof(resp)); 424 } 425 426 static int ib_uverbs_alloc_pd(struct uverbs_attr_bundle *attrs) 427 { 428 struct ib_uverbs_alloc_pd_resp resp = {}; 429 struct ib_uverbs_alloc_pd cmd; 430 struct ib_uobject *uobj; 431 struct ib_pd *pd; 432 int ret; 433 struct ib_device *ib_dev; 434 435 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 436 if (ret) 437 return ret; 438 439 uobj = uobj_alloc(UVERBS_OBJECT_PD, attrs, &ib_dev); 440 if (IS_ERR(uobj)) 441 return PTR_ERR(uobj); 442 443 pd = rdma_zalloc_drv_obj(ib_dev, ib_pd); 444 if (!pd) { 445 ret = -ENOMEM; 446 goto err; 447 } 448 449 pd->device = ib_dev; 450 pd->uobject = uobj; 451 atomic_set(&pd->usecnt, 0); 452 453 rdma_restrack_new(&pd->res, RDMA_RESTRACK_PD); 454 rdma_restrack_set_name(&pd->res, NULL); 455 456 ret = ib_dev->ops.alloc_pd(pd, &attrs->driver_udata); 457 if (ret) 458 goto err_alloc; 459 rdma_restrack_add(&pd->res); 460 461 uobj->object = pd; 462 uobj_finalize_uobj_create(uobj, attrs); 463 464 resp.pd_handle = uobj->id; 465 return uverbs_response(attrs, &resp, sizeof(resp)); 466 467 err_alloc: 468 rdma_restrack_put(&pd->res); 469 kfree(pd); 470 err: 471 uobj_alloc_abort(uobj, attrs); 472 return ret; 473 } 474 475 static int ib_uverbs_dealloc_pd(struct uverbs_attr_bundle *attrs) 476 { 477 struct ib_uverbs_dealloc_pd cmd; 478 int ret; 479 480 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 481 if (ret) 482 return ret; 483 484 return uobj_perform_destroy(UVERBS_OBJECT_PD, cmd.pd_handle, attrs); 485 } 486 487 struct xrcd_table_entry { 488 struct rb_node node; 489 struct ib_xrcd *xrcd; 490 struct inode *inode; 491 }; 492 493 static int xrcd_table_insert(struct ib_uverbs_device *dev, 494 struct inode *inode, 495 struct ib_xrcd *xrcd) 496 { 497 struct xrcd_table_entry *entry, *scan; 498 struct rb_node **p = &dev->xrcd_tree.rb_node; 499 struct rb_node *parent = NULL; 500 501 entry = kmalloc_obj(*entry); 502 if (!entry) 503 return -ENOMEM; 504 505 entry->xrcd = xrcd; 506 entry->inode = inode; 507 508 while (*p) { 509 parent = *p; 510 scan = rb_entry(parent, struct xrcd_table_entry, node); 511 512 if (inode < scan->inode) { 513 p = &(*p)->rb_left; 514 } else if (inode > scan->inode) { 515 p = &(*p)->rb_right; 516 } else { 517 kfree(entry); 518 return -EEXIST; 519 } 520 } 521 522 rb_link_node(&entry->node, parent, p); 523 rb_insert_color(&entry->node, &dev->xrcd_tree); 524 igrab(inode); 525 return 0; 526 } 527 528 static struct xrcd_table_entry *xrcd_table_search(struct ib_uverbs_device *dev, 529 struct inode *inode) 530 { 531 struct xrcd_table_entry *entry; 532 struct rb_node *p = dev->xrcd_tree.rb_node; 533 534 while (p) { 535 entry = rb_entry(p, struct xrcd_table_entry, node); 536 537 if (inode < entry->inode) 538 p = p->rb_left; 539 else if (inode > entry->inode) 540 p = p->rb_right; 541 else 542 return entry; 543 } 544 545 return NULL; 546 } 547 548 static struct ib_xrcd *find_xrcd(struct ib_uverbs_device *dev, struct inode *inode) 549 { 550 struct xrcd_table_entry *entry; 551 552 entry = xrcd_table_search(dev, inode); 553 if (!entry) 554 return NULL; 555 556 return entry->xrcd; 557 } 558 559 static void xrcd_table_delete(struct ib_uverbs_device *dev, 560 struct inode *inode) 561 { 562 struct xrcd_table_entry *entry; 563 564 entry = xrcd_table_search(dev, inode); 565 if (entry) { 566 iput(inode); 567 rb_erase(&entry->node, &dev->xrcd_tree); 568 kfree(entry); 569 } 570 } 571 572 static int ib_uverbs_open_xrcd(struct uverbs_attr_bundle *attrs) 573 { 574 struct ib_uverbs_device *ibudev = attrs->ufile->device; 575 struct ib_uverbs_open_xrcd_resp resp = {}; 576 struct ib_uverbs_open_xrcd cmd; 577 struct ib_uxrcd_object *obj; 578 struct ib_xrcd *xrcd = NULL; 579 struct inode *inode = NULL; 580 int new_xrcd = 0; 581 struct ib_device *ib_dev; 582 struct fd f = EMPTY_FD; 583 int ret; 584 585 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 586 if (ret) 587 return ret; 588 589 mutex_lock(&ibudev->xrcd_tree_mutex); 590 591 if (cmd.fd != -1) { 592 /* search for file descriptor */ 593 f = fdget(cmd.fd); 594 if (fd_empty(f)) { 595 ret = -EBADF; 596 goto err_tree_mutex_unlock; 597 } 598 599 inode = file_inode(fd_file(f)); 600 xrcd = find_xrcd(ibudev, inode); 601 if (!xrcd && !(cmd.oflags & O_CREAT)) { 602 /* no file descriptor. Need CREATE flag */ 603 ret = -EAGAIN; 604 goto err_tree_mutex_unlock; 605 } 606 607 if (xrcd && cmd.oflags & O_EXCL) { 608 ret = -EINVAL; 609 goto err_tree_mutex_unlock; 610 } 611 } 612 613 obj = (struct ib_uxrcd_object *)uobj_alloc(UVERBS_OBJECT_XRCD, attrs, 614 &ib_dev); 615 if (IS_ERR(obj)) { 616 ret = PTR_ERR(obj); 617 goto err_tree_mutex_unlock; 618 } 619 620 if (!xrcd) { 621 xrcd = ib_alloc_xrcd_user(ib_dev, inode, &attrs->driver_udata); 622 if (IS_ERR(xrcd)) { 623 ret = PTR_ERR(xrcd); 624 goto err; 625 } 626 new_xrcd = 1; 627 } 628 629 atomic_set(&obj->refcnt, 0); 630 obj->uobject.object = xrcd; 631 632 if (inode) { 633 if (new_xrcd) { 634 /* create new inode/xrcd table entry */ 635 ret = xrcd_table_insert(ibudev, inode, xrcd); 636 if (ret) 637 goto err_dealloc_xrcd; 638 } 639 atomic_inc(&xrcd->usecnt); 640 } 641 642 fdput(f); 643 644 mutex_unlock(&ibudev->xrcd_tree_mutex); 645 uobj_finalize_uobj_create(&obj->uobject, attrs); 646 647 resp.xrcd_handle = obj->uobject.id; 648 return uverbs_response(attrs, &resp, sizeof(resp)); 649 650 err_dealloc_xrcd: 651 ib_dealloc_xrcd_user(xrcd, uverbs_get_cleared_udata(attrs)); 652 653 err: 654 uobj_alloc_abort(&obj->uobject, attrs); 655 656 err_tree_mutex_unlock: 657 fdput(f); 658 659 mutex_unlock(&ibudev->xrcd_tree_mutex); 660 661 return ret; 662 } 663 664 static int ib_uverbs_close_xrcd(struct uverbs_attr_bundle *attrs) 665 { 666 struct ib_uverbs_close_xrcd cmd; 667 int ret; 668 669 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 670 if (ret) 671 return ret; 672 673 return uobj_perform_destroy(UVERBS_OBJECT_XRCD, cmd.xrcd_handle, attrs); 674 } 675 676 int ib_uverbs_dealloc_xrcd(struct ib_uobject *uobject, struct ib_xrcd *xrcd, 677 enum rdma_remove_reason why, 678 struct uverbs_attr_bundle *attrs) 679 { 680 struct inode *inode; 681 int ret; 682 struct ib_uverbs_device *dev = attrs->ufile->device; 683 684 inode = xrcd->inode; 685 if (inode && !atomic_dec_and_test(&xrcd->usecnt)) 686 return 0; 687 688 ret = ib_dealloc_xrcd_user(xrcd, &attrs->driver_udata); 689 if (ret) { 690 atomic_inc(&xrcd->usecnt); 691 return ret; 692 } 693 694 if (inode) 695 xrcd_table_delete(dev, inode); 696 697 return 0; 698 } 699 700 static int ib_uverbs_reg_mr(struct uverbs_attr_bundle *attrs) 701 { 702 struct ib_uverbs_reg_mr_resp resp = {}; 703 struct ib_uverbs_reg_mr cmd; 704 struct ib_uobject *uobj; 705 struct ib_pd *pd; 706 struct ib_mr *mr; 707 int ret; 708 struct ib_device *ib_dev; 709 710 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 711 if (ret) 712 return ret; 713 714 if ((cmd.start & ~PAGE_MASK) != (cmd.hca_va & ~PAGE_MASK)) 715 return -EINVAL; 716 717 uobj = uobj_alloc(UVERBS_OBJECT_MR, attrs, &ib_dev); 718 if (IS_ERR(uobj)) 719 return PTR_ERR(uobj); 720 721 ret = ib_check_mr_access(ib_dev, cmd.access_flags); 722 if (ret) 723 goto err_free; 724 725 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs); 726 if (IS_ERR(pd)) { 727 ret = PTR_ERR(pd); 728 goto err_free; 729 } 730 731 mr = pd->device->ops.reg_user_mr(pd, cmd.start, cmd.length, cmd.hca_va, 732 cmd.access_flags, NULL, 733 &attrs->driver_udata); 734 if (IS_ERR(mr)) { 735 ret = PTR_ERR(mr); 736 goto err_put; 737 } 738 739 mr->device = pd->device; 740 mr->pd = pd; 741 mr->type = IB_MR_TYPE_USER; 742 mr->dm = NULL; 743 mr->sig_attrs = NULL; 744 mr->uobject = uobj; 745 atomic_inc(&pd->usecnt); 746 mr->iova = cmd.hca_va; 747 mr->length = cmd.length; 748 749 rdma_restrack_new(&mr->res, RDMA_RESTRACK_MR); 750 rdma_restrack_set_name(&mr->res, NULL); 751 rdma_restrack_add(&mr->res); 752 753 uobj->object = mr; 754 uobj_put_obj_read(pd); 755 uobj_finalize_uobj_create(uobj, attrs); 756 757 resp.lkey = mr->lkey; 758 resp.rkey = mr->rkey; 759 resp.mr_handle = uobj->id; 760 return uverbs_response(attrs, &resp, sizeof(resp)); 761 762 err_put: 763 uobj_put_obj_read(pd); 764 err_free: 765 uobj_alloc_abort(uobj, attrs); 766 return ret; 767 } 768 769 static int ib_uverbs_rereg_mr(struct uverbs_attr_bundle *attrs) 770 { 771 struct ib_uverbs_rereg_mr cmd; 772 struct ib_uverbs_rereg_mr_resp resp; 773 struct ib_mr *mr; 774 int ret; 775 struct ib_uobject *uobj; 776 struct ib_uobject *new_uobj; 777 struct ib_device *ib_dev; 778 struct ib_pd *orig_pd; 779 struct ib_pd *new_pd; 780 struct ib_mr *new_mr; 781 u32 lkey, rkey; 782 783 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 784 if (ret) 785 return ret; 786 787 if (!cmd.flags) 788 return -EINVAL; 789 790 if (cmd.flags & ~IB_MR_REREG_SUPPORTED) 791 return -EOPNOTSUPP; 792 793 if ((cmd.flags & IB_MR_REREG_TRANS) && 794 (cmd.start & ~PAGE_MASK) != (cmd.hca_va & ~PAGE_MASK)) 795 return -EINVAL; 796 797 uobj = uobj_get_write(UVERBS_OBJECT_MR, cmd.mr_handle, attrs); 798 if (IS_ERR(uobj)) 799 return PTR_ERR(uobj); 800 801 mr = uobj->object; 802 803 if (mr->dm) { 804 ret = -EINVAL; 805 goto put_uobjs; 806 } 807 808 if (cmd.flags & IB_MR_REREG_ACCESS) { 809 ret = ib_check_mr_access(mr->device, cmd.access_flags); 810 if (ret) 811 goto put_uobjs; 812 } 813 814 orig_pd = mr->pd; 815 if (cmd.flags & IB_MR_REREG_PD) { 816 new_pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, 817 attrs); 818 if (IS_ERR(new_pd)) { 819 ret = PTR_ERR(new_pd); 820 goto put_uobjs; 821 } 822 } else { 823 new_pd = mr->pd; 824 } 825 826 /* 827 * The driver might create a new HW object as part of the rereg, we need 828 * to have a uobject ready to hold it. 829 */ 830 new_uobj = uobj_alloc(UVERBS_OBJECT_MR, attrs, &ib_dev); 831 if (IS_ERR(new_uobj)) { 832 ret = PTR_ERR(new_uobj); 833 goto put_uobj_pd; 834 } 835 836 new_mr = ib_dev->ops.rereg_user_mr(mr, cmd.flags, cmd.start, cmd.length, 837 cmd.hca_va, cmd.access_flags, new_pd, 838 &attrs->driver_udata); 839 if (IS_ERR(new_mr)) { 840 ret = PTR_ERR(new_mr); 841 goto put_new_uobj; 842 } 843 if (new_mr) { 844 new_mr->device = new_pd->device; 845 new_mr->pd = new_pd; 846 new_mr->type = IB_MR_TYPE_USER; 847 new_mr->uobject = uobj; 848 atomic_inc(&new_pd->usecnt); 849 new_uobj->object = new_mr; 850 lkey = new_mr->lkey; 851 rkey = new_mr->rkey; 852 853 rdma_restrack_new(&new_mr->res, RDMA_RESTRACK_MR); 854 rdma_restrack_set_name(&new_mr->res, NULL); 855 rdma_restrack_add(&new_mr->res); 856 857 /* 858 * The new uobj for the new HW object is put into the same spot 859 * in the IDR and the old uobj & HW object is deleted. 860 */ 861 rdma_assign_uobject(uobj, new_uobj, attrs); 862 rdma_alloc_commit_uobject(new_uobj, attrs); 863 uobj_put_destroy(uobj); 864 new_uobj = NULL; 865 uobj = NULL; 866 mr = new_mr; 867 } else { 868 if (cmd.flags & IB_MR_REREG_PD) { 869 atomic_dec(&orig_pd->usecnt); 870 mr->pd = new_pd; 871 atomic_inc(&new_pd->usecnt); 872 } 873 if (cmd.flags & IB_MR_REREG_TRANS) { 874 mr->iova = cmd.hca_va; 875 mr->length = cmd.length; 876 } 877 lkey = mr->lkey; 878 rkey = mr->rkey; 879 } 880 881 memset(&resp, 0, sizeof(resp)); 882 resp.lkey = lkey; 883 resp.rkey = rkey; 884 885 ret = uverbs_response(attrs, &resp, sizeof(resp)); 886 887 put_new_uobj: 888 if (new_uobj) 889 uobj_alloc_abort(new_uobj, attrs); 890 put_uobj_pd: 891 if (cmd.flags & IB_MR_REREG_PD) 892 uobj_put_obj_read(new_pd); 893 894 put_uobjs: 895 if (uobj) 896 uobj_put_write(uobj); 897 898 return ret; 899 } 900 901 static int ib_uverbs_dereg_mr(struct uverbs_attr_bundle *attrs) 902 { 903 struct ib_uverbs_dereg_mr cmd; 904 int ret; 905 906 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 907 if (ret) 908 return ret; 909 910 return uobj_perform_destroy(UVERBS_OBJECT_MR, cmd.mr_handle, attrs); 911 } 912 913 static int ib_uverbs_alloc_mw(struct uverbs_attr_bundle *attrs) 914 { 915 struct ib_uverbs_alloc_mw cmd; 916 struct ib_uverbs_alloc_mw_resp resp = {}; 917 struct ib_uobject *uobj; 918 struct ib_pd *pd; 919 struct ib_mw *mw; 920 int ret; 921 struct ib_device *ib_dev; 922 923 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 924 if (ret) 925 return ret; 926 927 uobj = uobj_alloc(UVERBS_OBJECT_MW, attrs, &ib_dev); 928 if (IS_ERR(uobj)) 929 return PTR_ERR(uobj); 930 931 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs); 932 if (IS_ERR(pd)) { 933 ret = PTR_ERR(pd); 934 goto err_free; 935 } 936 937 if (cmd.mw_type != IB_MW_TYPE_1 && cmd.mw_type != IB_MW_TYPE_2) { 938 ret = -EINVAL; 939 goto err_put; 940 } 941 942 mw = rdma_zalloc_drv_obj(ib_dev, ib_mw); 943 if (!mw) { 944 ret = -ENOMEM; 945 goto err_put; 946 } 947 948 mw->device = ib_dev; 949 mw->pd = pd; 950 mw->uobject = uobj; 951 mw->type = cmd.mw_type; 952 953 ret = pd->device->ops.alloc_mw(mw, &attrs->driver_udata); 954 if (ret) 955 goto err_alloc; 956 957 atomic_inc(&pd->usecnt); 958 959 uobj->object = mw; 960 uobj_put_obj_read(pd); 961 uobj_finalize_uobj_create(uobj, attrs); 962 963 resp.rkey = mw->rkey; 964 resp.mw_handle = uobj->id; 965 return uverbs_response(attrs, &resp, sizeof(resp)); 966 967 err_alloc: 968 kfree(mw); 969 err_put: 970 uobj_put_obj_read(pd); 971 err_free: 972 uobj_alloc_abort(uobj, attrs); 973 return ret; 974 } 975 976 static int ib_uverbs_dealloc_mw(struct uverbs_attr_bundle *attrs) 977 { 978 struct ib_uverbs_dealloc_mw cmd; 979 int ret; 980 981 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 982 if (ret) 983 return ret; 984 985 return uobj_perform_destroy(UVERBS_OBJECT_MW, cmd.mw_handle, attrs); 986 } 987 988 static int ib_uverbs_create_comp_channel(struct uverbs_attr_bundle *attrs) 989 { 990 struct ib_uverbs_create_comp_channel cmd; 991 struct ib_uverbs_create_comp_channel_resp resp; 992 struct ib_uobject *uobj; 993 struct ib_uverbs_completion_event_file *ev_file; 994 struct ib_device *ib_dev; 995 int ret; 996 997 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 998 if (ret) 999 return ret; 1000 1001 uobj = uobj_alloc(UVERBS_OBJECT_COMP_CHANNEL, attrs, &ib_dev); 1002 if (IS_ERR(uobj)) 1003 return PTR_ERR(uobj); 1004 1005 ev_file = container_of(uobj, struct ib_uverbs_completion_event_file, 1006 uobj); 1007 ib_uverbs_init_event_queue(&ev_file->ev_queue); 1008 uobj_finalize_uobj_create(uobj, attrs); 1009 1010 resp.fd = uobj->id; 1011 return uverbs_response(attrs, &resp, sizeof(resp)); 1012 } 1013 1014 static int create_cq(struct uverbs_attr_bundle *attrs, 1015 struct ib_uverbs_ex_create_cq *cmd) 1016 { 1017 struct ib_ucq_object *obj; 1018 struct ib_uverbs_completion_event_file *ev_file = NULL; 1019 struct ib_cq *cq; 1020 int ret; 1021 struct ib_uverbs_ex_create_cq_resp resp = {}; 1022 struct ib_cq_init_attr attr = {}; 1023 struct ib_device *ib_dev; 1024 1025 if (cmd->comp_vector >= attrs->ufile->device->num_comp_vectors) 1026 return -EINVAL; 1027 1028 if (!cmd->cqe) 1029 return -EINVAL; 1030 1031 obj = (struct ib_ucq_object *)uobj_alloc(UVERBS_OBJECT_CQ, attrs, 1032 &ib_dev); 1033 if (IS_ERR(obj)) 1034 return PTR_ERR(obj); 1035 1036 if (cmd->comp_channel >= 0) { 1037 ev_file = ib_uverbs_lookup_comp_file(cmd->comp_channel, attrs); 1038 if (IS_ERR(ev_file)) { 1039 ret = PTR_ERR(ev_file); 1040 goto err; 1041 } 1042 } 1043 1044 obj->uevent.uobject.user_handle = cmd->user_handle; 1045 INIT_LIST_HEAD(&obj->comp_list); 1046 INIT_LIST_HEAD(&obj->uevent.event_list); 1047 1048 attr.cqe = cmd->cqe; 1049 attr.comp_vector = cmd->comp_vector; 1050 attr.flags = cmd->flags; 1051 1052 cq = rdma_zalloc_drv_obj(ib_dev, ib_cq); 1053 if (!cq) { 1054 ret = -ENOMEM; 1055 goto err_file; 1056 } 1057 cq->device = ib_dev; 1058 cq->uobject = obj; 1059 cq->comp_handler = ib_uverbs_comp_handler; 1060 cq->event_handler = ib_uverbs_cq_event_handler; 1061 cq->cq_context = ev_file ? &ev_file->ev_queue : NULL; 1062 atomic_set(&cq->usecnt, 0); 1063 1064 rdma_restrack_new(&cq->res, RDMA_RESTRACK_CQ); 1065 rdma_restrack_set_name(&cq->res, NULL); 1066 1067 if (ib_dev->ops.create_user_cq) 1068 ret = ib_dev->ops.create_user_cq(cq, &attr, attrs); 1069 else 1070 ret = ib_dev->ops.create_cq(cq, &attr, attrs); 1071 if (ret) 1072 goto err_free; 1073 rdma_restrack_add(&cq->res); 1074 1075 obj->uevent.uobject.object = cq; 1076 obj->uevent.event_file = READ_ONCE(attrs->ufile->default_async_file); 1077 if (obj->uevent.event_file) 1078 uverbs_uobject_get(&obj->uevent.event_file->uobj); 1079 uobj_finalize_uobj_create(&obj->uevent.uobject, attrs); 1080 1081 resp.base.cq_handle = obj->uevent.uobject.id; 1082 resp.base.cqe = cq->cqe; 1083 resp.response_length = uverbs_response_length(attrs, sizeof(resp)); 1084 return uverbs_response(attrs, &resp, sizeof(resp)); 1085 1086 err_free: 1087 ib_umem_release(cq->umem); 1088 rdma_restrack_put(&cq->res); 1089 kfree(cq); 1090 err_file: 1091 if (ev_file) 1092 ib_uverbs_release_ucq(ev_file, obj); 1093 err: 1094 uobj_alloc_abort(&obj->uevent.uobject, attrs); 1095 return ret; 1096 } 1097 1098 static int ib_uverbs_create_cq(struct uverbs_attr_bundle *attrs) 1099 { 1100 struct ib_uverbs_create_cq cmd; 1101 struct ib_uverbs_ex_create_cq cmd_ex; 1102 int ret; 1103 1104 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1105 if (ret) 1106 return ret; 1107 1108 memset(&cmd_ex, 0, sizeof(cmd_ex)); 1109 cmd_ex.user_handle = cmd.user_handle; 1110 cmd_ex.cqe = cmd.cqe; 1111 cmd_ex.comp_vector = cmd.comp_vector; 1112 cmd_ex.comp_channel = cmd.comp_channel; 1113 1114 return create_cq(attrs, &cmd_ex); 1115 } 1116 1117 static int ib_uverbs_ex_create_cq(struct uverbs_attr_bundle *attrs) 1118 { 1119 struct ib_uverbs_ex_create_cq cmd; 1120 int ret; 1121 1122 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1123 if (ret) 1124 return ret; 1125 1126 if (cmd.comp_mask) 1127 return -EINVAL; 1128 1129 if (cmd.reserved) 1130 return -EINVAL; 1131 1132 return create_cq(attrs, &cmd); 1133 } 1134 1135 static int ib_uverbs_resize_cq(struct uverbs_attr_bundle *attrs) 1136 { 1137 struct ib_uverbs_resize_cq cmd; 1138 struct ib_uverbs_resize_cq_resp resp = {}; 1139 struct ib_cq *cq; 1140 int ret; 1141 1142 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1143 if (ret) 1144 return ret; 1145 1146 if (!cmd.cqe) 1147 return -EINVAL; 1148 1149 cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs); 1150 if (IS_ERR(cq)) 1151 return PTR_ERR(cq); 1152 1153 ret = cq->device->ops.resize_user_cq(cq, cmd.cqe, &attrs->driver_udata); 1154 if (ret) 1155 goto out; 1156 1157 resp.cqe = cq->cqe; 1158 1159 ret = uverbs_response(attrs, &resp, sizeof(resp)); 1160 out: 1161 rdma_lookup_put_uobject(&cq->uobject->uevent.uobject, 1162 UVERBS_LOOKUP_READ); 1163 1164 return ret; 1165 } 1166 1167 static int copy_wc_to_user(struct ib_device *ib_dev, void __user *dest, 1168 struct ib_wc *wc) 1169 { 1170 struct ib_uverbs_wc tmp; 1171 1172 tmp.wr_id = wc->wr_id; 1173 tmp.status = wc->status; 1174 tmp.opcode = wc->opcode; 1175 tmp.vendor_err = wc->vendor_err; 1176 tmp.byte_len = wc->byte_len; 1177 tmp.ex.imm_data = wc->ex.imm_data; 1178 tmp.qp_num = wc->qp->qp_num; 1179 tmp.src_qp = wc->src_qp; 1180 tmp.wc_flags = wc->wc_flags; 1181 tmp.pkey_index = wc->pkey_index; 1182 if (rdma_cap_opa_ah(ib_dev, wc->port_num)) 1183 tmp.slid = OPA_TO_IB_UCAST_LID(wc->slid); 1184 else 1185 tmp.slid = ib_lid_cpu16(wc->slid); 1186 tmp.sl = wc->sl; 1187 tmp.dlid_path_bits = wc->dlid_path_bits; 1188 tmp.port_num = wc->port_num; 1189 tmp.reserved = 0; 1190 1191 if (copy_to_user(dest, &tmp, sizeof tmp)) 1192 return -EFAULT; 1193 1194 return 0; 1195 } 1196 1197 static int ib_uverbs_poll_cq(struct uverbs_attr_bundle *attrs) 1198 { 1199 struct ib_uverbs_poll_cq cmd; 1200 struct ib_uverbs_poll_cq_resp resp; 1201 u8 __user *header_ptr; 1202 u8 __user *data_ptr; 1203 struct ib_cq *cq; 1204 struct ib_wc wc; 1205 int ret; 1206 1207 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1208 if (ret) 1209 return ret; 1210 1211 cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs); 1212 if (IS_ERR(cq)) 1213 return PTR_ERR(cq); 1214 1215 /* we copy a struct ib_uverbs_poll_cq_resp to user space */ 1216 header_ptr = attrs->ucore.outbuf; 1217 data_ptr = header_ptr + sizeof resp; 1218 1219 memset(&resp, 0, sizeof resp); 1220 while (resp.count < cmd.ne) { 1221 ret = ib_poll_cq(cq, 1, &wc); 1222 if (ret < 0) 1223 goto out_put; 1224 if (!ret) 1225 break; 1226 1227 ret = copy_wc_to_user(cq->device, data_ptr, &wc); 1228 if (ret) 1229 goto out_put; 1230 1231 data_ptr += sizeof(struct ib_uverbs_wc); 1232 ++resp.count; 1233 } 1234 1235 if (copy_to_user(header_ptr, &resp, sizeof resp)) { 1236 ret = -EFAULT; 1237 goto out_put; 1238 } 1239 ret = 0; 1240 1241 if (uverbs_attr_is_valid(attrs, UVERBS_ATTR_CORE_OUT)) 1242 ret = uverbs_output_written(attrs, UVERBS_ATTR_CORE_OUT); 1243 1244 out_put: 1245 rdma_lookup_put_uobject(&cq->uobject->uevent.uobject, 1246 UVERBS_LOOKUP_READ); 1247 return ret; 1248 } 1249 1250 static int ib_uverbs_req_notify_cq(struct uverbs_attr_bundle *attrs) 1251 { 1252 struct ib_uverbs_req_notify_cq cmd; 1253 struct ib_cq *cq; 1254 int ret; 1255 1256 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1257 if (ret) 1258 return ret; 1259 1260 cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs); 1261 if (IS_ERR(cq)) 1262 return PTR_ERR(cq); 1263 1264 ib_req_notify_cq(cq, cmd.solicited_only ? 1265 IB_CQ_SOLICITED : IB_CQ_NEXT_COMP); 1266 1267 rdma_lookup_put_uobject(&cq->uobject->uevent.uobject, 1268 UVERBS_LOOKUP_READ); 1269 return 0; 1270 } 1271 1272 static int ib_uverbs_destroy_cq(struct uverbs_attr_bundle *attrs) 1273 { 1274 struct ib_uverbs_destroy_cq cmd; 1275 struct ib_uverbs_destroy_cq_resp resp; 1276 struct ib_uobject *uobj; 1277 struct ib_ucq_object *obj; 1278 int ret; 1279 1280 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1281 if (ret) 1282 return ret; 1283 1284 uobj = uobj_get_destroy(UVERBS_OBJECT_CQ, cmd.cq_handle, attrs); 1285 if (IS_ERR(uobj)) 1286 return PTR_ERR(uobj); 1287 1288 obj = container_of(uobj, struct ib_ucq_object, uevent.uobject); 1289 memset(&resp, 0, sizeof(resp)); 1290 resp.comp_events_reported = obj->comp_events_reported; 1291 resp.async_events_reported = obj->uevent.events_reported; 1292 1293 uobj_put_destroy(uobj); 1294 1295 return uverbs_response(attrs, &resp, sizeof(resp)); 1296 } 1297 1298 static int create_qp(struct uverbs_attr_bundle *attrs, 1299 struct ib_uverbs_ex_create_qp *cmd) 1300 { 1301 struct ib_uqp_object *obj; 1302 struct ib_device *device; 1303 struct ib_pd *pd = NULL; 1304 struct ib_xrcd *xrcd = NULL; 1305 struct ib_uobject *xrcd_uobj = ERR_PTR(-ENOENT); 1306 struct ib_cq *scq = NULL, *rcq = NULL; 1307 struct ib_srq *srq = NULL; 1308 struct ib_qp *qp; 1309 struct ib_qp_init_attr attr = {}; 1310 struct ib_uverbs_ex_create_qp_resp resp = {}; 1311 int ret; 1312 struct ib_rwq_ind_table *ind_tbl = NULL; 1313 bool has_sq = true; 1314 struct ib_device *ib_dev; 1315 1316 switch (cmd->qp_type) { 1317 case IB_QPT_RAW_PACKET: 1318 if (!rdma_uattrs_has_raw_cap(attrs)) 1319 return -EPERM; 1320 fallthrough; 1321 case IB_QPT_RC: 1322 case IB_QPT_UC: 1323 case IB_QPT_UD: 1324 case IB_QPT_XRC_INI: 1325 case IB_QPT_XRC_TGT: 1326 case IB_QPT_DRIVER: 1327 break; 1328 default: 1329 return -EINVAL; 1330 } 1331 1332 obj = (struct ib_uqp_object *)uobj_alloc(UVERBS_OBJECT_QP, attrs, 1333 &ib_dev); 1334 if (IS_ERR(obj)) 1335 return PTR_ERR(obj); 1336 obj->uxrcd = NULL; 1337 obj->uevent.uobject.user_handle = cmd->user_handle; 1338 mutex_init(&obj->mcast_lock); 1339 1340 if (cmd->comp_mask & IB_UVERBS_CREATE_QP_MASK_IND_TABLE) { 1341 ind_tbl = uobj_get_obj_read(rwq_ind_table, 1342 UVERBS_OBJECT_RWQ_IND_TBL, 1343 cmd->rwq_ind_tbl_handle, attrs); 1344 if (IS_ERR(ind_tbl)) { 1345 ret = PTR_ERR(ind_tbl); 1346 goto err_put; 1347 } 1348 1349 attr.rwq_ind_tbl = ind_tbl; 1350 } 1351 1352 if (ind_tbl && (cmd->max_recv_wr || cmd->max_recv_sge || cmd->is_srq)) { 1353 ret = -EINVAL; 1354 goto err_put; 1355 } 1356 1357 if (ind_tbl && !cmd->max_send_wr) 1358 has_sq = false; 1359 1360 if (cmd->qp_type == IB_QPT_XRC_TGT) { 1361 xrcd_uobj = uobj_get_read(UVERBS_OBJECT_XRCD, cmd->pd_handle, 1362 attrs); 1363 1364 if (IS_ERR(xrcd_uobj)) { 1365 ret = -EINVAL; 1366 goto err_put; 1367 } 1368 1369 xrcd = (struct ib_xrcd *)xrcd_uobj->object; 1370 if (!xrcd) { 1371 ret = -EINVAL; 1372 goto err_put; 1373 } 1374 device = xrcd->device; 1375 } else { 1376 if (cmd->qp_type == IB_QPT_XRC_INI) { 1377 cmd->max_recv_wr = 0; 1378 cmd->max_recv_sge = 0; 1379 } else { 1380 if (cmd->is_srq) { 1381 srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, 1382 cmd->srq_handle, attrs); 1383 if (IS_ERR(srq) || 1384 srq->srq_type == IB_SRQT_XRC) { 1385 ret = IS_ERR(srq) ? PTR_ERR(srq) : 1386 -EINVAL; 1387 goto err_put; 1388 } 1389 } 1390 1391 if (!ind_tbl) { 1392 if (cmd->recv_cq_handle != cmd->send_cq_handle) { 1393 rcq = uobj_get_obj_read( 1394 cq, UVERBS_OBJECT_CQ, 1395 cmd->recv_cq_handle, attrs); 1396 if (IS_ERR(rcq)) { 1397 ret = PTR_ERR(rcq); 1398 goto err_put; 1399 } 1400 } 1401 } 1402 } 1403 1404 if (has_sq) { 1405 scq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, 1406 cmd->send_cq_handle, attrs); 1407 if (IS_ERR(scq)) { 1408 ret = PTR_ERR(scq); 1409 goto err_put; 1410 } 1411 } 1412 1413 if (!ind_tbl && cmd->qp_type != IB_QPT_XRC_INI) 1414 rcq = rcq ?: scq; 1415 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd->pd_handle, 1416 attrs); 1417 if (IS_ERR(pd)) { 1418 ret = PTR_ERR(pd); 1419 goto err_put; 1420 } 1421 1422 device = pd->device; 1423 } 1424 1425 attr.event_handler = ib_uverbs_qp_event_handler; 1426 attr.send_cq = scq; 1427 attr.recv_cq = rcq; 1428 attr.srq = srq; 1429 attr.xrcd = xrcd; 1430 attr.sq_sig_type = cmd->sq_sig_all ? IB_SIGNAL_ALL_WR : 1431 IB_SIGNAL_REQ_WR; 1432 attr.qp_type = cmd->qp_type; 1433 1434 attr.cap.max_send_wr = cmd->max_send_wr; 1435 attr.cap.max_recv_wr = cmd->max_recv_wr; 1436 attr.cap.max_send_sge = cmd->max_send_sge; 1437 attr.cap.max_recv_sge = cmd->max_recv_sge; 1438 attr.cap.max_inline_data = cmd->max_inline_data; 1439 1440 INIT_LIST_HEAD(&obj->uevent.event_list); 1441 INIT_LIST_HEAD(&obj->mcast_list); 1442 1443 attr.create_flags = cmd->create_flags; 1444 if (attr.create_flags & ~(IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK | 1445 IB_QP_CREATE_CROSS_CHANNEL | 1446 IB_QP_CREATE_MANAGED_SEND | 1447 IB_QP_CREATE_MANAGED_RECV | 1448 IB_QP_CREATE_SCATTER_FCS | 1449 IB_QP_CREATE_CVLAN_STRIPPING | 1450 IB_QP_CREATE_SOURCE_QPN | 1451 IB_QP_CREATE_PCI_WRITE_END_PADDING)) { 1452 ret = -EINVAL; 1453 goto err_put; 1454 } 1455 1456 if (attr.create_flags & IB_QP_CREATE_SOURCE_QPN) { 1457 if (!rdma_uattrs_has_raw_cap(attrs)) { 1458 ret = -EPERM; 1459 goto err_put; 1460 } 1461 1462 attr.source_qpn = cmd->source_qpn; 1463 } 1464 1465 qp = ib_create_qp_user(device, pd, &attr, &attrs->driver_udata, obj, 1466 KBUILD_MODNAME); 1467 if (IS_ERR(qp)) { 1468 ret = PTR_ERR(qp); 1469 goto err_put; 1470 } 1471 ib_qp_usecnt_inc(qp); 1472 1473 obj->uevent.uobject.object = qp; 1474 obj->uevent.event_file = READ_ONCE(attrs->ufile->default_async_file); 1475 if (obj->uevent.event_file) 1476 uverbs_uobject_get(&obj->uevent.event_file->uobj); 1477 1478 if (xrcd) { 1479 obj->uxrcd = container_of(xrcd_uobj, struct ib_uxrcd_object, 1480 uobject); 1481 atomic_inc(&obj->uxrcd->refcnt); 1482 uobj_put_read(xrcd_uobj); 1483 } 1484 1485 if (pd) 1486 uobj_put_obj_read(pd); 1487 if (scq) 1488 rdma_lookup_put_uobject(&scq->uobject->uevent.uobject, 1489 UVERBS_LOOKUP_READ); 1490 if (rcq && rcq != scq) 1491 rdma_lookup_put_uobject(&rcq->uobject->uevent.uobject, 1492 UVERBS_LOOKUP_READ); 1493 if (srq) 1494 rdma_lookup_put_uobject(&srq->uobject->uevent.uobject, 1495 UVERBS_LOOKUP_READ); 1496 if (ind_tbl) 1497 uobj_put_obj_read(ind_tbl); 1498 uobj_finalize_uobj_create(&obj->uevent.uobject, attrs); 1499 1500 resp.base.qpn = qp->qp_num; 1501 resp.base.qp_handle = obj->uevent.uobject.id; 1502 resp.base.max_recv_sge = attr.cap.max_recv_sge; 1503 resp.base.max_send_sge = attr.cap.max_send_sge; 1504 resp.base.max_recv_wr = attr.cap.max_recv_wr; 1505 resp.base.max_send_wr = attr.cap.max_send_wr; 1506 resp.base.max_inline_data = attr.cap.max_inline_data; 1507 resp.response_length = uverbs_response_length(attrs, sizeof(resp)); 1508 return uverbs_response(attrs, &resp, sizeof(resp)); 1509 1510 err_put: 1511 if (!IS_ERR(xrcd_uobj)) 1512 uobj_put_read(xrcd_uobj); 1513 if (!IS_ERR_OR_NULL(pd)) 1514 uobj_put_obj_read(pd); 1515 if (!IS_ERR_OR_NULL(scq)) 1516 rdma_lookup_put_uobject(&scq->uobject->uevent.uobject, 1517 UVERBS_LOOKUP_READ); 1518 if (!IS_ERR_OR_NULL(rcq) && rcq != scq) 1519 rdma_lookup_put_uobject(&rcq->uobject->uevent.uobject, 1520 UVERBS_LOOKUP_READ); 1521 if (!IS_ERR_OR_NULL(srq)) 1522 rdma_lookup_put_uobject(&srq->uobject->uevent.uobject, 1523 UVERBS_LOOKUP_READ); 1524 if (!IS_ERR_OR_NULL(ind_tbl)) 1525 uobj_put_obj_read(ind_tbl); 1526 1527 uobj_alloc_abort(&obj->uevent.uobject, attrs); 1528 return ret; 1529 } 1530 1531 static int ib_uverbs_create_qp(struct uverbs_attr_bundle *attrs) 1532 { 1533 struct ib_uverbs_create_qp cmd; 1534 struct ib_uverbs_ex_create_qp cmd_ex; 1535 int ret; 1536 1537 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1538 if (ret) 1539 return ret; 1540 1541 memset(&cmd_ex, 0, sizeof(cmd_ex)); 1542 cmd_ex.user_handle = cmd.user_handle; 1543 cmd_ex.pd_handle = cmd.pd_handle; 1544 cmd_ex.send_cq_handle = cmd.send_cq_handle; 1545 cmd_ex.recv_cq_handle = cmd.recv_cq_handle; 1546 cmd_ex.srq_handle = cmd.srq_handle; 1547 cmd_ex.max_send_wr = cmd.max_send_wr; 1548 cmd_ex.max_recv_wr = cmd.max_recv_wr; 1549 cmd_ex.max_send_sge = cmd.max_send_sge; 1550 cmd_ex.max_recv_sge = cmd.max_recv_sge; 1551 cmd_ex.max_inline_data = cmd.max_inline_data; 1552 cmd_ex.sq_sig_all = cmd.sq_sig_all; 1553 cmd_ex.qp_type = cmd.qp_type; 1554 cmd_ex.is_srq = cmd.is_srq; 1555 1556 return create_qp(attrs, &cmd_ex); 1557 } 1558 1559 static int ib_uverbs_ex_create_qp(struct uverbs_attr_bundle *attrs) 1560 { 1561 struct ib_uverbs_ex_create_qp cmd; 1562 int ret; 1563 1564 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1565 if (ret) 1566 return ret; 1567 1568 if (cmd.comp_mask & ~IB_UVERBS_CREATE_QP_SUP_COMP_MASK) 1569 return -EINVAL; 1570 1571 if (cmd.reserved) 1572 return -EINVAL; 1573 1574 return create_qp(attrs, &cmd); 1575 } 1576 1577 static int ib_uverbs_open_qp(struct uverbs_attr_bundle *attrs) 1578 { 1579 struct ib_uverbs_create_qp_resp resp = {}; 1580 struct ib_uverbs_open_qp cmd; 1581 struct ib_uqp_object *obj; 1582 struct ib_xrcd *xrcd; 1583 struct ib_qp *qp; 1584 struct ib_qp_open_attr attr = {}; 1585 int ret; 1586 struct ib_uobject *xrcd_uobj; 1587 struct ib_device *ib_dev; 1588 1589 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1590 if (ret) 1591 return ret; 1592 1593 obj = (struct ib_uqp_object *)uobj_alloc(UVERBS_OBJECT_QP, attrs, 1594 &ib_dev); 1595 if (IS_ERR(obj)) 1596 return PTR_ERR(obj); 1597 1598 xrcd_uobj = uobj_get_read(UVERBS_OBJECT_XRCD, cmd.pd_handle, attrs); 1599 if (IS_ERR(xrcd_uobj)) { 1600 ret = -EINVAL; 1601 goto err_put; 1602 } 1603 1604 xrcd = (struct ib_xrcd *)xrcd_uobj->object; 1605 if (!xrcd) { 1606 ret = -EINVAL; 1607 goto err_xrcd; 1608 } 1609 1610 attr.event_handler = ib_uverbs_qp_event_handler; 1611 attr.qp_num = cmd.qpn; 1612 attr.qp_type = cmd.qp_type; 1613 1614 INIT_LIST_HEAD(&obj->uevent.event_list); 1615 INIT_LIST_HEAD(&obj->mcast_list); 1616 1617 qp = ib_open_qp(xrcd, &attr); 1618 if (IS_ERR(qp)) { 1619 ret = PTR_ERR(qp); 1620 goto err_xrcd; 1621 } 1622 1623 obj->uevent.uobject.object = qp; 1624 obj->uevent.uobject.user_handle = cmd.user_handle; 1625 1626 obj->uxrcd = container_of(xrcd_uobj, struct ib_uxrcd_object, uobject); 1627 atomic_inc(&obj->uxrcd->refcnt); 1628 qp->uobject = obj; 1629 uobj_put_read(xrcd_uobj); 1630 uobj_finalize_uobj_create(&obj->uevent.uobject, attrs); 1631 1632 resp.qpn = qp->qp_num; 1633 resp.qp_handle = obj->uevent.uobject.id; 1634 return uverbs_response(attrs, &resp, sizeof(resp)); 1635 1636 err_xrcd: 1637 uobj_put_read(xrcd_uobj); 1638 err_put: 1639 uobj_alloc_abort(&obj->uevent.uobject, attrs); 1640 return ret; 1641 } 1642 1643 static void copy_ah_attr_to_uverbs(struct ib_uverbs_qp_dest *uverb_attr, 1644 struct rdma_ah_attr *rdma_attr) 1645 { 1646 const struct ib_global_route *grh; 1647 1648 uverb_attr->dlid = rdma_ah_get_dlid(rdma_attr); 1649 uverb_attr->sl = rdma_ah_get_sl(rdma_attr); 1650 uverb_attr->src_path_bits = rdma_ah_get_path_bits(rdma_attr); 1651 uverb_attr->static_rate = rdma_ah_get_static_rate(rdma_attr); 1652 uverb_attr->is_global = !!(rdma_ah_get_ah_flags(rdma_attr) & 1653 IB_AH_GRH); 1654 if (uverb_attr->is_global) { 1655 grh = rdma_ah_read_grh(rdma_attr); 1656 memcpy(uverb_attr->dgid, grh->dgid.raw, 16); 1657 uverb_attr->flow_label = grh->flow_label; 1658 uverb_attr->sgid_index = grh->sgid_index; 1659 uverb_attr->hop_limit = grh->hop_limit; 1660 uverb_attr->traffic_class = grh->traffic_class; 1661 } 1662 uverb_attr->port_num = rdma_ah_get_port_num(rdma_attr); 1663 } 1664 1665 static int ib_uverbs_query_qp(struct uverbs_attr_bundle *attrs) 1666 { 1667 struct ib_uverbs_query_qp cmd; 1668 struct ib_uverbs_query_qp_resp resp; 1669 struct ib_qp *qp; 1670 struct ib_qp_attr *attr; 1671 struct ib_qp_init_attr *init_attr; 1672 int ret; 1673 1674 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1675 if (ret) 1676 return ret; 1677 1678 attr = kmalloc_obj(*attr); 1679 init_attr = kmalloc_obj(*init_attr); 1680 if (!attr || !init_attr) { 1681 ret = -ENOMEM; 1682 goto out; 1683 } 1684 1685 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 1686 if (IS_ERR(qp)) { 1687 ret = PTR_ERR(qp); 1688 goto out; 1689 } 1690 1691 ret = ib_query_qp(qp, attr, cmd.attr_mask, init_attr); 1692 1693 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 1694 UVERBS_LOOKUP_READ); 1695 1696 if (ret) 1697 goto out; 1698 1699 memset(&resp, 0, sizeof resp); 1700 1701 resp.qp_state = attr->qp_state; 1702 resp.cur_qp_state = attr->cur_qp_state; 1703 resp.path_mtu = attr->path_mtu; 1704 resp.path_mig_state = attr->path_mig_state; 1705 resp.qkey = attr->qkey; 1706 resp.rq_psn = attr->rq_psn; 1707 resp.sq_psn = attr->sq_psn; 1708 resp.dest_qp_num = attr->dest_qp_num; 1709 resp.qp_access_flags = attr->qp_access_flags; 1710 resp.pkey_index = attr->pkey_index; 1711 resp.alt_pkey_index = attr->alt_pkey_index; 1712 resp.sq_draining = attr->sq_draining; 1713 resp.max_rd_atomic = attr->max_rd_atomic; 1714 resp.max_dest_rd_atomic = attr->max_dest_rd_atomic; 1715 resp.min_rnr_timer = attr->min_rnr_timer; 1716 resp.port_num = attr->port_num; 1717 resp.timeout = attr->timeout; 1718 resp.retry_cnt = attr->retry_cnt; 1719 resp.rnr_retry = attr->rnr_retry; 1720 resp.alt_port_num = attr->alt_port_num; 1721 resp.alt_timeout = attr->alt_timeout; 1722 1723 copy_ah_attr_to_uverbs(&resp.dest, &attr->ah_attr); 1724 copy_ah_attr_to_uverbs(&resp.alt_dest, &attr->alt_ah_attr); 1725 1726 resp.max_send_wr = init_attr->cap.max_send_wr; 1727 resp.max_recv_wr = init_attr->cap.max_recv_wr; 1728 resp.max_send_sge = init_attr->cap.max_send_sge; 1729 resp.max_recv_sge = init_attr->cap.max_recv_sge; 1730 resp.max_inline_data = init_attr->cap.max_inline_data; 1731 resp.sq_sig_all = init_attr->sq_sig_type == IB_SIGNAL_ALL_WR; 1732 1733 ret = uverbs_response(attrs, &resp, sizeof(resp)); 1734 1735 out: 1736 kfree(attr); 1737 kfree(init_attr); 1738 1739 return ret; 1740 } 1741 1742 /* Remove ignored fields set in the attribute mask */ 1743 static int modify_qp_mask(enum ib_qp_type qp_type, int mask) 1744 { 1745 switch (qp_type) { 1746 case IB_QPT_XRC_INI: 1747 return mask & ~(IB_QP_MAX_DEST_RD_ATOMIC | IB_QP_MIN_RNR_TIMER); 1748 case IB_QPT_XRC_TGT: 1749 return mask & ~(IB_QP_MAX_QP_RD_ATOMIC | IB_QP_RETRY_CNT | 1750 IB_QP_RNR_RETRY); 1751 default: 1752 return mask; 1753 } 1754 } 1755 1756 static void copy_ah_attr_from_uverbs(struct ib_device *dev, 1757 struct rdma_ah_attr *rdma_attr, 1758 struct ib_uverbs_qp_dest *uverb_attr) 1759 { 1760 rdma_attr->type = rdma_ah_find_type(dev, uverb_attr->port_num); 1761 if (uverb_attr->is_global) { 1762 rdma_ah_set_grh(rdma_attr, NULL, 1763 uverb_attr->flow_label, 1764 uverb_attr->sgid_index, 1765 uverb_attr->hop_limit, 1766 uverb_attr->traffic_class); 1767 rdma_ah_set_dgid_raw(rdma_attr, uverb_attr->dgid); 1768 } else { 1769 rdma_ah_set_ah_flags(rdma_attr, 0); 1770 } 1771 rdma_ah_set_dlid(rdma_attr, uverb_attr->dlid); 1772 rdma_ah_set_sl(rdma_attr, uverb_attr->sl); 1773 rdma_ah_set_path_bits(rdma_attr, uverb_attr->src_path_bits); 1774 rdma_ah_set_static_rate(rdma_attr, uverb_attr->static_rate); 1775 rdma_ah_set_port_num(rdma_attr, uverb_attr->port_num); 1776 rdma_ah_set_make_grd(rdma_attr, false); 1777 } 1778 1779 static int modify_qp(struct uverbs_attr_bundle *attrs, 1780 struct ib_uverbs_ex_modify_qp *cmd) 1781 { 1782 struct ib_qp_attr *attr; 1783 struct ib_qp *qp; 1784 int ret; 1785 1786 attr = kzalloc_obj(*attr); 1787 if (!attr) 1788 return -ENOMEM; 1789 1790 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd->base.qp_handle, 1791 attrs); 1792 if (IS_ERR(qp)) { 1793 ret = PTR_ERR(qp); 1794 goto out; 1795 } 1796 1797 if ((cmd->base.attr_mask & IB_QP_PORT) && 1798 !rdma_is_port_valid(qp->device, cmd->base.port_num)) { 1799 ret = -EINVAL; 1800 goto release_qp; 1801 } 1802 1803 if ((cmd->base.attr_mask & IB_QP_AV)) { 1804 if (!rdma_is_port_valid(qp->device, cmd->base.dest.port_num)) { 1805 ret = -EINVAL; 1806 goto release_qp; 1807 } 1808 1809 if (cmd->base.attr_mask & IB_QP_STATE && 1810 cmd->base.qp_state == IB_QPS_RTR) { 1811 /* We are in INIT->RTR TRANSITION (if we are not, 1812 * this transition will be rejected in subsequent checks). 1813 * In the INIT->RTR transition, we cannot have IB_QP_PORT set, 1814 * but the IB_QP_STATE flag is required. 1815 * 1816 * Since kernel 3.14 (commit dbf727de7440), the uverbs driver, 1817 * when IB_QP_AV is set, has required inclusion of a valid 1818 * port number in the primary AV. (AVs are created and handled 1819 * differently for infiniband and ethernet (RoCE) ports). 1820 * 1821 * Check the port number included in the primary AV against 1822 * the port number in the qp struct, which was set (and saved) 1823 * in the RST->INIT transition. 1824 */ 1825 if (cmd->base.dest.port_num != qp->real_qp->port) { 1826 ret = -EINVAL; 1827 goto release_qp; 1828 } 1829 } else { 1830 /* We are in SQD->SQD. (If we are not, this transition will 1831 * be rejected later in the verbs layer checks). 1832 * Check for both IB_QP_PORT and IB_QP_AV, these can be set 1833 * together in the SQD->SQD transition. 1834 * 1835 * If only IP_QP_AV was set, add in IB_QP_PORT as well (the 1836 * verbs layer driver does not track primary port changes 1837 * resulting from path migration. Thus, in SQD, if the primary 1838 * AV is modified, the primary port should also be modified). 1839 * 1840 * Note that in this transition, the IB_QP_STATE flag 1841 * is not allowed. 1842 */ 1843 if (((cmd->base.attr_mask & (IB_QP_AV | IB_QP_PORT)) 1844 == (IB_QP_AV | IB_QP_PORT)) && 1845 cmd->base.port_num != cmd->base.dest.port_num) { 1846 ret = -EINVAL; 1847 goto release_qp; 1848 } 1849 if ((cmd->base.attr_mask & (IB_QP_AV | IB_QP_PORT)) 1850 == IB_QP_AV) { 1851 cmd->base.attr_mask |= IB_QP_PORT; 1852 cmd->base.port_num = cmd->base.dest.port_num; 1853 } 1854 } 1855 } 1856 1857 if ((cmd->base.attr_mask & IB_QP_ALT_PATH) && 1858 (!rdma_is_port_valid(qp->device, cmd->base.alt_port_num) || 1859 !rdma_is_port_valid(qp->device, cmd->base.alt_dest.port_num) || 1860 cmd->base.alt_port_num != cmd->base.alt_dest.port_num)) { 1861 ret = -EINVAL; 1862 goto release_qp; 1863 } 1864 1865 if ((cmd->base.attr_mask & IB_QP_CUR_STATE && 1866 cmd->base.cur_qp_state > IB_QPS_ERR) || 1867 (cmd->base.attr_mask & IB_QP_STATE && 1868 cmd->base.qp_state > IB_QPS_ERR)) { 1869 ret = -EINVAL; 1870 goto release_qp; 1871 } 1872 1873 if (cmd->base.attr_mask & IB_QP_STATE) 1874 attr->qp_state = cmd->base.qp_state; 1875 if (cmd->base.attr_mask & IB_QP_CUR_STATE) 1876 attr->cur_qp_state = cmd->base.cur_qp_state; 1877 if (cmd->base.attr_mask & IB_QP_PATH_MTU) 1878 attr->path_mtu = cmd->base.path_mtu; 1879 if (cmd->base.attr_mask & IB_QP_PATH_MIG_STATE) 1880 attr->path_mig_state = cmd->base.path_mig_state; 1881 if (cmd->base.attr_mask & IB_QP_QKEY) { 1882 if (cmd->base.qkey & IB_QP_SET_QKEY && 1883 !(rdma_nl_get_privileged_qkey() || 1884 rdma_uattrs_has_raw_cap(attrs))) { 1885 ret = -EPERM; 1886 goto release_qp; 1887 } 1888 attr->qkey = cmd->base.qkey; 1889 } 1890 if (cmd->base.attr_mask & IB_QP_RQ_PSN) 1891 attr->rq_psn = cmd->base.rq_psn; 1892 if (cmd->base.attr_mask & IB_QP_SQ_PSN) 1893 attr->sq_psn = cmd->base.sq_psn; 1894 if (cmd->base.attr_mask & IB_QP_DEST_QPN) 1895 attr->dest_qp_num = cmd->base.dest_qp_num; 1896 if (cmd->base.attr_mask & IB_QP_ACCESS_FLAGS) 1897 attr->qp_access_flags = cmd->base.qp_access_flags; 1898 if (cmd->base.attr_mask & IB_QP_PKEY_INDEX) 1899 attr->pkey_index = cmd->base.pkey_index; 1900 if (cmd->base.attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY) 1901 attr->en_sqd_async_notify = cmd->base.en_sqd_async_notify; 1902 if (cmd->base.attr_mask & IB_QP_MAX_QP_RD_ATOMIC) 1903 attr->max_rd_atomic = cmd->base.max_rd_atomic; 1904 if (cmd->base.attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) 1905 attr->max_dest_rd_atomic = cmd->base.max_dest_rd_atomic; 1906 if (cmd->base.attr_mask & IB_QP_MIN_RNR_TIMER) 1907 attr->min_rnr_timer = cmd->base.min_rnr_timer; 1908 if (cmd->base.attr_mask & IB_QP_PORT) 1909 attr->port_num = cmd->base.port_num; 1910 if (cmd->base.attr_mask & IB_QP_TIMEOUT) 1911 attr->timeout = cmd->base.timeout; 1912 if (cmd->base.attr_mask & IB_QP_RETRY_CNT) 1913 attr->retry_cnt = cmd->base.retry_cnt; 1914 if (cmd->base.attr_mask & IB_QP_RNR_RETRY) 1915 attr->rnr_retry = cmd->base.rnr_retry; 1916 if (cmd->base.attr_mask & IB_QP_ALT_PATH) { 1917 attr->alt_port_num = cmd->base.alt_port_num; 1918 attr->alt_timeout = cmd->base.alt_timeout; 1919 attr->alt_pkey_index = cmd->base.alt_pkey_index; 1920 } 1921 if (cmd->base.attr_mask & IB_QP_RATE_LIMIT) 1922 attr->rate_limit = cmd->rate_limit; 1923 1924 if (cmd->base.attr_mask & IB_QP_AV) 1925 copy_ah_attr_from_uverbs(qp->device, &attr->ah_attr, 1926 &cmd->base.dest); 1927 1928 if (cmd->base.attr_mask & IB_QP_ALT_PATH) 1929 copy_ah_attr_from_uverbs(qp->device, &attr->alt_ah_attr, 1930 &cmd->base.alt_dest); 1931 1932 ret = ib_modify_qp_with_udata(qp, attr, 1933 modify_qp_mask(qp->qp_type, 1934 cmd->base.attr_mask), 1935 &attrs->driver_udata); 1936 1937 release_qp: 1938 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 1939 UVERBS_LOOKUP_READ); 1940 out: 1941 kfree(attr); 1942 1943 return ret; 1944 } 1945 1946 static int ib_uverbs_modify_qp(struct uverbs_attr_bundle *attrs) 1947 { 1948 struct ib_uverbs_ex_modify_qp cmd; 1949 int ret; 1950 1951 ret = uverbs_request(attrs, &cmd.base, sizeof(cmd.base)); 1952 if (ret) 1953 return ret; 1954 1955 if (cmd.base.attr_mask & ~IB_QP_ATTR_STANDARD_BITS) 1956 return -EOPNOTSUPP; 1957 1958 return modify_qp(attrs, &cmd); 1959 } 1960 1961 static int ib_uverbs_ex_modify_qp(struct uverbs_attr_bundle *attrs) 1962 { 1963 struct ib_uverbs_ex_modify_qp cmd; 1964 struct ib_uverbs_ex_modify_qp_resp resp = { 1965 .response_length = uverbs_response_length(attrs, sizeof(resp)) 1966 }; 1967 int ret; 1968 1969 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1970 if (ret) 1971 return ret; 1972 1973 /* 1974 * Last bit is reserved for extending the attr_mask by 1975 * using another field. 1976 */ 1977 if (cmd.base.attr_mask & ~(IB_QP_ATTR_STANDARD_BITS | IB_QP_RATE_LIMIT)) 1978 return -EOPNOTSUPP; 1979 1980 ret = modify_qp(attrs, &cmd); 1981 if (ret) 1982 return ret; 1983 1984 return uverbs_response(attrs, &resp, sizeof(resp)); 1985 } 1986 1987 static int ib_uverbs_destroy_qp(struct uverbs_attr_bundle *attrs) 1988 { 1989 struct ib_uverbs_destroy_qp cmd; 1990 struct ib_uverbs_destroy_qp_resp resp; 1991 struct ib_uobject *uobj; 1992 struct ib_uqp_object *obj; 1993 int ret; 1994 1995 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 1996 if (ret) 1997 return ret; 1998 1999 uobj = uobj_get_destroy(UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 2000 if (IS_ERR(uobj)) 2001 return PTR_ERR(uobj); 2002 2003 obj = container_of(uobj, struct ib_uqp_object, uevent.uobject); 2004 memset(&resp, 0, sizeof(resp)); 2005 resp.events_reported = obj->uevent.events_reported; 2006 2007 uobj_put_destroy(uobj); 2008 2009 return uverbs_response(attrs, &resp, sizeof(resp)); 2010 } 2011 2012 static void *alloc_wr(size_t wr_size, __u32 num_sge) 2013 { 2014 if (num_sge >= (U32_MAX - ALIGN(wr_size, sizeof(struct ib_sge))) / 2015 sizeof(struct ib_sge)) 2016 return NULL; 2017 2018 return kmalloc(ALIGN(wr_size, sizeof(struct ib_sge)) + 2019 num_sge * sizeof(struct ib_sge), 2020 GFP_KERNEL); 2021 } 2022 2023 static int ib_uverbs_post_send(struct uverbs_attr_bundle *attrs) 2024 { 2025 struct ib_uverbs_post_send cmd; 2026 struct ib_uverbs_post_send_resp resp; 2027 struct ib_uverbs_send_wr *user_wr; 2028 struct ib_send_wr *wr = NULL, *last, *next; 2029 const struct ib_send_wr *bad_wr; 2030 struct ib_qp *qp; 2031 int i, sg_ind; 2032 int is_ud; 2033 int ret, ret2; 2034 size_t next_size; 2035 const struct ib_sge __user *sgls; 2036 const void __user *wqes; 2037 struct uverbs_req_iter iter; 2038 2039 ret = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd)); 2040 if (ret) 2041 return ret; 2042 wqes = uverbs_request_next_ptr(&iter, size_mul(cmd.wqe_size, 2043 cmd.wr_count)); 2044 if (IS_ERR(wqes)) 2045 return PTR_ERR(wqes); 2046 sgls = uverbs_request_next_ptr(&iter, 2047 size_mul(cmd.sge_count, 2048 sizeof(struct ib_uverbs_sge))); 2049 if (IS_ERR(sgls)) 2050 return PTR_ERR(sgls); 2051 ret = uverbs_request_finish(&iter); 2052 if (ret) 2053 return ret; 2054 2055 if (cmd.wqe_size < sizeof(struct ib_uverbs_send_wr)) 2056 return -EINVAL; 2057 2058 user_wr = kmalloc(cmd.wqe_size, GFP_KERNEL | __GFP_NOWARN); 2059 if (!user_wr) 2060 return -ENOMEM; 2061 2062 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 2063 if (IS_ERR(qp)) { 2064 ret = PTR_ERR(qp); 2065 goto out; 2066 } 2067 2068 is_ud = qp->qp_type == IB_QPT_UD; 2069 sg_ind = 0; 2070 last = NULL; 2071 for (i = 0; i < cmd.wr_count; ++i) { 2072 if (copy_from_user(user_wr, wqes + i * cmd.wqe_size, 2073 cmd.wqe_size)) { 2074 ret = -EFAULT; 2075 goto out_put; 2076 } 2077 2078 if (user_wr->num_sge + sg_ind > cmd.sge_count) { 2079 ret = -EINVAL; 2080 goto out_put; 2081 } 2082 2083 if (is_ud) { 2084 struct ib_ud_wr *ud; 2085 2086 if (user_wr->opcode != IB_WR_SEND && 2087 user_wr->opcode != IB_WR_SEND_WITH_IMM) { 2088 ret = -EINVAL; 2089 goto out_put; 2090 } 2091 2092 next_size = sizeof(*ud); 2093 ud = alloc_wr(next_size, user_wr->num_sge); 2094 if (!ud) { 2095 ret = -ENOMEM; 2096 goto out_put; 2097 } 2098 2099 ud->ah = uobj_get_obj_read(ah, UVERBS_OBJECT_AH, 2100 user_wr->wr.ud.ah, attrs); 2101 if (IS_ERR(ud->ah)) { 2102 ret = PTR_ERR(ud->ah); 2103 kfree(ud); 2104 goto out_put; 2105 } 2106 ud->remote_qpn = user_wr->wr.ud.remote_qpn; 2107 ud->remote_qkey = user_wr->wr.ud.remote_qkey; 2108 2109 next = &ud->wr; 2110 } else if (user_wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM || 2111 user_wr->opcode == IB_WR_RDMA_WRITE || 2112 user_wr->opcode == IB_WR_RDMA_READ) { 2113 struct ib_rdma_wr *rdma; 2114 2115 next_size = sizeof(*rdma); 2116 rdma = alloc_wr(next_size, user_wr->num_sge); 2117 if (!rdma) { 2118 ret = -ENOMEM; 2119 goto out_put; 2120 } 2121 2122 rdma->remote_addr = user_wr->wr.rdma.remote_addr; 2123 rdma->rkey = user_wr->wr.rdma.rkey; 2124 2125 next = &rdma->wr; 2126 } else if (user_wr->opcode == IB_WR_ATOMIC_CMP_AND_SWP || 2127 user_wr->opcode == IB_WR_ATOMIC_FETCH_AND_ADD) { 2128 struct ib_atomic_wr *atomic; 2129 2130 next_size = sizeof(*atomic); 2131 atomic = alloc_wr(next_size, user_wr->num_sge); 2132 if (!atomic) { 2133 ret = -ENOMEM; 2134 goto out_put; 2135 } 2136 2137 atomic->remote_addr = user_wr->wr.atomic.remote_addr; 2138 atomic->compare_add = user_wr->wr.atomic.compare_add; 2139 atomic->swap = user_wr->wr.atomic.swap; 2140 atomic->rkey = user_wr->wr.atomic.rkey; 2141 2142 next = &atomic->wr; 2143 } else if (user_wr->opcode == IB_WR_SEND || 2144 user_wr->opcode == IB_WR_SEND_WITH_IMM || 2145 user_wr->opcode == IB_WR_SEND_WITH_INV) { 2146 next_size = sizeof(*next); 2147 next = alloc_wr(next_size, user_wr->num_sge); 2148 if (!next) { 2149 ret = -ENOMEM; 2150 goto out_put; 2151 } 2152 } else { 2153 ret = -EINVAL; 2154 goto out_put; 2155 } 2156 2157 if (user_wr->opcode == IB_WR_SEND_WITH_IMM || 2158 user_wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM) { 2159 next->ex.imm_data = 2160 (__be32 __force) user_wr->ex.imm_data; 2161 } else if (user_wr->opcode == IB_WR_SEND_WITH_INV) { 2162 next->ex.invalidate_rkey = user_wr->ex.invalidate_rkey; 2163 } 2164 2165 if (!last) 2166 wr = next; 2167 else 2168 last->next = next; 2169 last = next; 2170 2171 next->next = NULL; 2172 next->wr_id = user_wr->wr_id; 2173 next->num_sge = user_wr->num_sge; 2174 next->opcode = user_wr->opcode; 2175 next->send_flags = user_wr->send_flags; 2176 2177 if (next->num_sge) { 2178 next->sg_list = (void *) next + 2179 ALIGN(next_size, sizeof(struct ib_sge)); 2180 if (copy_from_user(next->sg_list, sgls + sg_ind, 2181 next->num_sge * 2182 sizeof(struct ib_sge))) { 2183 ret = -EFAULT; 2184 goto out_put; 2185 } 2186 sg_ind += next->num_sge; 2187 } else 2188 next->sg_list = NULL; 2189 } 2190 2191 resp.bad_wr = 0; 2192 ret = qp->device->ops.post_send(qp->real_qp, wr, &bad_wr); 2193 if (ret) 2194 for (next = wr; next; next = next->next) { 2195 ++resp.bad_wr; 2196 if (next == bad_wr) 2197 break; 2198 } 2199 2200 ret2 = uverbs_response(attrs, &resp, sizeof(resp)); 2201 if (ret2) 2202 ret = ret2; 2203 2204 out_put: 2205 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 2206 UVERBS_LOOKUP_READ); 2207 2208 while (wr) { 2209 if (is_ud && ud_wr(wr)->ah) 2210 uobj_put_obj_read(ud_wr(wr)->ah); 2211 next = wr->next; 2212 kfree(wr); 2213 wr = next; 2214 } 2215 2216 out: 2217 kfree(user_wr); 2218 2219 return ret; 2220 } 2221 2222 static struct ib_recv_wr * 2223 ib_uverbs_unmarshall_recv(struct uverbs_req_iter *iter, u32 wr_count, 2224 u32 wqe_size, u32 sge_count) 2225 { 2226 struct ib_uverbs_recv_wr *user_wr; 2227 struct ib_recv_wr *wr = NULL, *last, *next; 2228 int sg_ind; 2229 int i; 2230 int ret; 2231 const struct ib_sge __user *sgls; 2232 const void __user *wqes; 2233 2234 if (wqe_size < sizeof(struct ib_uverbs_recv_wr)) 2235 return ERR_PTR(-EINVAL); 2236 2237 wqes = uverbs_request_next_ptr(iter, size_mul(wqe_size, wr_count)); 2238 if (IS_ERR(wqes)) 2239 return ERR_CAST(wqes); 2240 sgls = uverbs_request_next_ptr(iter, size_mul(sge_count, 2241 sizeof(struct ib_uverbs_sge))); 2242 if (IS_ERR(sgls)) 2243 return ERR_CAST(sgls); 2244 ret = uverbs_request_finish(iter); 2245 if (ret) 2246 return ERR_PTR(ret); 2247 2248 user_wr = kmalloc(wqe_size, GFP_KERNEL | __GFP_NOWARN); 2249 if (!user_wr) 2250 return ERR_PTR(-ENOMEM); 2251 2252 sg_ind = 0; 2253 last = NULL; 2254 for (i = 0; i < wr_count; ++i) { 2255 if (copy_from_user(user_wr, wqes + i * wqe_size, 2256 wqe_size)) { 2257 ret = -EFAULT; 2258 goto err; 2259 } 2260 2261 if (user_wr->num_sge + sg_ind > sge_count) { 2262 ret = -EINVAL; 2263 goto err; 2264 } 2265 2266 if (user_wr->num_sge >= 2267 (U32_MAX - ALIGN(sizeof(*next), sizeof(struct ib_sge))) / 2268 sizeof(struct ib_sge)) { 2269 ret = -EINVAL; 2270 goto err; 2271 } 2272 2273 next = kmalloc(ALIGN(sizeof(*next), sizeof(struct ib_sge)) + 2274 user_wr->num_sge * sizeof(struct ib_sge), 2275 GFP_KERNEL); 2276 if (!next) { 2277 ret = -ENOMEM; 2278 goto err; 2279 } 2280 2281 if (!last) 2282 wr = next; 2283 else 2284 last->next = next; 2285 last = next; 2286 2287 next->next = NULL; 2288 next->wr_id = user_wr->wr_id; 2289 next->num_sge = user_wr->num_sge; 2290 2291 if (next->num_sge) { 2292 next->sg_list = (void *)next + 2293 ALIGN(sizeof(*next), sizeof(struct ib_sge)); 2294 if (copy_from_user(next->sg_list, sgls + sg_ind, 2295 next->num_sge * 2296 sizeof(struct ib_sge))) { 2297 ret = -EFAULT; 2298 goto err; 2299 } 2300 sg_ind += next->num_sge; 2301 } else 2302 next->sg_list = NULL; 2303 } 2304 2305 kfree(user_wr); 2306 return wr; 2307 2308 err: 2309 kfree(user_wr); 2310 2311 while (wr) { 2312 next = wr->next; 2313 kfree(wr); 2314 wr = next; 2315 } 2316 2317 return ERR_PTR(ret); 2318 } 2319 2320 static int ib_uverbs_post_recv(struct uverbs_attr_bundle *attrs) 2321 { 2322 struct ib_uverbs_post_recv cmd; 2323 struct ib_uverbs_post_recv_resp resp; 2324 struct ib_recv_wr *wr, *next; 2325 const struct ib_recv_wr *bad_wr; 2326 struct ib_qp *qp; 2327 int ret, ret2; 2328 struct uverbs_req_iter iter; 2329 2330 ret = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd)); 2331 if (ret) 2332 return ret; 2333 2334 wr = ib_uverbs_unmarshall_recv(&iter, cmd.wr_count, cmd.wqe_size, 2335 cmd.sge_count); 2336 if (IS_ERR(wr)) 2337 return PTR_ERR(wr); 2338 2339 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 2340 if (IS_ERR(qp)) { 2341 ret = PTR_ERR(qp); 2342 goto out; 2343 } 2344 2345 resp.bad_wr = 0; 2346 ret = qp->device->ops.post_recv(qp->real_qp, wr, &bad_wr); 2347 2348 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 2349 UVERBS_LOOKUP_READ); 2350 if (ret) { 2351 for (next = wr; next; next = next->next) { 2352 ++resp.bad_wr; 2353 if (next == bad_wr) 2354 break; 2355 } 2356 } 2357 2358 ret2 = uverbs_response(attrs, &resp, sizeof(resp)); 2359 if (ret2) 2360 ret = ret2; 2361 out: 2362 while (wr) { 2363 next = wr->next; 2364 kfree(wr); 2365 wr = next; 2366 } 2367 2368 return ret; 2369 } 2370 2371 static int ib_uverbs_post_srq_recv(struct uverbs_attr_bundle *attrs) 2372 { 2373 struct ib_uverbs_post_srq_recv cmd; 2374 struct ib_uverbs_post_srq_recv_resp resp; 2375 struct ib_recv_wr *wr, *next; 2376 const struct ib_recv_wr *bad_wr; 2377 struct ib_srq *srq; 2378 int ret, ret2; 2379 struct uverbs_req_iter iter; 2380 2381 ret = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd)); 2382 if (ret) 2383 return ret; 2384 2385 wr = ib_uverbs_unmarshall_recv(&iter, cmd.wr_count, cmd.wqe_size, 2386 cmd.sge_count); 2387 if (IS_ERR(wr)) 2388 return PTR_ERR(wr); 2389 2390 srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs); 2391 if (IS_ERR(srq)) { 2392 ret = PTR_ERR(srq); 2393 goto out; 2394 } 2395 2396 resp.bad_wr = 0; 2397 ret = srq->device->ops.post_srq_recv(srq, wr, &bad_wr); 2398 2399 rdma_lookup_put_uobject(&srq->uobject->uevent.uobject, 2400 UVERBS_LOOKUP_READ); 2401 2402 if (ret) 2403 for (next = wr; next; next = next->next) { 2404 ++resp.bad_wr; 2405 if (next == bad_wr) 2406 break; 2407 } 2408 2409 ret2 = uverbs_response(attrs, &resp, sizeof(resp)); 2410 if (ret2) 2411 ret = ret2; 2412 2413 out: 2414 while (wr) { 2415 next = wr->next; 2416 kfree(wr); 2417 wr = next; 2418 } 2419 2420 return ret; 2421 } 2422 2423 static int ib_uverbs_create_ah(struct uverbs_attr_bundle *attrs) 2424 { 2425 struct ib_uverbs_create_ah cmd; 2426 struct ib_uverbs_create_ah_resp resp; 2427 struct ib_uobject *uobj; 2428 struct ib_pd *pd; 2429 struct ib_ah *ah; 2430 struct rdma_ah_attr attr = {}; 2431 int ret; 2432 struct ib_device *ib_dev; 2433 2434 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 2435 if (ret) 2436 return ret; 2437 2438 uobj = uobj_alloc(UVERBS_OBJECT_AH, attrs, &ib_dev); 2439 if (IS_ERR(uobj)) 2440 return PTR_ERR(uobj); 2441 2442 if (!rdma_is_port_valid(ib_dev, cmd.attr.port_num)) { 2443 ret = -EINVAL; 2444 goto err; 2445 } 2446 2447 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs); 2448 if (IS_ERR(pd)) { 2449 ret = PTR_ERR(pd); 2450 goto err; 2451 } 2452 2453 attr.type = rdma_ah_find_type(ib_dev, cmd.attr.port_num); 2454 rdma_ah_set_make_grd(&attr, false); 2455 rdma_ah_set_dlid(&attr, cmd.attr.dlid); 2456 rdma_ah_set_sl(&attr, cmd.attr.sl); 2457 rdma_ah_set_path_bits(&attr, cmd.attr.src_path_bits); 2458 rdma_ah_set_static_rate(&attr, cmd.attr.static_rate); 2459 rdma_ah_set_port_num(&attr, cmd.attr.port_num); 2460 2461 if (cmd.attr.is_global) { 2462 rdma_ah_set_grh(&attr, NULL, cmd.attr.grh.flow_label, 2463 cmd.attr.grh.sgid_index, 2464 cmd.attr.grh.hop_limit, 2465 cmd.attr.grh.traffic_class); 2466 rdma_ah_set_dgid_raw(&attr, cmd.attr.grh.dgid); 2467 } else { 2468 rdma_ah_set_ah_flags(&attr, 0); 2469 } 2470 2471 ah = rdma_create_user_ah(pd, &attr, &attrs->driver_udata); 2472 if (IS_ERR(ah)) { 2473 ret = PTR_ERR(ah); 2474 goto err_put; 2475 } 2476 2477 ah->uobject = uobj; 2478 uobj->user_handle = cmd.user_handle; 2479 uobj->object = ah; 2480 uobj_put_obj_read(pd); 2481 uobj_finalize_uobj_create(uobj, attrs); 2482 2483 resp.ah_handle = uobj->id; 2484 return uverbs_response(attrs, &resp, sizeof(resp)); 2485 2486 err_put: 2487 uobj_put_obj_read(pd); 2488 err: 2489 uobj_alloc_abort(uobj, attrs); 2490 return ret; 2491 } 2492 2493 static int ib_uverbs_destroy_ah(struct uverbs_attr_bundle *attrs) 2494 { 2495 struct ib_uverbs_destroy_ah cmd; 2496 int ret; 2497 2498 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 2499 if (ret) 2500 return ret; 2501 2502 return uobj_perform_destroy(UVERBS_OBJECT_AH, cmd.ah_handle, attrs); 2503 } 2504 2505 static int ib_uverbs_attach_mcast(struct uverbs_attr_bundle *attrs) 2506 { 2507 struct ib_uverbs_attach_mcast cmd; 2508 struct ib_qp *qp; 2509 struct ib_uqp_object *obj; 2510 struct ib_uverbs_mcast_entry *mcast; 2511 int ret; 2512 2513 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 2514 if (ret) 2515 return ret; 2516 2517 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 2518 if (IS_ERR(qp)) 2519 return PTR_ERR(qp); 2520 2521 obj = qp->uobject; 2522 2523 mutex_lock(&obj->mcast_lock); 2524 list_for_each_entry(mcast, &obj->mcast_list, list) 2525 if (cmd.mlid == mcast->lid && 2526 !memcmp(cmd.gid, mcast->gid.raw, sizeof mcast->gid.raw)) { 2527 ret = 0; 2528 goto out_put; 2529 } 2530 2531 mcast = kmalloc_obj(*mcast); 2532 if (!mcast) { 2533 ret = -ENOMEM; 2534 goto out_put; 2535 } 2536 2537 mcast->lid = cmd.mlid; 2538 memcpy(mcast->gid.raw, cmd.gid, sizeof mcast->gid.raw); 2539 2540 ret = ib_attach_mcast(qp, &mcast->gid, cmd.mlid); 2541 if (!ret) 2542 list_add_tail(&mcast->list, &obj->mcast_list); 2543 else 2544 kfree(mcast); 2545 2546 out_put: 2547 mutex_unlock(&obj->mcast_lock); 2548 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 2549 UVERBS_LOOKUP_READ); 2550 2551 return ret; 2552 } 2553 2554 static int ib_uverbs_detach_mcast(struct uverbs_attr_bundle *attrs) 2555 { 2556 struct ib_uverbs_detach_mcast cmd; 2557 struct ib_uqp_object *obj; 2558 struct ib_qp *qp; 2559 struct ib_uverbs_mcast_entry *mcast; 2560 int ret; 2561 bool found = false; 2562 2563 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 2564 if (ret) 2565 return ret; 2566 2567 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 2568 if (IS_ERR(qp)) 2569 return PTR_ERR(qp); 2570 2571 obj = qp->uobject; 2572 mutex_lock(&obj->mcast_lock); 2573 2574 list_for_each_entry(mcast, &obj->mcast_list, list) 2575 if (cmd.mlid == mcast->lid && 2576 !memcmp(cmd.gid, mcast->gid.raw, sizeof mcast->gid.raw)) { 2577 list_del(&mcast->list); 2578 kfree(mcast); 2579 found = true; 2580 break; 2581 } 2582 2583 if (!found) { 2584 ret = -EINVAL; 2585 goto out_put; 2586 } 2587 2588 ret = ib_detach_mcast(qp, (union ib_gid *)cmd.gid, cmd.mlid); 2589 2590 out_put: 2591 mutex_unlock(&obj->mcast_lock); 2592 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 2593 UVERBS_LOOKUP_READ); 2594 return ret; 2595 } 2596 2597 struct ib_uflow_resources *flow_resources_alloc(size_t num_specs) 2598 { 2599 struct ib_uflow_resources *resources; 2600 2601 resources = kzalloc_obj(*resources); 2602 2603 if (!resources) 2604 return NULL; 2605 2606 if (!num_specs) 2607 goto out; 2608 2609 resources->counters = 2610 kzalloc_objs(*resources->counters, num_specs); 2611 resources->collection = 2612 kzalloc_objs(*resources->collection, num_specs); 2613 2614 if (!resources->counters || !resources->collection) 2615 goto err; 2616 2617 out: 2618 resources->max = num_specs; 2619 return resources; 2620 2621 err: 2622 kfree(resources->counters); 2623 kfree(resources); 2624 2625 return NULL; 2626 } 2627 EXPORT_SYMBOL(flow_resources_alloc); 2628 2629 void ib_uverbs_flow_resources_free(struct ib_uflow_resources *uflow_res) 2630 { 2631 unsigned int i; 2632 2633 if (!uflow_res) 2634 return; 2635 2636 for (i = 0; i < uflow_res->collection_num; i++) 2637 atomic_dec(&uflow_res->collection[i]->usecnt); 2638 2639 for (i = 0; i < uflow_res->counters_num; i++) 2640 atomic_dec(&uflow_res->counters[i]->usecnt); 2641 2642 kfree(uflow_res->collection); 2643 kfree(uflow_res->counters); 2644 kfree(uflow_res); 2645 } 2646 EXPORT_SYMBOL(ib_uverbs_flow_resources_free); 2647 2648 void flow_resources_add(struct ib_uflow_resources *uflow_res, 2649 enum ib_flow_spec_type type, 2650 void *ibobj) 2651 { 2652 WARN_ON(uflow_res->num >= uflow_res->max); 2653 2654 switch (type) { 2655 case IB_FLOW_SPEC_ACTION_HANDLE: 2656 atomic_inc(&((struct ib_flow_action *)ibobj)->usecnt); 2657 uflow_res->collection[uflow_res->collection_num++] = 2658 (struct ib_flow_action *)ibobj; 2659 break; 2660 case IB_FLOW_SPEC_ACTION_COUNT: 2661 atomic_inc(&((struct ib_counters *)ibobj)->usecnt); 2662 uflow_res->counters[uflow_res->counters_num++] = 2663 (struct ib_counters *)ibobj; 2664 break; 2665 default: 2666 WARN_ON(1); 2667 } 2668 2669 uflow_res->num++; 2670 } 2671 EXPORT_SYMBOL(flow_resources_add); 2672 2673 static int kern_spec_to_ib_spec_action(struct uverbs_attr_bundle *attrs, 2674 struct ib_uverbs_flow_spec *kern_spec, 2675 union ib_flow_spec *ib_spec, 2676 struct ib_uflow_resources *uflow_res) 2677 { 2678 ib_spec->type = kern_spec->type; 2679 switch (ib_spec->type) { 2680 case IB_FLOW_SPEC_ACTION_TAG: 2681 if (kern_spec->flow_tag.size != 2682 sizeof(struct ib_uverbs_flow_spec_action_tag)) 2683 return -EINVAL; 2684 2685 ib_spec->flow_tag.size = sizeof(struct ib_flow_spec_action_tag); 2686 ib_spec->flow_tag.tag_id = kern_spec->flow_tag.tag_id; 2687 break; 2688 case IB_FLOW_SPEC_ACTION_DROP: 2689 if (kern_spec->drop.size != 2690 sizeof(struct ib_uverbs_flow_spec_action_drop)) 2691 return -EINVAL; 2692 2693 ib_spec->drop.size = sizeof(struct ib_flow_spec_action_drop); 2694 break; 2695 case IB_FLOW_SPEC_ACTION_HANDLE: 2696 if (kern_spec->action.size != 2697 sizeof(struct ib_uverbs_flow_spec_action_handle)) 2698 return -EOPNOTSUPP; 2699 ib_spec->action.act = uobj_get_obj_read(flow_action, 2700 UVERBS_OBJECT_FLOW_ACTION, 2701 kern_spec->action.handle, 2702 attrs); 2703 if (IS_ERR(ib_spec->action.act)) 2704 return PTR_ERR(ib_spec->action.act); 2705 ib_spec->action.size = 2706 sizeof(struct ib_flow_spec_action_handle); 2707 flow_resources_add(uflow_res, 2708 IB_FLOW_SPEC_ACTION_HANDLE, 2709 ib_spec->action.act); 2710 uobj_put_obj_read(ib_spec->action.act); 2711 break; 2712 case IB_FLOW_SPEC_ACTION_COUNT: 2713 if (kern_spec->flow_count.size != 2714 sizeof(struct ib_uverbs_flow_spec_action_count)) 2715 return -EINVAL; 2716 ib_spec->flow_count.counters = 2717 uobj_get_obj_read(counters, 2718 UVERBS_OBJECT_COUNTERS, 2719 kern_spec->flow_count.handle, 2720 attrs); 2721 if (IS_ERR(ib_spec->flow_count.counters)) 2722 return PTR_ERR(ib_spec->flow_count.counters); 2723 ib_spec->flow_count.size = 2724 sizeof(struct ib_flow_spec_action_count); 2725 flow_resources_add(uflow_res, 2726 IB_FLOW_SPEC_ACTION_COUNT, 2727 ib_spec->flow_count.counters); 2728 uobj_put_obj_read(ib_spec->flow_count.counters); 2729 break; 2730 default: 2731 return -EINVAL; 2732 } 2733 return 0; 2734 } 2735 2736 static ssize_t spec_filter_size(const void *kern_spec_filter, u16 kern_filter_size, 2737 u16 ib_real_filter_sz) 2738 { 2739 /* 2740 * User space filter structures must be 64 bit aligned, otherwise this 2741 * may pass, but we won't handle additional new attributes. 2742 */ 2743 2744 if (kern_filter_size > ib_real_filter_sz) { 2745 if (memchr_inv(kern_spec_filter + 2746 ib_real_filter_sz, 0, 2747 kern_filter_size - ib_real_filter_sz)) 2748 return -EINVAL; 2749 return ib_real_filter_sz; 2750 } 2751 return kern_filter_size; 2752 } 2753 2754 int ib_uverbs_kern_spec_to_ib_spec_filter(enum ib_flow_spec_type type, 2755 const void *kern_spec_mask, 2756 const void *kern_spec_val, 2757 size_t kern_filter_sz, 2758 union ib_flow_spec *ib_spec) 2759 { 2760 ssize_t actual_filter_sz; 2761 ssize_t ib_filter_sz; 2762 2763 /* User flow spec size must be aligned to 4 bytes */ 2764 if (kern_filter_sz != ALIGN(kern_filter_sz, 4)) 2765 return -EINVAL; 2766 2767 ib_spec->type = type; 2768 2769 if (ib_spec->type == (IB_FLOW_SPEC_INNER | IB_FLOW_SPEC_VXLAN_TUNNEL)) 2770 return -EINVAL; 2771 2772 switch (ib_spec->type & ~IB_FLOW_SPEC_INNER) { 2773 case IB_FLOW_SPEC_ETH: 2774 ib_filter_sz = sizeof(struct ib_flow_eth_filter); 2775 actual_filter_sz = spec_filter_size(kern_spec_mask, 2776 kern_filter_sz, 2777 ib_filter_sz); 2778 if (actual_filter_sz <= 0) 2779 return -EINVAL; 2780 ib_spec->size = sizeof(struct ib_flow_spec_eth); 2781 memcpy(&ib_spec->eth.val, kern_spec_val, actual_filter_sz); 2782 memcpy(&ib_spec->eth.mask, kern_spec_mask, actual_filter_sz); 2783 break; 2784 case IB_FLOW_SPEC_IPV4: 2785 ib_filter_sz = sizeof(struct ib_flow_ipv4_filter); 2786 actual_filter_sz = spec_filter_size(kern_spec_mask, 2787 kern_filter_sz, 2788 ib_filter_sz); 2789 if (actual_filter_sz <= 0) 2790 return -EINVAL; 2791 ib_spec->size = sizeof(struct ib_flow_spec_ipv4); 2792 memcpy(&ib_spec->ipv4.val, kern_spec_val, actual_filter_sz); 2793 memcpy(&ib_spec->ipv4.mask, kern_spec_mask, actual_filter_sz); 2794 break; 2795 case IB_FLOW_SPEC_IPV6: 2796 ib_filter_sz = sizeof(struct ib_flow_ipv6_filter); 2797 actual_filter_sz = spec_filter_size(kern_spec_mask, 2798 kern_filter_sz, 2799 ib_filter_sz); 2800 if (actual_filter_sz <= 0) 2801 return -EINVAL; 2802 ib_spec->size = sizeof(struct ib_flow_spec_ipv6); 2803 memcpy(&ib_spec->ipv6.val, kern_spec_val, actual_filter_sz); 2804 memcpy(&ib_spec->ipv6.mask, kern_spec_mask, actual_filter_sz); 2805 2806 if ((ntohl(ib_spec->ipv6.mask.flow_label)) >= BIT(20) || 2807 (ntohl(ib_spec->ipv6.val.flow_label)) >= BIT(20)) 2808 return -EINVAL; 2809 break; 2810 case IB_FLOW_SPEC_TCP: 2811 case IB_FLOW_SPEC_UDP: 2812 ib_filter_sz = sizeof(struct ib_flow_tcp_udp_filter); 2813 actual_filter_sz = spec_filter_size(kern_spec_mask, 2814 kern_filter_sz, 2815 ib_filter_sz); 2816 if (actual_filter_sz <= 0) 2817 return -EINVAL; 2818 ib_spec->size = sizeof(struct ib_flow_spec_tcp_udp); 2819 memcpy(&ib_spec->tcp_udp.val, kern_spec_val, actual_filter_sz); 2820 memcpy(&ib_spec->tcp_udp.mask, kern_spec_mask, actual_filter_sz); 2821 break; 2822 case IB_FLOW_SPEC_VXLAN_TUNNEL: 2823 ib_filter_sz = sizeof(struct ib_flow_tunnel_filter); 2824 actual_filter_sz = spec_filter_size(kern_spec_mask, 2825 kern_filter_sz, 2826 ib_filter_sz); 2827 if (actual_filter_sz <= 0) 2828 return -EINVAL; 2829 ib_spec->tunnel.size = sizeof(struct ib_flow_spec_tunnel); 2830 memcpy(&ib_spec->tunnel.val, kern_spec_val, actual_filter_sz); 2831 memcpy(&ib_spec->tunnel.mask, kern_spec_mask, actual_filter_sz); 2832 2833 if ((ntohl(ib_spec->tunnel.mask.tunnel_id)) >= BIT(24) || 2834 (ntohl(ib_spec->tunnel.val.tunnel_id)) >= BIT(24)) 2835 return -EINVAL; 2836 break; 2837 case IB_FLOW_SPEC_ESP: 2838 ib_filter_sz = sizeof(struct ib_flow_esp_filter); 2839 actual_filter_sz = spec_filter_size(kern_spec_mask, 2840 kern_filter_sz, 2841 ib_filter_sz); 2842 if (actual_filter_sz <= 0) 2843 return -EINVAL; 2844 ib_spec->esp.size = sizeof(struct ib_flow_spec_esp); 2845 memcpy(&ib_spec->esp.val, kern_spec_val, actual_filter_sz); 2846 memcpy(&ib_spec->esp.mask, kern_spec_mask, actual_filter_sz); 2847 break; 2848 case IB_FLOW_SPEC_GRE: 2849 ib_filter_sz = sizeof(struct ib_flow_gre_filter); 2850 actual_filter_sz = spec_filter_size(kern_spec_mask, 2851 kern_filter_sz, 2852 ib_filter_sz); 2853 if (actual_filter_sz <= 0) 2854 return -EINVAL; 2855 ib_spec->gre.size = sizeof(struct ib_flow_spec_gre); 2856 memcpy(&ib_spec->gre.val, kern_spec_val, actual_filter_sz); 2857 memcpy(&ib_spec->gre.mask, kern_spec_mask, actual_filter_sz); 2858 break; 2859 case IB_FLOW_SPEC_MPLS: 2860 ib_filter_sz = sizeof(struct ib_flow_mpls_filter); 2861 actual_filter_sz = spec_filter_size(kern_spec_mask, 2862 kern_filter_sz, 2863 ib_filter_sz); 2864 if (actual_filter_sz <= 0) 2865 return -EINVAL; 2866 ib_spec->mpls.size = sizeof(struct ib_flow_spec_mpls); 2867 memcpy(&ib_spec->mpls.val, kern_spec_val, actual_filter_sz); 2868 memcpy(&ib_spec->mpls.mask, kern_spec_mask, actual_filter_sz); 2869 break; 2870 default: 2871 return -EINVAL; 2872 } 2873 return 0; 2874 } 2875 2876 static int kern_spec_to_ib_spec_filter(struct ib_uverbs_flow_spec *kern_spec, 2877 union ib_flow_spec *ib_spec) 2878 { 2879 size_t kern_filter_sz; 2880 void *kern_spec_mask; 2881 void *kern_spec_val; 2882 2883 if (check_sub_overflow((size_t)kern_spec->hdr.size, 2884 sizeof(struct ib_uverbs_flow_spec_hdr), 2885 &kern_filter_sz)) 2886 return -EINVAL; 2887 2888 kern_filter_sz /= 2; 2889 2890 kern_spec_val = (void *)kern_spec + 2891 sizeof(struct ib_uverbs_flow_spec_hdr); 2892 kern_spec_mask = kern_spec_val + kern_filter_sz; 2893 2894 return ib_uverbs_kern_spec_to_ib_spec_filter(kern_spec->type, 2895 kern_spec_mask, 2896 kern_spec_val, 2897 kern_filter_sz, ib_spec); 2898 } 2899 2900 static int kern_spec_to_ib_spec(struct uverbs_attr_bundle *attrs, 2901 struct ib_uverbs_flow_spec *kern_spec, 2902 union ib_flow_spec *ib_spec, 2903 struct ib_uflow_resources *uflow_res) 2904 { 2905 if (kern_spec->reserved) 2906 return -EINVAL; 2907 2908 if (kern_spec->type >= IB_FLOW_SPEC_ACTION_TAG) 2909 return kern_spec_to_ib_spec_action(attrs, kern_spec, ib_spec, 2910 uflow_res); 2911 else 2912 return kern_spec_to_ib_spec_filter(kern_spec, ib_spec); 2913 } 2914 2915 static int ib_uverbs_ex_create_wq(struct uverbs_attr_bundle *attrs) 2916 { 2917 struct ib_uverbs_ex_create_wq cmd; 2918 struct ib_uverbs_ex_create_wq_resp resp = {}; 2919 struct ib_uwq_object *obj; 2920 int err = 0; 2921 struct ib_cq *cq; 2922 struct ib_pd *pd; 2923 struct ib_wq *wq; 2924 struct ib_wq_init_attr wq_init_attr = {}; 2925 struct ib_device *ib_dev; 2926 2927 err = uverbs_request(attrs, &cmd, sizeof(cmd)); 2928 if (err) 2929 return err; 2930 2931 if (cmd.comp_mask) 2932 return -EOPNOTSUPP; 2933 2934 obj = (struct ib_uwq_object *)uobj_alloc(UVERBS_OBJECT_WQ, attrs, 2935 &ib_dev); 2936 if (IS_ERR(obj)) 2937 return PTR_ERR(obj); 2938 2939 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd.pd_handle, attrs); 2940 if (IS_ERR(pd)) { 2941 err = PTR_ERR(pd); 2942 goto err_uobj; 2943 } 2944 2945 cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs); 2946 if (IS_ERR(cq)) { 2947 err = PTR_ERR(cq); 2948 goto err_put_pd; 2949 } 2950 2951 wq_init_attr.cq = cq; 2952 wq_init_attr.max_sge = cmd.max_sge; 2953 wq_init_attr.max_wr = cmd.max_wr; 2954 wq_init_attr.wq_type = cmd.wq_type; 2955 wq_init_attr.event_handler = ib_uverbs_wq_event_handler; 2956 wq_init_attr.create_flags = cmd.create_flags; 2957 INIT_LIST_HEAD(&obj->uevent.event_list); 2958 obj->uevent.uobject.user_handle = cmd.user_handle; 2959 2960 wq = pd->device->ops.create_wq(pd, &wq_init_attr, &attrs->driver_udata); 2961 if (IS_ERR(wq)) { 2962 err = PTR_ERR(wq); 2963 goto err_put_cq; 2964 } 2965 2966 wq->uobject = obj; 2967 obj->uevent.uobject.object = wq; 2968 wq->wq_type = wq_init_attr.wq_type; 2969 wq->cq = cq; 2970 wq->pd = pd; 2971 wq->device = pd->device; 2972 atomic_set(&wq->usecnt, 0); 2973 atomic_inc(&pd->usecnt); 2974 atomic_inc(&cq->usecnt); 2975 obj->uevent.event_file = READ_ONCE(attrs->ufile->default_async_file); 2976 if (obj->uevent.event_file) 2977 uverbs_uobject_get(&obj->uevent.event_file->uobj); 2978 2979 uobj_put_obj_read(pd); 2980 rdma_lookup_put_uobject(&cq->uobject->uevent.uobject, 2981 UVERBS_LOOKUP_READ); 2982 uobj_finalize_uobj_create(&obj->uevent.uobject, attrs); 2983 2984 resp.wq_handle = obj->uevent.uobject.id; 2985 resp.max_sge = wq_init_attr.max_sge; 2986 resp.max_wr = wq_init_attr.max_wr; 2987 resp.wqn = wq->wq_num; 2988 resp.response_length = uverbs_response_length(attrs, sizeof(resp)); 2989 return uverbs_response(attrs, &resp, sizeof(resp)); 2990 2991 err_put_cq: 2992 rdma_lookup_put_uobject(&cq->uobject->uevent.uobject, 2993 UVERBS_LOOKUP_READ); 2994 err_put_pd: 2995 uobj_put_obj_read(pd); 2996 err_uobj: 2997 uobj_alloc_abort(&obj->uevent.uobject, attrs); 2998 2999 return err; 3000 } 3001 3002 static int ib_uverbs_ex_destroy_wq(struct uverbs_attr_bundle *attrs) 3003 { 3004 struct ib_uverbs_ex_destroy_wq cmd; 3005 struct ib_uverbs_ex_destroy_wq_resp resp = {}; 3006 struct ib_uobject *uobj; 3007 struct ib_uwq_object *obj; 3008 int ret; 3009 3010 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3011 if (ret) 3012 return ret; 3013 3014 if (cmd.comp_mask) 3015 return -EOPNOTSUPP; 3016 3017 resp.response_length = uverbs_response_length(attrs, sizeof(resp)); 3018 uobj = uobj_get_destroy(UVERBS_OBJECT_WQ, cmd.wq_handle, attrs); 3019 if (IS_ERR(uobj)) 3020 return PTR_ERR(uobj); 3021 3022 obj = container_of(uobj, struct ib_uwq_object, uevent.uobject); 3023 resp.events_reported = obj->uevent.events_reported; 3024 3025 uobj_put_destroy(uobj); 3026 3027 return uverbs_response(attrs, &resp, sizeof(resp)); 3028 } 3029 3030 static int ib_uverbs_ex_modify_wq(struct uverbs_attr_bundle *attrs) 3031 { 3032 struct ib_uverbs_ex_modify_wq cmd; 3033 struct ib_wq *wq; 3034 struct ib_wq_attr wq_attr = {}; 3035 int ret; 3036 3037 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3038 if (ret) 3039 return ret; 3040 3041 if (!cmd.attr_mask) 3042 return -EINVAL; 3043 3044 if (cmd.attr_mask > (IB_WQ_STATE | IB_WQ_CUR_STATE | IB_WQ_FLAGS)) 3045 return -EINVAL; 3046 3047 wq = uobj_get_obj_read(wq, UVERBS_OBJECT_WQ, cmd.wq_handle, attrs); 3048 if (IS_ERR(wq)) 3049 return PTR_ERR(wq); 3050 3051 if (cmd.attr_mask & IB_WQ_FLAGS) { 3052 wq_attr.flags = cmd.flags; 3053 wq_attr.flags_mask = cmd.flags_mask; 3054 } 3055 3056 if (cmd.attr_mask & IB_WQ_CUR_STATE) { 3057 if (cmd.curr_wq_state > IB_WQS_ERR) 3058 return -EINVAL; 3059 3060 wq_attr.curr_wq_state = cmd.curr_wq_state; 3061 } else { 3062 wq_attr.curr_wq_state = wq->state; 3063 } 3064 3065 if (cmd.attr_mask & IB_WQ_STATE) { 3066 if (cmd.wq_state > IB_WQS_ERR) 3067 return -EINVAL; 3068 3069 wq_attr.wq_state = cmd.wq_state; 3070 } else { 3071 wq_attr.wq_state = wq_attr.curr_wq_state; 3072 } 3073 3074 ret = wq->device->ops.modify_wq(wq, &wq_attr, cmd.attr_mask, 3075 &attrs->driver_udata); 3076 rdma_lookup_put_uobject(&wq->uobject->uevent.uobject, 3077 UVERBS_LOOKUP_READ); 3078 return ret; 3079 } 3080 3081 static int ib_uverbs_ex_create_rwq_ind_table(struct uverbs_attr_bundle *attrs) 3082 { 3083 struct ib_uverbs_ex_create_rwq_ind_table cmd; 3084 struct ib_uverbs_ex_create_rwq_ind_table_resp resp = {}; 3085 struct ib_uobject *uobj; 3086 int err; 3087 struct ib_rwq_ind_table_init_attr init_attr = {}; 3088 struct ib_rwq_ind_table *rwq_ind_tbl; 3089 struct ib_wq **wqs = NULL; 3090 u32 *wqs_handles = NULL; 3091 struct ib_wq *wq = NULL; 3092 int i, num_read_wqs; 3093 u32 num_wq_handles; 3094 struct uverbs_req_iter iter; 3095 struct ib_device *ib_dev; 3096 3097 err = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd)); 3098 if (err) 3099 return err; 3100 3101 if (cmd.comp_mask) 3102 return -EOPNOTSUPP; 3103 3104 if (cmd.log_ind_tbl_size > IB_USER_VERBS_MAX_LOG_IND_TBL_SIZE) 3105 return -EINVAL; 3106 3107 num_wq_handles = 1 << cmd.log_ind_tbl_size; 3108 wqs_handles = kcalloc(num_wq_handles, sizeof(*wqs_handles), 3109 GFP_KERNEL); 3110 if (!wqs_handles) 3111 return -ENOMEM; 3112 3113 err = uverbs_request_next(&iter, wqs_handles, 3114 num_wq_handles * sizeof(__u32)); 3115 if (err) 3116 goto err_free; 3117 3118 err = uverbs_request_finish(&iter); 3119 if (err) 3120 goto err_free; 3121 3122 wqs = kzalloc_objs(*wqs, num_wq_handles); 3123 if (!wqs) { 3124 err = -ENOMEM; 3125 goto err_free; 3126 } 3127 3128 for (num_read_wqs = 0; num_read_wqs < num_wq_handles; 3129 num_read_wqs++) { 3130 wq = uobj_get_obj_read(wq, UVERBS_OBJECT_WQ, 3131 wqs_handles[num_read_wqs], attrs); 3132 if (IS_ERR(wq)) { 3133 err = PTR_ERR(wq); 3134 goto put_wqs; 3135 } 3136 3137 wqs[num_read_wqs] = wq; 3138 atomic_inc(&wqs[num_read_wqs]->usecnt); 3139 } 3140 3141 uobj = uobj_alloc(UVERBS_OBJECT_RWQ_IND_TBL, attrs, &ib_dev); 3142 if (IS_ERR(uobj)) { 3143 err = PTR_ERR(uobj); 3144 goto put_wqs; 3145 } 3146 3147 rwq_ind_tbl = rdma_zalloc_drv_obj(ib_dev, ib_rwq_ind_table); 3148 if (!rwq_ind_tbl) { 3149 err = -ENOMEM; 3150 goto err_uobj; 3151 } 3152 3153 init_attr.log_ind_tbl_size = cmd.log_ind_tbl_size; 3154 init_attr.ind_tbl = wqs; 3155 3156 rwq_ind_tbl->ind_tbl = wqs; 3157 rwq_ind_tbl->log_ind_tbl_size = init_attr.log_ind_tbl_size; 3158 rwq_ind_tbl->uobject = uobj; 3159 uobj->object = rwq_ind_tbl; 3160 rwq_ind_tbl->device = ib_dev; 3161 atomic_set(&rwq_ind_tbl->usecnt, 0); 3162 3163 err = ib_dev->ops.create_rwq_ind_table(rwq_ind_tbl, &init_attr, 3164 &attrs->driver_udata); 3165 if (err) 3166 goto err_create; 3167 3168 for (i = 0; i < num_wq_handles; i++) 3169 rdma_lookup_put_uobject(&wqs[i]->uobject->uevent.uobject, 3170 UVERBS_LOOKUP_READ); 3171 kfree(wqs_handles); 3172 uobj_finalize_uobj_create(uobj, attrs); 3173 3174 resp.ind_tbl_handle = uobj->id; 3175 resp.ind_tbl_num = rwq_ind_tbl->ind_tbl_num; 3176 resp.response_length = uverbs_response_length(attrs, sizeof(resp)); 3177 return uverbs_response(attrs, &resp, sizeof(resp)); 3178 3179 err_create: 3180 kfree(rwq_ind_tbl); 3181 err_uobj: 3182 uobj_alloc_abort(uobj, attrs); 3183 put_wqs: 3184 for (i = 0; i < num_read_wqs; i++) { 3185 rdma_lookup_put_uobject(&wqs[i]->uobject->uevent.uobject, 3186 UVERBS_LOOKUP_READ); 3187 atomic_dec(&wqs[i]->usecnt); 3188 } 3189 err_free: 3190 kfree(wqs_handles); 3191 kfree(wqs); 3192 return err; 3193 } 3194 3195 static int ib_uverbs_ex_destroy_rwq_ind_table(struct uverbs_attr_bundle *attrs) 3196 { 3197 struct ib_uverbs_ex_destroy_rwq_ind_table cmd; 3198 int ret; 3199 3200 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3201 if (ret) 3202 return ret; 3203 3204 if (cmd.comp_mask) 3205 return -EOPNOTSUPP; 3206 3207 return uobj_perform_destroy(UVERBS_OBJECT_RWQ_IND_TBL, 3208 cmd.ind_tbl_handle, attrs); 3209 } 3210 3211 static int ib_uverbs_ex_create_flow(struct uverbs_attr_bundle *attrs) 3212 { 3213 struct ib_uverbs_create_flow cmd; 3214 struct ib_uverbs_create_flow_resp resp = {}; 3215 struct ib_uobject *uobj; 3216 struct ib_flow *flow_id; 3217 struct ib_uverbs_flow_attr *kern_flow_attr; 3218 struct ib_flow_attr *flow_attr; 3219 struct ib_qp *qp; 3220 struct ib_uflow_resources *uflow_res; 3221 struct ib_uverbs_flow_spec_hdr *kern_spec; 3222 struct uverbs_req_iter iter; 3223 int err; 3224 void *ib_spec; 3225 int i; 3226 struct ib_device *ib_dev; 3227 3228 err = uverbs_request_start(attrs, &iter, &cmd, sizeof(cmd)); 3229 if (err) 3230 return err; 3231 3232 if (cmd.comp_mask) 3233 return -EINVAL; 3234 3235 if (!rdma_uattrs_has_raw_cap(attrs)) 3236 return -EPERM; 3237 3238 if (cmd.flow_attr.flags >= IB_FLOW_ATTR_FLAGS_RESERVED) 3239 return -EINVAL; 3240 3241 if ((cmd.flow_attr.flags & IB_FLOW_ATTR_FLAGS_DONT_TRAP) && 3242 ((cmd.flow_attr.type == IB_FLOW_ATTR_ALL_DEFAULT) || 3243 (cmd.flow_attr.type == IB_FLOW_ATTR_MC_DEFAULT))) 3244 return -EINVAL; 3245 3246 if (cmd.flow_attr.num_of_specs > IB_FLOW_SPEC_SUPPORT_LAYERS) 3247 return -EINVAL; 3248 3249 if (cmd.flow_attr.size > 3250 (cmd.flow_attr.num_of_specs * sizeof(struct ib_uverbs_flow_spec))) 3251 return -EINVAL; 3252 3253 if (cmd.flow_attr.reserved[0] || 3254 cmd.flow_attr.reserved[1]) 3255 return -EINVAL; 3256 3257 if (cmd.flow_attr.num_of_specs) { 3258 kern_flow_attr = kmalloc(sizeof(*kern_flow_attr) + cmd.flow_attr.size, 3259 GFP_KERNEL); 3260 if (!kern_flow_attr) 3261 return -ENOMEM; 3262 3263 *kern_flow_attr = cmd.flow_attr; 3264 err = uverbs_request_next(&iter, &kern_flow_attr->flow_specs, 3265 cmd.flow_attr.size); 3266 if (err) 3267 goto err_free_attr; 3268 } else { 3269 kern_flow_attr = &cmd.flow_attr; 3270 } 3271 3272 err = uverbs_request_finish(&iter); 3273 if (err) 3274 goto err_free_attr; 3275 3276 uobj = uobj_alloc(UVERBS_OBJECT_FLOW, attrs, &ib_dev); 3277 if (IS_ERR(uobj)) { 3278 err = PTR_ERR(uobj); 3279 goto err_free_attr; 3280 } 3281 3282 if (!rdma_is_port_valid(uobj->context->device, cmd.flow_attr.port)) { 3283 err = -EINVAL; 3284 goto err_uobj; 3285 } 3286 3287 qp = uobj_get_obj_read(qp, UVERBS_OBJECT_QP, cmd.qp_handle, attrs); 3288 if (IS_ERR(qp)) { 3289 err = PTR_ERR(qp); 3290 goto err_uobj; 3291 } 3292 3293 if (qp->qp_type != IB_QPT_UD && qp->qp_type != IB_QPT_RAW_PACKET) { 3294 err = -EINVAL; 3295 goto err_put; 3296 } 3297 3298 flow_attr = kzalloc_flex(*flow_attr, flows, cmd.flow_attr.num_of_specs); 3299 if (!flow_attr) { 3300 err = -ENOMEM; 3301 goto err_put; 3302 } 3303 uflow_res = flow_resources_alloc(cmd.flow_attr.num_of_specs); 3304 if (!uflow_res) { 3305 err = -ENOMEM; 3306 goto err_free_flow_attr; 3307 } 3308 3309 flow_attr->type = kern_flow_attr->type; 3310 flow_attr->priority = kern_flow_attr->priority; 3311 flow_attr->num_of_specs = kern_flow_attr->num_of_specs; 3312 flow_attr->port = kern_flow_attr->port; 3313 flow_attr->flags = kern_flow_attr->flags; 3314 flow_attr->size = sizeof(*flow_attr); 3315 3316 kern_spec = kern_flow_attr->flow_specs; 3317 ib_spec = flow_attr + 1; 3318 for (i = 0; i < flow_attr->num_of_specs && 3319 cmd.flow_attr.size >= sizeof(*kern_spec) && 3320 cmd.flow_attr.size >= kern_spec->size; 3321 i++) { 3322 err = kern_spec_to_ib_spec( 3323 attrs, (struct ib_uverbs_flow_spec *)kern_spec, 3324 ib_spec, uflow_res); 3325 if (err) 3326 goto err_free; 3327 3328 flow_attr->size += 3329 ((union ib_flow_spec *) ib_spec)->size; 3330 cmd.flow_attr.size -= kern_spec->size; 3331 kern_spec = ((void *)kern_spec) + kern_spec->size; 3332 ib_spec += ((union ib_flow_spec *) ib_spec)->size; 3333 } 3334 if (cmd.flow_attr.size || (i != flow_attr->num_of_specs)) { 3335 pr_warn("create flow failed, flow %d: %u bytes left from uverb cmd\n", 3336 i, cmd.flow_attr.size); 3337 err = -EINVAL; 3338 goto err_free; 3339 } 3340 3341 flow_id = qp->device->ops.create_flow(qp, flow_attr, 3342 &attrs->driver_udata); 3343 3344 if (IS_ERR(flow_id)) { 3345 err = PTR_ERR(flow_id); 3346 goto err_free; 3347 } 3348 3349 ib_set_flow(uobj, flow_id, qp, qp->device, uflow_res); 3350 3351 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 3352 UVERBS_LOOKUP_READ); 3353 kfree(flow_attr); 3354 3355 if (cmd.flow_attr.num_of_specs) 3356 kfree(kern_flow_attr); 3357 uobj_finalize_uobj_create(uobj, attrs); 3358 3359 resp.flow_handle = uobj->id; 3360 return uverbs_response(attrs, &resp, sizeof(resp)); 3361 3362 err_free: 3363 ib_uverbs_flow_resources_free(uflow_res); 3364 err_free_flow_attr: 3365 kfree(flow_attr); 3366 err_put: 3367 rdma_lookup_put_uobject(&qp->uobject->uevent.uobject, 3368 UVERBS_LOOKUP_READ); 3369 err_uobj: 3370 uobj_alloc_abort(uobj, attrs); 3371 err_free_attr: 3372 if (cmd.flow_attr.num_of_specs) 3373 kfree(kern_flow_attr); 3374 return err; 3375 } 3376 3377 static int ib_uverbs_ex_destroy_flow(struct uverbs_attr_bundle *attrs) 3378 { 3379 struct ib_uverbs_destroy_flow cmd; 3380 int ret; 3381 3382 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3383 if (ret) 3384 return ret; 3385 3386 if (cmd.comp_mask) 3387 return -EINVAL; 3388 3389 return uobj_perform_destroy(UVERBS_OBJECT_FLOW, cmd.flow_handle, attrs); 3390 } 3391 3392 static int __uverbs_create_xsrq(struct uverbs_attr_bundle *attrs, 3393 struct ib_uverbs_create_xsrq *cmd, 3394 struct ib_udata *udata) 3395 { 3396 struct ib_uverbs_create_srq_resp resp = {}; 3397 struct ib_usrq_object *obj; 3398 struct ib_pd *pd; 3399 struct ib_srq *srq; 3400 struct ib_srq_init_attr attr; 3401 int ret; 3402 struct ib_uobject *xrcd_uobj; 3403 struct ib_device *ib_dev; 3404 3405 obj = (struct ib_usrq_object *)uobj_alloc(UVERBS_OBJECT_SRQ, attrs, 3406 &ib_dev); 3407 if (IS_ERR(obj)) 3408 return PTR_ERR(obj); 3409 3410 if (cmd->srq_type == IB_SRQT_TM) 3411 attr.ext.tag_matching.max_num_tags = cmd->max_num_tags; 3412 3413 if (cmd->srq_type == IB_SRQT_XRC) { 3414 xrcd_uobj = uobj_get_read(UVERBS_OBJECT_XRCD, cmd->xrcd_handle, 3415 attrs); 3416 if (IS_ERR(xrcd_uobj)) { 3417 ret = -EINVAL; 3418 goto err; 3419 } 3420 3421 attr.ext.xrc.xrcd = (struct ib_xrcd *)xrcd_uobj->object; 3422 if (!attr.ext.xrc.xrcd) { 3423 ret = -EINVAL; 3424 goto err_put_xrcd; 3425 } 3426 3427 obj->uxrcd = container_of(xrcd_uobj, struct ib_uxrcd_object, uobject); 3428 atomic_inc(&obj->uxrcd->refcnt); 3429 } 3430 3431 if (ib_srq_has_cq(cmd->srq_type)) { 3432 attr.ext.cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, 3433 cmd->cq_handle, attrs); 3434 if (IS_ERR(attr.ext.cq)) { 3435 ret = PTR_ERR(attr.ext.cq); 3436 goto err_put_xrcd; 3437 } 3438 } 3439 3440 pd = uobj_get_obj_read(pd, UVERBS_OBJECT_PD, cmd->pd_handle, attrs); 3441 if (IS_ERR(pd)) { 3442 ret = PTR_ERR(pd); 3443 goto err_put_cq; 3444 } 3445 3446 attr.event_handler = ib_uverbs_srq_event_handler; 3447 attr.srq_type = cmd->srq_type; 3448 attr.attr.max_wr = cmd->max_wr; 3449 attr.attr.max_sge = cmd->max_sge; 3450 attr.attr.srq_limit = cmd->srq_limit; 3451 3452 INIT_LIST_HEAD(&obj->uevent.event_list); 3453 obj->uevent.uobject.user_handle = cmd->user_handle; 3454 3455 srq = ib_create_srq_user(pd, &attr, obj, udata); 3456 if (IS_ERR(srq)) { 3457 ret = PTR_ERR(srq); 3458 goto err_put_pd; 3459 } 3460 3461 obj->uevent.uobject.object = srq; 3462 obj->uevent.uobject.user_handle = cmd->user_handle; 3463 obj->uevent.event_file = READ_ONCE(attrs->ufile->default_async_file); 3464 if (obj->uevent.event_file) 3465 uverbs_uobject_get(&obj->uevent.event_file->uobj); 3466 3467 if (cmd->srq_type == IB_SRQT_XRC) 3468 resp.srqn = srq->ext.xrc.srq_num; 3469 3470 if (cmd->srq_type == IB_SRQT_XRC) 3471 uobj_put_read(xrcd_uobj); 3472 3473 if (ib_srq_has_cq(cmd->srq_type)) 3474 rdma_lookup_put_uobject(&attr.ext.cq->uobject->uevent.uobject, 3475 UVERBS_LOOKUP_READ); 3476 3477 uobj_put_obj_read(pd); 3478 uobj_finalize_uobj_create(&obj->uevent.uobject, attrs); 3479 3480 resp.srq_handle = obj->uevent.uobject.id; 3481 resp.max_wr = attr.attr.max_wr; 3482 resp.max_sge = attr.attr.max_sge; 3483 return uverbs_response(attrs, &resp, sizeof(resp)); 3484 3485 err_put_pd: 3486 uobj_put_obj_read(pd); 3487 err_put_cq: 3488 if (ib_srq_has_cq(cmd->srq_type)) 3489 rdma_lookup_put_uobject(&attr.ext.cq->uobject->uevent.uobject, 3490 UVERBS_LOOKUP_READ); 3491 3492 err_put_xrcd: 3493 if (cmd->srq_type == IB_SRQT_XRC) { 3494 atomic_dec(&obj->uxrcd->refcnt); 3495 uobj_put_read(xrcd_uobj); 3496 } 3497 3498 err: 3499 uobj_alloc_abort(&obj->uevent.uobject, attrs); 3500 return ret; 3501 } 3502 3503 static int ib_uverbs_create_srq(struct uverbs_attr_bundle *attrs) 3504 { 3505 struct ib_uverbs_create_srq cmd; 3506 struct ib_uverbs_create_xsrq xcmd; 3507 int ret; 3508 3509 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3510 if (ret) 3511 return ret; 3512 3513 memset(&xcmd, 0, sizeof(xcmd)); 3514 xcmd.response = cmd.response; 3515 xcmd.user_handle = cmd.user_handle; 3516 xcmd.srq_type = IB_SRQT_BASIC; 3517 xcmd.pd_handle = cmd.pd_handle; 3518 xcmd.max_wr = cmd.max_wr; 3519 xcmd.max_sge = cmd.max_sge; 3520 xcmd.srq_limit = cmd.srq_limit; 3521 3522 return __uverbs_create_xsrq(attrs, &xcmd, &attrs->driver_udata); 3523 } 3524 3525 static int ib_uverbs_create_xsrq(struct uverbs_attr_bundle *attrs) 3526 { 3527 struct ib_uverbs_create_xsrq cmd; 3528 int ret; 3529 3530 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3531 if (ret) 3532 return ret; 3533 3534 return __uverbs_create_xsrq(attrs, &cmd, &attrs->driver_udata); 3535 } 3536 3537 static int ib_uverbs_modify_srq(struct uverbs_attr_bundle *attrs) 3538 { 3539 struct ib_uverbs_modify_srq cmd; 3540 struct ib_srq *srq; 3541 struct ib_srq_attr attr; 3542 int ret; 3543 3544 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3545 if (ret) 3546 return ret; 3547 3548 srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs); 3549 if (IS_ERR(srq)) 3550 return PTR_ERR(srq); 3551 3552 attr.max_wr = cmd.max_wr; 3553 attr.srq_limit = cmd.srq_limit; 3554 3555 ret = srq->device->ops.modify_srq(srq, &attr, cmd.attr_mask, 3556 &attrs->driver_udata); 3557 3558 rdma_lookup_put_uobject(&srq->uobject->uevent.uobject, 3559 UVERBS_LOOKUP_READ); 3560 3561 return ret; 3562 } 3563 3564 static int ib_uverbs_query_srq(struct uverbs_attr_bundle *attrs) 3565 { 3566 struct ib_uverbs_query_srq cmd; 3567 struct ib_uverbs_query_srq_resp resp; 3568 struct ib_srq_attr attr; 3569 struct ib_srq *srq; 3570 int ret; 3571 3572 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3573 if (ret) 3574 return ret; 3575 3576 srq = uobj_get_obj_read(srq, UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs); 3577 if (IS_ERR(srq)) 3578 return PTR_ERR(srq); 3579 3580 ret = ib_query_srq(srq, &attr); 3581 3582 rdma_lookup_put_uobject(&srq->uobject->uevent.uobject, 3583 UVERBS_LOOKUP_READ); 3584 3585 if (ret) 3586 return ret; 3587 3588 memset(&resp, 0, sizeof resp); 3589 3590 resp.max_wr = attr.max_wr; 3591 resp.max_sge = attr.max_sge; 3592 resp.srq_limit = attr.srq_limit; 3593 3594 return uverbs_response(attrs, &resp, sizeof(resp)); 3595 } 3596 3597 static int ib_uverbs_destroy_srq(struct uverbs_attr_bundle *attrs) 3598 { 3599 struct ib_uverbs_destroy_srq cmd; 3600 struct ib_uverbs_destroy_srq_resp resp; 3601 struct ib_uobject *uobj; 3602 struct ib_uevent_object *obj; 3603 int ret; 3604 3605 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3606 if (ret) 3607 return ret; 3608 3609 uobj = uobj_get_destroy(UVERBS_OBJECT_SRQ, cmd.srq_handle, attrs); 3610 if (IS_ERR(uobj)) 3611 return PTR_ERR(uobj); 3612 3613 obj = container_of(uobj, struct ib_uevent_object, uobject); 3614 memset(&resp, 0, sizeof(resp)); 3615 resp.events_reported = obj->events_reported; 3616 3617 uobj_put_destroy(uobj); 3618 3619 return uverbs_response(attrs, &resp, sizeof(resp)); 3620 } 3621 3622 static int ib_uverbs_ex_query_device(struct uverbs_attr_bundle *attrs) 3623 { 3624 struct ib_uverbs_ex_query_device_resp resp = {}; 3625 struct ib_uverbs_ex_query_device cmd; 3626 struct ib_device_attr attr = {0}; 3627 struct ib_ucontext *ucontext; 3628 struct ib_device *ib_dev; 3629 int err; 3630 3631 ucontext = ib_uverbs_get_ucontext(attrs); 3632 if (IS_ERR(ucontext)) 3633 return PTR_ERR(ucontext); 3634 ib_dev = ucontext->device; 3635 3636 err = uverbs_request(attrs, &cmd, sizeof(cmd)); 3637 if (err) 3638 return err; 3639 3640 if (cmd.comp_mask) 3641 return -EINVAL; 3642 3643 if (cmd.reserved) 3644 return -EINVAL; 3645 3646 err = ib_dev->ops.query_device(ib_dev, &attr, &attrs->driver_udata); 3647 if (err) 3648 return err; 3649 3650 copy_query_dev_fields(ucontext, &resp.base, &attr); 3651 3652 resp.odp_caps.general_caps = attr.odp_caps.general_caps; 3653 resp.odp_caps.per_transport_caps.rc_odp_caps = 3654 attr.odp_caps.per_transport_caps.rc_odp_caps; 3655 resp.odp_caps.per_transport_caps.uc_odp_caps = 3656 attr.odp_caps.per_transport_caps.uc_odp_caps; 3657 resp.odp_caps.per_transport_caps.ud_odp_caps = 3658 attr.odp_caps.per_transport_caps.ud_odp_caps; 3659 resp.xrc_odp_caps = attr.odp_caps.per_transport_caps.xrc_odp_caps; 3660 3661 resp.timestamp_mask = attr.timestamp_mask; 3662 resp.hca_core_clock = attr.hca_core_clock; 3663 resp.device_cap_flags_ex = attr.device_cap_flags; 3664 resp.rss_caps.supported_qpts = attr.rss_caps.supported_qpts; 3665 resp.rss_caps.max_rwq_indirection_tables = 3666 attr.rss_caps.max_rwq_indirection_tables; 3667 resp.rss_caps.max_rwq_indirection_table_size = 3668 attr.rss_caps.max_rwq_indirection_table_size; 3669 resp.max_wq_type_rq = attr.max_wq_type_rq; 3670 resp.raw_packet_caps = attr.raw_packet_caps; 3671 resp.tm_caps.max_rndv_hdr_size = attr.tm_caps.max_rndv_hdr_size; 3672 resp.tm_caps.max_num_tags = attr.tm_caps.max_num_tags; 3673 resp.tm_caps.max_ops = attr.tm_caps.max_ops; 3674 resp.tm_caps.max_sge = attr.tm_caps.max_sge; 3675 resp.tm_caps.flags = attr.tm_caps.flags; 3676 resp.cq_moderation_caps.max_cq_moderation_count = 3677 attr.cq_caps.max_cq_moderation_count; 3678 resp.cq_moderation_caps.max_cq_moderation_period = 3679 attr.cq_caps.max_cq_moderation_period; 3680 resp.max_dm_size = attr.max_dm_size; 3681 resp.response_length = uverbs_response_length(attrs, sizeof(resp)); 3682 3683 return uverbs_response(attrs, &resp, sizeof(resp)); 3684 } 3685 3686 static int ib_uverbs_ex_modify_cq(struct uverbs_attr_bundle *attrs) 3687 { 3688 struct ib_uverbs_ex_modify_cq cmd; 3689 struct ib_cq *cq; 3690 int ret; 3691 3692 ret = uverbs_request(attrs, &cmd, sizeof(cmd)); 3693 if (ret) 3694 return ret; 3695 3696 if (!cmd.attr_mask || cmd.reserved) 3697 return -EINVAL; 3698 3699 if (cmd.attr_mask > IB_CQ_MODERATE) 3700 return -EOPNOTSUPP; 3701 3702 cq = uobj_get_obj_read(cq, UVERBS_OBJECT_CQ, cmd.cq_handle, attrs); 3703 if (IS_ERR(cq)) 3704 return PTR_ERR(cq); 3705 3706 ret = rdma_set_cq_moderation(cq, cmd.attr.cq_count, cmd.attr.cq_period); 3707 3708 rdma_lookup_put_uobject(&cq->uobject->uevent.uobject, 3709 UVERBS_LOOKUP_READ); 3710 return ret; 3711 } 3712 3713 /* 3714 * Describe the input structs for write(). Some write methods have an input 3715 * only struct, most have an input and output. If the struct has an output then 3716 * the 'response' u64 must be the first field in the request structure. 3717 * 3718 * If udata is present then both the request and response structs have a 3719 * trailing driver_data flex array. In this case the size of the base struct 3720 * cannot be changed. 3721 */ 3722 #define UAPI_DEF_WRITE_IO(req, resp) \ 3723 .write.has_resp = 1 + \ 3724 BUILD_BUG_ON_ZERO(offsetof(req, response) != 0) + \ 3725 BUILD_BUG_ON_ZERO(sizeof_field(req, response) != \ 3726 sizeof(u64)), \ 3727 .write.req_size = sizeof(req), .write.resp_size = sizeof(resp) 3728 3729 #define UAPI_DEF_WRITE_I(req) .write.req_size = sizeof(req) 3730 3731 #define UAPI_DEF_WRITE_UDATA_IO(req, resp) \ 3732 UAPI_DEF_WRITE_IO(req, resp), \ 3733 .write.has_udata = \ 3734 1 + \ 3735 BUILD_BUG_ON_ZERO(offsetof(req, driver_data) != \ 3736 sizeof(req)) + \ 3737 BUILD_BUG_ON_ZERO(offsetof(resp, driver_data) != \ 3738 sizeof(resp)) 3739 3740 #define UAPI_DEF_WRITE_UDATA_I(req) \ 3741 UAPI_DEF_WRITE_I(req), \ 3742 .write.has_udata = \ 3743 1 + BUILD_BUG_ON_ZERO(offsetof(req, driver_data) != \ 3744 sizeof(req)) 3745 3746 /* 3747 * The _EX versions are for use with WRITE_EX and allow the last struct member 3748 * to be specified. Buffers that do not include that member will be rejected. 3749 */ 3750 #define UAPI_DEF_WRITE_IO_EX(req, req_last_member, resp, resp_last_member) \ 3751 .write.has_resp = 1, \ 3752 .write.req_size = offsetofend(req, req_last_member), \ 3753 .write.resp_size = offsetofend(resp, resp_last_member) 3754 3755 #define UAPI_DEF_WRITE_I_EX(req, req_last_member) \ 3756 .write.req_size = offsetofend(req, req_last_member) 3757 3758 const struct uapi_definition uverbs_def_write_intf[] = { 3759 DECLARE_UVERBS_OBJECT( 3760 UVERBS_OBJECT_AH, 3761 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_AH, 3762 ib_uverbs_create_ah, 3763 UAPI_DEF_WRITE_UDATA_IO( 3764 struct ib_uverbs_create_ah, 3765 struct ib_uverbs_create_ah_resp)), 3766 DECLARE_UVERBS_WRITE( 3767 IB_USER_VERBS_CMD_DESTROY_AH, 3768 ib_uverbs_destroy_ah, 3769 UAPI_DEF_WRITE_I(struct ib_uverbs_destroy_ah)), 3770 UAPI_DEF_OBJ_NEEDS_FN(create_user_ah), 3771 UAPI_DEF_OBJ_NEEDS_FN(destroy_ah)), 3772 3773 DECLARE_UVERBS_OBJECT( 3774 UVERBS_OBJECT_COMP_CHANNEL, 3775 DECLARE_UVERBS_WRITE( 3776 IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL, 3777 ib_uverbs_create_comp_channel, 3778 UAPI_DEF_WRITE_IO( 3779 struct ib_uverbs_create_comp_channel, 3780 struct ib_uverbs_create_comp_channel_resp))), 3781 3782 DECLARE_UVERBS_OBJECT( 3783 UVERBS_OBJECT_CQ, 3784 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_CQ, 3785 ib_uverbs_create_cq, 3786 UAPI_DEF_WRITE_UDATA_IO( 3787 struct ib_uverbs_create_cq, 3788 struct ib_uverbs_create_cq_resp), 3789 UAPI_DEF_METHOD_NEEDS_FN(create_cq)), 3790 DECLARE_UVERBS_WRITE( 3791 IB_USER_VERBS_CMD_DESTROY_CQ, 3792 ib_uverbs_destroy_cq, 3793 UAPI_DEF_WRITE_IO(struct ib_uverbs_destroy_cq, 3794 struct ib_uverbs_destroy_cq_resp), 3795 UAPI_DEF_METHOD_NEEDS_FN(destroy_cq)), 3796 DECLARE_UVERBS_WRITE( 3797 IB_USER_VERBS_CMD_POLL_CQ, 3798 ib_uverbs_poll_cq, 3799 UAPI_DEF_WRITE_IO(struct ib_uverbs_poll_cq, 3800 struct ib_uverbs_poll_cq_resp), 3801 UAPI_DEF_METHOD_NEEDS_FN(poll_cq)), 3802 DECLARE_UVERBS_WRITE( 3803 IB_USER_VERBS_CMD_REQ_NOTIFY_CQ, 3804 ib_uverbs_req_notify_cq, 3805 UAPI_DEF_WRITE_I(struct ib_uverbs_req_notify_cq), 3806 UAPI_DEF_METHOD_NEEDS_FN(req_notify_cq)), 3807 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_RESIZE_CQ, 3808 ib_uverbs_resize_cq, 3809 UAPI_DEF_WRITE_UDATA_IO( 3810 struct ib_uverbs_resize_cq, 3811 struct ib_uverbs_resize_cq_resp), 3812 UAPI_DEF_METHOD_NEEDS_FN(resize_user_cq)), 3813 DECLARE_UVERBS_WRITE_EX( 3814 IB_USER_VERBS_EX_CMD_CREATE_CQ, 3815 ib_uverbs_ex_create_cq, 3816 UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_create_cq, 3817 reserved, 3818 struct ib_uverbs_ex_create_cq_resp, 3819 response_length), 3820 UAPI_DEF_METHOD_NEEDS_FN(create_cq)), 3821 DECLARE_UVERBS_WRITE_EX( 3822 IB_USER_VERBS_EX_CMD_MODIFY_CQ, 3823 ib_uverbs_ex_modify_cq, 3824 UAPI_DEF_WRITE_I(struct ib_uverbs_ex_modify_cq), 3825 UAPI_DEF_METHOD_NEEDS_FN(modify_cq))), 3826 3827 DECLARE_UVERBS_OBJECT( 3828 UVERBS_OBJECT_DEVICE, 3829 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_GET_CONTEXT, 3830 ib_uverbs_get_context, 3831 UAPI_DEF_WRITE_UDATA_IO( 3832 struct ib_uverbs_get_context, 3833 struct ib_uverbs_get_context_resp)), 3834 DECLARE_UVERBS_WRITE( 3835 IB_USER_VERBS_CMD_QUERY_DEVICE, 3836 ib_uverbs_query_device, 3837 UAPI_DEF_WRITE_IO(struct ib_uverbs_query_device, 3838 struct ib_uverbs_query_device_resp)), 3839 DECLARE_UVERBS_WRITE( 3840 IB_USER_VERBS_CMD_QUERY_PORT, 3841 ib_uverbs_query_port, 3842 UAPI_DEF_WRITE_IO(struct ib_uverbs_query_port, 3843 struct ib_uverbs_query_port_resp), 3844 UAPI_DEF_METHOD_NEEDS_FN(query_port)), 3845 DECLARE_UVERBS_WRITE_EX( 3846 IB_USER_VERBS_EX_CMD_QUERY_DEVICE, 3847 ib_uverbs_ex_query_device, 3848 UAPI_DEF_WRITE_IO_EX( 3849 struct ib_uverbs_ex_query_device, 3850 reserved, 3851 struct ib_uverbs_ex_query_device_resp, 3852 response_length), 3853 UAPI_DEF_METHOD_NEEDS_FN(query_device)), 3854 UAPI_DEF_OBJ_NEEDS_FN(alloc_ucontext), 3855 UAPI_DEF_OBJ_NEEDS_FN(dealloc_ucontext)), 3856 3857 DECLARE_UVERBS_OBJECT( 3858 UVERBS_OBJECT_FLOW, 3859 DECLARE_UVERBS_WRITE_EX( 3860 IB_USER_VERBS_EX_CMD_CREATE_FLOW, 3861 ib_uverbs_ex_create_flow, 3862 UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_create_flow, 3863 flow_attr, 3864 struct ib_uverbs_create_flow_resp, 3865 flow_handle), 3866 UAPI_DEF_METHOD_NEEDS_FN(create_flow)), 3867 DECLARE_UVERBS_WRITE_EX( 3868 IB_USER_VERBS_EX_CMD_DESTROY_FLOW, 3869 ib_uverbs_ex_destroy_flow, 3870 UAPI_DEF_WRITE_I(struct ib_uverbs_destroy_flow), 3871 UAPI_DEF_METHOD_NEEDS_FN(destroy_flow))), 3872 3873 DECLARE_UVERBS_OBJECT( 3874 UVERBS_OBJECT_MR, 3875 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_DEREG_MR, 3876 ib_uverbs_dereg_mr, 3877 UAPI_DEF_WRITE_I(struct ib_uverbs_dereg_mr), 3878 UAPI_DEF_METHOD_NEEDS_FN(dereg_mr)), 3879 DECLARE_UVERBS_WRITE( 3880 IB_USER_VERBS_CMD_REG_MR, 3881 ib_uverbs_reg_mr, 3882 UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_reg_mr, 3883 struct ib_uverbs_reg_mr_resp), 3884 UAPI_DEF_METHOD_NEEDS_FN(reg_user_mr)), 3885 DECLARE_UVERBS_WRITE( 3886 IB_USER_VERBS_CMD_REREG_MR, 3887 ib_uverbs_rereg_mr, 3888 UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_rereg_mr, 3889 struct ib_uverbs_rereg_mr_resp), 3890 UAPI_DEF_METHOD_NEEDS_FN(rereg_user_mr))), 3891 3892 DECLARE_UVERBS_OBJECT( 3893 UVERBS_OBJECT_MW, 3894 DECLARE_UVERBS_WRITE( 3895 IB_USER_VERBS_CMD_ALLOC_MW, 3896 ib_uverbs_alloc_mw, 3897 UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_alloc_mw, 3898 struct ib_uverbs_alloc_mw_resp), 3899 UAPI_DEF_METHOD_NEEDS_FN(alloc_mw)), 3900 DECLARE_UVERBS_WRITE( 3901 IB_USER_VERBS_CMD_DEALLOC_MW, 3902 ib_uverbs_dealloc_mw, 3903 UAPI_DEF_WRITE_I(struct ib_uverbs_dealloc_mw), 3904 UAPI_DEF_METHOD_NEEDS_FN(dealloc_mw))), 3905 3906 DECLARE_UVERBS_OBJECT( 3907 UVERBS_OBJECT_PD, 3908 DECLARE_UVERBS_WRITE( 3909 IB_USER_VERBS_CMD_ALLOC_PD, 3910 ib_uverbs_alloc_pd, 3911 UAPI_DEF_WRITE_UDATA_IO(struct ib_uverbs_alloc_pd, 3912 struct ib_uverbs_alloc_pd_resp), 3913 UAPI_DEF_METHOD_NEEDS_FN(alloc_pd)), 3914 DECLARE_UVERBS_WRITE( 3915 IB_USER_VERBS_CMD_DEALLOC_PD, 3916 ib_uverbs_dealloc_pd, 3917 UAPI_DEF_WRITE_I(struct ib_uverbs_dealloc_pd), 3918 UAPI_DEF_METHOD_NEEDS_FN(dealloc_pd))), 3919 3920 DECLARE_UVERBS_OBJECT( 3921 UVERBS_OBJECT_QP, 3922 DECLARE_UVERBS_WRITE( 3923 IB_USER_VERBS_CMD_ATTACH_MCAST, 3924 ib_uverbs_attach_mcast, 3925 UAPI_DEF_WRITE_I(struct ib_uverbs_attach_mcast), 3926 UAPI_DEF_METHOD_NEEDS_FN(attach_mcast), 3927 UAPI_DEF_METHOD_NEEDS_FN(detach_mcast)), 3928 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_QP, 3929 ib_uverbs_create_qp, 3930 UAPI_DEF_WRITE_UDATA_IO( 3931 struct ib_uverbs_create_qp, 3932 struct ib_uverbs_create_qp_resp), 3933 UAPI_DEF_METHOD_NEEDS_FN(create_qp)), 3934 DECLARE_UVERBS_WRITE( 3935 IB_USER_VERBS_CMD_DESTROY_QP, 3936 ib_uverbs_destroy_qp, 3937 UAPI_DEF_WRITE_IO(struct ib_uverbs_destroy_qp, 3938 struct ib_uverbs_destroy_qp_resp), 3939 UAPI_DEF_METHOD_NEEDS_FN(destroy_qp)), 3940 DECLARE_UVERBS_WRITE( 3941 IB_USER_VERBS_CMD_DETACH_MCAST, 3942 ib_uverbs_detach_mcast, 3943 UAPI_DEF_WRITE_I(struct ib_uverbs_detach_mcast), 3944 UAPI_DEF_METHOD_NEEDS_FN(detach_mcast)), 3945 DECLARE_UVERBS_WRITE( 3946 IB_USER_VERBS_CMD_MODIFY_QP, 3947 ib_uverbs_modify_qp, 3948 UAPI_DEF_WRITE_I(struct ib_uverbs_modify_qp), 3949 UAPI_DEF_METHOD_NEEDS_FN(modify_qp)), 3950 DECLARE_UVERBS_WRITE( 3951 IB_USER_VERBS_CMD_POST_RECV, 3952 ib_uverbs_post_recv, 3953 UAPI_DEF_WRITE_IO(struct ib_uverbs_post_recv, 3954 struct ib_uverbs_post_recv_resp), 3955 UAPI_DEF_METHOD_NEEDS_FN(post_recv)), 3956 DECLARE_UVERBS_WRITE( 3957 IB_USER_VERBS_CMD_POST_SEND, 3958 ib_uverbs_post_send, 3959 UAPI_DEF_WRITE_IO(struct ib_uverbs_post_send, 3960 struct ib_uverbs_post_send_resp), 3961 UAPI_DEF_METHOD_NEEDS_FN(post_send)), 3962 DECLARE_UVERBS_WRITE( 3963 IB_USER_VERBS_CMD_QUERY_QP, 3964 ib_uverbs_query_qp, 3965 UAPI_DEF_WRITE_IO(struct ib_uverbs_query_qp, 3966 struct ib_uverbs_query_qp_resp), 3967 UAPI_DEF_METHOD_NEEDS_FN(query_qp)), 3968 DECLARE_UVERBS_WRITE_EX( 3969 IB_USER_VERBS_EX_CMD_CREATE_QP, 3970 ib_uverbs_ex_create_qp, 3971 UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_create_qp, 3972 comp_mask, 3973 struct ib_uverbs_ex_create_qp_resp, 3974 response_length), 3975 UAPI_DEF_METHOD_NEEDS_FN(create_qp)), 3976 DECLARE_UVERBS_WRITE_EX( 3977 IB_USER_VERBS_EX_CMD_MODIFY_QP, 3978 ib_uverbs_ex_modify_qp, 3979 UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_modify_qp, 3980 base, 3981 struct ib_uverbs_ex_modify_qp_resp, 3982 response_length), 3983 UAPI_DEF_METHOD_NEEDS_FN(modify_qp))), 3984 3985 DECLARE_UVERBS_OBJECT( 3986 UVERBS_OBJECT_RWQ_IND_TBL, 3987 DECLARE_UVERBS_WRITE_EX( 3988 IB_USER_VERBS_EX_CMD_CREATE_RWQ_IND_TBL, 3989 ib_uverbs_ex_create_rwq_ind_table, 3990 UAPI_DEF_WRITE_IO_EX( 3991 struct ib_uverbs_ex_create_rwq_ind_table, 3992 log_ind_tbl_size, 3993 struct ib_uverbs_ex_create_rwq_ind_table_resp, 3994 ind_tbl_num), 3995 UAPI_DEF_METHOD_NEEDS_FN(create_rwq_ind_table)), 3996 DECLARE_UVERBS_WRITE_EX( 3997 IB_USER_VERBS_EX_CMD_DESTROY_RWQ_IND_TBL, 3998 ib_uverbs_ex_destroy_rwq_ind_table, 3999 UAPI_DEF_WRITE_I( 4000 struct ib_uverbs_ex_destroy_rwq_ind_table), 4001 UAPI_DEF_METHOD_NEEDS_FN(destroy_rwq_ind_table))), 4002 4003 DECLARE_UVERBS_OBJECT( 4004 UVERBS_OBJECT_WQ, 4005 DECLARE_UVERBS_WRITE_EX( 4006 IB_USER_VERBS_EX_CMD_CREATE_WQ, 4007 ib_uverbs_ex_create_wq, 4008 UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_create_wq, 4009 max_sge, 4010 struct ib_uverbs_ex_create_wq_resp, 4011 wqn), 4012 UAPI_DEF_METHOD_NEEDS_FN(create_wq)), 4013 DECLARE_UVERBS_WRITE_EX( 4014 IB_USER_VERBS_EX_CMD_DESTROY_WQ, 4015 ib_uverbs_ex_destroy_wq, 4016 UAPI_DEF_WRITE_IO_EX(struct ib_uverbs_ex_destroy_wq, 4017 wq_handle, 4018 struct ib_uverbs_ex_destroy_wq_resp, 4019 reserved), 4020 UAPI_DEF_METHOD_NEEDS_FN(destroy_wq)), 4021 DECLARE_UVERBS_WRITE_EX( 4022 IB_USER_VERBS_EX_CMD_MODIFY_WQ, 4023 ib_uverbs_ex_modify_wq, 4024 UAPI_DEF_WRITE_I_EX(struct ib_uverbs_ex_modify_wq, 4025 curr_wq_state), 4026 UAPI_DEF_METHOD_NEEDS_FN(modify_wq))), 4027 4028 DECLARE_UVERBS_OBJECT( 4029 UVERBS_OBJECT_SRQ, 4030 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_SRQ, 4031 ib_uverbs_create_srq, 4032 UAPI_DEF_WRITE_UDATA_IO( 4033 struct ib_uverbs_create_srq, 4034 struct ib_uverbs_create_srq_resp), 4035 UAPI_DEF_METHOD_NEEDS_FN(create_srq)), 4036 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_CREATE_XSRQ, 4037 ib_uverbs_create_xsrq, 4038 UAPI_DEF_WRITE_UDATA_IO( 4039 struct ib_uverbs_create_xsrq, 4040 struct ib_uverbs_create_srq_resp), 4041 UAPI_DEF_METHOD_NEEDS_FN(create_srq)), 4042 DECLARE_UVERBS_WRITE( 4043 IB_USER_VERBS_CMD_DESTROY_SRQ, 4044 ib_uverbs_destroy_srq, 4045 UAPI_DEF_WRITE_IO(struct ib_uverbs_destroy_srq, 4046 struct ib_uverbs_destroy_srq_resp), 4047 UAPI_DEF_METHOD_NEEDS_FN(destroy_srq)), 4048 DECLARE_UVERBS_WRITE( 4049 IB_USER_VERBS_CMD_MODIFY_SRQ, 4050 ib_uverbs_modify_srq, 4051 UAPI_DEF_WRITE_UDATA_I(struct ib_uverbs_modify_srq), 4052 UAPI_DEF_METHOD_NEEDS_FN(modify_srq)), 4053 DECLARE_UVERBS_WRITE( 4054 IB_USER_VERBS_CMD_POST_SRQ_RECV, 4055 ib_uverbs_post_srq_recv, 4056 UAPI_DEF_WRITE_IO(struct ib_uverbs_post_srq_recv, 4057 struct ib_uverbs_post_srq_recv_resp), 4058 UAPI_DEF_METHOD_NEEDS_FN(post_srq_recv)), 4059 DECLARE_UVERBS_WRITE( 4060 IB_USER_VERBS_CMD_QUERY_SRQ, 4061 ib_uverbs_query_srq, 4062 UAPI_DEF_WRITE_IO(struct ib_uverbs_query_srq, 4063 struct ib_uverbs_query_srq_resp), 4064 UAPI_DEF_METHOD_NEEDS_FN(query_srq))), 4065 4066 DECLARE_UVERBS_OBJECT( 4067 UVERBS_OBJECT_XRCD, 4068 DECLARE_UVERBS_WRITE( 4069 IB_USER_VERBS_CMD_CLOSE_XRCD, 4070 ib_uverbs_close_xrcd, 4071 UAPI_DEF_WRITE_I(struct ib_uverbs_close_xrcd)), 4072 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_OPEN_QP, 4073 ib_uverbs_open_qp, 4074 UAPI_DEF_WRITE_UDATA_IO( 4075 struct ib_uverbs_open_qp, 4076 struct ib_uverbs_create_qp_resp)), 4077 DECLARE_UVERBS_WRITE(IB_USER_VERBS_CMD_OPEN_XRCD, 4078 ib_uverbs_open_xrcd, 4079 UAPI_DEF_WRITE_UDATA_IO( 4080 struct ib_uverbs_open_xrcd, 4081 struct ib_uverbs_open_xrcd_resp)), 4082 UAPI_DEF_OBJ_NEEDS_FN(alloc_xrcd), 4083 UAPI_DEF_OBJ_NEEDS_FN(dealloc_xrcd)), 4084 4085 {}, 4086 }; 4087