1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 /* 22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 23 * Use is subject to license terms. 24 */ 25 26 /* 27 * Data-Link Driver 28 */ 29 #include <sys/sysmacros.h> 30 #include <sys/strsubr.h> 31 #include <sys/strsun.h> 32 #include <sys/vlan.h> 33 #include <sys/dld_impl.h> 34 #include <sys/mac_client.h> 35 #include <sys/mac_client_impl.h> 36 #include <sys/mac_client_priv.h> 37 38 typedef void proto_reqfunc_t(dld_str_t *, mblk_t *); 39 40 static proto_reqfunc_t proto_info_req, proto_attach_req, proto_detach_req, 41 proto_bind_req, proto_unbind_req, proto_promiscon_req, proto_promiscoff_req, 42 proto_enabmulti_req, proto_disabmulti_req, proto_physaddr_req, 43 proto_setphysaddr_req, proto_udqos_req, proto_req, proto_capability_req, 44 proto_notify_req, proto_passive_req; 45 46 static void proto_capability_advertise(dld_str_t *, mblk_t *); 47 static int dld_capab_poll_disable(dld_str_t *, dld_capab_poll_t *); 48 49 #define DL_ACK_PENDING(state) \ 50 ((state) == DL_ATTACH_PENDING || \ 51 (state) == DL_DETACH_PENDING || \ 52 (state) == DL_BIND_PENDING || \ 53 (state) == DL_UNBIND_PENDING) 54 55 /* 56 * Process a DLPI protocol message. 57 * The primitives DL_BIND_REQ, DL_ENABMULTI_REQ, DL_PROMISCON_REQ, 58 * DL_SET_PHYS_ADDR_REQ put the data link below our dld_str_t into an 59 * 'active' state. The primitive DL_PASSIVE_REQ marks our dld_str_t 60 * as 'passive' and forbids it from being subsequently made 'active' 61 * by the above primitives. 62 */ 63 void 64 dld_proto(dld_str_t *dsp, mblk_t *mp) 65 { 66 t_uscalar_t prim; 67 68 if (MBLKL(mp) < sizeof (t_uscalar_t)) { 69 freemsg(mp); 70 return; 71 } 72 prim = ((union DL_primitives *)mp->b_rptr)->dl_primitive; 73 74 switch (prim) { 75 case DL_INFO_REQ: 76 proto_info_req(dsp, mp); 77 break; 78 case DL_BIND_REQ: 79 proto_bind_req(dsp, mp); 80 break; 81 case DL_UNBIND_REQ: 82 proto_unbind_req(dsp, mp); 83 break; 84 case DL_UNITDATA_REQ: 85 proto_unitdata_req(dsp, mp); 86 break; 87 case DL_UDQOS_REQ: 88 proto_udqos_req(dsp, mp); 89 break; 90 case DL_ATTACH_REQ: 91 proto_attach_req(dsp, mp); 92 break; 93 case DL_DETACH_REQ: 94 proto_detach_req(dsp, mp); 95 break; 96 case DL_ENABMULTI_REQ: 97 proto_enabmulti_req(dsp, mp); 98 break; 99 case DL_DISABMULTI_REQ: 100 proto_disabmulti_req(dsp, mp); 101 break; 102 case DL_PROMISCON_REQ: 103 proto_promiscon_req(dsp, mp); 104 break; 105 case DL_PROMISCOFF_REQ: 106 proto_promiscoff_req(dsp, mp); 107 break; 108 case DL_PHYS_ADDR_REQ: 109 proto_physaddr_req(dsp, mp); 110 break; 111 case DL_SET_PHYS_ADDR_REQ: 112 proto_setphysaddr_req(dsp, mp); 113 break; 114 case DL_NOTIFY_REQ: 115 proto_notify_req(dsp, mp); 116 break; 117 case DL_CAPABILITY_REQ: 118 proto_capability_req(dsp, mp); 119 break; 120 case DL_PASSIVE_REQ: 121 proto_passive_req(dsp, mp); 122 break; 123 default: 124 proto_req(dsp, mp); 125 break; 126 } 127 } 128 129 #define NEG(x) -(x) 130 typedef struct dl_info_ack_wrapper { 131 dl_info_ack_t dl_info; 132 uint8_t dl_addr[MAXMACADDRLEN + sizeof (uint16_t)]; 133 uint8_t dl_brdcst_addr[MAXMACADDRLEN]; 134 dl_qos_cl_range1_t dl_qos_range1; 135 dl_qos_cl_sel1_t dl_qos_sel1; 136 } dl_info_ack_wrapper_t; 137 138 /* 139 * DL_INFO_REQ 140 */ 141 static void 142 proto_info_req(dld_str_t *dsp, mblk_t *mp) 143 { 144 dl_info_ack_wrapper_t *dlwp; 145 dl_info_ack_t *dlp; 146 dl_qos_cl_sel1_t *selp; 147 dl_qos_cl_range1_t *rangep; 148 uint8_t *addr; 149 uint8_t *brdcst_addr; 150 uint_t addr_length; 151 uint_t sap_length; 152 mac_info_t minfo; 153 mac_info_t *minfop; 154 queue_t *q = dsp->ds_wq; 155 156 /* 157 * Swap the request message for one large enough to contain the 158 * wrapper structure defined above. 159 */ 160 if ((mp = mexchange(q, mp, sizeof (dl_info_ack_wrapper_t), 161 M_PCPROTO, 0)) == NULL) 162 return; 163 164 bzero(mp->b_rptr, sizeof (dl_info_ack_wrapper_t)); 165 dlwp = (dl_info_ack_wrapper_t *)mp->b_rptr; 166 167 dlp = &(dlwp->dl_info); 168 ASSERT(dlp == (dl_info_ack_t *)mp->b_rptr); 169 170 dlp->dl_primitive = DL_INFO_ACK; 171 172 /* 173 * Set up the sub-structure pointers. 174 */ 175 addr = dlwp->dl_addr; 176 brdcst_addr = dlwp->dl_brdcst_addr; 177 rangep = &(dlwp->dl_qos_range1); 178 selp = &(dlwp->dl_qos_sel1); 179 180 /* 181 * This driver supports only version 2 connectionless DLPI provider 182 * nodes. 183 */ 184 dlp->dl_service_mode = DL_CLDLS; 185 dlp->dl_version = DL_VERSION_2; 186 187 /* 188 * Set the style of the provider 189 */ 190 dlp->dl_provider_style = dsp->ds_style; 191 ASSERT(dlp->dl_provider_style == DL_STYLE1 || 192 dlp->dl_provider_style == DL_STYLE2); 193 194 /* 195 * Set the current DLPI state. 196 */ 197 dlp->dl_current_state = dsp->ds_dlstate; 198 199 /* 200 * Gratuitously set the media type. This is to deal with modules 201 * that assume the media type is known prior to DL_ATTACH_REQ 202 * being completed. 203 */ 204 dlp->dl_mac_type = DL_ETHER; 205 206 /* 207 * If the stream is not at least attached we try to retrieve the 208 * mac_info using mac_info_get() 209 */ 210 if (dsp->ds_dlstate == DL_UNATTACHED || 211 dsp->ds_dlstate == DL_ATTACH_PENDING || 212 dsp->ds_dlstate == DL_DETACH_PENDING) { 213 if (!mac_info_get(ddi_major_to_name(dsp->ds_major), &minfo)) { 214 /* 215 * Cannot find mac_info. giving up. 216 */ 217 goto done; 218 } 219 minfop = &minfo; 220 } else { 221 minfop = (mac_info_t *)dsp->ds_mip; 222 /* We can only get the sdu if we're attached. */ 223 mac_sdu_get(dsp->ds_mh, &dlp->dl_min_sdu, &dlp->dl_max_sdu); 224 } 225 226 /* 227 * Set the media type (properly this time). 228 */ 229 if (dsp->ds_native) 230 dlp->dl_mac_type = minfop->mi_nativemedia; 231 else 232 dlp->dl_mac_type = minfop->mi_media; 233 234 /* 235 * Set the DLSAP length. We only support 16 bit values and they 236 * appear after the MAC address portion of DLSAP addresses. 237 */ 238 sap_length = sizeof (uint16_t); 239 dlp->dl_sap_length = NEG(sap_length); 240 241 addr_length = minfop->mi_addr_length; 242 243 /* 244 * Copy in the media broadcast address. 245 */ 246 if (minfop->mi_brdcst_addr != NULL) { 247 dlp->dl_brdcst_addr_offset = 248 (uintptr_t)brdcst_addr - (uintptr_t)dlp; 249 bcopy(minfop->mi_brdcst_addr, brdcst_addr, addr_length); 250 dlp->dl_brdcst_addr_length = addr_length; 251 } 252 253 /* Only VLAN links and links that have a normal tag mode support QOS. */ 254 if ((dsp->ds_mch != NULL && 255 mac_client_vid(dsp->ds_mch) != VLAN_ID_NONE) || 256 (dsp->ds_dlp != NULL && 257 dsp->ds_dlp->dl_tagmode == LINK_TAGMODE_NORMAL)) { 258 dlp->dl_qos_range_offset = (uintptr_t)rangep - (uintptr_t)dlp; 259 dlp->dl_qos_range_length = sizeof (dl_qos_cl_range1_t); 260 261 rangep->dl_qos_type = DL_QOS_CL_RANGE1; 262 rangep->dl_trans_delay.dl_target_value = DL_UNKNOWN; 263 rangep->dl_trans_delay.dl_accept_value = DL_UNKNOWN; 264 rangep->dl_protection.dl_min = DL_UNKNOWN; 265 rangep->dl_protection.dl_max = DL_UNKNOWN; 266 rangep->dl_residual_error = DL_UNKNOWN; 267 268 /* 269 * Specify the supported range of priorities. 270 */ 271 rangep->dl_priority.dl_min = 0; 272 rangep->dl_priority.dl_max = (1 << VLAN_PRI_SIZE) - 1; 273 274 dlp->dl_qos_offset = (uintptr_t)selp - (uintptr_t)dlp; 275 dlp->dl_qos_length = sizeof (dl_qos_cl_sel1_t); 276 277 selp->dl_qos_type = DL_QOS_CL_SEL1; 278 selp->dl_trans_delay = DL_UNKNOWN; 279 selp->dl_protection = DL_UNKNOWN; 280 selp->dl_residual_error = DL_UNKNOWN; 281 282 /* 283 * Specify the current priority (which can be changed by 284 * the DL_UDQOS_REQ primitive). 285 */ 286 selp->dl_priority = dsp->ds_pri; 287 } 288 289 dlp->dl_addr_length = addr_length + sizeof (uint16_t); 290 if (dsp->ds_dlstate == DL_IDLE) { 291 /* 292 * The stream is bound. Therefore we can formulate a valid 293 * DLSAP address. 294 */ 295 dlp->dl_addr_offset = (uintptr_t)addr - (uintptr_t)dlp; 296 if (addr_length > 0) 297 mac_unicast_primary_get(dsp->ds_mh, addr); 298 299 *(uint16_t *)(addr + addr_length) = dsp->ds_sap; 300 } 301 302 done: 303 ASSERT(IMPLY(dlp->dl_qos_offset != 0, dlp->dl_qos_length != 0)); 304 ASSERT(IMPLY(dlp->dl_qos_range_offset != 0, 305 dlp->dl_qos_range_length != 0)); 306 ASSERT(IMPLY(dlp->dl_addr_offset != 0, dlp->dl_addr_length != 0)); 307 ASSERT(IMPLY(dlp->dl_brdcst_addr_offset != 0, 308 dlp->dl_brdcst_addr_length != 0)); 309 310 qreply(q, mp); 311 } 312 313 /* 314 * DL_ATTACH_REQ 315 */ 316 static void 317 proto_attach_req(dld_str_t *dsp, mblk_t *mp) 318 { 319 dl_attach_req_t *dlp = (dl_attach_req_t *)mp->b_rptr; 320 int err = 0; 321 t_uscalar_t dl_err; 322 queue_t *q = dsp->ds_wq; 323 324 if (MBLKL(mp) < sizeof (dl_attach_req_t) || 325 dlp->dl_ppa < 0 || dsp->ds_style == DL_STYLE1) { 326 dl_err = DL_BADPRIM; 327 goto failed; 328 } 329 330 if (dsp->ds_dlstate != DL_UNATTACHED) { 331 dl_err = DL_OUTSTATE; 332 goto failed; 333 } 334 335 dsp->ds_dlstate = DL_ATTACH_PENDING; 336 337 err = dld_str_attach(dsp, dlp->dl_ppa); 338 if (err != 0) { 339 switch (err) { 340 case ENOENT: 341 dl_err = DL_BADPPA; 342 err = 0; 343 break; 344 default: 345 dl_err = DL_SYSERR; 346 break; 347 } 348 dsp->ds_dlstate = DL_UNATTACHED; 349 goto failed; 350 } 351 ASSERT(dsp->ds_dlstate == DL_UNBOUND); 352 dlokack(q, mp, DL_ATTACH_REQ); 353 return; 354 355 failed: 356 dlerrorack(q, mp, DL_ATTACH_REQ, dl_err, (t_uscalar_t)err); 357 } 358 359 /* 360 * DL_DETACH_REQ 361 */ 362 static void 363 proto_detach_req(dld_str_t *dsp, mblk_t *mp) 364 { 365 queue_t *q = dsp->ds_wq; 366 t_uscalar_t dl_err; 367 368 if (MBLKL(mp) < sizeof (dl_detach_req_t)) { 369 dl_err = DL_BADPRIM; 370 goto failed; 371 } 372 373 if (dsp->ds_dlstate != DL_UNBOUND) { 374 dl_err = DL_OUTSTATE; 375 goto failed; 376 } 377 378 if (dsp->ds_style == DL_STYLE1) { 379 dl_err = DL_BADPRIM; 380 goto failed; 381 } 382 383 ASSERT(dsp->ds_datathr_cnt == 0); 384 dsp->ds_dlstate = DL_DETACH_PENDING; 385 386 dld_str_detach(dsp); 387 dlokack(dsp->ds_wq, mp, DL_DETACH_REQ); 388 return; 389 390 failed: 391 dlerrorack(q, mp, DL_DETACH_REQ, dl_err, 0); 392 } 393 394 /* 395 * DL_BIND_REQ 396 */ 397 static void 398 proto_bind_req(dld_str_t *dsp, mblk_t *mp) 399 { 400 dl_bind_req_t *dlp = (dl_bind_req_t *)mp->b_rptr; 401 int err = 0; 402 uint8_t dlsap_addr[MAXMACADDRLEN + sizeof (uint16_t)]; 403 uint_t dlsap_addr_length; 404 t_uscalar_t dl_err; 405 t_scalar_t sap; 406 queue_t *q = dsp->ds_wq; 407 mac_perim_handle_t mph; 408 void *mdip; 409 int32_t intr_cpu; 410 411 if (MBLKL(mp) < sizeof (dl_bind_req_t)) { 412 dl_err = DL_BADPRIM; 413 goto failed; 414 } 415 416 if (dlp->dl_xidtest_flg != 0) { 417 dl_err = DL_NOAUTO; 418 goto failed; 419 } 420 421 if (dlp->dl_service_mode != DL_CLDLS) { 422 dl_err = DL_UNSUPPORTED; 423 goto failed; 424 } 425 426 if (dsp->ds_dlstate != DL_UNBOUND) { 427 dl_err = DL_OUTSTATE; 428 goto failed; 429 } 430 431 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 432 433 if (dsp->ds_passivestate == DLD_UNINITIALIZED && 434 ((err = dls_active_set(dsp)) != 0)) { 435 dl_err = DL_SYSERR; 436 goto failed2; 437 } 438 439 dsp->ds_dlstate = DL_BIND_PENDING; 440 /* 441 * Set the receive callback. 442 */ 443 dls_rx_set(dsp, (dsp->ds_mode == DLD_RAW) ? 444 dld_str_rx_raw : dld_str_rx_unitdata, dsp); 445 446 /* 447 * Bind the channel such that it can receive packets. 448 */ 449 sap = dlp->dl_sap; 450 err = dls_bind(dsp, sap); 451 if (err != 0) { 452 switch (err) { 453 case EINVAL: 454 dl_err = DL_BADADDR; 455 err = 0; 456 break; 457 default: 458 dl_err = DL_SYSERR; 459 break; 460 } 461 462 dsp->ds_dlstate = DL_UNBOUND; 463 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 464 dls_active_clear(dsp); 465 goto failed2; 466 } 467 468 intr_cpu = mac_client_intr_cpu(dsp->ds_mch); 469 mdip = mac_get_devinfo(dsp->ds_mh); 470 mac_perim_exit(mph); 471 472 /* 473 * We do this after we get out of the perim to avoid deadlocks 474 * etc. since part of mac_client_retarget_intr is to walk the 475 * device tree in order to find and retarget the interrupts. 476 */ 477 mac_client_set_intr_cpu(mdip, dsp->ds_mch, intr_cpu); 478 479 /* 480 * Copy in MAC address. 481 */ 482 dlsap_addr_length = dsp->ds_mip->mi_addr_length; 483 mac_unicast_primary_get(dsp->ds_mh, dlsap_addr); 484 485 /* 486 * Copy in the SAP. 487 */ 488 *(uint16_t *)(dlsap_addr + dlsap_addr_length) = sap; 489 dlsap_addr_length += sizeof (uint16_t); 490 491 dsp->ds_dlstate = DL_IDLE; 492 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 493 dsp->ds_passivestate = DLD_ACTIVE; 494 495 dlbindack(q, mp, sap, dlsap_addr, dlsap_addr_length, 0, 0); 496 return; 497 498 failed2: 499 mac_perim_exit(mph); 500 failed: 501 dlerrorack(q, mp, DL_BIND_REQ, dl_err, (t_uscalar_t)err); 502 } 503 504 /* 505 * DL_UNBIND_REQ 506 */ 507 static void 508 proto_unbind_req(dld_str_t *dsp, mblk_t *mp) 509 { 510 queue_t *q = dsp->ds_wq; 511 t_uscalar_t dl_err; 512 mac_perim_handle_t mph; 513 514 if (MBLKL(mp) < sizeof (dl_unbind_req_t)) { 515 dl_err = DL_BADPRIM; 516 goto failed; 517 } 518 519 if (dsp->ds_dlstate != DL_IDLE) { 520 dl_err = DL_OUTSTATE; 521 goto failed; 522 } 523 524 mutex_enter(&dsp->ds_lock); 525 while (dsp->ds_datathr_cnt != 0) 526 cv_wait(&dsp->ds_datathr_cv, &dsp->ds_lock); 527 528 dsp->ds_dlstate = DL_UNBIND_PENDING; 529 mutex_exit(&dsp->ds_lock); 530 531 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 532 /* 533 * Unbind the channel to stop packets being received. 534 */ 535 dls_unbind(dsp); 536 537 /* 538 * Disable polling mode, if it is enabled. 539 */ 540 (void) dld_capab_poll_disable(dsp, NULL); 541 542 /* 543 * Clear LSO flags. 544 */ 545 dsp->ds_lso = B_FALSE; 546 dsp->ds_lso_max = 0; 547 548 /* 549 * Clear the receive callback. 550 */ 551 dls_rx_set(dsp, NULL, NULL); 552 dsp->ds_direct = B_FALSE; 553 554 /* 555 * Set the mode back to the default (unitdata). 556 */ 557 dsp->ds_mode = DLD_UNITDATA; 558 dsp->ds_dlstate = DL_UNBOUND; 559 560 mac_perim_exit(mph); 561 dlokack(dsp->ds_wq, mp, DL_UNBIND_REQ); 562 return; 563 failed: 564 dlerrorack(q, mp, DL_UNBIND_REQ, dl_err, 0); 565 } 566 567 /* 568 * DL_PROMISCON_REQ 569 */ 570 static void 571 proto_promiscon_req(dld_str_t *dsp, mblk_t *mp) 572 { 573 dl_promiscon_req_t *dlp = (dl_promiscon_req_t *)mp->b_rptr; 574 int err = 0; 575 t_uscalar_t dl_err; 576 uint32_t promisc_saved; 577 queue_t *q = dsp->ds_wq; 578 mac_perim_handle_t mph; 579 580 if (MBLKL(mp) < sizeof (dl_promiscon_req_t)) { 581 dl_err = DL_BADPRIM; 582 goto failed; 583 } 584 585 if (dsp->ds_dlstate == DL_UNATTACHED || 586 DL_ACK_PENDING(dsp->ds_dlstate)) { 587 dl_err = DL_OUTSTATE; 588 goto failed; 589 } 590 591 promisc_saved = dsp->ds_promisc; 592 switch (dlp->dl_level) { 593 case DL_PROMISC_SAP: 594 dsp->ds_promisc |= DLS_PROMISC_SAP; 595 break; 596 597 case DL_PROMISC_MULTI: 598 dsp->ds_promisc |= DLS_PROMISC_MULTI; 599 break; 600 601 case DL_PROMISC_PHYS: 602 dsp->ds_promisc |= DLS_PROMISC_PHYS; 603 break; 604 605 default: 606 dl_err = DL_NOTSUPPORTED; 607 goto failed; 608 } 609 610 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 611 612 if (dsp->ds_passivestate == DLD_UNINITIALIZED && 613 ((err = dls_active_set(dsp)) != 0)) { 614 dsp->ds_promisc = promisc_saved; 615 dl_err = DL_SYSERR; 616 goto failed2; 617 } 618 619 /* 620 * Adjust channel promiscuity. 621 */ 622 err = dls_promisc(dsp, promisc_saved); 623 624 if (err != 0) { 625 dl_err = DL_SYSERR; 626 dsp->ds_promisc = promisc_saved; 627 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 628 dls_active_clear(dsp); 629 goto failed2; 630 } 631 632 mac_perim_exit(mph); 633 634 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 635 dsp->ds_passivestate = DLD_ACTIVE; 636 dlokack(q, mp, DL_PROMISCON_REQ); 637 return; 638 639 failed2: 640 mac_perim_exit(mph); 641 failed: 642 dlerrorack(q, mp, DL_PROMISCON_REQ, dl_err, (t_uscalar_t)err); 643 } 644 645 /* 646 * DL_PROMISCOFF_REQ 647 */ 648 static void 649 proto_promiscoff_req(dld_str_t *dsp, mblk_t *mp) 650 { 651 dl_promiscoff_req_t *dlp = (dl_promiscoff_req_t *)mp->b_rptr; 652 int err = 0; 653 t_uscalar_t dl_err; 654 uint32_t promisc_saved; 655 queue_t *q = dsp->ds_wq; 656 mac_perim_handle_t mph; 657 658 if (MBLKL(mp) < sizeof (dl_promiscoff_req_t)) { 659 dl_err = DL_BADPRIM; 660 goto failed; 661 } 662 663 if (dsp->ds_dlstate == DL_UNATTACHED || 664 DL_ACK_PENDING(dsp->ds_dlstate)) { 665 dl_err = DL_OUTSTATE; 666 goto failed; 667 } 668 669 promisc_saved = dsp->ds_promisc; 670 switch (dlp->dl_level) { 671 case DL_PROMISC_SAP: 672 if (!(dsp->ds_promisc & DLS_PROMISC_SAP)) { 673 dl_err = DL_NOTENAB; 674 goto failed; 675 } 676 dsp->ds_promisc &= ~DLS_PROMISC_SAP; 677 break; 678 679 case DL_PROMISC_MULTI: 680 if (!(dsp->ds_promisc & DLS_PROMISC_MULTI)) { 681 dl_err = DL_NOTENAB; 682 goto failed; 683 } 684 dsp->ds_promisc &= ~DLS_PROMISC_MULTI; 685 break; 686 687 case DL_PROMISC_PHYS: 688 if (!(dsp->ds_promisc & DLS_PROMISC_PHYS)) { 689 dl_err = DL_NOTENAB; 690 goto failed; 691 } 692 dsp->ds_promisc &= ~DLS_PROMISC_PHYS; 693 break; 694 695 default: 696 dl_err = DL_NOTSUPPORTED; 697 goto failed; 698 } 699 700 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 701 /* 702 * Adjust channel promiscuity. 703 */ 704 err = dls_promisc(dsp, promisc_saved); 705 mac_perim_exit(mph); 706 707 if (err != 0) { 708 dl_err = DL_SYSERR; 709 goto failed; 710 } 711 dlokack(q, mp, DL_PROMISCOFF_REQ); 712 return; 713 failed: 714 dlerrorack(q, mp, DL_PROMISCOFF_REQ, dl_err, (t_uscalar_t)err); 715 } 716 717 /* 718 * DL_ENABMULTI_REQ 719 */ 720 static void 721 proto_enabmulti_req(dld_str_t *dsp, mblk_t *mp) 722 { 723 dl_enabmulti_req_t *dlp = (dl_enabmulti_req_t *)mp->b_rptr; 724 int err = 0; 725 t_uscalar_t dl_err; 726 queue_t *q = dsp->ds_wq; 727 mac_perim_handle_t mph; 728 729 if (dsp->ds_dlstate == DL_UNATTACHED || 730 DL_ACK_PENDING(dsp->ds_dlstate)) { 731 dl_err = DL_OUTSTATE; 732 goto failed; 733 } 734 735 if (MBLKL(mp) < sizeof (dl_enabmulti_req_t) || 736 !MBLKIN(mp, dlp->dl_addr_offset, dlp->dl_addr_length) || 737 dlp->dl_addr_length != dsp->ds_mip->mi_addr_length) { 738 dl_err = DL_BADPRIM; 739 goto failed; 740 } 741 742 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 743 744 if (dsp->ds_passivestate == DLD_UNINITIALIZED && 745 ((err = dls_active_set(dsp)) != 0)) { 746 dl_err = DL_SYSERR; 747 goto failed2; 748 } 749 750 err = dls_multicst_add(dsp, mp->b_rptr + dlp->dl_addr_offset); 751 752 if (err != 0) { 753 switch (err) { 754 case EINVAL: 755 dl_err = DL_BADADDR; 756 err = 0; 757 break; 758 case ENOSPC: 759 dl_err = DL_TOOMANY; 760 err = 0; 761 break; 762 default: 763 dl_err = DL_SYSERR; 764 break; 765 } 766 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 767 dls_active_clear(dsp); 768 769 goto failed2; 770 } 771 772 mac_perim_exit(mph); 773 774 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 775 dsp->ds_passivestate = DLD_ACTIVE; 776 dlokack(q, mp, DL_ENABMULTI_REQ); 777 return; 778 779 failed2: 780 mac_perim_exit(mph); 781 failed: 782 dlerrorack(q, mp, DL_ENABMULTI_REQ, dl_err, (t_uscalar_t)err); 783 } 784 785 /* 786 * DL_DISABMULTI_REQ 787 */ 788 static void 789 proto_disabmulti_req(dld_str_t *dsp, mblk_t *mp) 790 { 791 dl_disabmulti_req_t *dlp = (dl_disabmulti_req_t *)mp->b_rptr; 792 int err = 0; 793 t_uscalar_t dl_err; 794 queue_t *q = dsp->ds_wq; 795 mac_perim_handle_t mph; 796 797 if (dsp->ds_dlstate == DL_UNATTACHED || 798 DL_ACK_PENDING(dsp->ds_dlstate)) { 799 dl_err = DL_OUTSTATE; 800 goto failed; 801 } 802 803 if (MBLKL(mp) < sizeof (dl_disabmulti_req_t) || 804 !MBLKIN(mp, dlp->dl_addr_offset, dlp->dl_addr_length) || 805 dlp->dl_addr_length != dsp->ds_mip->mi_addr_length) { 806 dl_err = DL_BADPRIM; 807 goto failed; 808 } 809 810 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 811 err = dls_multicst_remove(dsp, mp->b_rptr + dlp->dl_addr_offset); 812 mac_perim_exit(mph); 813 814 if (err != 0) { 815 switch (err) { 816 case EINVAL: 817 dl_err = DL_BADADDR; 818 err = 0; 819 break; 820 821 case ENOENT: 822 dl_err = DL_NOTENAB; 823 err = 0; 824 break; 825 826 default: 827 dl_err = DL_SYSERR; 828 break; 829 } 830 goto failed; 831 } 832 dlokack(q, mp, DL_DISABMULTI_REQ); 833 return; 834 failed: 835 dlerrorack(q, mp, DL_DISABMULTI_REQ, dl_err, (t_uscalar_t)err); 836 } 837 838 /* 839 * DL_PHYS_ADDR_REQ 840 */ 841 static void 842 proto_physaddr_req(dld_str_t *dsp, mblk_t *mp) 843 { 844 dl_phys_addr_req_t *dlp = (dl_phys_addr_req_t *)mp->b_rptr; 845 queue_t *q = dsp->ds_wq; 846 t_uscalar_t dl_err; 847 char *addr; 848 uint_t addr_length; 849 850 if (MBLKL(mp) < sizeof (dl_phys_addr_req_t)) { 851 dl_err = DL_BADPRIM; 852 goto failed; 853 } 854 855 if (dsp->ds_dlstate == DL_UNATTACHED || 856 DL_ACK_PENDING(dsp->ds_dlstate)) { 857 dl_err = DL_OUTSTATE; 858 goto failed; 859 } 860 861 if (dlp->dl_addr_type != DL_CURR_PHYS_ADDR && 862 dlp->dl_addr_type != DL_FACT_PHYS_ADDR) { 863 dl_err = DL_UNSUPPORTED; 864 goto failed; 865 } 866 867 addr_length = dsp->ds_mip->mi_addr_length; 868 if (addr_length > 0) { 869 addr = kmem_alloc(addr_length, KM_SLEEP); 870 if (dlp->dl_addr_type == DL_CURR_PHYS_ADDR) 871 mac_unicast_primary_get(dsp->ds_mh, (uint8_t *)addr); 872 else 873 bcopy(dsp->ds_mip->mi_unicst_addr, addr, addr_length); 874 875 dlphysaddrack(q, mp, addr, (t_uscalar_t)addr_length); 876 kmem_free(addr, addr_length); 877 } else { 878 dlphysaddrack(q, mp, NULL, 0); 879 } 880 return; 881 failed: 882 dlerrorack(q, mp, DL_PHYS_ADDR_REQ, dl_err, 0); 883 } 884 885 /* 886 * DL_SET_PHYS_ADDR_REQ 887 */ 888 static void 889 proto_setphysaddr_req(dld_str_t *dsp, mblk_t *mp) 890 { 891 dl_set_phys_addr_req_t *dlp = (dl_set_phys_addr_req_t *)mp->b_rptr; 892 int err = 0; 893 t_uscalar_t dl_err; 894 queue_t *q = dsp->ds_wq; 895 mac_perim_handle_t mph; 896 897 if (dsp->ds_dlstate == DL_UNATTACHED || 898 DL_ACK_PENDING(dsp->ds_dlstate)) { 899 dl_err = DL_OUTSTATE; 900 goto failed; 901 } 902 903 if (MBLKL(mp) < sizeof (dl_set_phys_addr_req_t) || 904 !MBLKIN(mp, dlp->dl_addr_offset, dlp->dl_addr_length) || 905 dlp->dl_addr_length != dsp->ds_mip->mi_addr_length) { 906 dl_err = DL_BADPRIM; 907 goto failed; 908 } 909 910 mac_perim_enter_by_mh(dsp->ds_mh, &mph); 911 912 if (dsp->ds_passivestate == DLD_UNINITIALIZED && 913 ((err = dls_active_set(dsp)) != 0)) { 914 dl_err = DL_SYSERR; 915 goto failed2; 916 } 917 918 err = mac_unicast_primary_set(dsp->ds_mh, 919 mp->b_rptr + dlp->dl_addr_offset); 920 if (err != 0) { 921 switch (err) { 922 case EINVAL: 923 dl_err = DL_BADADDR; 924 err = 0; 925 break; 926 927 default: 928 dl_err = DL_SYSERR; 929 break; 930 } 931 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 932 dls_active_clear(dsp); 933 934 goto failed2; 935 936 } 937 938 mac_perim_exit(mph); 939 940 if (dsp->ds_passivestate == DLD_UNINITIALIZED) 941 dsp->ds_passivestate = DLD_ACTIVE; 942 dlokack(q, mp, DL_SET_PHYS_ADDR_REQ); 943 return; 944 945 failed2: 946 mac_perim_exit(mph); 947 failed: 948 dlerrorack(q, mp, DL_SET_PHYS_ADDR_REQ, dl_err, (t_uscalar_t)err); 949 } 950 951 /* 952 * DL_UDQOS_REQ 953 */ 954 static void 955 proto_udqos_req(dld_str_t *dsp, mblk_t *mp) 956 { 957 dl_udqos_req_t *dlp = (dl_udqos_req_t *)mp->b_rptr; 958 dl_qos_cl_sel1_t *selp; 959 int off, len; 960 t_uscalar_t dl_err; 961 queue_t *q = dsp->ds_wq; 962 963 off = dlp->dl_qos_offset; 964 len = dlp->dl_qos_length; 965 966 if (MBLKL(mp) < sizeof (dl_udqos_req_t) || !MBLKIN(mp, off, len)) { 967 dl_err = DL_BADPRIM; 968 goto failed; 969 } 970 971 selp = (dl_qos_cl_sel1_t *)(mp->b_rptr + off); 972 if (selp->dl_qos_type != DL_QOS_CL_SEL1) { 973 dl_err = DL_BADQOSTYPE; 974 goto failed; 975 } 976 977 if (selp->dl_priority > (1 << VLAN_PRI_SIZE) - 1 || 978 selp->dl_priority < 0) { 979 dl_err = DL_BADQOSPARAM; 980 goto failed; 981 } 982 983 dsp->ds_pri = selp->dl_priority; 984 dlokack(q, mp, DL_UDQOS_REQ); 985 return; 986 failed: 987 dlerrorack(q, mp, DL_UDQOS_REQ, dl_err, 0); 988 } 989 990 static boolean_t 991 check_ip_above(queue_t *q) 992 { 993 queue_t *next_q; 994 boolean_t ret = B_TRUE; 995 996 claimstr(q); 997 next_q = q->q_next; 998 if (strcmp(next_q->q_qinfo->qi_minfo->mi_idname, "ip") != 0) 999 ret = B_FALSE; 1000 releasestr(q); 1001 return (ret); 1002 } 1003 1004 /* 1005 * DL_CAPABILITY_REQ 1006 */ 1007 static void 1008 proto_capability_req(dld_str_t *dsp, mblk_t *mp) 1009 { 1010 dl_capability_req_t *dlp = (dl_capability_req_t *)mp->b_rptr; 1011 dl_capability_sub_t *sp; 1012 size_t size, len; 1013 offset_t off, end; 1014 t_uscalar_t dl_err; 1015 queue_t *q = dsp->ds_wq; 1016 1017 if (MBLKL(mp) < sizeof (dl_capability_req_t)) { 1018 dl_err = DL_BADPRIM; 1019 goto failed; 1020 } 1021 1022 if (dsp->ds_dlstate == DL_UNATTACHED || 1023 DL_ACK_PENDING(dsp->ds_dlstate)) { 1024 dl_err = DL_OUTSTATE; 1025 goto failed; 1026 } 1027 1028 /* 1029 * This request is overloaded. If there are no requested capabilities 1030 * then we just want to acknowledge with all the capabilities we 1031 * support. Otherwise we enable the set of capabilities requested. 1032 */ 1033 if (dlp->dl_sub_length == 0) { 1034 proto_capability_advertise(dsp, mp); 1035 return; 1036 } 1037 1038 if (!MBLKIN(mp, dlp->dl_sub_offset, dlp->dl_sub_length)) { 1039 dl_err = DL_BADPRIM; 1040 goto failed; 1041 } 1042 1043 dlp->dl_primitive = DL_CAPABILITY_ACK; 1044 1045 off = dlp->dl_sub_offset; 1046 len = dlp->dl_sub_length; 1047 1048 /* 1049 * Walk the list of capabilities to be enabled. 1050 */ 1051 for (end = off + len; off < end; ) { 1052 sp = (dl_capability_sub_t *)(mp->b_rptr + off); 1053 size = sizeof (dl_capability_sub_t) + sp->dl_length; 1054 1055 if (off + size > end || 1056 !IS_P2ALIGNED(off, sizeof (uint32_t))) { 1057 dl_err = DL_BADPRIM; 1058 goto failed; 1059 } 1060 1061 switch (sp->dl_cap) { 1062 /* 1063 * TCP/IP checksum offload to hardware. 1064 */ 1065 case DL_CAPAB_HCKSUM: { 1066 dl_capab_hcksum_t *hcksump; 1067 dl_capab_hcksum_t hcksum; 1068 1069 hcksump = (dl_capab_hcksum_t *)&sp[1]; 1070 /* 1071 * Copy for alignment. 1072 */ 1073 bcopy(hcksump, &hcksum, sizeof (dl_capab_hcksum_t)); 1074 dlcapabsetqid(&(hcksum.hcksum_mid), dsp->ds_rq); 1075 bcopy(&hcksum, hcksump, sizeof (dl_capab_hcksum_t)); 1076 break; 1077 } 1078 1079 case DL_CAPAB_DLD: { 1080 dl_capab_dld_t *dldp; 1081 dl_capab_dld_t dld; 1082 1083 dldp = (dl_capab_dld_t *)&sp[1]; 1084 /* 1085 * Copy for alignment. 1086 */ 1087 bcopy(dldp, &dld, sizeof (dl_capab_dld_t)); 1088 dlcapabsetqid(&(dld.dld_mid), dsp->ds_rq); 1089 bcopy(&dld, dldp, sizeof (dl_capab_dld_t)); 1090 break; 1091 } 1092 default: 1093 break; 1094 } 1095 off += size; 1096 } 1097 qreply(q, mp); 1098 return; 1099 failed: 1100 dlerrorack(q, mp, DL_CAPABILITY_REQ, dl_err, 0); 1101 } 1102 1103 /* 1104 * DL_NOTIFY_REQ 1105 */ 1106 static void 1107 proto_notify_req(dld_str_t *dsp, mblk_t *mp) 1108 { 1109 dl_notify_req_t *dlp = (dl_notify_req_t *)mp->b_rptr; 1110 t_uscalar_t dl_err; 1111 queue_t *q = dsp->ds_wq; 1112 uint_t note = 1113 DL_NOTE_PROMISC_ON_PHYS | 1114 DL_NOTE_PROMISC_OFF_PHYS | 1115 DL_NOTE_PHYS_ADDR | 1116 DL_NOTE_LINK_UP | 1117 DL_NOTE_LINK_DOWN | 1118 DL_NOTE_CAPAB_RENEG | 1119 DL_NOTE_FASTPATH_FLUSH | 1120 DL_NOTE_SPEED; 1121 1122 if (MBLKL(mp) < sizeof (dl_notify_req_t)) { 1123 dl_err = DL_BADPRIM; 1124 goto failed; 1125 } 1126 1127 if (dsp->ds_dlstate == DL_UNATTACHED || 1128 DL_ACK_PENDING(dsp->ds_dlstate)) { 1129 dl_err = DL_OUTSTATE; 1130 goto failed; 1131 } 1132 1133 note &= ~(mac_no_notification(dsp->ds_mh)); 1134 1135 /* 1136 * Cache the notifications that are being enabled. 1137 */ 1138 dsp->ds_notifications = dlp->dl_notifications & note; 1139 /* 1140 * The ACK carries all notifications regardless of which set is 1141 * being enabled. 1142 */ 1143 dlnotifyack(q, mp, note); 1144 1145 /* 1146 * Generate DL_NOTIFY_IND messages for each enabled notification. 1147 */ 1148 if (dsp->ds_notifications != 0) { 1149 dld_str_notify_ind(dsp); 1150 } 1151 return; 1152 failed: 1153 dlerrorack(q, mp, DL_NOTIFY_REQ, dl_err, 0); 1154 } 1155 1156 /* 1157 * DL_UINTDATA_REQ 1158 */ 1159 void 1160 proto_unitdata_req(dld_str_t *dsp, mblk_t *mp) 1161 { 1162 queue_t *q = dsp->ds_wq; 1163 dl_unitdata_req_t *dlp = (dl_unitdata_req_t *)mp->b_rptr; 1164 off_t off; 1165 size_t len, size; 1166 const uint8_t *addr; 1167 uint16_t sap; 1168 uint_t addr_length; 1169 mblk_t *bp, *payload; 1170 uint32_t start, stuff, end, value, flags; 1171 t_uscalar_t dl_err; 1172 uint_t max_sdu; 1173 1174 if (MBLKL(mp) < sizeof (dl_unitdata_req_t) || mp->b_cont == NULL) { 1175 dlerrorack(q, mp, DL_UNITDATA_REQ, DL_BADPRIM, 0); 1176 return; 1177 } 1178 1179 mutex_enter(&dsp->ds_lock); 1180 if (dsp->ds_dlstate != DL_IDLE) { 1181 mutex_exit(&dsp->ds_lock); 1182 dlerrorack(q, mp, DL_UNITDATA_REQ, DL_OUTSTATE, 0); 1183 return; 1184 } 1185 DLD_DATATHR_INC(dsp); 1186 mutex_exit(&dsp->ds_lock); 1187 1188 addr_length = dsp->ds_mip->mi_addr_length; 1189 1190 off = dlp->dl_dest_addr_offset; 1191 len = dlp->dl_dest_addr_length; 1192 1193 if (!MBLKIN(mp, off, len) || !IS_P2ALIGNED(off, sizeof (uint16_t))) { 1194 dl_err = DL_BADPRIM; 1195 goto failed; 1196 } 1197 1198 if (len != addr_length + sizeof (uint16_t)) { 1199 dl_err = DL_BADADDR; 1200 goto failed; 1201 } 1202 1203 addr = mp->b_rptr + off; 1204 sap = *(uint16_t *)(mp->b_rptr + off + addr_length); 1205 1206 /* 1207 * Check the length of the packet and the block types. 1208 */ 1209 size = 0; 1210 payload = mp->b_cont; 1211 for (bp = payload; bp != NULL; bp = bp->b_cont) { 1212 if (DB_TYPE(bp) != M_DATA) 1213 goto baddata; 1214 1215 size += MBLKL(bp); 1216 } 1217 1218 mac_sdu_get(dsp->ds_mh, NULL, &max_sdu); 1219 if (size > max_sdu) 1220 goto baddata; 1221 1222 /* 1223 * Build a packet header. 1224 */ 1225 if ((bp = dls_header(dsp, addr, sap, dlp->dl_priority.dl_max, 1226 &payload)) == NULL) { 1227 dl_err = DL_BADADDR; 1228 goto failed; 1229 } 1230 1231 /* 1232 * We no longer need the M_PROTO header, so free it. 1233 */ 1234 freeb(mp); 1235 1236 /* 1237 * Transfer the checksum offload information if it is present. 1238 */ 1239 hcksum_retrieve(payload, NULL, NULL, &start, &stuff, &end, &value, 1240 &flags); 1241 (void) hcksum_assoc(bp, NULL, NULL, start, stuff, end, value, flags, 0); 1242 1243 /* 1244 * Link the payload onto the new header. 1245 */ 1246 ASSERT(bp->b_cont == NULL); 1247 bp->b_cont = payload; 1248 1249 /* 1250 * No lock can be held across modules and putnext()'s, 1251 * which can happen here with the call from DLD_TX(). 1252 */ 1253 if (DLD_TX(dsp, bp, 0, 0) != NULL) { 1254 /* flow-controlled */ 1255 DLD_SETQFULL(dsp); 1256 } 1257 DLD_DATATHR_DCR(dsp); 1258 return; 1259 1260 failed: 1261 dlerrorack(q, mp, DL_UNITDATA_REQ, dl_err, 0); 1262 DLD_DATATHR_DCR(dsp); 1263 return; 1264 1265 baddata: 1266 dluderrorind(q, mp, (void *)addr, len, DL_BADDATA, 0); 1267 DLD_DATATHR_DCR(dsp); 1268 } 1269 1270 /* 1271 * DL_PASSIVE_REQ 1272 */ 1273 static void 1274 proto_passive_req(dld_str_t *dsp, mblk_t *mp) 1275 { 1276 t_uscalar_t dl_err; 1277 1278 /* 1279 * If we've already become active by issuing an active primitive, 1280 * then it's too late to try to become passive. 1281 */ 1282 if (dsp->ds_passivestate == DLD_ACTIVE) { 1283 dl_err = DL_OUTSTATE; 1284 goto failed; 1285 } 1286 1287 if (MBLKL(mp) < sizeof (dl_passive_req_t)) { 1288 dl_err = DL_BADPRIM; 1289 goto failed; 1290 } 1291 1292 dsp->ds_passivestate = DLD_PASSIVE; 1293 dlokack(dsp->ds_wq, mp, DL_PASSIVE_REQ); 1294 return; 1295 failed: 1296 dlerrorack(dsp->ds_wq, mp, DL_PASSIVE_REQ, dl_err, 0); 1297 } 1298 1299 1300 /* 1301 * Catch-all handler. 1302 */ 1303 static void 1304 proto_req(dld_str_t *dsp, mblk_t *mp) 1305 { 1306 union DL_primitives *dlp = (union DL_primitives *)mp->b_rptr; 1307 1308 dlerrorack(dsp->ds_wq, mp, dlp->dl_primitive, DL_UNSUPPORTED, 0); 1309 } 1310 1311 static int 1312 dld_capab_perim(dld_str_t *dsp, void *data, uint_t flags) 1313 { 1314 switch (flags) { 1315 case DLD_ENABLE: 1316 mac_perim_enter_by_mh(dsp->ds_mh, (mac_perim_handle_t *)data); 1317 return (0); 1318 1319 case DLD_DISABLE: 1320 mac_perim_exit((mac_perim_handle_t)data); 1321 return (0); 1322 1323 case DLD_QUERY: 1324 return (mac_perim_held(dsp->ds_mh)); 1325 } 1326 return (0); 1327 } 1328 1329 static int 1330 dld_capab_direct(dld_str_t *dsp, void *data, uint_t flags) 1331 { 1332 dld_capab_direct_t *direct = data; 1333 1334 ASSERT(MAC_PERIM_HELD(dsp->ds_mh)); 1335 1336 switch (flags) { 1337 case DLD_ENABLE: 1338 dls_rx_set(dsp, (dls_rx_t)direct->di_rx_cf, 1339 direct->di_rx_ch); 1340 1341 direct->di_tx_df = (uintptr_t)str_mdata_fastpath_put; 1342 direct->di_tx_dh = dsp; 1343 direct->di_tx_cb_df = (uintptr_t)mac_client_tx_notify; 1344 direct->di_tx_cb_dh = dsp->ds_mch; 1345 direct->di_tx_fctl_df = (uintptr_t)mac_tx_is_flow_blocked; 1346 direct->di_tx_fctl_dh = dsp->ds_mch; 1347 1348 dsp->ds_direct = B_TRUE; 1349 1350 return (0); 1351 1352 case DLD_DISABLE: 1353 dls_rx_set(dsp, (dsp->ds_mode == DLD_FASTPATH) ? 1354 dld_str_rx_fastpath : dld_str_rx_unitdata, (void *)dsp); 1355 dsp->ds_direct = B_FALSE; 1356 1357 return (0); 1358 } 1359 return (ENOTSUP); 1360 } 1361 1362 /* 1363 * dld_capab_poll_enable() 1364 * 1365 * This function is misnamed. All polling and fanouts are run out of the 1366 * lower mac (in case of VNIC and the only mac in case of NICs). The 1367 * availability of Rx ring and promiscous mode is all taken care between 1368 * the soft ring set (mac_srs), the Rx ring, and S/W classifier. Any 1369 * fanout necessary is done by the soft rings that are part of the 1370 * mac_srs (by default mac_srs sends the packets up via a TCP and 1371 * non TCP soft ring). 1372 * 1373 * The mac_srs (or its associated soft rings) always store the ill_rx_ring 1374 * (the cookie returned when they registered with IP during plumb) as their 1375 * 2nd argument which is passed up as mac_resource_handle_t. The upcall 1376 * function and 1st argument is what the caller registered when they 1377 * called mac_rx_classify_flow_add() to register the flow. For VNIC, 1378 * the function is vnic_rx and argument is vnic_t. For regular NIC 1379 * case, it mac_rx_default and mac_handle_t. As explained above, the 1380 * mac_srs (or its soft ring) will add the ill_rx_ring (mac_resource_handle_t) 1381 * from its stored 2nd argument. 1382 */ 1383 static int 1384 dld_capab_poll_enable(dld_str_t *dsp, dld_capab_poll_t *poll) 1385 { 1386 if (dsp->ds_polling) 1387 return (EINVAL); 1388 1389 if ((dld_opt & DLD_OPT_NO_POLL) != 0 || dsp->ds_mode == DLD_RAW) 1390 return (ENOTSUP); 1391 1392 /* 1393 * Enable client polling if and only if DLS bypass is possible. 1394 * Special cases like VLANs need DLS processing in the Rx data path. 1395 * In such a case we can neither allow the client (IP) to directly 1396 * poll the softring (since DLS processing hasn't been done) nor can 1397 * we allow DLS bypass. 1398 */ 1399 if (!mac_rx_bypass_set(dsp->ds_mch, dsp->ds_rx, dsp->ds_rx_arg)) 1400 return (ENOTSUP); 1401 1402 /* 1403 * Register soft ring resources. This will come in handy later if 1404 * the user decides to modify CPU bindings to use more CPUs for the 1405 * device in which case we will switch to fanout using soft rings. 1406 */ 1407 mac_resource_set_common(dsp->ds_mch, 1408 (mac_resource_add_t)poll->poll_ring_add_cf, 1409 (mac_resource_remove_t)poll->poll_ring_remove_cf, 1410 (mac_resource_quiesce_t)poll->poll_ring_quiesce_cf, 1411 (mac_resource_restart_t)poll->poll_ring_restart_cf, 1412 (mac_resource_bind_t)poll->poll_ring_bind_cf, 1413 poll->poll_ring_ch); 1414 1415 mac_client_poll_enable(dsp->ds_mch); 1416 1417 dsp->ds_polling = B_TRUE; 1418 return (0); 1419 } 1420 1421 /* ARGSUSED */ 1422 static int 1423 dld_capab_poll_disable(dld_str_t *dsp, dld_capab_poll_t *poll) 1424 { 1425 if (!dsp->ds_polling) 1426 return (EINVAL); 1427 1428 mac_client_poll_disable(dsp->ds_mch); 1429 mac_resource_set(dsp->ds_mch, NULL, NULL); 1430 1431 dsp->ds_polling = B_FALSE; 1432 return (0); 1433 } 1434 1435 static int 1436 dld_capab_poll(dld_str_t *dsp, void *data, uint_t flags) 1437 { 1438 dld_capab_poll_t *poll = data; 1439 1440 ASSERT(MAC_PERIM_HELD(dsp->ds_mh)); 1441 1442 switch (flags) { 1443 case DLD_ENABLE: 1444 return (dld_capab_poll_enable(dsp, poll)); 1445 case DLD_DISABLE: 1446 return (dld_capab_poll_disable(dsp, poll)); 1447 } 1448 return (ENOTSUP); 1449 } 1450 1451 static int 1452 dld_capab_lso(dld_str_t *dsp, void *data, uint_t flags) 1453 { 1454 dld_capab_lso_t *lso = data; 1455 1456 ASSERT(MAC_PERIM_HELD(dsp->ds_mh)); 1457 1458 switch (flags) { 1459 case DLD_ENABLE: { 1460 mac_capab_lso_t mac_lso; 1461 1462 /* 1463 * Check if LSO is supported on this MAC & enable LSO 1464 * accordingly. 1465 */ 1466 if (mac_capab_get(dsp->ds_mh, MAC_CAPAB_LSO, &mac_lso)) { 1467 lso->lso_max = mac_lso.lso_basic_tcp_ipv4.lso_max; 1468 lso->lso_flags = 0; 1469 /* translate the flag for mac clients */ 1470 if ((mac_lso.lso_flags & LSO_TX_BASIC_TCP_IPV4) != 0) 1471 lso->lso_flags |= DLD_LSO_TX_BASIC_TCP_IPV4; 1472 dsp->ds_lso = B_TRUE; 1473 dsp->ds_lso_max = lso->lso_max; 1474 } else { 1475 dsp->ds_lso = B_FALSE; 1476 dsp->ds_lso_max = 0; 1477 return (ENOTSUP); 1478 } 1479 return (0); 1480 } 1481 case DLD_DISABLE: { 1482 dsp->ds_lso = B_FALSE; 1483 dsp->ds_lso_max = 0; 1484 return (0); 1485 } 1486 } 1487 return (ENOTSUP); 1488 } 1489 1490 static int 1491 dld_capab(dld_str_t *dsp, uint_t type, void *data, uint_t flags) 1492 { 1493 int err; 1494 1495 /* 1496 * Don't enable direct callback capabilities unless the caller is 1497 * the IP client. When a module is inserted in a stream (_I_INSERT) 1498 * the stack initiates capability disable, but due to races, the 1499 * module insertion may complete before the capability disable 1500 * completes. So we limit the check to DLD_ENABLE case. 1501 */ 1502 if ((flags == DLD_ENABLE && type != DLD_CAPAB_PERIM) && 1503 (dsp->ds_sap != ETHERTYPE_IP || !check_ip_above(dsp->ds_rq))) { 1504 return (ENOTSUP); 1505 } 1506 1507 switch (type) { 1508 case DLD_CAPAB_DIRECT: 1509 err = dld_capab_direct(dsp, data, flags); 1510 break; 1511 1512 case DLD_CAPAB_POLL: 1513 err = dld_capab_poll(dsp, data, flags); 1514 break; 1515 1516 case DLD_CAPAB_PERIM: 1517 err = dld_capab_perim(dsp, data, flags); 1518 break; 1519 1520 case DLD_CAPAB_LSO: 1521 err = dld_capab_lso(dsp, data, flags); 1522 break; 1523 1524 default: 1525 err = ENOTSUP; 1526 break; 1527 } 1528 1529 return (err); 1530 } 1531 1532 /* 1533 * DL_CAPABILITY_ACK/DL_ERROR_ACK 1534 */ 1535 static void 1536 proto_capability_advertise(dld_str_t *dsp, mblk_t *mp) 1537 { 1538 dl_capability_ack_t *dlap; 1539 dl_capability_sub_t *dlsp; 1540 size_t subsize; 1541 dl_capab_dld_t dld; 1542 dl_capab_hcksum_t hcksum; 1543 dl_capab_zerocopy_t zcopy; 1544 uint8_t *ptr; 1545 queue_t *q = dsp->ds_wq; 1546 mblk_t *mp1; 1547 boolean_t is_vlan; 1548 boolean_t hcksum_capable = B_FALSE; 1549 boolean_t zcopy_capable = B_FALSE; 1550 boolean_t dld_capable = B_FALSE; 1551 1552 /* 1553 * Initially assume no capabilities. 1554 */ 1555 subsize = 0; 1556 is_vlan = (mac_client_vid(dsp->ds_mch) != VLAN_ID_NONE); 1557 1558 /* 1559 * Check if checksum offload is supported on this MAC. Don't 1560 * advertise DL_CAPAB_HCKSUM if the underlying MAC is VLAN incapable, 1561 * since it might not be able to do the hardware checksum offload 1562 * with the correct offset. 1563 */ 1564 bzero(&hcksum, sizeof (dl_capab_hcksum_t)); 1565 if ((!is_vlan || (!mac_capab_get(dsp->ds_mh, MAC_CAPAB_NO_NATIVEVLAN, 1566 NULL))) && mac_capab_get(dsp->ds_mh, MAC_CAPAB_HCKSUM, 1567 &hcksum.hcksum_txflags)) { 1568 if (hcksum.hcksum_txflags != 0) { 1569 hcksum_capable = B_TRUE; 1570 subsize += sizeof (dl_capability_sub_t) + 1571 sizeof (dl_capab_hcksum_t); 1572 } 1573 } 1574 1575 /* 1576 * Check if zerocopy is supported on this interface. 1577 * If advertising DL_CAPAB_ZEROCOPY has not been explicitly disabled 1578 * then reserve space for that capability. 1579 */ 1580 if (!mac_capab_get(dsp->ds_mh, MAC_CAPAB_NO_ZCOPY, NULL) && 1581 !(dld_opt & DLD_OPT_NO_ZEROCOPY)) { 1582 zcopy_capable = B_TRUE; 1583 subsize += sizeof (dl_capability_sub_t) + 1584 sizeof (dl_capab_zerocopy_t); 1585 } 1586 1587 /* 1588 * Direct capability negotiation interface between IP and DLD 1589 */ 1590 if (dsp->ds_sap == ETHERTYPE_IP && check_ip_above(dsp->ds_rq)) { 1591 dld_capable = B_TRUE; 1592 subsize += sizeof (dl_capability_sub_t) + 1593 sizeof (dl_capab_dld_t); 1594 } 1595 1596 /* 1597 * If there are no capabilities to advertise or if we 1598 * can't allocate a response, send a DL_ERROR_ACK. 1599 */ 1600 if ((mp1 = reallocb(mp, 1601 sizeof (dl_capability_ack_t) + subsize, 0)) == NULL) { 1602 dlerrorack(q, mp, DL_CAPABILITY_REQ, DL_NOTSUPPORTED, 0); 1603 return; 1604 } 1605 1606 mp = mp1; 1607 DB_TYPE(mp) = M_PROTO; 1608 mp->b_wptr = mp->b_rptr + sizeof (dl_capability_ack_t) + subsize; 1609 bzero(mp->b_rptr, MBLKL(mp)); 1610 dlap = (dl_capability_ack_t *)mp->b_rptr; 1611 dlap->dl_primitive = DL_CAPABILITY_ACK; 1612 dlap->dl_sub_offset = sizeof (dl_capability_ack_t); 1613 dlap->dl_sub_length = subsize; 1614 ptr = (uint8_t *)&dlap[1]; 1615 1616 /* 1617 * TCP/IP checksum offload. 1618 */ 1619 if (hcksum_capable) { 1620 dlsp = (dl_capability_sub_t *)ptr; 1621 1622 dlsp->dl_cap = DL_CAPAB_HCKSUM; 1623 dlsp->dl_length = sizeof (dl_capab_hcksum_t); 1624 ptr += sizeof (dl_capability_sub_t); 1625 1626 hcksum.hcksum_version = HCKSUM_VERSION_1; 1627 dlcapabsetqid(&(hcksum.hcksum_mid), dsp->ds_rq); 1628 bcopy(&hcksum, ptr, sizeof (dl_capab_hcksum_t)); 1629 ptr += sizeof (dl_capab_hcksum_t); 1630 } 1631 1632 /* 1633 * Zero copy 1634 */ 1635 if (zcopy_capable) { 1636 dlsp = (dl_capability_sub_t *)ptr; 1637 1638 dlsp->dl_cap = DL_CAPAB_ZEROCOPY; 1639 dlsp->dl_length = sizeof (dl_capab_zerocopy_t); 1640 ptr += sizeof (dl_capability_sub_t); 1641 1642 bzero(&zcopy, sizeof (dl_capab_zerocopy_t)); 1643 zcopy.zerocopy_version = ZEROCOPY_VERSION_1; 1644 zcopy.zerocopy_flags = DL_CAPAB_VMSAFE_MEM; 1645 1646 dlcapabsetqid(&(zcopy.zerocopy_mid), dsp->ds_rq); 1647 bcopy(&zcopy, ptr, sizeof (dl_capab_zerocopy_t)); 1648 ptr += sizeof (dl_capab_zerocopy_t); 1649 } 1650 1651 /* 1652 * Direct capability negotiation interface between IP and DLD. 1653 * Refer to dld.h for details. 1654 */ 1655 if (dld_capable) { 1656 dlsp = (dl_capability_sub_t *)ptr; 1657 dlsp->dl_cap = DL_CAPAB_DLD; 1658 dlsp->dl_length = sizeof (dl_capab_dld_t); 1659 ptr += sizeof (dl_capability_sub_t); 1660 1661 bzero(&dld, sizeof (dl_capab_dld_t)); 1662 dld.dld_version = DLD_CURRENT_VERSION; 1663 dld.dld_capab = (uintptr_t)dld_capab; 1664 dld.dld_capab_handle = (uintptr_t)dsp; 1665 1666 dlcapabsetqid(&(dld.dld_mid), dsp->ds_rq); 1667 bcopy(&dld, ptr, sizeof (dl_capab_dld_t)); 1668 ptr += sizeof (dl_capab_dld_t); 1669 } 1670 1671 ASSERT(ptr == mp->b_rptr + sizeof (dl_capability_ack_t) + subsize); 1672 qreply(q, mp); 1673 } 1674 1675 /* 1676 * Disable any enabled capabilities. 1677 */ 1678 void 1679 dld_capabilities_disable(dld_str_t *dsp) 1680 { 1681 if (dsp->ds_polling) 1682 (void) dld_capab_poll_disable(dsp, NULL); 1683 } 1684