1 /*- 2 * Copyright (c) 1980, 1986, 1993 3 * The Regents of the University of California. All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 4. Neither the name of the University nor the names of its contributors 14 * may be used to endorse or promote products derived from this software 15 * without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 * 29 * @(#)if.c 8.5 (Berkeley) 1/9/95 30 * $FreeBSD$ 31 */ 32 33 #include "opt_compat.h" 34 #include "opt_inet6.h" 35 #include "opt_inet.h" 36 #include "opt_carp.h" 37 38 #include <sys/param.h> 39 #include <sys/types.h> 40 #include <sys/conf.h> 41 #include <sys/malloc.h> 42 #include <sys/sbuf.h> 43 #include <sys/bus.h> 44 #include <sys/mbuf.h> 45 #include <sys/systm.h> 46 #include <sys/priv.h> 47 #include <sys/proc.h> 48 #include <sys/socket.h> 49 #include <sys/socketvar.h> 50 #include <sys/protosw.h> 51 #include <sys/kernel.h> 52 #include <sys/lock.h> 53 #include <sys/refcount.h> 54 #include <sys/module.h> 55 #include <sys/rwlock.h> 56 #include <sys/sockio.h> 57 #include <sys/syslog.h> 58 #include <sys/sysctl.h> 59 #include <sys/taskqueue.h> 60 #include <sys/domain.h> 61 #include <sys/jail.h> 62 #include <machine/stdarg.h> 63 #include <vm/uma.h> 64 65 #include <net/if.h> 66 #include <net/if_arp.h> 67 #include <net/if_clone.h> 68 #include <net/if_dl.h> 69 #include <net/if_types.h> 70 #include <net/if_var.h> 71 #include <net/radix.h> 72 #include <net/route.h> 73 #include <net/vnet.h> 74 75 #if defined(INET) || defined(INET6) 76 /*XXX*/ 77 #include <netinet/in.h> 78 #include <netinet/in_var.h> 79 #ifdef INET6 80 #include <netinet6/in6_var.h> 81 #include <netinet6/in6_ifattach.h> 82 #endif 83 #endif 84 #ifdef INET 85 #include <netinet/if_ether.h> 86 #endif 87 #if defined(INET) || defined(INET6) 88 #ifdef DEV_CARP 89 #include <netinet/ip_carp.h> 90 #endif 91 #endif 92 93 #include <security/mac/mac_framework.h> 94 95 struct ifindex_entry { 96 struct ifnet *ife_ifnet; 97 }; 98 99 SYSCTL_NODE(_net, PF_LINK, link, CTLFLAG_RW, 0, "Link layers"); 100 SYSCTL_NODE(_net_link, 0, generic, CTLFLAG_RW, 0, "Generic link-management"); 101 102 /* Log link state change events */ 103 static int log_link_state_change = 1; 104 105 SYSCTL_INT(_net_link, OID_AUTO, log_link_state_change, CTLFLAG_RW, 106 &log_link_state_change, 0, 107 "log interface link state change events"); 108 109 /* Interface description */ 110 static unsigned int ifdescr_maxlen = 1024; 111 SYSCTL_UINT(_net, OID_AUTO, ifdescr_maxlen, CTLFLAG_RW, 112 &ifdescr_maxlen, 0, 113 "administrative maximum length for interface description"); 114 115 MALLOC_DEFINE(M_IFDESCR, "ifdescr", "ifnet descriptions"); 116 117 /* global sx for non-critical path ifdescr */ 118 static struct sx ifdescr_sx; 119 SX_SYSINIT(ifdescr_sx, &ifdescr_sx, "ifnet descr"); 120 121 void (*bstp_linkstate_p)(struct ifnet *ifp, int state); 122 void (*ng_ether_link_state_p)(struct ifnet *ifp, int state); 123 void (*lagg_linkstate_p)(struct ifnet *ifp, int state); 124 125 struct mbuf *(*tbr_dequeue_ptr)(struct ifaltq *, int) = NULL; 126 127 /* 128 * XXX: Style; these should be sorted alphabetically, and unprototyped 129 * static functions should be prototyped. Currently they are sorted by 130 * declaration order. 131 */ 132 static void if_attachdomain(void *); 133 static void if_attachdomain1(struct ifnet *); 134 static int ifconf(u_long, caddr_t); 135 static void if_freemulti(struct ifmultiaddr *); 136 static void if_init(void *); 137 static void if_grow(void); 138 static void if_route(struct ifnet *, int flag, int fam); 139 static int if_setflag(struct ifnet *, int, int, int *, int); 140 static int if_transmit(struct ifnet *ifp, struct mbuf *m); 141 static void if_unroute(struct ifnet *, int flag, int fam); 142 static void link_rtrequest(int, struct rtentry *, struct rt_addrinfo *); 143 static int if_rtdel(struct radix_node *, void *); 144 static int ifhwioctl(u_long, struct ifnet *, caddr_t, struct thread *); 145 static int if_delmulti_locked(struct ifnet *, struct ifmultiaddr *, int); 146 static void do_link_state_change(void *, int); 147 static int if_getgroup(struct ifgroupreq *, struct ifnet *); 148 static int if_getgroupmembers(struct ifgroupreq *); 149 static void if_delgroups(struct ifnet *); 150 static void if_attach_internal(struct ifnet *, int); 151 static void if_detach_internal(struct ifnet *, int); 152 153 #ifdef INET6 154 /* 155 * XXX: declare here to avoid to include many inet6 related files.. 156 * should be more generalized? 157 */ 158 extern void nd6_setmtu(struct ifnet *); 159 #endif 160 161 VNET_DEFINE(struct ifnethead, ifnet); /* depend on static init XXX */ 162 VNET_DEFINE(struct ifgrouphead, ifg_head); 163 VNET_DEFINE(int, if_index); 164 static VNET_DEFINE(int, if_indexlim) = 8; 165 166 /* Table of ifnet by index. */ 167 static VNET_DEFINE(struct ifindex_entry *, ifindex_table); 168 169 #define V_if_indexlim VNET(if_indexlim) 170 #define V_ifindex_table VNET(ifindex_table) 171 172 int ifqmaxlen = IFQ_MAXLEN; 173 174 /* 175 * The global network interface list (V_ifnet) and related state (such as 176 * if_index, if_indexlim, and ifindex_table) are protected by an sxlock and 177 * an rwlock. Either may be acquired shared to stablize the list, but both 178 * must be acquired writable to modify the list. This model allows us to 179 * both stablize the interface list during interrupt thread processing, but 180 * also to stablize it over long-running ioctls, without introducing priority 181 * inversions and deadlocks. 182 */ 183 struct rwlock ifnet_rwlock; 184 struct sx ifnet_sxlock; 185 186 /* 187 * The allocation of network interfaces is a rather non-atomic affair; we 188 * need to select an index before we are ready to expose the interface for 189 * use, so will use this pointer value to indicate reservation. 190 */ 191 #define IFNET_HOLD (void *)(uintptr_t)(-1) 192 193 static if_com_alloc_t *if_com_alloc[256]; 194 static if_com_free_t *if_com_free[256]; 195 196 MALLOC_DEFINE(M_IFNET, "ifnet", "interface internals"); 197 MALLOC_DEFINE(M_IFADDR, "ifaddr", "interface address"); 198 MALLOC_DEFINE(M_IFMADDR, "ether_multi", "link-level multicast address"); 199 200 struct ifnet * 201 ifnet_byindex_locked(u_short idx) 202 { 203 204 if (idx > V_if_index) 205 return (NULL); 206 if (V_ifindex_table[idx].ife_ifnet == IFNET_HOLD) 207 return (NULL); 208 return (V_ifindex_table[idx].ife_ifnet); 209 } 210 211 struct ifnet * 212 ifnet_byindex(u_short idx) 213 { 214 struct ifnet *ifp; 215 216 IFNET_RLOCK_NOSLEEP(); 217 ifp = ifnet_byindex_locked(idx); 218 IFNET_RUNLOCK_NOSLEEP(); 219 return (ifp); 220 } 221 222 struct ifnet * 223 ifnet_byindex_ref(u_short idx) 224 { 225 struct ifnet *ifp; 226 227 IFNET_RLOCK_NOSLEEP(); 228 ifp = ifnet_byindex_locked(idx); 229 if (ifp == NULL || (ifp->if_flags & IFF_DYING)) { 230 IFNET_RUNLOCK_NOSLEEP(); 231 return (NULL); 232 } 233 if_ref(ifp); 234 IFNET_RUNLOCK_NOSLEEP(); 235 return (ifp); 236 } 237 238 /* 239 * Allocate an ifindex array entry; return 0 on success or an error on 240 * failure. 241 */ 242 static int 243 ifindex_alloc_locked(u_short *idxp) 244 { 245 u_short idx; 246 247 IFNET_WLOCK_ASSERT(); 248 249 /* 250 * Try to find an empty slot below V_if_index. If we fail, take the 251 * next slot. 252 */ 253 for (idx = 1; idx <= V_if_index; idx++) { 254 if (V_ifindex_table[idx].ife_ifnet == NULL) 255 break; 256 } 257 258 /* Catch if_index overflow. */ 259 if (idx < 1) 260 return (ENOSPC); 261 if (idx > V_if_index) 262 V_if_index = idx; 263 if (V_if_index >= V_if_indexlim) 264 if_grow(); 265 *idxp = idx; 266 return (0); 267 } 268 269 static void 270 ifindex_free_locked(u_short idx) 271 { 272 273 IFNET_WLOCK_ASSERT(); 274 275 V_ifindex_table[idx].ife_ifnet = NULL; 276 while (V_if_index > 0 && 277 V_ifindex_table[V_if_index].ife_ifnet == NULL) 278 V_if_index--; 279 } 280 281 static void 282 ifindex_free(u_short idx) 283 { 284 285 IFNET_WLOCK(); 286 ifindex_free_locked(idx); 287 IFNET_WUNLOCK(); 288 } 289 290 static void 291 ifnet_setbyindex_locked(u_short idx, struct ifnet *ifp) 292 { 293 294 IFNET_WLOCK_ASSERT(); 295 296 V_ifindex_table[idx].ife_ifnet = ifp; 297 } 298 299 static void 300 ifnet_setbyindex(u_short idx, struct ifnet *ifp) 301 { 302 303 IFNET_WLOCK(); 304 ifnet_setbyindex_locked(idx, ifp); 305 IFNET_WUNLOCK(); 306 } 307 308 struct ifaddr * 309 ifaddr_byindex(u_short idx) 310 { 311 struct ifaddr *ifa; 312 313 IFNET_RLOCK_NOSLEEP(); 314 ifa = ifnet_byindex_locked(idx)->if_addr; 315 if (ifa != NULL) 316 ifa_ref(ifa); 317 IFNET_RUNLOCK_NOSLEEP(); 318 return (ifa); 319 } 320 321 /* 322 * Network interface utility routines. 323 * 324 * Routines with ifa_ifwith* names take sockaddr *'s as 325 * parameters. 326 */ 327 328 static void 329 vnet_if_init(const void *unused __unused) 330 { 331 332 TAILQ_INIT(&V_ifnet); 333 TAILQ_INIT(&V_ifg_head); 334 if_grow(); /* create initial table */ 335 vnet_if_clone_init(); 336 } 337 VNET_SYSINIT(vnet_if_init, SI_SUB_INIT_IF, SI_ORDER_FIRST, vnet_if_init, 338 NULL); 339 340 /* ARGSUSED*/ 341 static void 342 if_init(void *dummy __unused) 343 { 344 345 IFNET_LOCK_INIT(); 346 if_clone_init(); 347 } 348 SYSINIT(interfaces, SI_SUB_INIT_IF, SI_ORDER_SECOND, if_init, NULL); 349 350 351 #ifdef VIMAGE 352 static void 353 vnet_if_uninit(const void *unused __unused) 354 { 355 356 VNET_ASSERT(TAILQ_EMPTY(&V_ifnet)); 357 VNET_ASSERT(TAILQ_EMPTY(&V_ifg_head)); 358 359 free((caddr_t)V_ifindex_table, M_IFNET); 360 } 361 VNET_SYSUNINIT(vnet_if_uninit, SI_SUB_INIT_IF, SI_ORDER_FIRST, 362 vnet_if_uninit, NULL); 363 #endif 364 365 static void 366 if_grow(void) 367 { 368 u_int n; 369 struct ifindex_entry *e; 370 371 V_if_indexlim <<= 1; 372 n = V_if_indexlim * sizeof(*e); 373 e = malloc(n, M_IFNET, M_WAITOK | M_ZERO); 374 if (V_ifindex_table != NULL) { 375 memcpy((caddr_t)e, (caddr_t)V_ifindex_table, n/2); 376 free((caddr_t)V_ifindex_table, M_IFNET); 377 } 378 V_ifindex_table = e; 379 } 380 381 /* 382 * Allocate a struct ifnet and an index for an interface. A layer 2 383 * common structure will also be allocated if an allocation routine is 384 * registered for the passed type. 385 */ 386 struct ifnet * 387 if_alloc(u_char type) 388 { 389 struct ifnet *ifp; 390 u_short idx; 391 392 ifp = malloc(sizeof(struct ifnet), M_IFNET, M_WAITOK|M_ZERO); 393 IFNET_WLOCK(); 394 if (ifindex_alloc_locked(&idx) != 0) { 395 IFNET_WUNLOCK(); 396 free(ifp, M_IFNET); 397 return (NULL); 398 } 399 ifnet_setbyindex_locked(idx, IFNET_HOLD); 400 IFNET_WUNLOCK(); 401 ifp->if_index = idx; 402 ifp->if_type = type; 403 ifp->if_alloctype = type; 404 if (if_com_alloc[type] != NULL) { 405 ifp->if_l2com = if_com_alloc[type](type, ifp); 406 if (ifp->if_l2com == NULL) { 407 free(ifp, M_IFNET); 408 ifindex_free(idx); 409 return (NULL); 410 } 411 } 412 413 IF_ADDR_LOCK_INIT(ifp); 414 TASK_INIT(&ifp->if_linktask, 0, do_link_state_change, ifp); 415 ifp->if_afdata_initialized = 0; 416 IF_AFDATA_LOCK_INIT(ifp); 417 TAILQ_INIT(&ifp->if_addrhead); 418 TAILQ_INIT(&ifp->if_prefixhead); 419 TAILQ_INIT(&ifp->if_multiaddrs); 420 TAILQ_INIT(&ifp->if_groups); 421 #ifdef MAC 422 mac_ifnet_init(ifp); 423 #endif 424 ifq_init(&ifp->if_snd, ifp); 425 426 refcount_init(&ifp->if_refcount, 1); /* Index reference. */ 427 ifnet_setbyindex(ifp->if_index, ifp); 428 return (ifp); 429 } 430 431 /* 432 * Do the actual work of freeing a struct ifnet, associated index, and layer 433 * 2 common structure. This call is made when the last reference to an 434 * interface is released. 435 */ 436 static void 437 if_free_internal(struct ifnet *ifp) 438 { 439 440 KASSERT((ifp->if_flags & IFF_DYING), 441 ("if_free_internal: interface not dying")); 442 443 IFNET_WLOCK(); 444 KASSERT(ifp == ifnet_byindex_locked(ifp->if_index), 445 ("%s: freeing unallocated ifnet", ifp->if_xname)); 446 447 ifindex_free_locked(ifp->if_index); 448 IFNET_WUNLOCK(); 449 450 if (if_com_free[ifp->if_alloctype] != NULL) 451 if_com_free[ifp->if_alloctype](ifp->if_l2com, 452 ifp->if_alloctype); 453 454 #ifdef MAC 455 mac_ifnet_destroy(ifp); 456 #endif /* MAC */ 457 if (ifp->if_description != NULL) 458 free(ifp->if_description, M_IFDESCR); 459 IF_AFDATA_DESTROY(ifp); 460 IF_ADDR_LOCK_DESTROY(ifp); 461 ifq_delete(&ifp->if_snd); 462 free(ifp, M_IFNET); 463 } 464 465 /* 466 * This version should only be called by intefaces that switch their type 467 * after calling if_alloc(). if_free_type() will go away again now that we 468 * have if_alloctype to cache the original allocation type. For now, assert 469 * that they match, since we require that in practice. 470 */ 471 void 472 if_free_type(struct ifnet *ifp, u_char type) 473 { 474 475 KASSERT(ifp->if_alloctype == type, 476 ("if_free_type: type (%d) != alloctype (%d)", type, 477 ifp->if_alloctype)); 478 479 ifp->if_flags |= IFF_DYING; /* XXX: Locking */ 480 if (!refcount_release(&ifp->if_refcount)) 481 return; 482 if_free_internal(ifp); 483 } 484 485 /* 486 * This is the normal version of if_free(), used by device drivers to free a 487 * detached network interface. The contents of if_free_type() will move into 488 * here when if_free_type() goes away. 489 */ 490 void 491 if_free(struct ifnet *ifp) 492 { 493 494 if_free_type(ifp, ifp->if_alloctype); 495 } 496 497 /* 498 * Interfaces to keep an ifnet type-stable despite the possibility of the 499 * driver calling if_free(). If there are additional references, we defer 500 * freeing the underlying data structure. 501 */ 502 void 503 if_ref(struct ifnet *ifp) 504 { 505 506 /* We don't assert the ifnet list lock here, but arguably should. */ 507 refcount_acquire(&ifp->if_refcount); 508 } 509 510 void 511 if_rele(struct ifnet *ifp) 512 { 513 514 if (!refcount_release(&ifp->if_refcount)) 515 return; 516 if_free_internal(ifp); 517 } 518 519 void 520 ifq_init(struct ifaltq *ifq, struct ifnet *ifp) 521 { 522 523 mtx_init(&ifq->ifq_mtx, ifp->if_xname, "if send queue", MTX_DEF); 524 525 if (ifq->ifq_maxlen == 0) 526 ifq->ifq_maxlen = ifqmaxlen; 527 528 ifq->altq_type = 0; 529 ifq->altq_disc = NULL; 530 ifq->altq_flags &= ALTQF_CANTCHANGE; 531 ifq->altq_tbr = NULL; 532 ifq->altq_ifp = ifp; 533 } 534 535 void 536 ifq_delete(struct ifaltq *ifq) 537 { 538 mtx_destroy(&ifq->ifq_mtx); 539 } 540 541 /* 542 * Perform generic interface initalization tasks and attach the interface 543 * to the list of "active" interfaces. If vmove flag is set on entry 544 * to if_attach_internal(), perform only a limited subset of initialization 545 * tasks, given that we are moving from one vnet to another an ifnet which 546 * has already been fully initialized. 547 * 548 * XXX: 549 * - The decision to return void and thus require this function to 550 * succeed is questionable. 551 * - We should probably do more sanity checking. For instance we don't 552 * do anything to insure if_xname is unique or non-empty. 553 */ 554 void 555 if_attach(struct ifnet *ifp) 556 { 557 558 if_attach_internal(ifp, 0); 559 } 560 561 static void 562 if_attach_internal(struct ifnet *ifp, int vmove) 563 { 564 unsigned socksize, ifasize; 565 int namelen, masklen; 566 struct sockaddr_dl *sdl; 567 struct ifaddr *ifa; 568 569 if (ifp->if_index == 0 || ifp != ifnet_byindex(ifp->if_index)) 570 panic ("%s: BUG: if_attach called without if_alloc'd input()\n", 571 ifp->if_xname); 572 573 #ifdef VIMAGE 574 ifp->if_vnet = curvnet; 575 if (ifp->if_home_vnet == NULL) 576 ifp->if_home_vnet = curvnet; 577 #endif 578 579 if_addgroup(ifp, IFG_ALL); 580 581 getmicrotime(&ifp->if_lastchange); 582 ifp->if_data.ifi_epoch = time_uptime; 583 ifp->if_data.ifi_datalen = sizeof(struct if_data); 584 585 KASSERT((ifp->if_transmit == NULL && ifp->if_qflush == NULL) || 586 (ifp->if_transmit != NULL && ifp->if_qflush != NULL), 587 ("transmit and qflush must both either be set or both be NULL")); 588 if (ifp->if_transmit == NULL) { 589 ifp->if_transmit = if_transmit; 590 ifp->if_qflush = if_qflush; 591 } 592 593 if (!vmove) { 594 #ifdef MAC 595 mac_ifnet_create(ifp); 596 #endif 597 598 /* 599 * Create a Link Level name for this device. 600 */ 601 namelen = strlen(ifp->if_xname); 602 /* 603 * Always save enough space for any possiable name so we 604 * can do a rename in place later. 605 */ 606 masklen = offsetof(struct sockaddr_dl, sdl_data[0]) + IFNAMSIZ; 607 socksize = masklen + ifp->if_addrlen; 608 if (socksize < sizeof(*sdl)) 609 socksize = sizeof(*sdl); 610 socksize = roundup2(socksize, sizeof(long)); 611 ifasize = sizeof(*ifa) + 2 * socksize; 612 ifa = malloc(ifasize, M_IFADDR, M_WAITOK | M_ZERO); 613 ifa_init(ifa); 614 sdl = (struct sockaddr_dl *)(ifa + 1); 615 sdl->sdl_len = socksize; 616 sdl->sdl_family = AF_LINK; 617 bcopy(ifp->if_xname, sdl->sdl_data, namelen); 618 sdl->sdl_nlen = namelen; 619 sdl->sdl_index = ifp->if_index; 620 sdl->sdl_type = ifp->if_type; 621 ifp->if_addr = ifa; 622 ifa->ifa_ifp = ifp; 623 ifa->ifa_rtrequest = link_rtrequest; 624 ifa->ifa_addr = (struct sockaddr *)sdl; 625 sdl = (struct sockaddr_dl *)(socksize + (caddr_t)sdl); 626 ifa->ifa_netmask = (struct sockaddr *)sdl; 627 sdl->sdl_len = masklen; 628 while (namelen != 0) 629 sdl->sdl_data[--namelen] = 0xff; 630 TAILQ_INSERT_HEAD(&ifp->if_addrhead, ifa, ifa_link); 631 /* Reliably crash if used uninitialized. */ 632 ifp->if_broadcastaddr = NULL; 633 } 634 #ifdef VIMAGE 635 else { 636 /* 637 * Update the interface index in the link layer address 638 * of the interface. 639 */ 640 for (ifa = ifp->if_addr; ifa != NULL; 641 ifa = TAILQ_NEXT(ifa, ifa_link)) { 642 if (ifa->ifa_addr->sa_family == AF_LINK) { 643 sdl = (struct sockaddr_dl *)ifa->ifa_addr; 644 sdl->sdl_index = ifp->if_index; 645 } 646 } 647 } 648 #endif 649 650 IFNET_WLOCK(); 651 TAILQ_INSERT_TAIL(&V_ifnet, ifp, if_link); 652 #ifdef VIMAGE 653 curvnet->vnet_ifcnt++; 654 #endif 655 IFNET_WUNLOCK(); 656 657 if (domain_init_status >= 2) 658 if_attachdomain1(ifp); 659 660 EVENTHANDLER_INVOKE(ifnet_arrival_event, ifp); 661 if (IS_DEFAULT_VNET(curvnet)) 662 devctl_notify("IFNET", ifp->if_xname, "ATTACH", NULL); 663 664 /* Announce the interface. */ 665 rt_ifannouncemsg(ifp, IFAN_ARRIVAL); 666 } 667 668 static void 669 if_attachdomain(void *dummy) 670 { 671 struct ifnet *ifp; 672 int s; 673 674 s = splnet(); 675 TAILQ_FOREACH(ifp, &V_ifnet, if_link) 676 if_attachdomain1(ifp); 677 splx(s); 678 } 679 SYSINIT(domainifattach, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_SECOND, 680 if_attachdomain, NULL); 681 682 static void 683 if_attachdomain1(struct ifnet *ifp) 684 { 685 struct domain *dp; 686 int s; 687 688 s = splnet(); 689 690 /* 691 * Since dp->dom_ifattach calls malloc() with M_WAITOK, we 692 * cannot lock ifp->if_afdata initialization, entirely. 693 */ 694 if (IF_AFDATA_TRYLOCK(ifp) == 0) { 695 splx(s); 696 return; 697 } 698 if (ifp->if_afdata_initialized >= domain_init_status) { 699 IF_AFDATA_UNLOCK(ifp); 700 splx(s); 701 printf("if_attachdomain called more than once on %s\n", 702 ifp->if_xname); 703 return; 704 } 705 ifp->if_afdata_initialized = domain_init_status; 706 IF_AFDATA_UNLOCK(ifp); 707 708 /* address family dependent data region */ 709 bzero(ifp->if_afdata, sizeof(ifp->if_afdata)); 710 for (dp = domains; dp; dp = dp->dom_next) { 711 if (dp->dom_ifattach) 712 ifp->if_afdata[dp->dom_family] = 713 (*dp->dom_ifattach)(ifp); 714 } 715 716 splx(s); 717 } 718 719 /* 720 * Remove any unicast or broadcast network addresses from an interface. 721 */ 722 void 723 if_purgeaddrs(struct ifnet *ifp) 724 { 725 struct ifaddr *ifa, *next; 726 727 TAILQ_FOREACH_SAFE(ifa, &ifp->if_addrhead, ifa_link, next) { 728 if (ifa->ifa_addr->sa_family == AF_LINK) 729 continue; 730 #ifdef INET 731 /* XXX: Ugly!! ad hoc just for INET */ 732 if (ifa->ifa_addr->sa_family == AF_INET) { 733 struct ifaliasreq ifr; 734 735 bzero(&ifr, sizeof(ifr)); 736 ifr.ifra_addr = *ifa->ifa_addr; 737 if (ifa->ifa_dstaddr) 738 ifr.ifra_broadaddr = *ifa->ifa_dstaddr; 739 if (in_control(NULL, SIOCDIFADDR, (caddr_t)&ifr, ifp, 740 NULL) == 0) 741 continue; 742 } 743 #endif /* INET */ 744 #ifdef INET6 745 if (ifa->ifa_addr->sa_family == AF_INET6) { 746 in6_purgeaddr(ifa); 747 /* ifp_addrhead is already updated */ 748 continue; 749 } 750 #endif /* INET6 */ 751 TAILQ_REMOVE(&ifp->if_addrhead, ifa, ifa_link); 752 ifa_free(ifa); 753 } 754 } 755 756 /* 757 * Remove any multicast network addresses from an interface when an ifnet 758 * is going away. 759 */ 760 static void 761 if_purgemaddrs(struct ifnet *ifp) 762 { 763 struct ifmultiaddr *ifma; 764 struct ifmultiaddr *next; 765 766 IF_ADDR_LOCK(ifp); 767 TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, next) 768 if_delmulti_locked(ifp, ifma, 1); 769 IF_ADDR_UNLOCK(ifp); 770 } 771 772 /* 773 * Detach an interface, removing it from the list of "active" interfaces. 774 * If vmove flag is set on entry to if_detach_internal(), perform only a 775 * limited subset of cleanup tasks, given that we are moving an ifnet from 776 * one vnet to another, where it must be fully operational. 777 * 778 * XXXRW: There are some significant questions about event ordering, and 779 * how to prevent things from starting to use the interface during detach. 780 */ 781 void 782 if_detach(struct ifnet *ifp) 783 { 784 785 if_detach_internal(ifp, 0); 786 } 787 788 static void 789 if_detach_internal(struct ifnet *ifp, int vmove) 790 { 791 struct ifaddr *ifa; 792 struct radix_node_head *rnh; 793 int i, j; 794 struct domain *dp; 795 struct ifnet *iter; 796 int found = 0; 797 798 IFNET_WLOCK(); 799 TAILQ_FOREACH(iter, &V_ifnet, if_link) 800 if (iter == ifp) { 801 TAILQ_REMOVE(&V_ifnet, ifp, if_link); 802 found = 1; 803 break; 804 } 805 #ifdef VIMAGE 806 if (found) 807 curvnet->vnet_ifcnt--; 808 #endif 809 IFNET_WUNLOCK(); 810 if (!found) { 811 if (vmove) 812 panic("interface not in it's own ifnet list"); 813 else 814 return; /* XXX this should panic as well? */ 815 } 816 817 /* 818 * Remove/wait for pending events. 819 */ 820 taskqueue_drain(taskqueue_swi, &ifp->if_linktask); 821 822 /* 823 * Remove routes and flush queues. 824 */ 825 if_down(ifp); 826 #ifdef ALTQ 827 if (ALTQ_IS_ENABLED(&ifp->if_snd)) 828 altq_disable(&ifp->if_snd); 829 if (ALTQ_IS_ATTACHED(&ifp->if_snd)) 830 altq_detach(&ifp->if_snd); 831 #endif 832 833 if_purgeaddrs(ifp); 834 835 #ifdef INET 836 in_ifdetach(ifp); 837 #endif 838 839 #ifdef INET6 840 /* 841 * Remove all IPv6 kernel structs related to ifp. This should be done 842 * before removing routing entries below, since IPv6 interface direct 843 * routes are expected to be removed by the IPv6-specific kernel API. 844 * Otherwise, the kernel will detect some inconsistency and bark it. 845 */ 846 in6_ifdetach(ifp); 847 #endif 848 if_purgemaddrs(ifp); 849 850 if (!vmove) { 851 /* 852 * Prevent further calls into the device driver via ifnet. 853 */ 854 if_dead(ifp); 855 856 /* 857 * Remove link ifaddr pointer and maybe decrement if_index. 858 * Clean up all addresses. 859 */ 860 ifp->if_addr = NULL; 861 862 /* We can now free link ifaddr. */ 863 if (!TAILQ_EMPTY(&ifp->if_addrhead)) { 864 ifa = TAILQ_FIRST(&ifp->if_addrhead); 865 TAILQ_REMOVE(&ifp->if_addrhead, ifa, ifa_link); 866 ifa_free(ifa); 867 } 868 } 869 870 /* 871 * Delete all remaining routes using this interface 872 * Unfortuneatly the only way to do this is to slog through 873 * the entire routing table looking for routes which point 874 * to this interface...oh well... 875 */ 876 for (i = 1; i <= AF_MAX; i++) { 877 for (j = 0; j < rt_numfibs; j++) { 878 rnh = rt_tables_get_rnh(j, i); 879 if (rnh == NULL) 880 continue; 881 RADIX_NODE_HEAD_LOCK(rnh); 882 (void) rnh->rnh_walktree(rnh, if_rtdel, ifp); 883 RADIX_NODE_HEAD_UNLOCK(rnh); 884 } 885 } 886 887 /* Announce that the interface is gone. */ 888 rt_ifannouncemsg(ifp, IFAN_DEPARTURE); 889 EVENTHANDLER_INVOKE(ifnet_departure_event, ifp); 890 if (IS_DEFAULT_VNET(curvnet)) 891 devctl_notify("IFNET", ifp->if_xname, "DETACH", NULL); 892 if_delgroups(ifp); 893 894 IF_AFDATA_LOCK(ifp); 895 for (dp = domains; dp; dp = dp->dom_next) { 896 if (dp->dom_ifdetach && ifp->if_afdata[dp->dom_family]) 897 (*dp->dom_ifdetach)(ifp, 898 ifp->if_afdata[dp->dom_family]); 899 } 900 ifp->if_afdata_initialized = 0; 901 IF_AFDATA_UNLOCK(ifp); 902 } 903 904 #ifdef VIMAGE 905 /* 906 * if_vmove() performs a limited version of if_detach() in current 907 * vnet and if_attach()es the ifnet to the vnet specified as 2nd arg. 908 * An attempt is made to shrink if_index in current vnet, find an 909 * unused if_index in target vnet and calls if_grow() if necessary, 910 * and finally find an unused if_xname for the target vnet. 911 */ 912 void 913 if_vmove(struct ifnet *ifp, struct vnet *new_vnet) 914 { 915 u_short idx; 916 917 /* 918 * Detach from current vnet, but preserve LLADDR info, do not 919 * mark as dead etc. so that the ifnet can be reattached later. 920 */ 921 if_detach_internal(ifp, 1); 922 923 /* 924 * Unlink the ifnet from ifindex_table[] in current vnet, and shrink 925 * the if_index for that vnet if possible. 926 * 927 * NOTE: IFNET_WLOCK/IFNET_WUNLOCK() are assumed to be unvirtualized, 928 * or we'd lock on one vnet and unlock on another. 929 */ 930 IFNET_WLOCK(); 931 ifindex_free_locked(ifp->if_index); 932 933 /* 934 * Switch to the context of the target vnet. 935 */ 936 CURVNET_SET_QUIET(new_vnet); 937 938 if (ifindex_alloc_locked(&idx) != 0) { 939 IFNET_WUNLOCK(); 940 panic("if_index overflow"); 941 } 942 ifp->if_index = idx; 943 ifnet_setbyindex_locked(ifp->if_index, ifp); 944 IFNET_WUNLOCK(); 945 946 if_attach_internal(ifp, 1); 947 948 CURVNET_RESTORE(); 949 } 950 951 /* 952 * Move an ifnet to or from another child prison/vnet, specified by the jail id. 953 */ 954 static int 955 if_vmove_loan(struct thread *td, struct ifnet *ifp, char *ifname, int jid) 956 { 957 struct prison *pr; 958 struct ifnet *difp; 959 960 /* Try to find the prison within our visibility. */ 961 sx_slock(&allprison_lock); 962 pr = prison_find_child(td->td_ucred->cr_prison, jid); 963 sx_sunlock(&allprison_lock); 964 if (pr == NULL) 965 return (ENXIO); 966 prison_hold_locked(pr); 967 mtx_unlock(&pr->pr_mtx); 968 969 /* Do not try to move the iface from and to the same prison. */ 970 if (pr->pr_vnet == ifp->if_vnet) { 971 prison_free(pr); 972 return (EEXIST); 973 } 974 975 /* Make sure the named iface does not exists in the dst. prison/vnet. */ 976 /* XXX Lock interfaces to avoid races. */ 977 CURVNET_SET_QUIET(pr->pr_vnet); 978 difp = ifunit(ifname); 979 CURVNET_RESTORE(); 980 if (difp != NULL) { 981 prison_free(pr); 982 return (EEXIST); 983 } 984 985 /* Move the interface into the child jail/vnet. */ 986 if_vmove(ifp, pr->pr_vnet); 987 988 /* Report the new if_xname back to the userland. */ 989 sprintf(ifname, "%s", ifp->if_xname); 990 991 prison_free(pr); 992 return (0); 993 } 994 995 static int 996 if_vmove_reclaim(struct thread *td, char *ifname, int jid) 997 { 998 struct prison *pr; 999 struct vnet *vnet_dst; 1000 struct ifnet *ifp; 1001 1002 /* Try to find the prison within our visibility. */ 1003 sx_slock(&allprison_lock); 1004 pr = prison_find_child(td->td_ucred->cr_prison, jid); 1005 sx_sunlock(&allprison_lock); 1006 if (pr == NULL) 1007 return (ENXIO); 1008 prison_hold_locked(pr); 1009 mtx_unlock(&pr->pr_mtx); 1010 1011 /* Make sure the named iface exists in the source prison/vnet. */ 1012 CURVNET_SET(pr->pr_vnet); 1013 ifp = ifunit(ifname); /* XXX Lock to avoid races. */ 1014 if (ifp == NULL) { 1015 CURVNET_RESTORE(); 1016 prison_free(pr); 1017 return (ENXIO); 1018 } 1019 1020 /* Do not try to move the iface from and to the same prison. */ 1021 vnet_dst = TD_TO_VNET(td); 1022 if (vnet_dst == ifp->if_vnet) { 1023 CURVNET_RESTORE(); 1024 prison_free(pr); 1025 return (EEXIST); 1026 } 1027 1028 /* Get interface back from child jail/vnet. */ 1029 if_vmove(ifp, vnet_dst); 1030 CURVNET_RESTORE(); 1031 1032 /* Report the new if_xname back to the userland. */ 1033 sprintf(ifname, "%s", ifp->if_xname); 1034 1035 prison_free(pr); 1036 return (0); 1037 } 1038 #endif /* VIMAGE */ 1039 1040 /* 1041 * Add a group to an interface 1042 */ 1043 int 1044 if_addgroup(struct ifnet *ifp, const char *groupname) 1045 { 1046 struct ifg_list *ifgl; 1047 struct ifg_group *ifg = NULL; 1048 struct ifg_member *ifgm; 1049 1050 if (groupname[0] && groupname[strlen(groupname) - 1] >= '0' && 1051 groupname[strlen(groupname) - 1] <= '9') 1052 return (EINVAL); 1053 1054 IFNET_WLOCK(); 1055 TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next) 1056 if (!strcmp(ifgl->ifgl_group->ifg_group, groupname)) { 1057 IFNET_WUNLOCK(); 1058 return (EEXIST); 1059 } 1060 1061 if ((ifgl = (struct ifg_list *)malloc(sizeof(struct ifg_list), M_TEMP, 1062 M_NOWAIT)) == NULL) { 1063 IFNET_WUNLOCK(); 1064 return (ENOMEM); 1065 } 1066 1067 if ((ifgm = (struct ifg_member *)malloc(sizeof(struct ifg_member), 1068 M_TEMP, M_NOWAIT)) == NULL) { 1069 free(ifgl, M_TEMP); 1070 IFNET_WUNLOCK(); 1071 return (ENOMEM); 1072 } 1073 1074 TAILQ_FOREACH(ifg, &V_ifg_head, ifg_next) 1075 if (!strcmp(ifg->ifg_group, groupname)) 1076 break; 1077 1078 if (ifg == NULL) { 1079 if ((ifg = (struct ifg_group *)malloc(sizeof(struct ifg_group), 1080 M_TEMP, M_NOWAIT)) == NULL) { 1081 free(ifgl, M_TEMP); 1082 free(ifgm, M_TEMP); 1083 IFNET_WUNLOCK(); 1084 return (ENOMEM); 1085 } 1086 strlcpy(ifg->ifg_group, groupname, sizeof(ifg->ifg_group)); 1087 ifg->ifg_refcnt = 0; 1088 TAILQ_INIT(&ifg->ifg_members); 1089 EVENTHANDLER_INVOKE(group_attach_event, ifg); 1090 TAILQ_INSERT_TAIL(&V_ifg_head, ifg, ifg_next); 1091 } 1092 1093 ifg->ifg_refcnt++; 1094 ifgl->ifgl_group = ifg; 1095 ifgm->ifgm_ifp = ifp; 1096 1097 IF_ADDR_LOCK(ifp); 1098 TAILQ_INSERT_TAIL(&ifg->ifg_members, ifgm, ifgm_next); 1099 TAILQ_INSERT_TAIL(&ifp->if_groups, ifgl, ifgl_next); 1100 IF_ADDR_UNLOCK(ifp); 1101 1102 IFNET_WUNLOCK(); 1103 1104 EVENTHANDLER_INVOKE(group_change_event, groupname); 1105 1106 return (0); 1107 } 1108 1109 /* 1110 * Remove a group from an interface 1111 */ 1112 int 1113 if_delgroup(struct ifnet *ifp, const char *groupname) 1114 { 1115 struct ifg_list *ifgl; 1116 struct ifg_member *ifgm; 1117 1118 IFNET_WLOCK(); 1119 TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next) 1120 if (!strcmp(ifgl->ifgl_group->ifg_group, groupname)) 1121 break; 1122 if (ifgl == NULL) { 1123 IFNET_WUNLOCK(); 1124 return (ENOENT); 1125 } 1126 1127 IF_ADDR_LOCK(ifp); 1128 TAILQ_REMOVE(&ifp->if_groups, ifgl, ifgl_next); 1129 IF_ADDR_UNLOCK(ifp); 1130 1131 TAILQ_FOREACH(ifgm, &ifgl->ifgl_group->ifg_members, ifgm_next) 1132 if (ifgm->ifgm_ifp == ifp) 1133 break; 1134 1135 if (ifgm != NULL) { 1136 TAILQ_REMOVE(&ifgl->ifgl_group->ifg_members, ifgm, ifgm_next); 1137 free(ifgm, M_TEMP); 1138 } 1139 1140 if (--ifgl->ifgl_group->ifg_refcnt == 0) { 1141 TAILQ_REMOVE(&V_ifg_head, ifgl->ifgl_group, ifg_next); 1142 EVENTHANDLER_INVOKE(group_detach_event, ifgl->ifgl_group); 1143 free(ifgl->ifgl_group, M_TEMP); 1144 } 1145 IFNET_WUNLOCK(); 1146 1147 free(ifgl, M_TEMP); 1148 1149 EVENTHANDLER_INVOKE(group_change_event, groupname); 1150 1151 return (0); 1152 } 1153 1154 /* 1155 * Remove an interface from all groups 1156 */ 1157 static void 1158 if_delgroups(struct ifnet *ifp) 1159 { 1160 struct ifg_list *ifgl; 1161 struct ifg_member *ifgm; 1162 char groupname[IFNAMSIZ]; 1163 1164 IFNET_WLOCK(); 1165 while (!TAILQ_EMPTY(&ifp->if_groups)) { 1166 ifgl = TAILQ_FIRST(&ifp->if_groups); 1167 1168 strlcpy(groupname, ifgl->ifgl_group->ifg_group, IFNAMSIZ); 1169 1170 IF_ADDR_LOCK(ifp); 1171 TAILQ_REMOVE(&ifp->if_groups, ifgl, ifgl_next); 1172 IF_ADDR_UNLOCK(ifp); 1173 1174 TAILQ_FOREACH(ifgm, &ifgl->ifgl_group->ifg_members, ifgm_next) 1175 if (ifgm->ifgm_ifp == ifp) 1176 break; 1177 1178 if (ifgm != NULL) { 1179 TAILQ_REMOVE(&ifgl->ifgl_group->ifg_members, ifgm, 1180 ifgm_next); 1181 free(ifgm, M_TEMP); 1182 } 1183 1184 if (--ifgl->ifgl_group->ifg_refcnt == 0) { 1185 TAILQ_REMOVE(&V_ifg_head, ifgl->ifgl_group, ifg_next); 1186 EVENTHANDLER_INVOKE(group_detach_event, 1187 ifgl->ifgl_group); 1188 free(ifgl->ifgl_group, M_TEMP); 1189 } 1190 IFNET_WUNLOCK(); 1191 1192 free(ifgl, M_TEMP); 1193 1194 EVENTHANDLER_INVOKE(group_change_event, groupname); 1195 1196 IFNET_WLOCK(); 1197 } 1198 IFNET_WUNLOCK(); 1199 } 1200 1201 /* 1202 * Stores all groups from an interface in memory pointed 1203 * to by data 1204 */ 1205 static int 1206 if_getgroup(struct ifgroupreq *data, struct ifnet *ifp) 1207 { 1208 int len, error; 1209 struct ifg_list *ifgl; 1210 struct ifg_req ifgrq, *ifgp; 1211 struct ifgroupreq *ifgr = data; 1212 1213 if (ifgr->ifgr_len == 0) { 1214 IF_ADDR_LOCK(ifp); 1215 TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next) 1216 ifgr->ifgr_len += sizeof(struct ifg_req); 1217 IF_ADDR_UNLOCK(ifp); 1218 return (0); 1219 } 1220 1221 len = ifgr->ifgr_len; 1222 ifgp = ifgr->ifgr_groups; 1223 /* XXX: wire */ 1224 IF_ADDR_LOCK(ifp); 1225 TAILQ_FOREACH(ifgl, &ifp->if_groups, ifgl_next) { 1226 if (len < sizeof(ifgrq)) { 1227 IF_ADDR_UNLOCK(ifp); 1228 return (EINVAL); 1229 } 1230 bzero(&ifgrq, sizeof ifgrq); 1231 strlcpy(ifgrq.ifgrq_group, ifgl->ifgl_group->ifg_group, 1232 sizeof(ifgrq.ifgrq_group)); 1233 if ((error = copyout(&ifgrq, ifgp, sizeof(struct ifg_req)))) { 1234 IF_ADDR_UNLOCK(ifp); 1235 return (error); 1236 } 1237 len -= sizeof(ifgrq); 1238 ifgp++; 1239 } 1240 IF_ADDR_UNLOCK(ifp); 1241 1242 return (0); 1243 } 1244 1245 /* 1246 * Stores all members of a group in memory pointed to by data 1247 */ 1248 static int 1249 if_getgroupmembers(struct ifgroupreq *data) 1250 { 1251 struct ifgroupreq *ifgr = data; 1252 struct ifg_group *ifg; 1253 struct ifg_member *ifgm; 1254 struct ifg_req ifgrq, *ifgp; 1255 int len, error; 1256 1257 IFNET_RLOCK(); 1258 TAILQ_FOREACH(ifg, &V_ifg_head, ifg_next) 1259 if (!strcmp(ifg->ifg_group, ifgr->ifgr_name)) 1260 break; 1261 if (ifg == NULL) { 1262 IFNET_RUNLOCK(); 1263 return (ENOENT); 1264 } 1265 1266 if (ifgr->ifgr_len == 0) { 1267 TAILQ_FOREACH(ifgm, &ifg->ifg_members, ifgm_next) 1268 ifgr->ifgr_len += sizeof(ifgrq); 1269 IFNET_RUNLOCK(); 1270 return (0); 1271 } 1272 1273 len = ifgr->ifgr_len; 1274 ifgp = ifgr->ifgr_groups; 1275 TAILQ_FOREACH(ifgm, &ifg->ifg_members, ifgm_next) { 1276 if (len < sizeof(ifgrq)) { 1277 IFNET_RUNLOCK(); 1278 return (EINVAL); 1279 } 1280 bzero(&ifgrq, sizeof ifgrq); 1281 strlcpy(ifgrq.ifgrq_member, ifgm->ifgm_ifp->if_xname, 1282 sizeof(ifgrq.ifgrq_member)); 1283 if ((error = copyout(&ifgrq, ifgp, sizeof(struct ifg_req)))) { 1284 IFNET_RUNLOCK(); 1285 return (error); 1286 } 1287 len -= sizeof(ifgrq); 1288 ifgp++; 1289 } 1290 IFNET_RUNLOCK(); 1291 1292 return (0); 1293 } 1294 1295 /* 1296 * Delete Routes for a Network Interface 1297 * 1298 * Called for each routing entry via the rnh->rnh_walktree() call above 1299 * to delete all route entries referencing a detaching network interface. 1300 * 1301 * Arguments: 1302 * rn pointer to node in the routing table 1303 * arg argument passed to rnh->rnh_walktree() - detaching interface 1304 * 1305 * Returns: 1306 * 0 successful 1307 * errno failed - reason indicated 1308 * 1309 */ 1310 static int 1311 if_rtdel(struct radix_node *rn, void *arg) 1312 { 1313 struct rtentry *rt = (struct rtentry *)rn; 1314 struct ifnet *ifp = arg; 1315 int err; 1316 1317 if (rt->rt_ifp == ifp) { 1318 1319 /* 1320 * Protect (sorta) against walktree recursion problems 1321 * with cloned routes 1322 */ 1323 if ((rt->rt_flags & RTF_UP) == 0) 1324 return (0); 1325 1326 err = rtrequest_fib(RTM_DELETE, rt_key(rt), rt->rt_gateway, 1327 rt_mask(rt), rt->rt_flags|RTF_RNH_LOCKED, 1328 (struct rtentry **) NULL, rt->rt_fibnum); 1329 if (err) { 1330 log(LOG_WARNING, "if_rtdel: error %d\n", err); 1331 } 1332 } 1333 1334 return (0); 1335 } 1336 1337 /* 1338 * Wrapper functions for struct ifnet address list locking macros. These are 1339 * used by kernel modules to avoid encoding programming interface or binary 1340 * interface assumptions that may be violated when kernel-internal locking 1341 * approaches change. 1342 */ 1343 void 1344 if_addr_rlock(struct ifnet *ifp) 1345 { 1346 1347 IF_ADDR_LOCK(ifp); 1348 } 1349 1350 void 1351 if_addr_runlock(struct ifnet *ifp) 1352 { 1353 1354 IF_ADDR_UNLOCK(ifp); 1355 } 1356 1357 void 1358 if_maddr_rlock(struct ifnet *ifp) 1359 { 1360 1361 IF_ADDR_LOCK(ifp); 1362 } 1363 1364 void 1365 if_maddr_runlock(struct ifnet *ifp) 1366 { 1367 1368 IF_ADDR_UNLOCK(ifp); 1369 } 1370 1371 /* 1372 * Reference count functions for ifaddrs. 1373 */ 1374 void 1375 ifa_init(struct ifaddr *ifa) 1376 { 1377 1378 mtx_init(&ifa->ifa_mtx, "ifaddr", NULL, MTX_DEF); 1379 refcount_init(&ifa->ifa_refcnt, 1); 1380 } 1381 1382 void 1383 ifa_ref(struct ifaddr *ifa) 1384 { 1385 1386 refcount_acquire(&ifa->ifa_refcnt); 1387 } 1388 1389 void 1390 ifa_free(struct ifaddr *ifa) 1391 { 1392 1393 if (refcount_release(&ifa->ifa_refcnt)) { 1394 mtx_destroy(&ifa->ifa_mtx); 1395 free(ifa, M_IFADDR); 1396 } 1397 } 1398 1399 int 1400 ifa_add_loopback_route(struct ifaddr *ifa, struct sockaddr *ia) 1401 { 1402 int error = 0; 1403 struct rtentry *rt = NULL; 1404 struct rt_addrinfo info; 1405 static struct sockaddr_dl null_sdl = {sizeof(null_sdl), AF_LINK}; 1406 1407 bzero(&info, sizeof(info)); 1408 info.rti_ifp = V_loif; 1409 info.rti_flags = ifa->ifa_flags | RTF_HOST | RTF_STATIC; 1410 info.rti_info[RTAX_DST] = ia; 1411 info.rti_info[RTAX_GATEWAY] = (struct sockaddr *)&null_sdl; 1412 error = rtrequest1_fib(RTM_ADD, &info, &rt, 0); 1413 1414 if (error == 0 && rt != NULL) { 1415 RT_LOCK(rt); 1416 ((struct sockaddr_dl *)rt->rt_gateway)->sdl_type = 1417 ifa->ifa_ifp->if_type; 1418 ((struct sockaddr_dl *)rt->rt_gateway)->sdl_index = 1419 ifa->ifa_ifp->if_index; 1420 RT_REMREF(rt); 1421 RT_UNLOCK(rt); 1422 } else if (error != 0) 1423 log(LOG_INFO, "ifa_add_loopback_route: insertion failed\n"); 1424 1425 return (error); 1426 } 1427 1428 int 1429 ifa_del_loopback_route(struct ifaddr *ifa, struct sockaddr *ia) 1430 { 1431 int error = 0; 1432 struct rt_addrinfo info; 1433 struct sockaddr_dl null_sdl; 1434 1435 bzero(&null_sdl, sizeof(null_sdl)); 1436 null_sdl.sdl_len = sizeof(null_sdl); 1437 null_sdl.sdl_family = AF_LINK; 1438 null_sdl.sdl_type = ifa->ifa_ifp->if_type; 1439 null_sdl.sdl_index = ifa->ifa_ifp->if_index; 1440 bzero(&info, sizeof(info)); 1441 info.rti_flags = ifa->ifa_flags | RTF_HOST | RTF_STATIC; 1442 info.rti_info[RTAX_DST] = ia; 1443 info.rti_info[RTAX_GATEWAY] = (struct sockaddr *)&null_sdl; 1444 error = rtrequest1_fib(RTM_DELETE, &info, NULL, 0); 1445 1446 if (error != 0) 1447 log(LOG_INFO, "ifa_del_loopback_route: deletion failed\n"); 1448 1449 return (error); 1450 } 1451 1452 /* 1453 * XXX: Because sockaddr_dl has deeper structure than the sockaddr 1454 * structs used to represent other address families, it is necessary 1455 * to perform a different comparison. 1456 */ 1457 1458 #define sa_equal(a1, a2) \ 1459 (bcmp((a1), (a2), ((a1))->sa_len) == 0) 1460 1461 #define sa_dl_equal(a1, a2) \ 1462 ((((struct sockaddr_dl *)(a1))->sdl_len == \ 1463 ((struct sockaddr_dl *)(a2))->sdl_len) && \ 1464 (bcmp(LLADDR((struct sockaddr_dl *)(a1)), \ 1465 LLADDR((struct sockaddr_dl *)(a2)), \ 1466 ((struct sockaddr_dl *)(a1))->sdl_alen) == 0)) 1467 1468 /* 1469 * Locate an interface based on a complete address. 1470 */ 1471 /*ARGSUSED*/ 1472 static struct ifaddr * 1473 ifa_ifwithaddr_internal(struct sockaddr *addr, int getref) 1474 { 1475 struct ifnet *ifp; 1476 struct ifaddr *ifa; 1477 1478 IFNET_RLOCK_NOSLEEP(); 1479 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 1480 IF_ADDR_LOCK(ifp); 1481 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 1482 if (ifa->ifa_addr->sa_family != addr->sa_family) 1483 continue; 1484 if (sa_equal(addr, ifa->ifa_addr)) { 1485 if (getref) 1486 ifa_ref(ifa); 1487 IF_ADDR_UNLOCK(ifp); 1488 goto done; 1489 } 1490 /* IP6 doesn't have broadcast */ 1491 if ((ifp->if_flags & IFF_BROADCAST) && 1492 ifa->ifa_broadaddr && 1493 ifa->ifa_broadaddr->sa_len != 0 && 1494 sa_equal(ifa->ifa_broadaddr, addr)) { 1495 if (getref) 1496 ifa_ref(ifa); 1497 IF_ADDR_UNLOCK(ifp); 1498 goto done; 1499 } 1500 } 1501 IF_ADDR_UNLOCK(ifp); 1502 } 1503 ifa = NULL; 1504 done: 1505 IFNET_RUNLOCK_NOSLEEP(); 1506 return (ifa); 1507 } 1508 1509 struct ifaddr * 1510 ifa_ifwithaddr(struct sockaddr *addr) 1511 { 1512 1513 return (ifa_ifwithaddr_internal(addr, 1)); 1514 } 1515 1516 int 1517 ifa_ifwithaddr_check(struct sockaddr *addr) 1518 { 1519 1520 return (ifa_ifwithaddr_internal(addr, 0) != NULL); 1521 } 1522 1523 /* 1524 * Locate an interface based on the broadcast address. 1525 */ 1526 /* ARGSUSED */ 1527 struct ifaddr * 1528 ifa_ifwithbroadaddr(struct sockaddr *addr) 1529 { 1530 struct ifnet *ifp; 1531 struct ifaddr *ifa; 1532 1533 IFNET_RLOCK_NOSLEEP(); 1534 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 1535 IF_ADDR_LOCK(ifp); 1536 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 1537 if (ifa->ifa_addr->sa_family != addr->sa_family) 1538 continue; 1539 if ((ifp->if_flags & IFF_BROADCAST) && 1540 ifa->ifa_broadaddr && 1541 ifa->ifa_broadaddr->sa_len != 0 && 1542 sa_equal(ifa->ifa_broadaddr, addr)) { 1543 ifa_ref(ifa); 1544 IF_ADDR_UNLOCK(ifp); 1545 goto done; 1546 } 1547 } 1548 IF_ADDR_UNLOCK(ifp); 1549 } 1550 ifa = NULL; 1551 done: 1552 IFNET_RUNLOCK_NOSLEEP(); 1553 return (ifa); 1554 } 1555 1556 /* 1557 * Locate the point to point interface with a given destination address. 1558 */ 1559 /*ARGSUSED*/ 1560 struct ifaddr * 1561 ifa_ifwithdstaddr(struct sockaddr *addr) 1562 { 1563 struct ifnet *ifp; 1564 struct ifaddr *ifa; 1565 1566 IFNET_RLOCK_NOSLEEP(); 1567 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 1568 if ((ifp->if_flags & IFF_POINTOPOINT) == 0) 1569 continue; 1570 IF_ADDR_LOCK(ifp); 1571 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 1572 if (ifa->ifa_addr->sa_family != addr->sa_family) 1573 continue; 1574 if (ifa->ifa_dstaddr != NULL && 1575 sa_equal(addr, ifa->ifa_dstaddr)) { 1576 ifa_ref(ifa); 1577 IF_ADDR_UNLOCK(ifp); 1578 goto done; 1579 } 1580 } 1581 IF_ADDR_UNLOCK(ifp); 1582 } 1583 ifa = NULL; 1584 done: 1585 IFNET_RUNLOCK_NOSLEEP(); 1586 return (ifa); 1587 } 1588 1589 /* 1590 * Find an interface on a specific network. If many, choice 1591 * is most specific found. 1592 */ 1593 struct ifaddr * 1594 ifa_ifwithnet(struct sockaddr *addr) 1595 { 1596 struct ifnet *ifp; 1597 struct ifaddr *ifa; 1598 struct ifaddr *ifa_maybe = NULL; 1599 u_int af = addr->sa_family; 1600 char *addr_data = addr->sa_data, *cplim; 1601 1602 /* 1603 * AF_LINK addresses can be looked up directly by their index number, 1604 * so do that if we can. 1605 */ 1606 if (af == AF_LINK) { 1607 struct sockaddr_dl *sdl = (struct sockaddr_dl *)addr; 1608 if (sdl->sdl_index && sdl->sdl_index <= V_if_index) 1609 return (ifaddr_byindex(sdl->sdl_index)); 1610 } 1611 1612 /* 1613 * Scan though each interface, looking for ones that have addresses 1614 * in this address family. Maintain a reference on ifa_maybe once 1615 * we find one, as we release the IF_ADDR_LOCK() that kept it stable 1616 * when we move onto the next interface. 1617 */ 1618 IFNET_RLOCK_NOSLEEP(); 1619 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 1620 IF_ADDR_LOCK(ifp); 1621 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 1622 char *cp, *cp2, *cp3; 1623 1624 if (ifa->ifa_addr->sa_family != af) 1625 next: continue; 1626 if (af == AF_INET && ifp->if_flags & IFF_POINTOPOINT) { 1627 /* 1628 * This is a bit broken as it doesn't 1629 * take into account that the remote end may 1630 * be a single node in the network we are 1631 * looking for. 1632 * The trouble is that we don't know the 1633 * netmask for the remote end. 1634 */ 1635 if (ifa->ifa_dstaddr != NULL && 1636 sa_equal(addr, ifa->ifa_dstaddr)) { 1637 ifa_ref(ifa); 1638 IF_ADDR_UNLOCK(ifp); 1639 goto done; 1640 } 1641 } else { 1642 /* 1643 * if we have a special address handler, 1644 * then use it instead of the generic one. 1645 */ 1646 if (ifa->ifa_claim_addr) { 1647 if ((*ifa->ifa_claim_addr)(ifa, addr)) { 1648 ifa_ref(ifa); 1649 IF_ADDR_UNLOCK(ifp); 1650 goto done; 1651 } 1652 continue; 1653 } 1654 1655 /* 1656 * Scan all the bits in the ifa's address. 1657 * If a bit dissagrees with what we are 1658 * looking for, mask it with the netmask 1659 * to see if it really matters. 1660 * (A byte at a time) 1661 */ 1662 if (ifa->ifa_netmask == 0) 1663 continue; 1664 cp = addr_data; 1665 cp2 = ifa->ifa_addr->sa_data; 1666 cp3 = ifa->ifa_netmask->sa_data; 1667 cplim = ifa->ifa_netmask->sa_len 1668 + (char *)ifa->ifa_netmask; 1669 while (cp3 < cplim) 1670 if ((*cp++ ^ *cp2++) & *cp3++) 1671 goto next; /* next address! */ 1672 /* 1673 * If the netmask of what we just found 1674 * is more specific than what we had before 1675 * (if we had one) then remember the new one 1676 * before continuing to search 1677 * for an even better one. 1678 */ 1679 if (ifa_maybe == NULL || 1680 rn_refines((caddr_t)ifa->ifa_netmask, 1681 (caddr_t)ifa_maybe->ifa_netmask)) { 1682 if (ifa_maybe != NULL) 1683 ifa_free(ifa_maybe); 1684 ifa_maybe = ifa; 1685 ifa_ref(ifa_maybe); 1686 } 1687 } 1688 } 1689 IF_ADDR_UNLOCK(ifp); 1690 } 1691 ifa = ifa_maybe; 1692 ifa_maybe = NULL; 1693 done: 1694 IFNET_RUNLOCK_NOSLEEP(); 1695 if (ifa_maybe != NULL) 1696 ifa_free(ifa_maybe); 1697 return (ifa); 1698 } 1699 1700 /* 1701 * Find an interface address specific to an interface best matching 1702 * a given address. 1703 */ 1704 struct ifaddr * 1705 ifaof_ifpforaddr(struct sockaddr *addr, struct ifnet *ifp) 1706 { 1707 struct ifaddr *ifa; 1708 char *cp, *cp2, *cp3; 1709 char *cplim; 1710 struct ifaddr *ifa_maybe = NULL; 1711 u_int af = addr->sa_family; 1712 1713 if (af >= AF_MAX) 1714 return (0); 1715 IF_ADDR_LOCK(ifp); 1716 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 1717 if (ifa->ifa_addr->sa_family != af) 1718 continue; 1719 if (ifa_maybe == NULL) 1720 ifa_maybe = ifa; 1721 if (ifa->ifa_netmask == 0) { 1722 if (sa_equal(addr, ifa->ifa_addr) || 1723 (ifa->ifa_dstaddr && 1724 sa_equal(addr, ifa->ifa_dstaddr))) 1725 goto done; 1726 continue; 1727 } 1728 if (ifp->if_flags & IFF_POINTOPOINT) { 1729 if (sa_equal(addr, ifa->ifa_dstaddr)) 1730 goto done; 1731 } else { 1732 cp = addr->sa_data; 1733 cp2 = ifa->ifa_addr->sa_data; 1734 cp3 = ifa->ifa_netmask->sa_data; 1735 cplim = ifa->ifa_netmask->sa_len + (char *)ifa->ifa_netmask; 1736 for (; cp3 < cplim; cp3++) 1737 if ((*cp++ ^ *cp2++) & *cp3) 1738 break; 1739 if (cp3 == cplim) 1740 goto done; 1741 } 1742 } 1743 ifa = ifa_maybe; 1744 done: 1745 if (ifa != NULL) 1746 ifa_ref(ifa); 1747 IF_ADDR_UNLOCK(ifp); 1748 return (ifa); 1749 } 1750 1751 #include <net/if_llatbl.h> 1752 1753 /* 1754 * Default action when installing a route with a Link Level gateway. 1755 * Lookup an appropriate real ifa to point to. 1756 * This should be moved to /sys/net/link.c eventually. 1757 */ 1758 static void 1759 link_rtrequest(int cmd, struct rtentry *rt, struct rt_addrinfo *info) 1760 { 1761 struct ifaddr *ifa, *oifa; 1762 struct sockaddr *dst; 1763 struct ifnet *ifp; 1764 1765 RT_LOCK_ASSERT(rt); 1766 1767 if (cmd != RTM_ADD || ((ifa = rt->rt_ifa) == 0) || 1768 ((ifp = ifa->ifa_ifp) == 0) || ((dst = rt_key(rt)) == 0)) 1769 return; 1770 ifa = ifaof_ifpforaddr(dst, ifp); 1771 if (ifa) { 1772 oifa = rt->rt_ifa; 1773 rt->rt_ifa = ifa; 1774 ifa_free(oifa); 1775 if (ifa->ifa_rtrequest && ifa->ifa_rtrequest != link_rtrequest) 1776 ifa->ifa_rtrequest(cmd, rt, info); 1777 } 1778 } 1779 1780 /* 1781 * Mark an interface down and notify protocols of 1782 * the transition. 1783 * NOTE: must be called at splnet or eqivalent. 1784 */ 1785 static void 1786 if_unroute(struct ifnet *ifp, int flag, int fam) 1787 { 1788 struct ifaddr *ifa; 1789 1790 KASSERT(flag == IFF_UP, ("if_unroute: flag != IFF_UP")); 1791 1792 ifp->if_flags &= ~flag; 1793 getmicrotime(&ifp->if_lastchange); 1794 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) 1795 if (fam == PF_UNSPEC || (fam == ifa->ifa_addr->sa_family)) 1796 pfctlinput(PRC_IFDOWN, ifa->ifa_addr); 1797 ifp->if_qflush(ifp); 1798 1799 #if defined(INET) || defined(INET6) 1800 #ifdef DEV_CARP 1801 if (ifp->if_carp) 1802 carp_carpdev_state(ifp->if_carp); 1803 #endif 1804 #endif 1805 rt_ifmsg(ifp); 1806 } 1807 1808 /* 1809 * Mark an interface up and notify protocols of 1810 * the transition. 1811 * NOTE: must be called at splnet or eqivalent. 1812 */ 1813 static void 1814 if_route(struct ifnet *ifp, int flag, int fam) 1815 { 1816 struct ifaddr *ifa; 1817 1818 KASSERT(flag == IFF_UP, ("if_route: flag != IFF_UP")); 1819 1820 ifp->if_flags |= flag; 1821 getmicrotime(&ifp->if_lastchange); 1822 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) 1823 if (fam == PF_UNSPEC || (fam == ifa->ifa_addr->sa_family)) 1824 pfctlinput(PRC_IFUP, ifa->ifa_addr); 1825 #if defined(INET) || defined(INET6) 1826 #ifdef DEV_CARP 1827 if (ifp->if_carp) 1828 carp_carpdev_state(ifp->if_carp); 1829 #endif 1830 #endif 1831 rt_ifmsg(ifp); 1832 #ifdef INET6 1833 in6_if_up(ifp); 1834 #endif 1835 } 1836 1837 void (*vlan_link_state_p)(struct ifnet *); /* XXX: private from if_vlan */ 1838 void (*vlan_trunk_cap_p)(struct ifnet *); /* XXX: private from if_vlan */ 1839 1840 /* 1841 * Handle a change in the interface link state. To avoid LORs 1842 * between driver lock and upper layer locks, as well as possible 1843 * recursions, we post event to taskqueue, and all job 1844 * is done in static do_link_state_change(). 1845 */ 1846 void 1847 if_link_state_change(struct ifnet *ifp, int link_state) 1848 { 1849 /* Return if state hasn't changed. */ 1850 if (ifp->if_link_state == link_state) 1851 return; 1852 1853 ifp->if_link_state = link_state; 1854 1855 taskqueue_enqueue(taskqueue_swi, &ifp->if_linktask); 1856 } 1857 1858 static void 1859 do_link_state_change(void *arg, int pending) 1860 { 1861 struct ifnet *ifp = (struct ifnet *)arg; 1862 int link_state = ifp->if_link_state; 1863 CURVNET_SET(ifp->if_vnet); 1864 1865 /* Notify that the link state has changed. */ 1866 rt_ifmsg(ifp); 1867 if (ifp->if_vlantrunk != NULL) 1868 (*vlan_link_state_p)(ifp); 1869 1870 if ((ifp->if_type == IFT_ETHER || ifp->if_type == IFT_L2VLAN) && 1871 IFP2AC(ifp)->ac_netgraph != NULL) 1872 (*ng_ether_link_state_p)(ifp, link_state); 1873 #if defined(INET) || defined(INET6) 1874 #ifdef DEV_CARP 1875 if (ifp->if_carp) 1876 carp_carpdev_state(ifp->if_carp); 1877 #endif 1878 #endif 1879 if (ifp->if_bridge) { 1880 KASSERT(bstp_linkstate_p != NULL,("if_bridge bstp not loaded!")); 1881 (*bstp_linkstate_p)(ifp, link_state); 1882 } 1883 if (ifp->if_lagg) { 1884 KASSERT(lagg_linkstate_p != NULL,("if_lagg not loaded!")); 1885 (*lagg_linkstate_p)(ifp, link_state); 1886 } 1887 1888 if (IS_DEFAULT_VNET(curvnet)) 1889 devctl_notify("IFNET", ifp->if_xname, 1890 (link_state == LINK_STATE_UP) ? "LINK_UP" : "LINK_DOWN", 1891 NULL); 1892 if (pending > 1) 1893 if_printf(ifp, "%d link states coalesced\n", pending); 1894 if (log_link_state_change) 1895 log(LOG_NOTICE, "%s: link state changed to %s\n", ifp->if_xname, 1896 (link_state == LINK_STATE_UP) ? "UP" : "DOWN" ); 1897 CURVNET_RESTORE(); 1898 } 1899 1900 /* 1901 * Mark an interface down and notify protocols of 1902 * the transition. 1903 * NOTE: must be called at splnet or eqivalent. 1904 */ 1905 void 1906 if_down(struct ifnet *ifp) 1907 { 1908 1909 if_unroute(ifp, IFF_UP, AF_UNSPEC); 1910 } 1911 1912 /* 1913 * Mark an interface up and notify protocols of 1914 * the transition. 1915 * NOTE: must be called at splnet or eqivalent. 1916 */ 1917 void 1918 if_up(struct ifnet *ifp) 1919 { 1920 1921 if_route(ifp, IFF_UP, AF_UNSPEC); 1922 } 1923 1924 /* 1925 * Flush an interface queue. 1926 */ 1927 void 1928 if_qflush(struct ifnet *ifp) 1929 { 1930 struct mbuf *m, *n; 1931 struct ifaltq *ifq; 1932 1933 ifq = &ifp->if_snd; 1934 IFQ_LOCK(ifq); 1935 #ifdef ALTQ 1936 if (ALTQ_IS_ENABLED(ifq)) 1937 ALTQ_PURGE(ifq); 1938 #endif 1939 n = ifq->ifq_head; 1940 while ((m = n) != 0) { 1941 n = m->m_act; 1942 m_freem(m); 1943 } 1944 ifq->ifq_head = 0; 1945 ifq->ifq_tail = 0; 1946 ifq->ifq_len = 0; 1947 IFQ_UNLOCK(ifq); 1948 } 1949 1950 /* 1951 * Map interface name to interface structure pointer, with or without 1952 * returning a reference. 1953 */ 1954 struct ifnet * 1955 ifunit_ref(const char *name) 1956 { 1957 struct ifnet *ifp; 1958 1959 IFNET_RLOCK_NOSLEEP(); 1960 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 1961 if (strncmp(name, ifp->if_xname, IFNAMSIZ) == 0 && 1962 !(ifp->if_flags & IFF_DYING)) 1963 break; 1964 } 1965 if (ifp != NULL) 1966 if_ref(ifp); 1967 IFNET_RUNLOCK_NOSLEEP(); 1968 return (ifp); 1969 } 1970 1971 struct ifnet * 1972 ifunit(const char *name) 1973 { 1974 struct ifnet *ifp; 1975 1976 IFNET_RLOCK_NOSLEEP(); 1977 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 1978 if (strncmp(name, ifp->if_xname, IFNAMSIZ) == 0) 1979 break; 1980 } 1981 IFNET_RUNLOCK_NOSLEEP(); 1982 return (ifp); 1983 } 1984 1985 /* 1986 * Hardware specific interface ioctls. 1987 */ 1988 static int 1989 ifhwioctl(u_long cmd, struct ifnet *ifp, caddr_t data, struct thread *td) 1990 { 1991 struct ifreq *ifr; 1992 struct ifstat *ifs; 1993 int error = 0; 1994 int new_flags, temp_flags; 1995 size_t namelen, onamelen; 1996 size_t descrlen; 1997 char *descrbuf, *odescrbuf; 1998 char new_name[IFNAMSIZ]; 1999 struct ifaddr *ifa; 2000 struct sockaddr_dl *sdl; 2001 2002 ifr = (struct ifreq *)data; 2003 switch (cmd) { 2004 case SIOCGIFINDEX: 2005 ifr->ifr_index = ifp->if_index; 2006 break; 2007 2008 case SIOCGIFFLAGS: 2009 temp_flags = ifp->if_flags | ifp->if_drv_flags; 2010 ifr->ifr_flags = temp_flags & 0xffff; 2011 ifr->ifr_flagshigh = temp_flags >> 16; 2012 break; 2013 2014 case SIOCGIFCAP: 2015 ifr->ifr_reqcap = ifp->if_capabilities; 2016 ifr->ifr_curcap = ifp->if_capenable; 2017 break; 2018 2019 #ifdef MAC 2020 case SIOCGIFMAC: 2021 error = mac_ifnet_ioctl_get(td->td_ucred, ifr, ifp); 2022 break; 2023 #endif 2024 2025 case SIOCGIFMETRIC: 2026 ifr->ifr_metric = ifp->if_metric; 2027 break; 2028 2029 case SIOCGIFMTU: 2030 ifr->ifr_mtu = ifp->if_mtu; 2031 break; 2032 2033 case SIOCGIFPHYS: 2034 ifr->ifr_phys = ifp->if_physical; 2035 break; 2036 2037 case SIOCGIFDESCR: 2038 error = 0; 2039 sx_slock(&ifdescr_sx); 2040 if (ifp->if_description == NULL) { 2041 ifr->ifr_buffer.length = 0; 2042 error = ENOMSG; 2043 } else { 2044 /* space for terminating nul */ 2045 descrlen = strlen(ifp->if_description) + 1; 2046 if (ifr->ifr_buffer.length < descrlen) 2047 error = ENAMETOOLONG; 2048 else 2049 error = copyout(ifp->if_description, 2050 ifr->ifr_buffer.buffer, descrlen); 2051 ifr->ifr_buffer.length = descrlen; 2052 } 2053 sx_sunlock(&ifdescr_sx); 2054 break; 2055 2056 case SIOCSIFDESCR: 2057 error = priv_check(td, PRIV_NET_SETIFDESCR); 2058 if (error) 2059 return (error); 2060 2061 /* 2062 * Copy only (length-1) bytes to make sure that 2063 * if_description is always nul terminated. The 2064 * length parameter is supposed to count the 2065 * terminating nul in. 2066 */ 2067 if (ifr->ifr_buffer.length > ifdescr_maxlen) 2068 return (ENAMETOOLONG); 2069 else if (ifr->ifr_buffer.length == 0) 2070 descrbuf = NULL; 2071 else { 2072 descrbuf = malloc(ifr->ifr_buffer.length, M_IFDESCR, 2073 M_WAITOK | M_ZERO); 2074 error = copyin(ifr->ifr_buffer.buffer, descrbuf, 2075 ifr->ifr_buffer.length - 1); 2076 if (error) { 2077 free(descrbuf, M_IFDESCR); 2078 break; 2079 } 2080 } 2081 2082 sx_xlock(&ifdescr_sx); 2083 odescrbuf = ifp->if_description; 2084 ifp->if_description = descrbuf; 2085 sx_xunlock(&ifdescr_sx); 2086 2087 getmicrotime(&ifp->if_lastchange); 2088 free(odescrbuf, M_IFDESCR); 2089 break; 2090 2091 case SIOCSIFFLAGS: 2092 error = priv_check(td, PRIV_NET_SETIFFLAGS); 2093 if (error) 2094 return (error); 2095 /* 2096 * Currently, no driver owned flags pass the IFF_CANTCHANGE 2097 * check, so we don't need special handling here yet. 2098 */ 2099 new_flags = (ifr->ifr_flags & 0xffff) | 2100 (ifr->ifr_flagshigh << 16); 2101 if (ifp->if_flags & IFF_SMART) { 2102 /* Smart drivers twiddle their own routes */ 2103 } else if (ifp->if_flags & IFF_UP && 2104 (new_flags & IFF_UP) == 0) { 2105 int s = splimp(); 2106 if_down(ifp); 2107 splx(s); 2108 } else if (new_flags & IFF_UP && 2109 (ifp->if_flags & IFF_UP) == 0) { 2110 int s = splimp(); 2111 if_up(ifp); 2112 splx(s); 2113 } 2114 /* See if permanently promiscuous mode bit is about to flip */ 2115 if ((ifp->if_flags ^ new_flags) & IFF_PPROMISC) { 2116 if (new_flags & IFF_PPROMISC) 2117 ifp->if_flags |= IFF_PROMISC; 2118 else if (ifp->if_pcount == 0) 2119 ifp->if_flags &= ~IFF_PROMISC; 2120 log(LOG_INFO, "%s: permanently promiscuous mode %s\n", 2121 ifp->if_xname, 2122 (new_flags & IFF_PPROMISC) ? "enabled" : "disabled"); 2123 } 2124 ifp->if_flags = (ifp->if_flags & IFF_CANTCHANGE) | 2125 (new_flags &~ IFF_CANTCHANGE); 2126 if (ifp->if_ioctl) { 2127 (void) (*ifp->if_ioctl)(ifp, cmd, data); 2128 } 2129 getmicrotime(&ifp->if_lastchange); 2130 break; 2131 2132 case SIOCSIFCAP: 2133 error = priv_check(td, PRIV_NET_SETIFCAP); 2134 if (error) 2135 return (error); 2136 if (ifp->if_ioctl == NULL) 2137 return (EOPNOTSUPP); 2138 if (ifr->ifr_reqcap & ~ifp->if_capabilities) 2139 return (EINVAL); 2140 error = (*ifp->if_ioctl)(ifp, cmd, data); 2141 if (error == 0) 2142 getmicrotime(&ifp->if_lastchange); 2143 break; 2144 2145 #ifdef MAC 2146 case SIOCSIFMAC: 2147 error = mac_ifnet_ioctl_set(td->td_ucred, ifr, ifp); 2148 break; 2149 #endif 2150 2151 case SIOCSIFNAME: 2152 error = priv_check(td, PRIV_NET_SETIFNAME); 2153 if (error) 2154 return (error); 2155 error = copyinstr(ifr->ifr_data, new_name, IFNAMSIZ, NULL); 2156 if (error != 0) 2157 return (error); 2158 if (new_name[0] == '\0') 2159 return (EINVAL); 2160 if (ifunit(new_name) != NULL) 2161 return (EEXIST); 2162 2163 /* 2164 * XXX: Locking. Nothing else seems to lock if_flags, 2165 * and there are numerous other races with the 2166 * ifunit() checks not being atomic with namespace 2167 * changes (renames, vmoves, if_attach, etc). 2168 */ 2169 ifp->if_flags |= IFF_RENAMING; 2170 2171 /* Announce the departure of the interface. */ 2172 rt_ifannouncemsg(ifp, IFAN_DEPARTURE); 2173 EVENTHANDLER_INVOKE(ifnet_departure_event, ifp); 2174 2175 log(LOG_INFO, "%s: changing name to '%s'\n", 2176 ifp->if_xname, new_name); 2177 2178 strlcpy(ifp->if_xname, new_name, sizeof(ifp->if_xname)); 2179 ifa = ifp->if_addr; 2180 IFA_LOCK(ifa); 2181 sdl = (struct sockaddr_dl *)ifa->ifa_addr; 2182 namelen = strlen(new_name); 2183 onamelen = sdl->sdl_nlen; 2184 /* 2185 * Move the address if needed. This is safe because we 2186 * allocate space for a name of length IFNAMSIZ when we 2187 * create this in if_attach(). 2188 */ 2189 if (namelen != onamelen) { 2190 bcopy(sdl->sdl_data + onamelen, 2191 sdl->sdl_data + namelen, sdl->sdl_alen); 2192 } 2193 bcopy(new_name, sdl->sdl_data, namelen); 2194 sdl->sdl_nlen = namelen; 2195 sdl = (struct sockaddr_dl *)ifa->ifa_netmask; 2196 bzero(sdl->sdl_data, onamelen); 2197 while (namelen != 0) 2198 sdl->sdl_data[--namelen] = 0xff; 2199 IFA_UNLOCK(ifa); 2200 2201 EVENTHANDLER_INVOKE(ifnet_arrival_event, ifp); 2202 /* Announce the return of the interface. */ 2203 rt_ifannouncemsg(ifp, IFAN_ARRIVAL); 2204 2205 ifp->if_flags &= ~IFF_RENAMING; 2206 break; 2207 2208 #ifdef VIMAGE 2209 case SIOCSIFVNET: 2210 error = priv_check(td, PRIV_NET_SETIFVNET); 2211 if (error) 2212 return (error); 2213 error = if_vmove_loan(td, ifp, ifr->ifr_name, ifr->ifr_jid); 2214 break; 2215 #endif 2216 2217 case SIOCSIFMETRIC: 2218 error = priv_check(td, PRIV_NET_SETIFMETRIC); 2219 if (error) 2220 return (error); 2221 ifp->if_metric = ifr->ifr_metric; 2222 getmicrotime(&ifp->if_lastchange); 2223 break; 2224 2225 case SIOCSIFPHYS: 2226 error = priv_check(td, PRIV_NET_SETIFPHYS); 2227 if (error) 2228 return (error); 2229 if (ifp->if_ioctl == NULL) 2230 return (EOPNOTSUPP); 2231 error = (*ifp->if_ioctl)(ifp, cmd, data); 2232 if (error == 0) 2233 getmicrotime(&ifp->if_lastchange); 2234 break; 2235 2236 case SIOCSIFMTU: 2237 { 2238 u_long oldmtu = ifp->if_mtu; 2239 2240 error = priv_check(td, PRIV_NET_SETIFMTU); 2241 if (error) 2242 return (error); 2243 if (ifr->ifr_mtu < IF_MINMTU || ifr->ifr_mtu > IF_MAXMTU) 2244 return (EINVAL); 2245 if (ifp->if_ioctl == NULL) 2246 return (EOPNOTSUPP); 2247 error = (*ifp->if_ioctl)(ifp, cmd, data); 2248 if (error == 0) { 2249 getmicrotime(&ifp->if_lastchange); 2250 rt_ifmsg(ifp); 2251 } 2252 /* 2253 * If the link MTU changed, do network layer specific procedure. 2254 */ 2255 if (ifp->if_mtu != oldmtu) { 2256 #ifdef INET6 2257 nd6_setmtu(ifp); 2258 #endif 2259 } 2260 break; 2261 } 2262 2263 case SIOCADDMULTI: 2264 case SIOCDELMULTI: 2265 if (cmd == SIOCADDMULTI) 2266 error = priv_check(td, PRIV_NET_ADDMULTI); 2267 else 2268 error = priv_check(td, PRIV_NET_DELMULTI); 2269 if (error) 2270 return (error); 2271 2272 /* Don't allow group membership on non-multicast interfaces. */ 2273 if ((ifp->if_flags & IFF_MULTICAST) == 0) 2274 return (EOPNOTSUPP); 2275 2276 /* Don't let users screw up protocols' entries. */ 2277 if (ifr->ifr_addr.sa_family != AF_LINK) 2278 return (EINVAL); 2279 2280 if (cmd == SIOCADDMULTI) { 2281 struct ifmultiaddr *ifma; 2282 2283 /* 2284 * Userland is only permitted to join groups once 2285 * via the if_addmulti() KPI, because it cannot hold 2286 * struct ifmultiaddr * between calls. It may also 2287 * lose a race while we check if the membership 2288 * already exists. 2289 */ 2290 IF_ADDR_LOCK(ifp); 2291 ifma = if_findmulti(ifp, &ifr->ifr_addr); 2292 IF_ADDR_UNLOCK(ifp); 2293 if (ifma != NULL) 2294 error = EADDRINUSE; 2295 else 2296 error = if_addmulti(ifp, &ifr->ifr_addr, &ifma); 2297 } else { 2298 error = if_delmulti(ifp, &ifr->ifr_addr); 2299 } 2300 if (error == 0) 2301 getmicrotime(&ifp->if_lastchange); 2302 break; 2303 2304 case SIOCSIFPHYADDR: 2305 case SIOCDIFPHYADDR: 2306 #ifdef INET6 2307 case SIOCSIFPHYADDR_IN6: 2308 #endif 2309 case SIOCSLIFPHYADDR: 2310 case SIOCSIFMEDIA: 2311 case SIOCSIFGENERIC: 2312 error = priv_check(td, PRIV_NET_HWIOCTL); 2313 if (error) 2314 return (error); 2315 if (ifp->if_ioctl == NULL) 2316 return (EOPNOTSUPP); 2317 error = (*ifp->if_ioctl)(ifp, cmd, data); 2318 if (error == 0) 2319 getmicrotime(&ifp->if_lastchange); 2320 break; 2321 2322 case SIOCGIFSTATUS: 2323 ifs = (struct ifstat *)data; 2324 ifs->ascii[0] = '\0'; 2325 2326 case SIOCGIFPSRCADDR: 2327 case SIOCGIFPDSTADDR: 2328 case SIOCGLIFPHYADDR: 2329 case SIOCGIFMEDIA: 2330 case SIOCGIFGENERIC: 2331 if (ifp->if_ioctl == NULL) 2332 return (EOPNOTSUPP); 2333 error = (*ifp->if_ioctl)(ifp, cmd, data); 2334 break; 2335 2336 case SIOCSIFLLADDR: 2337 error = priv_check(td, PRIV_NET_SETLLADDR); 2338 if (error) 2339 return (error); 2340 error = if_setlladdr(ifp, 2341 ifr->ifr_addr.sa_data, ifr->ifr_addr.sa_len); 2342 EVENTHANDLER_INVOKE(iflladdr_event, ifp); 2343 break; 2344 2345 case SIOCAIFGROUP: 2346 { 2347 struct ifgroupreq *ifgr = (struct ifgroupreq *)ifr; 2348 2349 error = priv_check(td, PRIV_NET_ADDIFGROUP); 2350 if (error) 2351 return (error); 2352 if ((error = if_addgroup(ifp, ifgr->ifgr_group))) 2353 return (error); 2354 break; 2355 } 2356 2357 case SIOCGIFGROUP: 2358 if ((error = if_getgroup((struct ifgroupreq *)ifr, ifp))) 2359 return (error); 2360 break; 2361 2362 case SIOCDIFGROUP: 2363 { 2364 struct ifgroupreq *ifgr = (struct ifgroupreq *)ifr; 2365 2366 error = priv_check(td, PRIV_NET_DELIFGROUP); 2367 if (error) 2368 return (error); 2369 if ((error = if_delgroup(ifp, ifgr->ifgr_group))) 2370 return (error); 2371 break; 2372 } 2373 2374 default: 2375 error = ENOIOCTL; 2376 break; 2377 } 2378 return (error); 2379 } 2380 2381 /* 2382 * Interface ioctls. 2383 */ 2384 int 2385 ifioctl(struct socket *so, u_long cmd, caddr_t data, struct thread *td) 2386 { 2387 struct ifnet *ifp; 2388 struct ifreq *ifr; 2389 int error; 2390 int oif_flags; 2391 2392 switch (cmd) { 2393 case SIOCGIFCONF: 2394 case OSIOCGIFCONF: 2395 #ifdef __amd64__ 2396 case SIOCGIFCONF32: 2397 #endif 2398 return (ifconf(cmd, data)); 2399 } 2400 ifr = (struct ifreq *)data; 2401 2402 switch (cmd) { 2403 #ifdef VIMAGE 2404 case SIOCSIFRVNET: 2405 error = priv_check(td, PRIV_NET_SETIFVNET); 2406 if (error) 2407 return (error); 2408 return (if_vmove_reclaim(td, ifr->ifr_name, ifr->ifr_jid)); 2409 #endif 2410 case SIOCIFCREATE: 2411 case SIOCIFCREATE2: 2412 error = priv_check(td, PRIV_NET_IFCREATE); 2413 if (error) 2414 return (error); 2415 return (if_clone_create(ifr->ifr_name, sizeof(ifr->ifr_name), 2416 cmd == SIOCIFCREATE2 ? ifr->ifr_data : NULL)); 2417 case SIOCIFDESTROY: 2418 error = priv_check(td, PRIV_NET_IFDESTROY); 2419 if (error) 2420 return (error); 2421 return if_clone_destroy(ifr->ifr_name); 2422 2423 case SIOCIFGCLONERS: 2424 return (if_clone_list((struct if_clonereq *)data)); 2425 case SIOCGIFGMEMB: 2426 return (if_getgroupmembers((struct ifgroupreq *)data)); 2427 } 2428 2429 ifp = ifunit_ref(ifr->ifr_name); 2430 if (ifp == NULL) 2431 return (ENXIO); 2432 2433 error = ifhwioctl(cmd, ifp, data, td); 2434 if (error != ENOIOCTL) { 2435 if_rele(ifp); 2436 return (error); 2437 } 2438 2439 oif_flags = ifp->if_flags; 2440 if (so->so_proto == NULL) { 2441 if_rele(ifp); 2442 return (EOPNOTSUPP); 2443 } 2444 #ifndef COMPAT_43 2445 error = ((*so->so_proto->pr_usrreqs->pru_control)(so, cmd, 2446 data, 2447 ifp, td)); 2448 if (error == EOPNOTSUPP && ifp != NULL && ifp->if_ioctl != NULL) 2449 error = (*ifp->if_ioctl)(ifp, cmd, data); 2450 #else 2451 { 2452 u_long ocmd = cmd; 2453 2454 switch (cmd) { 2455 2456 case SIOCSIFDSTADDR: 2457 case SIOCSIFADDR: 2458 case SIOCSIFBRDADDR: 2459 case SIOCSIFNETMASK: 2460 #if BYTE_ORDER != BIG_ENDIAN 2461 if (ifr->ifr_addr.sa_family == 0 && 2462 ifr->ifr_addr.sa_len < 16) { 2463 ifr->ifr_addr.sa_family = ifr->ifr_addr.sa_len; 2464 ifr->ifr_addr.sa_len = 16; 2465 } 2466 #else 2467 if (ifr->ifr_addr.sa_len == 0) 2468 ifr->ifr_addr.sa_len = 16; 2469 #endif 2470 break; 2471 2472 case OSIOCGIFADDR: 2473 cmd = SIOCGIFADDR; 2474 break; 2475 2476 case OSIOCGIFDSTADDR: 2477 cmd = SIOCGIFDSTADDR; 2478 break; 2479 2480 case OSIOCGIFBRDADDR: 2481 cmd = SIOCGIFBRDADDR; 2482 break; 2483 2484 case OSIOCGIFNETMASK: 2485 cmd = SIOCGIFNETMASK; 2486 } 2487 error = ((*so->so_proto->pr_usrreqs->pru_control)(so, 2488 cmd, 2489 data, 2490 ifp, td)); 2491 if (error == EOPNOTSUPP && ifp != NULL && 2492 ifp->if_ioctl != NULL) 2493 error = (*ifp->if_ioctl)(ifp, cmd, data); 2494 switch (ocmd) { 2495 2496 case OSIOCGIFADDR: 2497 case OSIOCGIFDSTADDR: 2498 case OSIOCGIFBRDADDR: 2499 case OSIOCGIFNETMASK: 2500 *(u_short *)&ifr->ifr_addr = ifr->ifr_addr.sa_family; 2501 2502 } 2503 } 2504 #endif /* COMPAT_43 */ 2505 2506 if ((oif_flags ^ ifp->if_flags) & IFF_UP) { 2507 #ifdef INET6 2508 if (ifp->if_flags & IFF_UP) { 2509 int s = splimp(); 2510 in6_if_up(ifp); 2511 splx(s); 2512 } 2513 #endif 2514 } 2515 if_rele(ifp); 2516 return (error); 2517 } 2518 2519 /* 2520 * The code common to handling reference counted flags, 2521 * e.g., in ifpromisc() and if_allmulti(). 2522 * The "pflag" argument can specify a permanent mode flag to check, 2523 * such as IFF_PPROMISC for promiscuous mode; should be 0 if none. 2524 * 2525 * Only to be used on stack-owned flags, not driver-owned flags. 2526 */ 2527 static int 2528 if_setflag(struct ifnet *ifp, int flag, int pflag, int *refcount, int onswitch) 2529 { 2530 struct ifreq ifr; 2531 int error; 2532 int oldflags, oldcount; 2533 2534 /* Sanity checks to catch programming errors */ 2535 KASSERT((flag & (IFF_DRV_OACTIVE|IFF_DRV_RUNNING)) == 0, 2536 ("%s: setting driver-owned flag %d", __func__, flag)); 2537 2538 if (onswitch) 2539 KASSERT(*refcount >= 0, 2540 ("%s: increment negative refcount %d for flag %d", 2541 __func__, *refcount, flag)); 2542 else 2543 KASSERT(*refcount > 0, 2544 ("%s: decrement non-positive refcount %d for flag %d", 2545 __func__, *refcount, flag)); 2546 2547 /* In case this mode is permanent, just touch refcount */ 2548 if (ifp->if_flags & pflag) { 2549 *refcount += onswitch ? 1 : -1; 2550 return (0); 2551 } 2552 2553 /* Save ifnet parameters for if_ioctl() may fail */ 2554 oldcount = *refcount; 2555 oldflags = ifp->if_flags; 2556 2557 /* 2558 * See if we aren't the only and touching refcount is enough. 2559 * Actually toggle interface flag if we are the first or last. 2560 */ 2561 if (onswitch) { 2562 if ((*refcount)++) 2563 return (0); 2564 ifp->if_flags |= flag; 2565 } else { 2566 if (--(*refcount)) 2567 return (0); 2568 ifp->if_flags &= ~flag; 2569 } 2570 2571 /* Call down the driver since we've changed interface flags */ 2572 if (ifp->if_ioctl == NULL) { 2573 error = EOPNOTSUPP; 2574 goto recover; 2575 } 2576 ifr.ifr_flags = ifp->if_flags & 0xffff; 2577 ifr.ifr_flagshigh = ifp->if_flags >> 16; 2578 error = (*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr); 2579 if (error) 2580 goto recover; 2581 /* Notify userland that interface flags have changed */ 2582 rt_ifmsg(ifp); 2583 return (0); 2584 2585 recover: 2586 /* Recover after driver error */ 2587 *refcount = oldcount; 2588 ifp->if_flags = oldflags; 2589 return (error); 2590 } 2591 2592 /* 2593 * Set/clear promiscuous mode on interface ifp based on the truth value 2594 * of pswitch. The calls are reference counted so that only the first 2595 * "on" request actually has an effect, as does the final "off" request. 2596 * Results are undefined if the "off" and "on" requests are not matched. 2597 */ 2598 int 2599 ifpromisc(struct ifnet *ifp, int pswitch) 2600 { 2601 int error; 2602 int oldflags = ifp->if_flags; 2603 2604 error = if_setflag(ifp, IFF_PROMISC, IFF_PPROMISC, 2605 &ifp->if_pcount, pswitch); 2606 /* If promiscuous mode status has changed, log a message */ 2607 if (error == 0 && ((ifp->if_flags ^ oldflags) & IFF_PROMISC)) 2608 log(LOG_INFO, "%s: promiscuous mode %s\n", 2609 ifp->if_xname, 2610 (ifp->if_flags & IFF_PROMISC) ? "enabled" : "disabled"); 2611 return (error); 2612 } 2613 2614 /* 2615 * Return interface configuration 2616 * of system. List may be used 2617 * in later ioctl's (above) to get 2618 * other information. 2619 */ 2620 /*ARGSUSED*/ 2621 static int 2622 ifconf(u_long cmd, caddr_t data) 2623 { 2624 struct ifconf *ifc = (struct ifconf *)data; 2625 #ifdef __amd64__ 2626 struct ifconf32 *ifc32 = (struct ifconf32 *)data; 2627 struct ifconf ifc_swab; 2628 #endif 2629 struct ifnet *ifp; 2630 struct ifaddr *ifa; 2631 struct ifreq ifr; 2632 struct sbuf *sb; 2633 int error, full = 0, valid_len, max_len; 2634 2635 #ifdef __amd64__ 2636 if (cmd == SIOCGIFCONF32) { 2637 ifc_swab.ifc_len = ifc32->ifc_len; 2638 ifc_swab.ifc_buf = (caddr_t)(uintptr_t)ifc32->ifc_buf; 2639 ifc = &ifc_swab; 2640 } 2641 #endif 2642 /* Limit initial buffer size to MAXPHYS to avoid DoS from userspace. */ 2643 max_len = MAXPHYS - 1; 2644 2645 /* Prevent hostile input from being able to crash the system */ 2646 if (ifc->ifc_len <= 0) 2647 return (EINVAL); 2648 2649 again: 2650 if (ifc->ifc_len <= max_len) { 2651 max_len = ifc->ifc_len; 2652 full = 1; 2653 } 2654 sb = sbuf_new(NULL, NULL, max_len + 1, SBUF_FIXEDLEN); 2655 max_len = 0; 2656 valid_len = 0; 2657 2658 IFNET_RLOCK(); 2659 TAILQ_FOREACH(ifp, &V_ifnet, if_link) { 2660 int addrs; 2661 2662 /* 2663 * Zero the ifr_name buffer to make sure we don't 2664 * disclose the contents of the stack. 2665 */ 2666 memset(ifr.ifr_name, 0, sizeof(ifr.ifr_name)); 2667 2668 if (strlcpy(ifr.ifr_name, ifp->if_xname, sizeof(ifr.ifr_name)) 2669 >= sizeof(ifr.ifr_name)) { 2670 sbuf_delete(sb); 2671 IFNET_RUNLOCK(); 2672 return (ENAMETOOLONG); 2673 } 2674 2675 addrs = 0; 2676 IF_ADDR_LOCK(ifp); 2677 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 2678 struct sockaddr *sa = ifa->ifa_addr; 2679 2680 if (prison_if(curthread->td_ucred, sa) != 0) 2681 continue; 2682 addrs++; 2683 #ifdef COMPAT_43 2684 if (cmd == OSIOCGIFCONF) { 2685 struct osockaddr *osa = 2686 (struct osockaddr *)&ifr.ifr_addr; 2687 ifr.ifr_addr = *sa; 2688 osa->sa_family = sa->sa_family; 2689 sbuf_bcat(sb, &ifr, sizeof(ifr)); 2690 max_len += sizeof(ifr); 2691 } else 2692 #endif 2693 if (sa->sa_len <= sizeof(*sa)) { 2694 ifr.ifr_addr = *sa; 2695 sbuf_bcat(sb, &ifr, sizeof(ifr)); 2696 max_len += sizeof(ifr); 2697 } else { 2698 sbuf_bcat(sb, &ifr, 2699 offsetof(struct ifreq, ifr_addr)); 2700 max_len += offsetof(struct ifreq, ifr_addr); 2701 sbuf_bcat(sb, sa, sa->sa_len); 2702 max_len += sa->sa_len; 2703 } 2704 2705 if (!sbuf_overflowed(sb)) 2706 valid_len = sbuf_len(sb); 2707 } 2708 IF_ADDR_UNLOCK(ifp); 2709 if (addrs == 0) { 2710 bzero((caddr_t)&ifr.ifr_addr, sizeof(ifr.ifr_addr)); 2711 sbuf_bcat(sb, &ifr, sizeof(ifr)); 2712 max_len += sizeof(ifr); 2713 2714 if (!sbuf_overflowed(sb)) 2715 valid_len = sbuf_len(sb); 2716 } 2717 } 2718 IFNET_RUNLOCK(); 2719 2720 /* 2721 * If we didn't allocate enough space (uncommon), try again. If 2722 * we have already allocated as much space as we are allowed, 2723 * return what we've got. 2724 */ 2725 if (valid_len != max_len && !full) { 2726 sbuf_delete(sb); 2727 goto again; 2728 } 2729 2730 ifc->ifc_len = valid_len; 2731 #ifdef __amd64__ 2732 if (cmd == SIOCGIFCONF32) 2733 ifc32->ifc_len = valid_len; 2734 #endif 2735 sbuf_finish(sb); 2736 error = copyout(sbuf_data(sb), ifc->ifc_req, ifc->ifc_len); 2737 sbuf_delete(sb); 2738 return (error); 2739 } 2740 2741 /* 2742 * Just like ifpromisc(), but for all-multicast-reception mode. 2743 */ 2744 int 2745 if_allmulti(struct ifnet *ifp, int onswitch) 2746 { 2747 2748 return (if_setflag(ifp, IFF_ALLMULTI, 0, &ifp->if_amcount, onswitch)); 2749 } 2750 2751 struct ifmultiaddr * 2752 if_findmulti(struct ifnet *ifp, struct sockaddr *sa) 2753 { 2754 struct ifmultiaddr *ifma; 2755 2756 IF_ADDR_LOCK_ASSERT(ifp); 2757 2758 TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) { 2759 if (sa->sa_family == AF_LINK) { 2760 if (sa_dl_equal(ifma->ifma_addr, sa)) 2761 break; 2762 } else { 2763 if (sa_equal(ifma->ifma_addr, sa)) 2764 break; 2765 } 2766 } 2767 2768 return ifma; 2769 } 2770 2771 /* 2772 * Allocate a new ifmultiaddr and initialize based on passed arguments. We 2773 * make copies of passed sockaddrs. The ifmultiaddr will not be added to 2774 * the ifnet multicast address list here, so the caller must do that and 2775 * other setup work (such as notifying the device driver). The reference 2776 * count is initialized to 1. 2777 */ 2778 static struct ifmultiaddr * 2779 if_allocmulti(struct ifnet *ifp, struct sockaddr *sa, struct sockaddr *llsa, 2780 int mflags) 2781 { 2782 struct ifmultiaddr *ifma; 2783 struct sockaddr *dupsa; 2784 2785 ifma = malloc(sizeof *ifma, M_IFMADDR, mflags | 2786 M_ZERO); 2787 if (ifma == NULL) 2788 return (NULL); 2789 2790 dupsa = malloc(sa->sa_len, M_IFMADDR, mflags); 2791 if (dupsa == NULL) { 2792 free(ifma, M_IFMADDR); 2793 return (NULL); 2794 } 2795 bcopy(sa, dupsa, sa->sa_len); 2796 ifma->ifma_addr = dupsa; 2797 2798 ifma->ifma_ifp = ifp; 2799 ifma->ifma_refcount = 1; 2800 ifma->ifma_protospec = NULL; 2801 2802 if (llsa == NULL) { 2803 ifma->ifma_lladdr = NULL; 2804 return (ifma); 2805 } 2806 2807 dupsa = malloc(llsa->sa_len, M_IFMADDR, mflags); 2808 if (dupsa == NULL) { 2809 free(ifma->ifma_addr, M_IFMADDR); 2810 free(ifma, M_IFMADDR); 2811 return (NULL); 2812 } 2813 bcopy(llsa, dupsa, llsa->sa_len); 2814 ifma->ifma_lladdr = dupsa; 2815 2816 return (ifma); 2817 } 2818 2819 /* 2820 * if_freemulti: free ifmultiaddr structure and possibly attached related 2821 * addresses. The caller is responsible for implementing reference 2822 * counting, notifying the driver, handling routing messages, and releasing 2823 * any dependent link layer state. 2824 */ 2825 static void 2826 if_freemulti(struct ifmultiaddr *ifma) 2827 { 2828 2829 KASSERT(ifma->ifma_refcount == 0, ("if_freemulti: refcount %d", 2830 ifma->ifma_refcount)); 2831 KASSERT(ifma->ifma_protospec == NULL, 2832 ("if_freemulti: protospec not NULL")); 2833 2834 if (ifma->ifma_lladdr != NULL) 2835 free(ifma->ifma_lladdr, M_IFMADDR); 2836 free(ifma->ifma_addr, M_IFMADDR); 2837 free(ifma, M_IFMADDR); 2838 } 2839 2840 /* 2841 * Register an additional multicast address with a network interface. 2842 * 2843 * - If the address is already present, bump the reference count on the 2844 * address and return. 2845 * - If the address is not link-layer, look up a link layer address. 2846 * - Allocate address structures for one or both addresses, and attach to the 2847 * multicast address list on the interface. If automatically adding a link 2848 * layer address, the protocol address will own a reference to the link 2849 * layer address, to be freed when it is freed. 2850 * - Notify the network device driver of an addition to the multicast address 2851 * list. 2852 * 2853 * 'sa' points to caller-owned memory with the desired multicast address. 2854 * 2855 * 'retifma' will be used to return a pointer to the resulting multicast 2856 * address reference, if desired. 2857 */ 2858 int 2859 if_addmulti(struct ifnet *ifp, struct sockaddr *sa, 2860 struct ifmultiaddr **retifma) 2861 { 2862 struct ifmultiaddr *ifma, *ll_ifma; 2863 struct sockaddr *llsa; 2864 int error; 2865 2866 /* 2867 * If the address is already present, return a new reference to it; 2868 * otherwise, allocate storage and set up a new address. 2869 */ 2870 IF_ADDR_LOCK(ifp); 2871 ifma = if_findmulti(ifp, sa); 2872 if (ifma != NULL) { 2873 ifma->ifma_refcount++; 2874 if (retifma != NULL) 2875 *retifma = ifma; 2876 IF_ADDR_UNLOCK(ifp); 2877 return (0); 2878 } 2879 2880 /* 2881 * The address isn't already present; resolve the protocol address 2882 * into a link layer address, and then look that up, bump its 2883 * refcount or allocate an ifma for that also. If 'llsa' was 2884 * returned, we will need to free it later. 2885 */ 2886 llsa = NULL; 2887 ll_ifma = NULL; 2888 if (ifp->if_resolvemulti != NULL) { 2889 error = ifp->if_resolvemulti(ifp, &llsa, sa); 2890 if (error) 2891 goto unlock_out; 2892 } 2893 2894 /* 2895 * Allocate the new address. Don't hook it up yet, as we may also 2896 * need to allocate a link layer multicast address. 2897 */ 2898 ifma = if_allocmulti(ifp, sa, llsa, M_NOWAIT); 2899 if (ifma == NULL) { 2900 error = ENOMEM; 2901 goto free_llsa_out; 2902 } 2903 2904 /* 2905 * If a link layer address is found, we'll need to see if it's 2906 * already present in the address list, or allocate is as well. 2907 * When this block finishes, the link layer address will be on the 2908 * list. 2909 */ 2910 if (llsa != NULL) { 2911 ll_ifma = if_findmulti(ifp, llsa); 2912 if (ll_ifma == NULL) { 2913 ll_ifma = if_allocmulti(ifp, llsa, NULL, M_NOWAIT); 2914 if (ll_ifma == NULL) { 2915 --ifma->ifma_refcount; 2916 if_freemulti(ifma); 2917 error = ENOMEM; 2918 goto free_llsa_out; 2919 } 2920 TAILQ_INSERT_HEAD(&ifp->if_multiaddrs, ll_ifma, 2921 ifma_link); 2922 } else 2923 ll_ifma->ifma_refcount++; 2924 ifma->ifma_llifma = ll_ifma; 2925 } 2926 2927 /* 2928 * We now have a new multicast address, ifma, and possibly a new or 2929 * referenced link layer address. Add the primary address to the 2930 * ifnet address list. 2931 */ 2932 TAILQ_INSERT_HEAD(&ifp->if_multiaddrs, ifma, ifma_link); 2933 2934 if (retifma != NULL) 2935 *retifma = ifma; 2936 2937 /* 2938 * Must generate the message while holding the lock so that 'ifma' 2939 * pointer is still valid. 2940 */ 2941 rt_newmaddrmsg(RTM_NEWMADDR, ifma); 2942 IF_ADDR_UNLOCK(ifp); 2943 2944 /* 2945 * We are certain we have added something, so call down to the 2946 * interface to let them know about it. 2947 */ 2948 if (ifp->if_ioctl != NULL) { 2949 (void) (*ifp->if_ioctl)(ifp, SIOCADDMULTI, 0); 2950 } 2951 2952 if (llsa != NULL) 2953 free(llsa, M_IFMADDR); 2954 2955 return (0); 2956 2957 free_llsa_out: 2958 if (llsa != NULL) 2959 free(llsa, M_IFMADDR); 2960 2961 unlock_out: 2962 IF_ADDR_UNLOCK(ifp); 2963 return (error); 2964 } 2965 2966 /* 2967 * Delete a multicast group membership by network-layer group address. 2968 * 2969 * Returns ENOENT if the entry could not be found. If ifp no longer 2970 * exists, results are undefined. This entry point should only be used 2971 * from subsystems which do appropriate locking to hold ifp for the 2972 * duration of the call. 2973 * Network-layer protocol domains must use if_delmulti_ifma(). 2974 */ 2975 int 2976 if_delmulti(struct ifnet *ifp, struct sockaddr *sa) 2977 { 2978 struct ifmultiaddr *ifma; 2979 int lastref; 2980 #ifdef INVARIANTS 2981 struct ifnet *oifp; 2982 2983 IFNET_RLOCK_NOSLEEP(); 2984 TAILQ_FOREACH(oifp, &V_ifnet, if_link) 2985 if (ifp == oifp) 2986 break; 2987 if (ifp != oifp) 2988 ifp = NULL; 2989 IFNET_RUNLOCK_NOSLEEP(); 2990 2991 KASSERT(ifp != NULL, ("%s: ifnet went away", __func__)); 2992 #endif 2993 if (ifp == NULL) 2994 return (ENOENT); 2995 2996 IF_ADDR_LOCK(ifp); 2997 lastref = 0; 2998 ifma = if_findmulti(ifp, sa); 2999 if (ifma != NULL) 3000 lastref = if_delmulti_locked(ifp, ifma, 0); 3001 IF_ADDR_UNLOCK(ifp); 3002 3003 if (ifma == NULL) 3004 return (ENOENT); 3005 3006 if (lastref && ifp->if_ioctl != NULL) { 3007 (void)(*ifp->if_ioctl)(ifp, SIOCDELMULTI, 0); 3008 } 3009 3010 return (0); 3011 } 3012 3013 /* 3014 * Delete all multicast group membership for an interface. 3015 * Should be used to quickly flush all multicast filters. 3016 */ 3017 void 3018 if_delallmulti(struct ifnet *ifp) 3019 { 3020 struct ifmultiaddr *ifma; 3021 struct ifmultiaddr *next; 3022 3023 IF_ADDR_LOCK(ifp); 3024 TAILQ_FOREACH_SAFE(ifma, &ifp->if_multiaddrs, ifma_link, next) 3025 if_delmulti_locked(ifp, ifma, 0); 3026 IF_ADDR_UNLOCK(ifp); 3027 } 3028 3029 /* 3030 * Delete a multicast group membership by group membership pointer. 3031 * Network-layer protocol domains must use this routine. 3032 * 3033 * It is safe to call this routine if the ifp disappeared. 3034 */ 3035 void 3036 if_delmulti_ifma(struct ifmultiaddr *ifma) 3037 { 3038 struct ifnet *ifp; 3039 int lastref; 3040 3041 ifp = ifma->ifma_ifp; 3042 #ifdef DIAGNOSTIC 3043 if (ifp == NULL) { 3044 printf("%s: ifma_ifp seems to be detached\n", __func__); 3045 } else { 3046 struct ifnet *oifp; 3047 3048 IFNET_RLOCK_NOSLEEP(); 3049 TAILQ_FOREACH(oifp, &V_ifnet, if_link) 3050 if (ifp == oifp) 3051 break; 3052 if (ifp != oifp) { 3053 printf("%s: ifnet %p disappeared\n", __func__, ifp); 3054 ifp = NULL; 3055 } 3056 IFNET_RUNLOCK_NOSLEEP(); 3057 } 3058 #endif 3059 /* 3060 * If and only if the ifnet instance exists: Acquire the address lock. 3061 */ 3062 if (ifp != NULL) 3063 IF_ADDR_LOCK(ifp); 3064 3065 lastref = if_delmulti_locked(ifp, ifma, 0); 3066 3067 if (ifp != NULL) { 3068 /* 3069 * If and only if the ifnet instance exists: 3070 * Release the address lock. 3071 * If the group was left: update the hardware hash filter. 3072 */ 3073 IF_ADDR_UNLOCK(ifp); 3074 if (lastref && ifp->if_ioctl != NULL) { 3075 (void)(*ifp->if_ioctl)(ifp, SIOCDELMULTI, 0); 3076 } 3077 } 3078 } 3079 3080 /* 3081 * Perform deletion of network-layer and/or link-layer multicast address. 3082 * 3083 * Return 0 if the reference count was decremented. 3084 * Return 1 if the final reference was released, indicating that the 3085 * hardware hash filter should be reprogrammed. 3086 */ 3087 static int 3088 if_delmulti_locked(struct ifnet *ifp, struct ifmultiaddr *ifma, int detaching) 3089 { 3090 struct ifmultiaddr *ll_ifma; 3091 3092 if (ifp != NULL && ifma->ifma_ifp != NULL) { 3093 KASSERT(ifma->ifma_ifp == ifp, 3094 ("%s: inconsistent ifp %p", __func__, ifp)); 3095 IF_ADDR_LOCK_ASSERT(ifp); 3096 } 3097 3098 ifp = ifma->ifma_ifp; 3099 3100 /* 3101 * If the ifnet is detaching, null out references to ifnet, 3102 * so that upper protocol layers will notice, and not attempt 3103 * to obtain locks for an ifnet which no longer exists. The 3104 * routing socket announcement must happen before the ifnet 3105 * instance is detached from the system. 3106 */ 3107 if (detaching) { 3108 #ifdef DIAGNOSTIC 3109 printf("%s: detaching ifnet instance %p\n", __func__, ifp); 3110 #endif 3111 /* 3112 * ifp may already be nulled out if we are being reentered 3113 * to delete the ll_ifma. 3114 */ 3115 if (ifp != NULL) { 3116 rt_newmaddrmsg(RTM_DELMADDR, ifma); 3117 ifma->ifma_ifp = NULL; 3118 } 3119 } 3120 3121 if (--ifma->ifma_refcount > 0) 3122 return 0; 3123 3124 /* 3125 * If this ifma is a network-layer ifma, a link-layer ifma may 3126 * have been associated with it. Release it first if so. 3127 */ 3128 ll_ifma = ifma->ifma_llifma; 3129 if (ll_ifma != NULL) { 3130 KASSERT(ifma->ifma_lladdr != NULL, 3131 ("%s: llifma w/o lladdr", __func__)); 3132 if (detaching) 3133 ll_ifma->ifma_ifp = NULL; /* XXX */ 3134 if (--ll_ifma->ifma_refcount == 0) { 3135 if (ifp != NULL) { 3136 TAILQ_REMOVE(&ifp->if_multiaddrs, ll_ifma, 3137 ifma_link); 3138 } 3139 if_freemulti(ll_ifma); 3140 } 3141 } 3142 3143 if (ifp != NULL) 3144 TAILQ_REMOVE(&ifp->if_multiaddrs, ifma, ifma_link); 3145 3146 if_freemulti(ifma); 3147 3148 /* 3149 * The last reference to this instance of struct ifmultiaddr 3150 * was released; the hardware should be notified of this change. 3151 */ 3152 return 1; 3153 } 3154 3155 /* 3156 * Set the link layer address on an interface. 3157 * 3158 * At this time we only support certain types of interfaces, 3159 * and we don't allow the length of the address to change. 3160 */ 3161 int 3162 if_setlladdr(struct ifnet *ifp, const u_char *lladdr, int len) 3163 { 3164 struct sockaddr_dl *sdl; 3165 struct ifaddr *ifa; 3166 struct ifreq ifr; 3167 3168 IF_ADDR_LOCK(ifp); 3169 ifa = ifp->if_addr; 3170 if (ifa == NULL) { 3171 IF_ADDR_UNLOCK(ifp); 3172 return (EINVAL); 3173 } 3174 ifa_ref(ifa); 3175 IF_ADDR_UNLOCK(ifp); 3176 sdl = (struct sockaddr_dl *)ifa->ifa_addr; 3177 if (sdl == NULL) { 3178 ifa_free(ifa); 3179 return (EINVAL); 3180 } 3181 if (len != sdl->sdl_alen) { /* don't allow length to change */ 3182 ifa_free(ifa); 3183 return (EINVAL); 3184 } 3185 switch (ifp->if_type) { 3186 case IFT_ETHER: 3187 case IFT_FDDI: 3188 case IFT_XETHER: 3189 case IFT_ISO88025: 3190 case IFT_L2VLAN: 3191 case IFT_BRIDGE: 3192 case IFT_ARCNET: 3193 case IFT_IEEE8023ADLAG: 3194 case IFT_IEEE80211: 3195 bcopy(lladdr, LLADDR(sdl), len); 3196 ifa_free(ifa); 3197 break; 3198 default: 3199 ifa_free(ifa); 3200 return (ENODEV); 3201 } 3202 3203 /* 3204 * If the interface is already up, we need 3205 * to re-init it in order to reprogram its 3206 * address filter. 3207 */ 3208 if ((ifp->if_flags & IFF_UP) != 0) { 3209 if (ifp->if_ioctl) { 3210 ifp->if_flags &= ~IFF_UP; 3211 ifr.ifr_flags = ifp->if_flags & 0xffff; 3212 ifr.ifr_flagshigh = ifp->if_flags >> 16; 3213 (*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr); 3214 ifp->if_flags |= IFF_UP; 3215 ifr.ifr_flags = ifp->if_flags & 0xffff; 3216 ifr.ifr_flagshigh = ifp->if_flags >> 16; 3217 (*ifp->if_ioctl)(ifp, SIOCSIFFLAGS, (caddr_t)&ifr); 3218 } 3219 #ifdef INET 3220 /* 3221 * Also send gratuitous ARPs to notify other nodes about 3222 * the address change. 3223 */ 3224 TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 3225 if (ifa->ifa_addr->sa_family == AF_INET) 3226 arp_ifinit(ifp, ifa); 3227 } 3228 #endif 3229 } 3230 return (0); 3231 } 3232 3233 /* 3234 * The name argument must be a pointer to storage which will last as 3235 * long as the interface does. For physical devices, the result of 3236 * device_get_name(dev) is a good choice and for pseudo-devices a 3237 * static string works well. 3238 */ 3239 void 3240 if_initname(struct ifnet *ifp, const char *name, int unit) 3241 { 3242 ifp->if_dname = name; 3243 ifp->if_dunit = unit; 3244 if (unit != IF_DUNIT_NONE) 3245 snprintf(ifp->if_xname, IFNAMSIZ, "%s%d", name, unit); 3246 else 3247 strlcpy(ifp->if_xname, name, IFNAMSIZ); 3248 } 3249 3250 int 3251 if_printf(struct ifnet *ifp, const char * fmt, ...) 3252 { 3253 va_list ap; 3254 int retval; 3255 3256 retval = printf("%s: ", ifp->if_xname); 3257 va_start(ap, fmt); 3258 retval += vprintf(fmt, ap); 3259 va_end(ap); 3260 return (retval); 3261 } 3262 3263 void 3264 if_start(struct ifnet *ifp) 3265 { 3266 3267 (*(ifp)->if_start)(ifp); 3268 } 3269 3270 /* 3271 * Backwards compatibility interface for drivers 3272 * that have not implemented it 3273 */ 3274 static int 3275 if_transmit(struct ifnet *ifp, struct mbuf *m) 3276 { 3277 int error; 3278 3279 IFQ_HANDOFF(ifp, m, error); 3280 return (error); 3281 } 3282 3283 int 3284 if_handoff(struct ifqueue *ifq, struct mbuf *m, struct ifnet *ifp, int adjust) 3285 { 3286 int active = 0; 3287 3288 IF_LOCK(ifq); 3289 if (_IF_QFULL(ifq)) { 3290 _IF_DROP(ifq); 3291 IF_UNLOCK(ifq); 3292 m_freem(m); 3293 return (0); 3294 } 3295 if (ifp != NULL) { 3296 ifp->if_obytes += m->m_pkthdr.len + adjust; 3297 if (m->m_flags & (M_BCAST|M_MCAST)) 3298 ifp->if_omcasts++; 3299 active = ifp->if_drv_flags & IFF_DRV_OACTIVE; 3300 } 3301 _IF_ENQUEUE(ifq, m); 3302 IF_UNLOCK(ifq); 3303 if (ifp != NULL && !active) 3304 (*(ifp)->if_start)(ifp); 3305 return (1); 3306 } 3307 3308 void 3309 if_register_com_alloc(u_char type, 3310 if_com_alloc_t *a, if_com_free_t *f) 3311 { 3312 3313 KASSERT(if_com_alloc[type] == NULL, 3314 ("if_register_com_alloc: %d already registered", type)); 3315 KASSERT(if_com_free[type] == NULL, 3316 ("if_register_com_alloc: %d free already registered", type)); 3317 3318 if_com_alloc[type] = a; 3319 if_com_free[type] = f; 3320 } 3321 3322 void 3323 if_deregister_com_alloc(u_char type) 3324 { 3325 3326 KASSERT(if_com_alloc[type] != NULL, 3327 ("if_deregister_com_alloc: %d not registered", type)); 3328 KASSERT(if_com_free[type] != NULL, 3329 ("if_deregister_com_alloc: %d free not registered", type)); 3330 if_com_alloc[type] = NULL; 3331 if_com_free[type] = NULL; 3332 } 3333