1caf43b02SWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 482cd038dSYoshinobu Inoue * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 5fa046d87SRobert Watson * Copyright (c) 2010-2011 Juniper Networks, Inc. 682cd038dSYoshinobu Inoue * All rights reserved. 782cd038dSYoshinobu Inoue * 8fa046d87SRobert Watson * Portions of this software were developed by Robert N. M. Watson under 9fa046d87SRobert Watson * contract to Juniper Networks, Inc. 10fa046d87SRobert Watson * 1182cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 1282cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 1382cd038dSYoshinobu Inoue * are met: 1482cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 1582cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 1682cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 1782cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 1882cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 1982cd038dSYoshinobu Inoue * 3. Neither the name of the project nor the names of its contributors 2082cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 2182cd038dSYoshinobu Inoue * without specific prior written permission. 2282cd038dSYoshinobu Inoue * 2382cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 2482cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2582cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2682cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 2782cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 2882cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2982cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 3082cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 3182cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 3282cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 3382cd038dSYoshinobu Inoue * SUCH DAMAGE. 3482cd038dSYoshinobu Inoue * 35b48287a3SDavid E. O'Brien * $KAME: in6_pcb.c,v 1.31 2001/05/21 05:45:10 jinmei Exp $ 3682cd038dSYoshinobu Inoue */ 3782cd038dSYoshinobu Inoue 38caf43b02SWarner Losh /*- 3982cd038dSYoshinobu Inoue * Copyright (c) 1982, 1986, 1991, 1993 4082cd038dSYoshinobu Inoue * The Regents of the University of California. All rights reserved. 4182cd038dSYoshinobu Inoue * 4282cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 4382cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 4482cd038dSYoshinobu Inoue * are met: 4582cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 4682cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 4782cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 4882cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 4982cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 50fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 5182cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 5282cd038dSYoshinobu Inoue * without specific prior written permission. 5382cd038dSYoshinobu Inoue * 5482cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 5582cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 5682cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 5782cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 5882cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 5982cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 6082cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 6182cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 6282cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 6382cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 6482cd038dSYoshinobu Inoue * SUCH DAMAGE. 6582cd038dSYoshinobu Inoue */ 6682cd038dSYoshinobu Inoue 67b48287a3SDavid E. O'Brien #include <sys/cdefs.h> 6833841545SHajimu UMEMOTO #include "opt_inet.h" 6933841545SHajimu UMEMOTO #include "opt_inet6.h" 706a800098SYoshinobu Inoue #include "opt_ipsec.h" 710c325f53SAlexander V. Chernikov #include "opt_route.h" 727527624eSRobert Watson #include "opt_rss.h" 7382cd038dSYoshinobu Inoue 74a0577692SGleb Smirnoff #include <sys/hash.h> 7582cd038dSYoshinobu Inoue #include <sys/param.h> 7682cd038dSYoshinobu Inoue #include <sys/systm.h> 7782cd038dSYoshinobu Inoue #include <sys/malloc.h> 7882cd038dSYoshinobu Inoue #include <sys/mbuf.h> 79fb59c426SYoshinobu Inoue #include <sys/domain.h> 80fdb987beSMark Johnston #include <sys/proc.h> 8182cd038dSYoshinobu Inoue #include <sys/protosw.h> 82fdb987beSMark Johnston #include <sys/smr.h> 8382cd038dSYoshinobu Inoue #include <sys/socket.h> 8482cd038dSYoshinobu Inoue #include <sys/socketvar.h> 8582cd038dSYoshinobu Inoue #include <sys/sockio.h> 8682cd038dSYoshinobu Inoue #include <sys/errno.h> 8782cd038dSYoshinobu Inoue #include <sys/time.h> 88acd3428bSRobert Watson #include <sys/priv.h> 8982cd038dSYoshinobu Inoue #include <sys/proc.h> 9082cd038dSYoshinobu Inoue #include <sys/jail.h> 9182cd038dSYoshinobu Inoue 9294540027SJeff Roberson #include <vm/uma.h> 9382cd038dSYoshinobu Inoue 9482cd038dSYoshinobu Inoue #include <net/if.h> 9576039bc8SGleb Smirnoff #include <net/if_var.h> 966d768226SGeorge V. Neville-Neil #include <net/if_llatbl.h> 9782cd038dSYoshinobu Inoue #include <net/if_types.h> 9882cd038dSYoshinobu Inoue #include <net/route.h> 99983066f0SAlexander V. Chernikov #include <net/route/nhop.h> 10082cd038dSYoshinobu Inoue 10182cd038dSYoshinobu Inoue #include <netinet/in.h> 10282cd038dSYoshinobu Inoue #include <netinet/in_var.h> 10382cd038dSYoshinobu Inoue #include <netinet/in_systm.h> 104686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h> 105fb59c426SYoshinobu Inoue #include <netinet/ip_var.h> 106ac957cd2SJulian Elischer 10782cd038dSYoshinobu Inoue #include <netinet6/ip6_var.h> 10882cd038dSYoshinobu Inoue #include <netinet6/nd6.h> 10982cd038dSYoshinobu Inoue #include <netinet/in_pcb.h> 1100f617ae4SGleb Smirnoff #include <netinet/in_pcb_var.h> 11182cd038dSYoshinobu Inoue #include <netinet6/in6_pcb.h> 112983066f0SAlexander V. Chernikov #include <netinet6/in6_fib.h> 113a1f7e5f8SHajimu UMEMOTO #include <netinet6/scope6_var.h> 11482cd038dSYoshinobu Inoue 11582cd038dSYoshinobu Inoue int 116147f018aSGleb Smirnoff in6_pcbsetport(struct in6_addr *laddr, struct inpcb *inp, struct ucred *cred) 117147f018aSGleb Smirnoff { 118147f018aSGleb Smirnoff struct socket *so = inp->inp_socket; 119147f018aSGleb Smirnoff u_int16_t lport = 0; 120147f018aSGleb Smirnoff int error, lookupflags = 0; 121147f018aSGleb Smirnoff #ifdef INVARIANTS 122147f018aSGleb Smirnoff struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 123147f018aSGleb Smirnoff #endif 124147f018aSGleb Smirnoff 125147f018aSGleb Smirnoff INP_WLOCK_ASSERT(inp); 126147f018aSGleb Smirnoff INP_HASH_WLOCK_ASSERT(pcbinfo); 127147f018aSGleb Smirnoff 128147f018aSGleb Smirnoff error = prison_local_ip6(cred, laddr, 129147f018aSGleb Smirnoff ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0)); 130147f018aSGleb Smirnoff if (error) 131147f018aSGleb Smirnoff return(error); 132147f018aSGleb Smirnoff 133147f018aSGleb Smirnoff /* XXX: this is redundant when called from in6_pcbbind */ 134147f018aSGleb Smirnoff if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT|SO_REUSEPORT_LB)) == 0) 135147f018aSGleb Smirnoff lookupflags = INPLOOKUP_WILDCARD; 136147f018aSGleb Smirnoff 137147f018aSGleb Smirnoff inp->inp_flags |= INP_ANONPORT; 138147f018aSGleb Smirnoff 139147f018aSGleb Smirnoff error = in_pcb_lport(inp, NULL, &lport, cred, lookupflags); 140147f018aSGleb Smirnoff if (error != 0) 141147f018aSGleb Smirnoff return (error); 142147f018aSGleb Smirnoff 143147f018aSGleb Smirnoff inp->inp_lport = lport; 144147f018aSGleb Smirnoff if (in_pcbinshash(inp) != 0) { 145147f018aSGleb Smirnoff inp->in6p_laddr = in6addr_any; 146147f018aSGleb Smirnoff inp->inp_lport = 0; 147147f018aSGleb Smirnoff return (EAGAIN); 148147f018aSGleb Smirnoff } 149147f018aSGleb Smirnoff 150147f018aSGleb Smirnoff return (0); 151147f018aSGleb Smirnoff } 152147f018aSGleb Smirnoff 153147f018aSGleb Smirnoff int 15496871af0SGleb Smirnoff in6_pcbbind(struct inpcb *inp, struct sockaddr_in6 *sin6, struct ucred *cred) 15582cd038dSYoshinobu Inoue { 15682cd038dSYoshinobu Inoue struct socket *so = inp->inp_socket; 15782cd038dSYoshinobu Inoue struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 15882cd038dSYoshinobu Inoue u_short lport = 0; 15968e0d7e0SRobert Watson int error, lookupflags = 0; 16068e0d7e0SRobert Watson int reuseport = (so->so_options & SO_REUSEPORT); 16182cd038dSYoshinobu Inoue 1621a43cff9SSean Bruno /* 1631a43cff9SSean Bruno * XXX: Maybe we could let SO_REUSEPORT_LB set SO_REUSEPORT bit here 1641a43cff9SSean Bruno * so that we don't have to add to the (already messy) code below. 1651a43cff9SSean Bruno */ 1661a43cff9SSean Bruno int reuseport_lb = (so->so_options & SO_REUSEPORT_LB); 1671a43cff9SSean Bruno 1688501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 169fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(pcbinfo); 17007385abdSRobert Watson 17182cd038dSYoshinobu Inoue if (inp->inp_lport || !IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 17282cd038dSYoshinobu Inoue return (EINVAL); 1731a43cff9SSean Bruno if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT|SO_REUSEPORT_LB)) == 0) 17468e0d7e0SRobert Watson lookupflags = INPLOOKUP_WILDCARD; 17596871af0SGleb Smirnoff if (sin6 == NULL) { 1767c2f3cb9SJamie Gritton if ((error = prison_local_ip6(cred, &inp->in6p_laddr, 1777c2f3cb9SJamie Gritton ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0))) != 0) 1787c2f3cb9SJamie Gritton return (error); 1797c2f3cb9SJamie Gritton } else { 180f161d294SMark Johnston KASSERT(sin6->sin6_family == AF_INET6, 181f161d294SMark Johnston ("%s: invalid address family for %p", __func__, sin6)); 182f161d294SMark Johnston KASSERT(sin6->sin6_len == sizeof(*sin6), 183f161d294SMark Johnston ("%s: invalid address length for %p", __func__, sin6)); 18482cd038dSYoshinobu Inoue 185603724d3SBjoern A. Zeeb if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0) 186a1f7e5f8SHajimu UMEMOTO return(error); 18782cd038dSYoshinobu Inoue 188b89e82ddSJamie Gritton if ((error = prison_local_ip6(cred, &sin6->sin6_addr, 189b89e82ddSJamie Gritton ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0))) != 0) 190b89e82ddSJamie Gritton return (error); 191413628a7SBjoern A. Zeeb 19282cd038dSYoshinobu Inoue lport = sin6->sin6_port; 19382cd038dSYoshinobu Inoue if (IN6_IS_ADDR_MULTICAST(&sin6->sin6_addr)) { 19482cd038dSYoshinobu Inoue /* 19582cd038dSYoshinobu Inoue * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 19682cd038dSYoshinobu Inoue * allow compepte duplication of binding if 19782cd038dSYoshinobu Inoue * SO_REUSEPORT is set, or if SO_REUSEADDR is set 19882cd038dSYoshinobu Inoue * and a multicast address is bound on both 19982cd038dSYoshinobu Inoue * new and duplicated sockets. 20082cd038dSYoshinobu Inoue */ 201f122b319SMikolaj Golub if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) != 0) 20282cd038dSYoshinobu Inoue reuseport = SO_REUSEADDR|SO_REUSEPORT; 2031a43cff9SSean Bruno /* 2041a43cff9SSean Bruno * XXX: How to deal with SO_REUSEPORT_LB here? 2051a43cff9SSean Bruno * Treat same as SO_REUSEPORT for now. 2061a43cff9SSean Bruno */ 2071a43cff9SSean Bruno if ((so->so_options & 2081a43cff9SSean Bruno (SO_REUSEADDR|SO_REUSEPORT_LB)) != 0) 2091a43cff9SSean Bruno reuseport_lb = SO_REUSEADDR|SO_REUSEPORT_LB; 21082cd038dSYoshinobu Inoue } else if (!IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 211a68cc388SGleb Smirnoff struct epoch_tracker et; 2128c0fec80SRobert Watson struct ifaddr *ifa; 21382cd038dSYoshinobu Inoue 21482cd038dSYoshinobu Inoue sin6->sin6_port = 0; /* yech... */ 215a68cc388SGleb Smirnoff NET_EPOCH_ENTER(et); 2168c0fec80SRobert Watson if ((ifa = ifa_ifwithaddr((struct sockaddr *)sin6)) == 2178c0fec80SRobert Watson NULL && 218f44270e7SPawel Jakub Dawidek (inp->inp_flags & INP_BINDANY) == 0) { 219a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 22082cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 221f44270e7SPawel Jakub Dawidek } 22282cd038dSYoshinobu Inoue 22382cd038dSYoshinobu Inoue /* 22482cd038dSYoshinobu Inoue * XXX: bind to an anycast address might accidentally 22582cd038dSYoshinobu Inoue * cause sending a packet with anycast source address. 22633841545SHajimu UMEMOTO * We should allow to bind to a deprecated address, since 2277efe5d92SHajimu UMEMOTO * the application dares to use it. 22882cd038dSYoshinobu Inoue */ 2298c0fec80SRobert Watson if (ifa != NULL && 2308c0fec80SRobert Watson ((struct in6_ifaddr *)ifa)->ia6_flags & 23133841545SHajimu UMEMOTO (IN6_IFF_ANYCAST|IN6_IFF_NOTREADY|IN6_IFF_DETACHED)) { 232a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 23382cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 23482cd038dSYoshinobu Inoue } 235a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 23682cd038dSYoshinobu Inoue } 23782cd038dSYoshinobu Inoue if (lport) { 23882cd038dSYoshinobu Inoue struct inpcb *t; 23982cd038dSYoshinobu Inoue 24082cd038dSYoshinobu Inoue /* GROSS */ 241603724d3SBjoern A. Zeeb if (ntohs(lport) <= V_ipport_reservedhigh && 242603724d3SBjoern A. Zeeb ntohs(lport) >= V_ipport_reservedlow && 243cc426dd3SMateusz Guzik priv_check_cred(cred, PRIV_NETINET_RESERVEDPORT)) 24482cd038dSYoshinobu Inoue return (EACCES); 245835d4b89SPawel Jakub Dawidek if (!IN6_IS_ADDR_MULTICAST(&sin6->sin6_addr) && 246cc426dd3SMateusz Guzik priv_check_cred(inp->inp_cred, PRIV_NETINET_REUSEPORT) != 0) { 247fb59c426SYoshinobu Inoue t = in6_pcblookup_local(pcbinfo, 24882cd038dSYoshinobu Inoue &sin6->sin6_addr, lport, 249078b7042SBjoern A. Zeeb INPLOOKUP_WILDCARD, cred); 2503aff4ccdSMark Johnston if (t != NULL && 251f66145c6SYaroslav Tykhiy (so->so_type != SOCK_STREAM || 252f66145c6SYaroslav Tykhiy IN6_IS_ADDR_UNSPECIFIED(&t->in6p_faddr)) && 2534cc20ab1SSeigo Tanimura (!IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr) || 25482cd038dSYoshinobu Inoue !IN6_IS_ADDR_UNSPECIFIED(&t->in6p_laddr) || 255e3ba0d6aSGleb Smirnoff (t->inp_socket->so_options & SO_REUSEPORT) || 256e3ba0d6aSGleb Smirnoff (t->inp_socket->so_options & SO_REUSEPORT_LB) == 0) && 257fc06cd42SMikolaj Golub (inp->inp_cred->cr_uid != 25886d02c5cSBjoern A. Zeeb t->inp_cred->cr_uid)) 25982cd038dSYoshinobu Inoue return (EADDRINUSE); 260c7c0d948SAdrian Chadd 26167107f45SBjoern A. Zeeb #ifdef INET 26233841545SHajimu UMEMOTO if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 263fb59c426SYoshinobu Inoue IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 264fb59c426SYoshinobu Inoue struct sockaddr_in sin; 265fb59c426SYoshinobu Inoue 266fb59c426SYoshinobu Inoue in6_sin6_2_sin(&sin, sin6); 267fb59c426SYoshinobu Inoue t = in_pcblookup_local(pcbinfo, 268fb59c426SYoshinobu Inoue sin.sin_addr, lport, 269078b7042SBjoern A. Zeeb INPLOOKUP_WILDCARD, cred); 2703aff4ccdSMark Johnston if (t != NULL && 271f66145c6SYaroslav Tykhiy (so->so_type != SOCK_STREAM || 272f66145c6SYaroslav Tykhiy ntohl(t->inp_faddr.s_addr) == 273f66145c6SYaroslav Tykhiy INADDR_ANY) && 27486d02c5cSBjoern A. Zeeb (inp->inp_cred->cr_uid != 27586d02c5cSBjoern A. Zeeb t->inp_cred->cr_uid)) 276fb59c426SYoshinobu Inoue return (EADDRINUSE); 277fb59c426SYoshinobu Inoue } 27867107f45SBjoern A. Zeeb #endif 27982cd038dSYoshinobu Inoue } 28082cd038dSYoshinobu Inoue t = in6_pcblookup_local(pcbinfo, &sin6->sin6_addr, 28168e0d7e0SRobert Watson lport, lookupflags, cred); 282e3ba0d6aSGleb Smirnoff if (t && (reuseport & t->inp_socket->so_options) == 0 && 283e3ba0d6aSGleb Smirnoff (reuseport_lb & t->inp_socket->so_options) == 0) { 28429381b36SMikolaj Golub return (EADDRINUSE); 28529381b36SMikolaj Golub } 28667107f45SBjoern A. Zeeb #ifdef INET 28733841545SHajimu UMEMOTO if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 288fb59c426SYoshinobu Inoue IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 289fb59c426SYoshinobu Inoue struct sockaddr_in sin; 290fb59c426SYoshinobu Inoue 291fb59c426SYoshinobu Inoue in6_sin6_2_sin(&sin, sin6); 292fb59c426SYoshinobu Inoue t = in_pcblookup_local(pcbinfo, sin.sin_addr, 29368e0d7e0SRobert Watson lport, lookupflags, cred); 2940d744519SGleb Smirnoff if (t && 295e3ba0d6aSGleb Smirnoff (reuseport & t->inp_socket->so_options) == 0 && 296e3ba0d6aSGleb Smirnoff (reuseport_lb & t->inp_socket->so_options) == 0 && 297fc06cd42SMikolaj Golub (ntohl(t->inp_laddr.s_addr) != INADDR_ANY || 2981a43cff9SSean Bruno (t->inp_vflag & INP_IPV6PROTO) != 0)) { 299fb59c426SYoshinobu Inoue return (EADDRINUSE); 300fb59c426SYoshinobu Inoue } 3011a43cff9SSean Bruno } 30267107f45SBjoern A. Zeeb #endif 30382cd038dSYoshinobu Inoue } 30482cd038dSYoshinobu Inoue inp->in6p_laddr = sin6->sin6_addr; 30582cd038dSYoshinobu Inoue } 30682cd038dSYoshinobu Inoue if (lport == 0) { 3074616026fSErmal Luçi if ((error = in6_pcbsetport(&inp->in6p_laddr, inp, cred)) != 0) { 3084a2b2562SBjoern A. Zeeb /* Undo an address bind that may have occurred. */ 3094a2b2562SBjoern A. Zeeb inp->in6p_laddr = in6addr_any; 310b89e82ddSJamie Gritton return (error); 3114a2b2562SBjoern A. Zeeb } 31255fd3bafSBjoern A. Zeeb } else { 31382cd038dSYoshinobu Inoue inp->inp_lport = lport; 31482cd038dSYoshinobu Inoue if (in_pcbinshash(inp) != 0) { 31582cd038dSYoshinobu Inoue inp->in6p_laddr = in6addr_any; 31682cd038dSYoshinobu Inoue inp->inp_lport = 0; 31782cd038dSYoshinobu Inoue return (EAGAIN); 31882cd038dSYoshinobu Inoue } 319686cdd19SJun-ichiro itojun Hagino } 32082cd038dSYoshinobu Inoue return (0); 32182cd038dSYoshinobu Inoue } 32282cd038dSYoshinobu Inoue 32382cd038dSYoshinobu Inoue /* 32482cd038dSYoshinobu Inoue * Transform old in6_pcbconnect() into an inner subroutine for new 32582cd038dSYoshinobu Inoue * in6_pcbconnect(): Do some validity-checking on the remote 32682cd038dSYoshinobu Inoue * address (in mbuf 'nam') and then determine local host address 32782cd038dSYoshinobu Inoue * (i.e., which interface) to use to access that remote host. 32882cd038dSYoshinobu Inoue * 32982cd038dSYoshinobu Inoue * This preserves definition of in6_pcbconnect(), while supporting a 33082cd038dSYoshinobu Inoue * slightly different version for T/TCP. (This is more than 33182cd038dSYoshinobu Inoue * a bit of a kludge, but cleaning up the internal interfaces would 33282cd038dSYoshinobu Inoue * have forced minor changes in every protocol). 33382cd038dSYoshinobu Inoue */ 334a7e201bbSAndrey V. Elsukov static int 335f161d294SMark Johnston in6_pcbladdr(struct inpcb *inp, struct sockaddr_in6 *sin6, 3360bf5377bSAndrey V. Elsukov struct in6_addr *plocal_addr6, bool sas_required) 33782cd038dSYoshinobu Inoue { 33882cd038dSYoshinobu Inoue int error = 0; 339a1f7e5f8SHajimu UMEMOTO int scope_ambiguous = 0; 34088d166bfSBjoern A. Zeeb struct in6_addr in6a; 34182cd038dSYoshinobu Inoue 3423d76be28SGleb Smirnoff NET_EPOCH_ASSERT(); 3438501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 344fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); /* XXXRW: why? */ 3458deea4a8SRobert Watson 34682cd038dSYoshinobu Inoue if (sin6->sin6_port == 0) 34782cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 34882cd038dSYoshinobu Inoue 349603724d3SBjoern A. Zeeb if (sin6->sin6_scope_id == 0 && !V_ip6_use_defzone) 350a1f7e5f8SHajimu UMEMOTO scope_ambiguous = 1; 351603724d3SBjoern A. Zeeb if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0) 352a1f7e5f8SHajimu UMEMOTO return(error); 353a1f7e5f8SHajimu UMEMOTO 354d7c5a620SMatt Macy if (!CK_STAILQ_EMPTY(&V_in6_ifaddrhead)) { 35582cd038dSYoshinobu Inoue /* 35682cd038dSYoshinobu Inoue * If the destination address is UNSPECIFIED addr, 35782cd038dSYoshinobu Inoue * use the loopback addr, e.g ::1. 35882cd038dSYoshinobu Inoue */ 35982cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) 36082cd038dSYoshinobu Inoue sin6->sin6_addr = in6addr_loopback; 36182cd038dSYoshinobu Inoue } 362b89e82ddSJamie Gritton if ((error = prison_remote_ip6(inp->inp_cred, &sin6->sin6_addr)) != 0) 363b89e82ddSJamie Gritton return (error); 364a1f7e5f8SHajimu UMEMOTO 3650bf5377bSAndrey V. Elsukov if (sas_required) { 366601c0b8bSAlexander V. Chernikov error = in6_selectsrc_socket(sin6, inp->in6p_outputopts, 367601c0b8bSAlexander V. Chernikov inp, inp->inp_cred, scope_ambiguous, &in6a, NULL); 36888d166bfSBjoern A. Zeeb if (error) 36988d166bfSBjoern A. Zeeb return (error); 3700bf5377bSAndrey V. Elsukov } else { 3710bf5377bSAndrey V. Elsukov /* 3720bf5377bSAndrey V. Elsukov * Source address selection isn't required when syncache 3730bf5377bSAndrey V. Elsukov * has already established connection and both source and 3740bf5377bSAndrey V. Elsukov * destination addresses was chosen. 3750bf5377bSAndrey V. Elsukov * 3760bf5377bSAndrey V. Elsukov * This also includes the case when fwd_tag was used to 3770bf5377bSAndrey V. Elsukov * select source address in tcp_input(). 3780bf5377bSAndrey V. Elsukov */ 3790bf5377bSAndrey V. Elsukov in6a = inp->in6p_laddr; 3800bf5377bSAndrey V. Elsukov } 3810bf5377bSAndrey V. Elsukov 382713264f6SMark Johnston if (IN6_IS_ADDR_UNSPECIFIED(&in6a)) 383713264f6SMark Johnston return (EHOSTUNREACH); 38488d166bfSBjoern A. Zeeb /* 38588d166bfSBjoern A. Zeeb * Do not update this earlier, in case we return with an error. 38688d166bfSBjoern A. Zeeb * 387601c0b8bSAlexander V. Chernikov * XXX: this in6_selectsrc_socket result might replace the bound local 388681ffdf9SBjoern A. Zeeb * address with the address specified by setsockopt(IPV6_PKTINFO). 38988d166bfSBjoern A. Zeeb * Is it the intended behavior? 39088d166bfSBjoern A. Zeeb */ 39188d166bfSBjoern A. Zeeb *plocal_addr6 = in6a; 39288d166bfSBjoern A. Zeeb 39382cd038dSYoshinobu Inoue /* 39482cd038dSYoshinobu Inoue * Don't do pcblookup call here; return interface in 39582cd038dSYoshinobu Inoue * plocal_addr6 39682cd038dSYoshinobu Inoue * and exit to caller, that will do the lookup. 39782cd038dSYoshinobu Inoue */ 398a1f7e5f8SHajimu UMEMOTO 39982cd038dSYoshinobu Inoue return (0); 40082cd038dSYoshinobu Inoue } 40182cd038dSYoshinobu Inoue 40282cd038dSYoshinobu Inoue /* 40382cd038dSYoshinobu Inoue * Outer subroutine: 40482cd038dSYoshinobu Inoue * Connect from a socket to a specified address. 40582cd038dSYoshinobu Inoue * Both address and port must be specified in argument sin. 40682cd038dSYoshinobu Inoue * If don't have a local address for this socket yet, 40782cd038dSYoshinobu Inoue * then pick one. 40882cd038dSYoshinobu Inoue */ 40982cd038dSYoshinobu Inoue int 410a9d22cceSGleb Smirnoff in6_pcbconnect(struct inpcb *inp, struct sockaddr_in6 *sin6, struct ucred *cred, 4110bf5377bSAndrey V. Elsukov bool sas_required) 41282cd038dSYoshinobu Inoue { 413fa046d87SRobert Watson struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 41425102351SMike Karels struct sockaddr_in6 laddr6; 41582cd038dSYoshinobu Inoue int error; 41682cd038dSYoshinobu Inoue 4173d76be28SGleb Smirnoff NET_EPOCH_ASSERT(); 4183d76be28SGleb Smirnoff INP_WLOCK_ASSERT(inp); 4193d76be28SGleb Smirnoff INP_HASH_WLOCK_ASSERT(pcbinfo); 420f161d294SMark Johnston KASSERT(sin6->sin6_family == AF_INET6, 421f161d294SMark Johnston ("%s: invalid address family for %p", __func__, sin6)); 422f161d294SMark Johnston KASSERT(sin6->sin6_len == sizeof(*sin6), 423f161d294SMark Johnston ("%s: invalid address length for %p", __func__, sin6)); 424fdb987beSMark Johnston KASSERT(IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr), 425fdb987beSMark Johnston ("%s: inp is already connected", __func__)); 426f161d294SMark Johnston 42725102351SMike Karels bzero(&laddr6, sizeof(laddr6)); 42825102351SMike Karels laddr6.sin6_family = AF_INET6; 42925102351SMike Karels 4300c325f53SAlexander V. Chernikov #ifdef ROUTE_MPATH 4310c325f53SAlexander V. Chernikov if (CALC_FLOWID_OUTBOUND) { 4320c325f53SAlexander V. Chernikov uint32_t hash_type, hash_val; 4330c325f53SAlexander V. Chernikov 4340c325f53SAlexander V. Chernikov hash_val = fib6_calc_software_hash(&inp->in6p_laddr, 4350c325f53SAlexander V. Chernikov &sin6->sin6_addr, 0, sin6->sin6_port, 4360c325f53SAlexander V. Chernikov inp->inp_socket->so_proto->pr_protocol, &hash_type); 4370c325f53SAlexander V. Chernikov inp->inp_flowid = hash_val; 4380c325f53SAlexander V. Chernikov inp->inp_flowtype = hash_type; 4390c325f53SAlexander V. Chernikov } 4400c325f53SAlexander V. Chernikov #endif 44182cd038dSYoshinobu Inoue /* 44282cd038dSYoshinobu Inoue * Call inner routine, to assign local interface address. 44388ff5695SSUZUKI Shinsuke * in6_pcbladdr() may automatically fill in sin6_scope_id. 44482cd038dSYoshinobu Inoue */ 4450bf5377bSAndrey V. Elsukov if ((error = in6_pcbladdr(inp, sin6, &laddr6.sin6_addr, 4460bf5377bSAndrey V. Elsukov sas_required)) != 0) 44782cd038dSYoshinobu Inoue return (error); 44882cd038dSYoshinobu Inoue 449fa046d87SRobert Watson if (in6_pcblookup_hash_locked(pcbinfo, &sin6->sin6_addr, 4504130ea61SMark Johnston sin6->sin6_port, IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) ? 4514130ea61SMark Johnston &laddr6.sin6_addr : &inp->in6p_laddr, inp->inp_lport, 0, 4524130ea61SMark Johnston M_NODOM) != NULL) 45382cd038dSYoshinobu Inoue return (EADDRINUSE); 45482cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) { 45582cd038dSYoshinobu Inoue if (inp->inp_lport == 0) { 45625102351SMike Karels error = in_pcb_lport_dest(inp, 45725102351SMike Karels (struct sockaddr *) &laddr6, &inp->inp_lport, 458440598ddSJonathan T. Looney (struct sockaddr *) sin6, sin6->sin6_port, cred, 459440598ddSJonathan T. Looney INPLOOKUP_WILDCARD); 4604616026fSErmal Luçi if (error) 46182cd038dSYoshinobu Inoue return (error); 46282cd038dSYoshinobu Inoue } 46325102351SMike Karels inp->in6p_laddr = laddr6.sin6_addr; 46482cd038dSYoshinobu Inoue } 46582cd038dSYoshinobu Inoue inp->in6p_faddr = sin6->sin6_addr; 46682cd038dSYoshinobu Inoue inp->inp_fport = sin6->sin6_port; 46733841545SHajimu UMEMOTO /* update flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 468fc384fa5SBjoern A. Zeeb inp->inp_flow &= ~IPV6_FLOWLABEL_MASK; 469fc384fa5SBjoern A. Zeeb if (inp->inp_flags & IN6P_AUTOFLOWLABEL) 470fc384fa5SBjoern A. Zeeb inp->inp_flow |= 471b79274baSHajimu UMEMOTO (htonl(ip6_randomflowlabel()) & IPV6_FLOWLABEL_MASK); 47282cd038dSYoshinobu Inoue 473fdb987beSMark Johnston if ((inp->inp_flags & INP_INHASHLIST) != 0) { 474db0ac6deSCy Schubert in_pcbrehash(inp); 475fe1274eeSMichael Tuexen } else { 476db0ac6deSCy Schubert in_pcbinshash(inp); 477fe1274eeSMichael Tuexen } 4782cb64cb2SGeorge V. Neville-Neil 47982cd038dSYoshinobu Inoue return (0); 48082cd038dSYoshinobu Inoue } 48182cd038dSYoshinobu Inoue 48282cd038dSYoshinobu Inoue void 4831272577eSXin LI in6_pcbdisconnect(struct inpcb *inp) 48482cd038dSYoshinobu Inoue { 48507385abdSRobert Watson 4868501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 487fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); 488fdb987beSMark Johnston KASSERT(inp->inp_smr == SMR_SEQ_INVALID, 489fdb987beSMark Johnston ("%s: inp %p was already disconnected", __func__, inp)); 49007385abdSRobert Watson 491fdb987beSMark Johnston in_pcbremhash_locked(inp); 492fdb987beSMark Johnston 493fdb987beSMark Johnston /* See the comment in in_pcbinshash(). */ 494fdb987beSMark Johnston inp->inp_smr = smr_advance(inp->inp_pcbinfo->ipi_smr); 495fdb987beSMark Johnston 496fdb987beSMark Johnston /* XXX-MJ torn writes are visible to SMR lookup */ 4972589ec0fSMark Johnston memset(&inp->in6p_laddr, 0, sizeof(inp->in6p_laddr)); 4982589ec0fSMark Johnston memset(&inp->in6p_faddr, 0, sizeof(inp->in6p_faddr)); 49982cd038dSYoshinobu Inoue inp->inp_fport = 0; 50033841545SHajimu UMEMOTO /* clear flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 501fc384fa5SBjoern A. Zeeb inp->inp_flow &= ~IPV6_FLOWLABEL_MASK; 50282cd038dSYoshinobu Inoue } 50382cd038dSYoshinobu Inoue 50482cd038dSYoshinobu Inoue int 505*0fac350cSGleb Smirnoff in6_getsockaddr(struct socket *so, struct sockaddr *sa) 50682cd038dSYoshinobu Inoue { 5073e85b721SEd Maste struct inpcb *inp; 50882cd038dSYoshinobu Inoue 50982cd038dSYoshinobu Inoue inp = sotoinpcb(so); 51054d642bbSRobert Watson KASSERT(inp != NULL, ("in6_getsockaddr: inp == NULL")); 51148477723SRobert Watson 512*0fac350cSGleb Smirnoff *(struct sockaddr_in6 *)sa = (struct sockaddr_in6 ){ 513*0fac350cSGleb Smirnoff .sin6_len = sizeof(struct sockaddr_in6), 514*0fac350cSGleb Smirnoff .sin6_family = AF_INET6, 515*0fac350cSGleb Smirnoff .sin6_port = inp->inp_lport, 516*0fac350cSGleb Smirnoff .sin6_addr = inp->in6p_laddr, 517*0fac350cSGleb Smirnoff }; 518*0fac350cSGleb Smirnoff /* XXX: should catch errors */ 519*0fac350cSGleb Smirnoff (void)sa6_recoverscope((struct sockaddr_in6 *)sa); 52082cd038dSYoshinobu Inoue 521*0fac350cSGleb Smirnoff return (0); 52282cd038dSYoshinobu Inoue } 52382cd038dSYoshinobu Inoue 52482cd038dSYoshinobu Inoue int 525*0fac350cSGleb Smirnoff in6_getpeeraddr(struct socket *so, struct sockaddr *sa) 52682cd038dSYoshinobu Inoue { 52782cd038dSYoshinobu Inoue struct inpcb *inp; 52882cd038dSYoshinobu Inoue 52982cd038dSYoshinobu Inoue inp = sotoinpcb(so); 53054d642bbSRobert Watson KASSERT(inp != NULL, ("in6_getpeeraddr: inp == NULL")); 53148477723SRobert Watson 532*0fac350cSGleb Smirnoff *(struct sockaddr_in6 *)sa = (struct sockaddr_in6 ){ 533*0fac350cSGleb Smirnoff .sin6_len = sizeof(struct sockaddr_in6), 534*0fac350cSGleb Smirnoff .sin6_family = AF_INET6, 535*0fac350cSGleb Smirnoff .sin6_port = inp->inp_fport, 536*0fac350cSGleb Smirnoff .sin6_addr = inp->in6p_faddr, 537*0fac350cSGleb Smirnoff }; 538*0fac350cSGleb Smirnoff /* XXX: should catch errors */ 539*0fac350cSGleb Smirnoff (void)sa6_recoverscope((struct sockaddr_in6 *)sa); 54082cd038dSYoshinobu Inoue 541*0fac350cSGleb Smirnoff return (0); 54282cd038dSYoshinobu Inoue } 54382cd038dSYoshinobu Inoue 54482cd038dSYoshinobu Inoue int 545*0fac350cSGleb Smirnoff in6_mapped_sockaddr(struct socket *so, struct sockaddr *sa) 54682cd038dSYoshinobu Inoue { 54748477723SRobert Watson struct inpcb *inp; 54882cd038dSYoshinobu Inoue int error; 54982cd038dSYoshinobu Inoue 55048477723SRobert Watson inp = sotoinpcb(so); 55148477723SRobert Watson KASSERT(inp != NULL, ("in6_mapped_sockaddr: inp == NULL")); 55248477723SRobert Watson 55367107f45SBjoern A. Zeeb #ifdef INET 5545fac4178SHajimu UMEMOTO if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 555*0fac350cSGleb Smirnoff struct sockaddr_in sin; 556*0fac350cSGleb Smirnoff 557*0fac350cSGleb Smirnoff error = in_getsockaddr(so, (struct sockaddr *)&sin); 558369dc8ceSEivind Eklund if (error == 0) 559*0fac350cSGleb Smirnoff in6_sin_2_v4mapsin6(&sin, (struct sockaddr_in6 *)sa); 56067107f45SBjoern A. Zeeb } else 56167107f45SBjoern A. Zeeb #endif 56267107f45SBjoern A. Zeeb { 56354d642bbSRobert Watson /* scope issues will be handled in in6_getsockaddr(). */ 564*0fac350cSGleb Smirnoff error = in6_getsockaddr(so, sa); 5657efe5d92SHajimu UMEMOTO } 56682cd038dSYoshinobu Inoue 56782cd038dSYoshinobu Inoue return error; 56882cd038dSYoshinobu Inoue } 56982cd038dSYoshinobu Inoue 57082cd038dSYoshinobu Inoue int 571*0fac350cSGleb Smirnoff in6_mapped_peeraddr(struct socket *so, struct sockaddr *sa) 57282cd038dSYoshinobu Inoue { 57348477723SRobert Watson struct inpcb *inp; 57482cd038dSYoshinobu Inoue int error; 57582cd038dSYoshinobu Inoue 57648477723SRobert Watson inp = sotoinpcb(so); 57748477723SRobert Watson KASSERT(inp != NULL, ("in6_mapped_peeraddr: inp == NULL")); 57848477723SRobert Watson 57967107f45SBjoern A. Zeeb #ifdef INET 5805fac4178SHajimu UMEMOTO if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 581*0fac350cSGleb Smirnoff struct sockaddr_in sin; 582*0fac350cSGleb Smirnoff 583*0fac350cSGleb Smirnoff error = in_getpeeraddr(so, (struct sockaddr *)&sin); 584369dc8ceSEivind Eklund if (error == 0) 585*0fac350cSGleb Smirnoff in6_sin_2_v4mapsin6(&sin, (struct sockaddr_in6 *)sa); 58682cd038dSYoshinobu Inoue } else 58767107f45SBjoern A. Zeeb #endif 58854d642bbSRobert Watson /* scope issues will be handled in in6_getpeeraddr(). */ 589*0fac350cSGleb Smirnoff error = in6_getpeeraddr(so, sa); 59082cd038dSYoshinobu Inoue 59182cd038dSYoshinobu Inoue return error; 59282cd038dSYoshinobu Inoue } 59382cd038dSYoshinobu Inoue 59482cd038dSYoshinobu Inoue /* 59582cd038dSYoshinobu Inoue * Pass some notification to all connections of a protocol 59682cd038dSYoshinobu Inoue * associated with address dst. The local address and/or port numbers 59782cd038dSYoshinobu Inoue * may be specified to limit the search. The "usual action" will be 59882cd038dSYoshinobu Inoue * taken, depending on the ctlinput cmd. The caller must filter any 59982cd038dSYoshinobu Inoue * cmds that are uninteresting (e.g., no error in the map). 60082cd038dSYoshinobu Inoue * Call the protocol specific routine (if any) to report 60182cd038dSYoshinobu Inoue * any errors for each matching socket. 60282cd038dSYoshinobu Inoue */ 603db0ac6deSCy Schubert static bool 604db0ac6deSCy Schubert inp_match6(const struct inpcb *inp, void *v __unused) 605db0ac6deSCy Schubert { 606db0ac6deSCy Schubert 607db0ac6deSCy Schubert return ((inp->inp_vflag & INP_IPV6) != 0); 608db0ac6deSCy Schubert } 609fcb3f813SGleb Smirnoff 61082cd038dSYoshinobu Inoue void 61143d39ca7SGleb Smirnoff in6_pcbnotify(struct inpcbinfo *pcbinfo, struct sockaddr_in6 *sa6_dst, 61243d39ca7SGleb Smirnoff u_int fport_arg, const struct sockaddr_in6 *src, u_int lport_arg, 613fcb3f813SGleb Smirnoff int errno, void *cmdarg, 6149233d8f3SDavid E. O'Brien struct inpcb *(*notify)(struct inpcb *, int)) 61582cd038dSYoshinobu Inoue { 616db0ac6deSCy Schubert struct inpcb_iterator inpi = INP_ITERATOR(pcbinfo, INPLOOKUP_WLOCKPCB, 617db0ac6deSCy Schubert inp_match6, NULL); 618db0ac6deSCy Schubert struct inpcb *inp; 61943d39ca7SGleb Smirnoff struct sockaddr_in6 sa6_src; 62082cd038dSYoshinobu Inoue u_short fport = fport_arg, lport = lport_arg; 62133841545SHajimu UMEMOTO u_int32_t flowinfo; 62233841545SHajimu UMEMOTO 62333841545SHajimu UMEMOTO if (IN6_IS_ADDR_UNSPECIFIED(&sa6_dst->sin6_addr)) 62482cd038dSYoshinobu Inoue return; 62582cd038dSYoshinobu Inoue 62682cd038dSYoshinobu Inoue /* 62733841545SHajimu UMEMOTO * note that src can be NULL when we get notify by local fragmentation. 62833841545SHajimu UMEMOTO */ 62943d39ca7SGleb Smirnoff sa6_src = (src == NULL) ? sa6_any : *src; 63033841545SHajimu UMEMOTO flowinfo = sa6_src.sin6_flowinfo; 63133841545SHajimu UMEMOTO 632db0ac6deSCy Schubert while ((inp = inp_next(&inpi)) != NULL) { 633db0ac6deSCy Schubert INP_WLOCK_ASSERT(inp); 634686cdd19SJun-ichiro itojun Hagino /* 635efddf5c6SHajimu UMEMOTO * If the error designates a new path MTU for a destination 636efddf5c6SHajimu UMEMOTO * and the application (associated with this socket) wanted to 6378f1beb88SAndrey V. Elsukov * know the value, notify. 638efddf5c6SHajimu UMEMOTO * XXX: should we avoid to notify the value to TCP sockets? 639efddf5c6SHajimu UMEMOTO */ 640fcb3f813SGleb Smirnoff if (errno == EMSGSIZE && cmdarg != NULL) 64143d39ca7SGleb Smirnoff ip6_notify_pmtu(inp, sa6_dst, *(uint32_t *)cmdarg); 642efddf5c6SHajimu UMEMOTO 643efddf5c6SHajimu UMEMOTO /* 64433841545SHajimu UMEMOTO * Detect if we should notify the error. If no source and 64504389c85SGordon Bergling * destination ports are specified, but non-zero flowinfo and 64633841545SHajimu UMEMOTO * local address match, notify the error. This is the case 64733841545SHajimu UMEMOTO * when the error is delivered with an encrypted buffer 64833841545SHajimu UMEMOTO * by ESP. Otherwise, just compare addresses and ports 64933841545SHajimu UMEMOTO * as usual. 650686cdd19SJun-ichiro itojun Hagino */ 65133841545SHajimu UMEMOTO if (lport == 0 && fport == 0 && flowinfo && 65233841545SHajimu UMEMOTO inp->inp_socket != NULL && 653fc384fa5SBjoern A. Zeeb flowinfo == (inp->inp_flow & IPV6_FLOWLABEL_MASK) && 65433841545SHajimu UMEMOTO IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, &sa6_src.sin6_addr)) 65533841545SHajimu UMEMOTO goto do_notify; 65633841545SHajimu UMEMOTO else if (!IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, 65733841545SHajimu UMEMOTO &sa6_dst->sin6_addr) || 65882cd038dSYoshinobu Inoue inp->inp_socket == 0 || 65982cd038dSYoshinobu Inoue (lport && inp->inp_lport != lport) || 66033841545SHajimu UMEMOTO (!IN6_IS_ADDR_UNSPECIFIED(&sa6_src.sin6_addr) && 66133841545SHajimu UMEMOTO !IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, 66233841545SHajimu UMEMOTO &sa6_src.sin6_addr)) || 663f31f65a7SRobert Watson (fport && inp->inp_fport != fport)) { 66482cd038dSYoshinobu Inoue continue; 665f31f65a7SRobert Watson } 666686cdd19SJun-ichiro itojun Hagino 66733841545SHajimu UMEMOTO do_notify: 668db0ac6deSCy Schubert if (notify) 669db0ac6deSCy Schubert (*notify)(inp, errno); 67082cd038dSYoshinobu Inoue } 67182cd038dSYoshinobu Inoue } 67282cd038dSYoshinobu Inoue 67382cd038dSYoshinobu Inoue /* 674fa046d87SRobert Watson * Lookup a PCB based on the local address and port. Caller must hold the 675fa046d87SRobert Watson * hash lock. No inpcb locks or references are acquired. 67682cd038dSYoshinobu Inoue */ 67782cd038dSYoshinobu Inoue struct inpcb * 6781272577eSXin LI in6_pcblookup_local(struct inpcbinfo *pcbinfo, struct in6_addr *laddr, 67968e0d7e0SRobert Watson u_short lport, int lookupflags, struct ucred *cred) 68082cd038dSYoshinobu Inoue { 6813e85b721SEd Maste struct inpcb *inp; 68282cd038dSYoshinobu Inoue int matchwild = 3, wildcard; 68382cd038dSYoshinobu Inoue 68468e0d7e0SRobert Watson KASSERT((lookupflags & ~(INPLOOKUP_WILDCARD)) == 0, 68568e0d7e0SRobert Watson ("%s: invalid lookup flags %d", __func__, lookupflags)); 68668e0d7e0SRobert Watson 687c17cd08fSGleb Smirnoff INP_HASH_LOCK_ASSERT(pcbinfo); 6888deea4a8SRobert Watson 68968e0d7e0SRobert Watson if ((lookupflags & INPLOOKUP_WILDCARD) == 0) { 69082cd038dSYoshinobu Inoue struct inpcbhead *head; 69182cd038dSYoshinobu Inoue /* 69282cd038dSYoshinobu Inoue * Look for an unconnected (wildcard foreign addr) PCB that 69382cd038dSYoshinobu Inoue * matches the local address and port we're looking for. 69482cd038dSYoshinobu Inoue */ 695fdb987beSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 6961b44e5ffSAndrey V. Elsukov pcbinfo->ipi_hashmask)]; 697fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 698413628a7SBjoern A. Zeeb /* XXX inp locking */ 699369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV6) == 0) 70082cd038dSYoshinobu Inoue continue; 70182cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) && 70282cd038dSYoshinobu Inoue IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 70382cd038dSYoshinobu Inoue inp->inp_lport == lport) { 704413628a7SBjoern A. Zeeb /* Found. */ 705ac1750ddSMark Johnston if (prison_equal_ip6(cred->cr_prison, 7060304c731SJamie Gritton inp->inp_cred->cr_prison)) 70782cd038dSYoshinobu Inoue return (inp); 70882cd038dSYoshinobu Inoue } 70982cd038dSYoshinobu Inoue } 71082cd038dSYoshinobu Inoue /* 71182cd038dSYoshinobu Inoue * Not found. 71282cd038dSYoshinobu Inoue */ 71382cd038dSYoshinobu Inoue return (NULL); 71482cd038dSYoshinobu Inoue } else { 71582cd038dSYoshinobu Inoue struct inpcbporthead *porthash; 71682cd038dSYoshinobu Inoue struct inpcbport *phd; 71782cd038dSYoshinobu Inoue struct inpcb *match = NULL; 71882cd038dSYoshinobu Inoue /* 71982cd038dSYoshinobu Inoue * Best fit PCB lookup. 72082cd038dSYoshinobu Inoue * 72182cd038dSYoshinobu Inoue * First see if this local port is in use by looking on the 72282cd038dSYoshinobu Inoue * port hash list. 72382cd038dSYoshinobu Inoue */ 724712fc218SRobert Watson porthash = &pcbinfo->ipi_porthashbase[INP_PCBPORTHASH(lport, 725712fc218SRobert Watson pcbinfo->ipi_porthashmask)]; 726b872626dSMatt Macy CK_LIST_FOREACH(phd, porthash, phd_hash) { 72782cd038dSYoshinobu Inoue if (phd->phd_port == lport) 72882cd038dSYoshinobu Inoue break; 72982cd038dSYoshinobu Inoue } 73082cd038dSYoshinobu Inoue if (phd != NULL) { 73182cd038dSYoshinobu Inoue /* 73282cd038dSYoshinobu Inoue * Port is in use by one or more PCBs. Look for best 73382cd038dSYoshinobu Inoue * fit. 73482cd038dSYoshinobu Inoue */ 735b872626dSMatt Macy CK_LIST_FOREACH(inp, &phd->phd_pcblist, inp_portlist) { 73682cd038dSYoshinobu Inoue wildcard = 0; 737ac1750ddSMark Johnston if (!prison_equal_ip6(cred->cr_prison, 7380304c731SJamie Gritton inp->inp_cred->cr_prison)) 739413628a7SBjoern A. Zeeb continue; 740413628a7SBjoern A. Zeeb /* XXX inp locking */ 741369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV6) == 0) 74282cd038dSYoshinobu Inoue continue; 74382cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) 74482cd038dSYoshinobu Inoue wildcard++; 74582cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED( 74682cd038dSYoshinobu Inoue &inp->in6p_laddr)) { 74782cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(laddr)) 74882cd038dSYoshinobu Inoue wildcard++; 74982cd038dSYoshinobu Inoue else if (!IN6_ARE_ADDR_EQUAL( 75082cd038dSYoshinobu Inoue &inp->in6p_laddr, laddr)) 75182cd038dSYoshinobu Inoue continue; 75282cd038dSYoshinobu Inoue } else { 75382cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED(laddr)) 75482cd038dSYoshinobu Inoue wildcard++; 75582cd038dSYoshinobu Inoue } 75682cd038dSYoshinobu Inoue if (wildcard < matchwild) { 75782cd038dSYoshinobu Inoue match = inp; 75882cd038dSYoshinobu Inoue matchwild = wildcard; 759413628a7SBjoern A. Zeeb if (matchwild == 0) 76082cd038dSYoshinobu Inoue break; 76182cd038dSYoshinobu Inoue } 76282cd038dSYoshinobu Inoue } 76382cd038dSYoshinobu Inoue } 76482cd038dSYoshinobu Inoue return (match); 76582cd038dSYoshinobu Inoue } 76682cd038dSYoshinobu Inoue } 76782cd038dSYoshinobu Inoue 768db0ac6deSCy Schubert static bool 769db0ac6deSCy Schubert in6_multi_match(const struct inpcb *inp, void *v __unused) 770db0ac6deSCy Schubert { 771db0ac6deSCy Schubert 772db0ac6deSCy Schubert if ((inp->inp_vflag & INP_IPV6) && inp->in6p_moptions != NULL) 773db0ac6deSCy Schubert return (true); 774db0ac6deSCy Schubert else 775db0ac6deSCy Schubert return (false); 776db0ac6deSCy Schubert } 777db0ac6deSCy Schubert 778e43cc4aeSHajimu UMEMOTO void 7791272577eSXin LI in6_pcbpurgeif0(struct inpcbinfo *pcbinfo, struct ifnet *ifp) 780e43cc4aeSHajimu UMEMOTO { 781db0ac6deSCy Schubert struct inpcb_iterator inpi = INP_ITERATOR(pcbinfo, INPLOOKUP_RLOCKPCB, 782db0ac6deSCy Schubert in6_multi_match, NULL); 7830ecd976eSBjoern A. Zeeb struct inpcb *inp; 78459854ecfSHans Petter Selasky struct in6_multi *inm; 78559854ecfSHans Petter Selasky struct in6_mfilter *imf; 786e43cc4aeSHajimu UMEMOTO struct ip6_moptions *im6o; 787e43cc4aeSHajimu UMEMOTO 788db0ac6deSCy Schubert IN6_MULTI_LOCK_ASSERT(); 789db0ac6deSCy Schubert 790db0ac6deSCy Schubert while ((inp = inp_next(&inpi)) != NULL) { 791db0ac6deSCy Schubert INP_RLOCK_ASSERT(inp); 792db0ac6deSCy Schubert 7930ecd976eSBjoern A. Zeeb im6o = inp->in6p_moptions; 794e43cc4aeSHajimu UMEMOTO /* 79533cde130SBruce M Simpson * Unselect the outgoing ifp for multicast if it 79633cde130SBruce M Simpson * is being detached. 797e43cc4aeSHajimu UMEMOTO */ 798e43cc4aeSHajimu UMEMOTO if (im6o->im6o_multicast_ifp == ifp) 799e43cc4aeSHajimu UMEMOTO im6o->im6o_multicast_ifp = NULL; 800e43cc4aeSHajimu UMEMOTO /* 801e43cc4aeSHajimu UMEMOTO * Drop multicast group membership if we joined 802e43cc4aeSHajimu UMEMOTO * through the interface being detached. 803e43cc4aeSHajimu UMEMOTO */ 80459854ecfSHans Petter Selasky restart: 80559854ecfSHans Petter Selasky IP6_MFILTER_FOREACH(imf, &im6o->im6o_head) { 80659854ecfSHans Petter Selasky if ((inm = imf->im6f_in6m) == NULL) 80759854ecfSHans Petter Selasky continue; 80859854ecfSHans Petter Selasky if (inm->in6m_ifp != ifp) 80959854ecfSHans Petter Selasky continue; 81059854ecfSHans Petter Selasky ip6_mfilter_remove(&im6o->im6o_head, imf); 81159854ecfSHans Petter Selasky in6_leavegroup_locked(inm, NULL); 81259854ecfSHans Petter Selasky ip6_mfilter_free(imf); 81359854ecfSHans Petter Selasky goto restart; 814e43cc4aeSHajimu UMEMOTO } 815e43cc4aeSHajimu UMEMOTO } 816e43cc4aeSHajimu UMEMOTO } 817e43cc4aeSHajimu UMEMOTO 81882cd038dSYoshinobu Inoue /* 81982cd038dSYoshinobu Inoue * Check for alternatives when higher level complains 82082cd038dSYoshinobu Inoue * about service problems. For now, invalidate cached 82182cd038dSYoshinobu Inoue * routing information. If the route was created dynamically 82282cd038dSYoshinobu Inoue * (by a redirect), time to try a default gateway again. 82382cd038dSYoshinobu Inoue */ 82482cd038dSYoshinobu Inoue void 825ec86402eSBjoern A. Zeeb in6_losing(struct inpcb *inp) 82682cd038dSYoshinobu Inoue { 8271272577eSXin LI 828ec86402eSBjoern A. Zeeb RO_INVALIDATE_CACHE(&inp->inp_route6); 82982cd038dSYoshinobu Inoue } 83082cd038dSYoshinobu Inoue 83182cd038dSYoshinobu Inoue /* 83282cd038dSYoshinobu Inoue * After a routing change, flush old routing 83382cd038dSYoshinobu Inoue * and allocate a (hopefully) better one. 83482cd038dSYoshinobu Inoue */ 8353ce144eaSJeffrey Hsu struct inpcb * 836ec86402eSBjoern A. Zeeb in6_rtchange(struct inpcb *inp, int errno __unused) 83782cd038dSYoshinobu Inoue { 83884cc0778SGeorge V. Neville-Neil 839ec86402eSBjoern A. Zeeb RO_INVALIDATE_CACHE(&inp->inp_route6); 8403ce144eaSJeffrey Hsu return inp; 84182cd038dSYoshinobu Inoue } 84282cd038dSYoshinobu Inoue 843d93ec8cbSMark Johnston static bool 844d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(const struct inpcblbgroup *grp, int domain) 845d93ec8cbSMark Johnston { 846d93ec8cbSMark Johnston return (domain == M_NODOM || domain == grp->il_numa_domain); 847d93ec8cbSMark Johnston } 848d93ec8cbSMark Johnston 8491a43cff9SSean Bruno static struct inpcb * 8501a43cff9SSean Bruno in6_pcblookup_lbgroup(const struct inpcbinfo *pcbinfo, 8514130ea61SMark Johnston const struct in6_addr *faddr, uint16_t fport, const struct in6_addr *laddr, 8524130ea61SMark Johnston uint16_t lport, uint8_t domain) 8531a43cff9SSean Bruno { 8541a43cff9SSean Bruno const struct inpcblbgrouphead *hdr; 8551a43cff9SSean Bruno struct inpcblbgroup *grp; 856d93ec8cbSMark Johnston struct inpcblbgroup *jail_exact, *jail_wild, *local_exact, *local_wild; 8571a43cff9SSean Bruno 8581a43cff9SSean Bruno INP_HASH_LOCK_ASSERT(pcbinfo); 8591a43cff9SSean Bruno 8609d2877fcSMark Johnston hdr = &pcbinfo->ipi_lbgrouphashbase[ 8619d2877fcSMark Johnston INP_PCBPORTHASH(lport, pcbinfo->ipi_lbgrouphashmask)]; 8621a43cff9SSean Bruno 8631a43cff9SSean Bruno /* 864d93ec8cbSMark Johnston * Search for an LB group match based on the following criteria: 865d93ec8cbSMark Johnston * - prefer jailed groups to non-jailed groups 866d93ec8cbSMark Johnston * - prefer exact source address matches to wildcard matches 867d93ec8cbSMark Johnston * - prefer groups bound to the specified NUMA domain 8681a43cff9SSean Bruno */ 869d93ec8cbSMark Johnston jail_exact = jail_wild = local_exact = local_wild = NULL; 87054af3d0dSMark Johnston CK_LIST_FOREACH(grp, hdr, il_list) { 871d93ec8cbSMark Johnston bool injail; 872d93ec8cbSMark Johnston 8734b82a7b6SAndrew Gallatin #ifdef INET 8744b82a7b6SAndrew Gallatin if (!(grp->il_vflag & INP_IPV6)) 8754b82a7b6SAndrew Gallatin continue; 8764b82a7b6SAndrew Gallatin #endif 877d3a4b0daSMark Johnston if (grp->il_lport != lport) 878d3a4b0daSMark Johnston continue; 8791a43cff9SSean Bruno 880d93ec8cbSMark Johnston injail = prison_flag(grp->il_cred, PR_IP6) != 0; 881d93ec8cbSMark Johnston if (injail && prison_check_ip6_locked(grp->il_cred->cr_prison, 882d93ec8cbSMark Johnston laddr) != 0) 883d93ec8cbSMark Johnston continue; 884d93ec8cbSMark Johnston 885a034518aSAndrew Gallatin if (IN6_ARE_ADDR_EQUAL(&grp->il6_laddr, laddr)) { 886d93ec8cbSMark Johnston if (injail) { 887d93ec8cbSMark Johnston jail_exact = grp; 888d93ec8cbSMark Johnston if (in6_pcblookup_lb_numa_match(grp, domain)) 889d93ec8cbSMark Johnston /* This is a perfect match. */ 890d93ec8cbSMark Johnston goto out; 891d93ec8cbSMark Johnston } else if (local_exact == NULL || 892d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) { 893d93ec8cbSMark Johnston local_exact = grp; 894a034518aSAndrew Gallatin } 8954130ea61SMark Johnston } else if (IN6_IS_ADDR_UNSPECIFIED(&grp->il6_laddr)) { 896d93ec8cbSMark Johnston if (injail) { 897d93ec8cbSMark Johnston if (jail_wild == NULL || 898d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) 899d93ec8cbSMark Johnston jail_wild = grp; 900d93ec8cbSMark Johnston } else if (local_wild == NULL || 901d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) { 902d93ec8cbSMark Johnston local_wild = grp; 903d93ec8cbSMark Johnston } 904d93ec8cbSMark Johnston } 905d93ec8cbSMark Johnston } 906d93ec8cbSMark Johnston 907d93ec8cbSMark Johnston if (jail_exact != NULL) 908d93ec8cbSMark Johnston grp = jail_exact; 909d93ec8cbSMark Johnston else if (jail_wild != NULL) 910d93ec8cbSMark Johnston grp = jail_wild; 911d93ec8cbSMark Johnston else if (local_exact != NULL) 912d93ec8cbSMark Johnston grp = local_exact; 913a034518aSAndrew Gallatin else 914d93ec8cbSMark Johnston grp = local_wild; 915d93ec8cbSMark Johnston if (grp == NULL) 916d93ec8cbSMark Johnston return (NULL); 917d93ec8cbSMark Johnston out: 918d93ec8cbSMark Johnston return (grp->il_inp[INP6_PCBLBGROUP_PKTHASH(faddr, lport, fport) % 919d93ec8cbSMark Johnston grp->il_inpcnt]); 9201a43cff9SSean Bruno } 9211a43cff9SSean Bruno 9223e98dcb3SMark Johnston static bool 9233e98dcb3SMark Johnston in6_pcblookup_exact_match(const struct inpcb *inp, const struct in6_addr *faddr, 9243e98dcb3SMark Johnston u_short fport, const struct in6_addr *laddr, u_short lport) 9253e98dcb3SMark Johnston { 9263e98dcb3SMark Johnston /* XXX inp locking */ 9273e98dcb3SMark Johnston if ((inp->inp_vflag & INP_IPV6) == 0) 9283e98dcb3SMark Johnston return (false); 9293e98dcb3SMark Johnston if (IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, faddr) && 9303e98dcb3SMark Johnston IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 9313e98dcb3SMark Johnston inp->inp_fport == fport && inp->inp_lport == lport) 9323e98dcb3SMark Johnston return (true); 9333e98dcb3SMark Johnston return (false); 9343e98dcb3SMark Johnston } 9353e98dcb3SMark Johnston 9364130ea61SMark Johnston static struct inpcb * 9377b92493aSMark Johnston in6_pcblookup_hash_exact(struct inpcbinfo *pcbinfo, 9387b92493aSMark Johnston const struct in6_addr *faddr, u_short fport, 9397b92493aSMark Johnston const struct in6_addr *laddr, u_short lport) 94082cd038dSYoshinobu Inoue { 94182cd038dSYoshinobu Inoue struct inpcbhead *head; 9423e98dcb3SMark Johnston struct inpcb *inp; 94368e0d7e0SRobert Watson 944fa046d87SRobert Watson INP_HASH_LOCK_ASSERT(pcbinfo); 9458deea4a8SRobert Watson 94682cd038dSYoshinobu Inoue /* 94782cd038dSYoshinobu Inoue * First look for an exact match. 94882cd038dSYoshinobu Inoue */ 949fdb987beSMark Johnston head = &pcbinfo->ipi_hash_exact[INP6_PCBHASH(faddr, lport, fport, 950a0577692SGleb Smirnoff pcbinfo->ipi_hashmask)]; 951fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_exact) { 9523e98dcb3SMark Johnston if (in6_pcblookup_exact_match(inp, faddr, fport, laddr, lport)) 95382cd038dSYoshinobu Inoue return (inp); 95482cd038dSYoshinobu Inoue } 9553e98dcb3SMark Johnston return (NULL); 9563e98dcb3SMark Johnston } 9573e98dcb3SMark Johnston 9583e98dcb3SMark Johnston typedef enum { 9593e98dcb3SMark Johnston INPLOOKUP_MATCH_NONE = 0, 9603e98dcb3SMark Johnston INPLOOKUP_MATCH_WILD = 1, 9613e98dcb3SMark Johnston INPLOOKUP_MATCH_LADDR = 2, 9623e98dcb3SMark Johnston } inp_lookup_match_t; 9633e98dcb3SMark Johnston 9643e98dcb3SMark Johnston static inp_lookup_match_t 9653e98dcb3SMark Johnston in6_pcblookup_wild_match(const struct inpcb *inp, const struct in6_addr *laddr, 9663e98dcb3SMark Johnston u_short lport) 9673e98dcb3SMark Johnston { 9683e98dcb3SMark Johnston /* XXX inp locking */ 9693e98dcb3SMark Johnston if ((inp->inp_vflag & INP_IPV6) == 0) 9703e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 9713e98dcb3SMark Johnston if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) || 9723e98dcb3SMark Johnston inp->inp_lport != lport) 9733e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 9743e98dcb3SMark Johnston if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 9753e98dcb3SMark Johnston return (INPLOOKUP_MATCH_WILD); 9763e98dcb3SMark Johnston if (IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr)) 9773e98dcb3SMark Johnston return (INPLOOKUP_MATCH_LADDR); 9783e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 9794130ea61SMark Johnston } 98082cd038dSYoshinobu Inoue 9817b92493aSMark Johnston #define INP_LOOKUP_AGAIN ((struct inpcb *)(uintptr_t)-1) 9827b92493aSMark Johnston 9837b92493aSMark Johnston static struct inpcb * 9847b92493aSMark Johnston in6_pcblookup_hash_wild_smr(struct inpcbinfo *pcbinfo, 9857b92493aSMark Johnston const struct in6_addr *faddr, u_short fport, const struct in6_addr *laddr, 9867b92493aSMark Johnston u_short lport, const inp_lookup_t lockflags) 9877b92493aSMark Johnston { 9887b92493aSMark Johnston struct inpcbhead *head; 9897b92493aSMark Johnston struct inpcb *inp; 9907b92493aSMark Johnston 9917b92493aSMark Johnston KASSERT(SMR_ENTERED(pcbinfo->ipi_smr), 9927b92493aSMark Johnston ("%s: not in SMR read section", __func__)); 9937b92493aSMark Johnston 9947b92493aSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 9957b92493aSMark Johnston pcbinfo->ipi_hashmask)]; 9967b92493aSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 9977b92493aSMark Johnston inp_lookup_match_t match; 9987b92493aSMark Johnston 9997b92493aSMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 10007b92493aSMark Johnston if (match == INPLOOKUP_MATCH_NONE) 10017b92493aSMark Johnston continue; 10027b92493aSMark Johnston 10037b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 1004a306ed50SMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 1005a306ed50SMark Johnston if (match != INPLOOKUP_MATCH_NONE && 1006a306ed50SMark Johnston prison_check_ip6_locked(inp->inp_cred->cr_prison, 1007a306ed50SMark Johnston laddr) == 0) 10087b92493aSMark Johnston return (inp); 10097b92493aSMark Johnston inp_unlock(inp, lockflags); 10107b92493aSMark Johnston } 10117b92493aSMark Johnston 10127b92493aSMark Johnston /* 10137b92493aSMark Johnston * The matching socket disappeared out from under us. Fall back 10147b92493aSMark Johnston * to a serialized lookup. 10157b92493aSMark Johnston */ 10167b92493aSMark Johnston return (INP_LOOKUP_AGAIN); 10177b92493aSMark Johnston } 10187b92493aSMark Johnston return (NULL); 10197b92493aSMark Johnston } 10207b92493aSMark Johnston 10214130ea61SMark Johnston static struct inpcb * 10224130ea61SMark Johnston in6_pcblookup_hash_wild_locked(struct inpcbinfo *pcbinfo, 10237b92493aSMark Johnston const struct in6_addr *faddr, u_short fport, const struct in6_addr *laddr, 10244130ea61SMark Johnston u_short lport) 10254130ea61SMark Johnston { 10264130ea61SMark Johnston struct inpcbhead *head; 10274130ea61SMark Johnston struct inpcb *inp, *jail_wild, *local_exact, *local_wild; 1028d93ec8cbSMark Johnston 10293e98dcb3SMark Johnston INP_HASH_LOCK_ASSERT(pcbinfo); 10303e98dcb3SMark Johnston 1031d93ec8cbSMark Johnston /* 1032413628a7SBjoern A. Zeeb * Order of socket selection - we always prefer jails. 1033413628a7SBjoern A. Zeeb * 1. jailed, non-wild. 1034413628a7SBjoern A. Zeeb * 2. jailed, wild. 1035413628a7SBjoern A. Zeeb * 3. non-jailed, non-wild. 1036413628a7SBjoern A. Zeeb * 4. non-jailed, wild. 1037413628a7SBjoern A. Zeeb */ 1038fdb987beSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 10391b44e5ffSAndrey V. Elsukov pcbinfo->ipi_hashmask)]; 10404130ea61SMark Johnston local_wild = local_exact = jail_wild = NULL; 1041fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 10423e98dcb3SMark Johnston inp_lookup_match_t match; 10434130ea61SMark Johnston bool injail; 10444130ea61SMark Johnston 10453e98dcb3SMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 10463e98dcb3SMark Johnston if (match == INPLOOKUP_MATCH_NONE) 104782cd038dSYoshinobu Inoue continue; 1048413628a7SBjoern A. Zeeb 10494130ea61SMark Johnston injail = prison_flag(inp->inp_cred, PR_IP6) != 0; 1050413628a7SBjoern A. Zeeb if (injail) { 1051185e659cSGleb Smirnoff if (prison_check_ip6_locked( 1052185e659cSGleb Smirnoff inp->inp_cred->cr_prison, laddr) != 0) 1053413628a7SBjoern A. Zeeb continue; 1054413628a7SBjoern A. Zeeb } else { 1055413628a7SBjoern A. Zeeb if (local_exact != NULL) 1056413628a7SBjoern A. Zeeb continue; 1057413628a7SBjoern A. Zeeb } 1058413628a7SBjoern A. Zeeb 10593e98dcb3SMark Johnston if (match == INPLOOKUP_MATCH_LADDR) { 1060413628a7SBjoern A. Zeeb if (injail) 106182cd038dSYoshinobu Inoue return (inp); 1062413628a7SBjoern A. Zeeb else 1063413628a7SBjoern A. Zeeb local_exact = inp; 10643e98dcb3SMark Johnston } else { 1065413628a7SBjoern A. Zeeb if (injail) 1066413628a7SBjoern A. Zeeb jail_wild = inp; 1067413628a7SBjoern A. Zeeb else 106882cd038dSYoshinobu Inoue local_wild = inp; 106982cd038dSYoshinobu Inoue } 10704130ea61SMark Johnston } 1071413628a7SBjoern A. Zeeb 1072413628a7SBjoern A. Zeeb if (jail_wild != NULL) 1073413628a7SBjoern A. Zeeb return (jail_wild); 1074413628a7SBjoern A. Zeeb if (local_exact != NULL) 1075413628a7SBjoern A. Zeeb return (local_exact); 1076413628a7SBjoern A. Zeeb if (local_wild != NULL) 107782cd038dSYoshinobu Inoue return (local_wild); 107882cd038dSYoshinobu Inoue return (NULL); 107982cd038dSYoshinobu Inoue } 108082cd038dSYoshinobu Inoue 10814130ea61SMark Johnston struct inpcb * 10827b92493aSMark Johnston in6_pcblookup_hash_locked(struct inpcbinfo *pcbinfo, 10837b92493aSMark Johnston const struct in6_addr *faddr, u_int fport_arg, 10847b92493aSMark Johnston const struct in6_addr *laddr, u_int lport_arg, 10854130ea61SMark Johnston int lookupflags, uint8_t numa_domain) 10864130ea61SMark Johnston { 10874130ea61SMark Johnston struct inpcb *inp; 10884130ea61SMark Johnston u_short fport = fport_arg, lport = lport_arg; 10894130ea61SMark Johnston 10904130ea61SMark Johnston KASSERT((lookupflags & ~INPLOOKUP_WILDCARD) == 0, 10914130ea61SMark Johnston ("%s: invalid lookup flags %d", __func__, lookupflags)); 10924130ea61SMark Johnston KASSERT(!IN6_IS_ADDR_UNSPECIFIED(faddr), 10934130ea61SMark Johnston ("%s: invalid foreign address", __func__)); 10944130ea61SMark Johnston KASSERT(!IN6_IS_ADDR_UNSPECIFIED(laddr), 10954130ea61SMark Johnston ("%s: invalid local address", __func__)); 10964130ea61SMark Johnston INP_HASH_LOCK_ASSERT(pcbinfo); 10974130ea61SMark Johnston 10984130ea61SMark Johnston inp = in6_pcblookup_hash_exact(pcbinfo, faddr, fport, laddr, lport); 10994130ea61SMark Johnston if (inp != NULL) 11004130ea61SMark Johnston return (inp); 11014130ea61SMark Johnston 11024130ea61SMark Johnston if ((lookupflags & INPLOOKUP_WILDCARD) != 0) { 11034130ea61SMark Johnston inp = in6_pcblookup_lbgroup(pcbinfo, faddr, fport, laddr, 11044130ea61SMark Johnston lport, numa_domain); 11054130ea61SMark Johnston if (inp == NULL) { 11064130ea61SMark Johnston inp = in6_pcblookup_hash_wild_locked(pcbinfo, faddr, 11074130ea61SMark Johnston fport, laddr, lport); 11084130ea61SMark Johnston } 11094130ea61SMark Johnston } 11104130ea61SMark Johnston return (inp); 11114130ea61SMark Johnston } 11124130ea61SMark Johnston 1113fa046d87SRobert Watson static struct inpcb * 11147b92493aSMark Johnston in6_pcblookup_hash(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 11157b92493aSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 11164130ea61SMark Johnston uint8_t numa_domain) 1117fa046d87SRobert Watson { 1118fa046d87SRobert Watson struct inpcb *inp; 11197b92493aSMark Johnston const inp_lookup_t lockflags = lookupflags & INPLOOKUP_LOCKMASK; 11207b92493aSMark Johnston 11217b92493aSMark Johnston KASSERT((lookupflags & (INPLOOKUP_RLOCKPCB | INPLOOKUP_WLOCKPCB)) != 0, 11227b92493aSMark Johnston ("%s: LOCKPCB not set", __func__)); 11237b92493aSMark Johnston 11247b92493aSMark Johnston INP_HASH_WLOCK(pcbinfo); 11257b92493aSMark Johnston inp = in6_pcblookup_hash_locked(pcbinfo, faddr, fport, laddr, lport, 11267b92493aSMark Johnston lookupflags & ~INPLOOKUP_LOCKMASK, numa_domain); 11277b92493aSMark Johnston if (inp != NULL && !inp_trylock(inp, lockflags)) { 11287b92493aSMark Johnston in_pcbref(inp); 11297b92493aSMark Johnston INP_HASH_WUNLOCK(pcbinfo); 11307b92493aSMark Johnston inp_lock(inp, lockflags); 11317b92493aSMark Johnston if (in_pcbrele(inp, lockflags)) 11327b92493aSMark Johnston /* XXX-MJ or retry until we get a negative match? */ 11337b92493aSMark Johnston inp = NULL; 11347b92493aSMark Johnston } else { 11357b92493aSMark Johnston INP_HASH_WUNLOCK(pcbinfo); 11367b92493aSMark Johnston } 11377b92493aSMark Johnston return (inp); 11387b92493aSMark Johnston } 11397b92493aSMark Johnston 11407b92493aSMark Johnston static struct inpcb * 11417b92493aSMark Johnston in6_pcblookup_hash_smr(struct inpcbinfo *pcbinfo, struct in6_addr *faddr, 11427b92493aSMark Johnston u_int fport_arg, struct in6_addr *laddr, u_int lport_arg, int lookupflags, 11437b92493aSMark Johnston uint8_t numa_domain) 11447b92493aSMark Johnston { 11457b92493aSMark Johnston struct inpcb *inp; 11467b92493aSMark Johnston const inp_lookup_t lockflags = lookupflags & INPLOOKUP_LOCKMASK; 11477b92493aSMark Johnston const u_short fport = fport_arg, lport = lport_arg; 1148fa046d87SRobert Watson 1149675e2618SMark Johnston KASSERT((lookupflags & ~INPLOOKUP_MASK) == 0, 1150675e2618SMark Johnston ("%s: invalid lookup flags %d", __func__, lookupflags)); 1151675e2618SMark Johnston KASSERT((lookupflags & (INPLOOKUP_RLOCKPCB | INPLOOKUP_WLOCKPCB)) != 0, 1152675e2618SMark Johnston ("%s: LOCKPCB not set", __func__)); 1153675e2618SMark Johnston 1154db0ac6deSCy Schubert smr_enter(pcbinfo->ipi_smr); 11557b92493aSMark Johnston inp = in6_pcblookup_hash_exact(pcbinfo, faddr, fport, laddr, lport); 1156fa046d87SRobert Watson if (inp != NULL) { 11577b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 11587b92493aSMark Johnston if (__predict_true(in6_pcblookup_exact_match(inp, 11597b92493aSMark Johnston faddr, fport, laddr, lport))) 11607b92493aSMark Johnston return (inp); 11617b92493aSMark Johnston inp_unlock(inp, lockflags); 11627b92493aSMark Johnston } 11637b92493aSMark Johnston /* 11647b92493aSMark Johnston * We failed to lock the inpcb, or its connection state changed 11657b92493aSMark Johnston * out from under us. Fall back to a precise search. 11667b92493aSMark Johnston */ 11677b92493aSMark Johnston return (in6_pcblookup_hash(pcbinfo, faddr, fport, laddr, lport, 11687b92493aSMark Johnston lookupflags, numa_domain)); 11697b92493aSMark Johnston } 11707b92493aSMark Johnston 11717b92493aSMark Johnston if ((lookupflags & INPLOOKUP_WILDCARD) != 0) { 11727b92493aSMark Johnston inp = in6_pcblookup_lbgroup(pcbinfo, faddr, fport, 11737b92493aSMark Johnston laddr, lport, numa_domain); 11747b92493aSMark Johnston if (inp != NULL) { 11757b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 11767b92493aSMark Johnston if (__predict_true(in6_pcblookup_wild_match(inp, 11777b92493aSMark Johnston laddr, lport) != INPLOOKUP_MATCH_NONE)) 11787b92493aSMark Johnston return (inp); 11797b92493aSMark Johnston inp_unlock(inp, lockflags); 11807b92493aSMark Johnston } 11817b92493aSMark Johnston inp = INP_LOOKUP_AGAIN; 11827b92493aSMark Johnston } else { 11837b92493aSMark Johnston inp = in6_pcblookup_hash_wild_smr(pcbinfo, faddr, fport, 11847b92493aSMark Johnston laddr, lport, lockflags); 11857b92493aSMark Johnston } 11867b92493aSMark Johnston if (inp == INP_LOOKUP_AGAIN) { 11877b92493aSMark Johnston return (in6_pcblookup_hash(pcbinfo, faddr, fport, laddr, 11887b92493aSMark Johnston lport, lookupflags, numa_domain)); 11897b92493aSMark Johnston } 11907b92493aSMark Johnston } 11917b92493aSMark Johnston 11927b92493aSMark Johnston if (inp == NULL) 1193db0ac6deSCy Schubert smr_exit(pcbinfo->ipi_smr); 1194db0ac6deSCy Schubert 1195fa046d87SRobert Watson return (inp); 1196fa046d87SRobert Watson } 1197fa046d87SRobert Watson 1198fa046d87SRobert Watson /* 1199d3c1f003SRobert Watson * Public inpcb lookup routines, accepting a 4-tuple, and optionally, an mbuf 1200d3c1f003SRobert Watson * from which a pre-calculated hash value may be extracted. 1201fa046d87SRobert Watson */ 1202fa046d87SRobert Watson struct inpcb * 1203fa046d87SRobert Watson in6_pcblookup(struct inpcbinfo *pcbinfo, struct in6_addr *faddr, u_int fport, 12044130ea61SMark Johnston struct in6_addr *laddr, u_int lport, int lookupflags, 12054130ea61SMark Johnston struct ifnet *ifp __unused) 1206fa046d87SRobert Watson { 12074130ea61SMark Johnston return (in6_pcblookup_hash_smr(pcbinfo, faddr, fport, laddr, lport, 12084130ea61SMark Johnston lookupflags, M_NODOM)); 1209d3c1f003SRobert Watson } 1210d3c1f003SRobert Watson 1211d3c1f003SRobert Watson struct inpcb * 1212d3c1f003SRobert Watson in6_pcblookup_mbuf(struct inpcbinfo *pcbinfo, struct in6_addr *faddr, 1213d3c1f003SRobert Watson u_int fport, struct in6_addr *laddr, u_int lport, int lookupflags, 12144130ea61SMark Johnston struct ifnet *ifp __unused, struct mbuf *m) 1215d3c1f003SRobert Watson { 12164130ea61SMark Johnston return (in6_pcblookup_hash_smr(pcbinfo, faddr, fport, laddr, lport, 12174130ea61SMark Johnston lookupflags, m->m_pkthdr.numa_domain)); 1218fa046d87SRobert Watson } 1219fa046d87SRobert Watson 122082cd038dSYoshinobu Inoue void 1221dce33a45SErmal Luçi init_sin6(struct sockaddr_in6 *sin6, struct mbuf *m, int srcordst) 122282cd038dSYoshinobu Inoue { 122382cd038dSYoshinobu Inoue struct ip6_hdr *ip; 122482cd038dSYoshinobu Inoue 122582cd038dSYoshinobu Inoue ip = mtod(m, struct ip6_hdr *); 122682cd038dSYoshinobu Inoue bzero(sin6, sizeof(*sin6)); 122782cd038dSYoshinobu Inoue sin6->sin6_len = sizeof(*sin6); 122882cd038dSYoshinobu Inoue sin6->sin6_family = AF_INET6; 1229dce33a45SErmal Luçi sin6->sin6_addr = srcordst ? ip->ip6_dst : ip->ip6_src; 1230a1f7e5f8SHajimu UMEMOTO 1231a1f7e5f8SHajimu UMEMOTO (void)sa6_recoverscope(sin6); /* XXX: should catch errors... */ 123282cd038dSYoshinobu Inoue 123382cd038dSYoshinobu Inoue return; 123482cd038dSYoshinobu Inoue } 1235