1caf43b02SWarner Losh /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 482cd038dSYoshinobu Inoue * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 5fa046d87SRobert Watson * Copyright (c) 2010-2011 Juniper Networks, Inc. 682cd038dSYoshinobu Inoue * All rights reserved. 782cd038dSYoshinobu Inoue * 8fa046d87SRobert Watson * Portions of this software were developed by Robert N. M. Watson under 9fa046d87SRobert Watson * contract to Juniper Networks, Inc. 10fa046d87SRobert Watson * 1182cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 1282cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 1382cd038dSYoshinobu Inoue * are met: 1482cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 1582cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 1682cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 1782cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 1882cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 1982cd038dSYoshinobu Inoue * 3. Neither the name of the project nor the names of its contributors 2082cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 2182cd038dSYoshinobu Inoue * without specific prior written permission. 2282cd038dSYoshinobu Inoue * 2382cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 2482cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2582cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2682cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 2782cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 2882cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2982cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 3082cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 3182cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 3282cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 3382cd038dSYoshinobu Inoue * SUCH DAMAGE. 3482cd038dSYoshinobu Inoue * 35b48287a3SDavid E. O'Brien * $KAME: in6_pcb.c,v 1.31 2001/05/21 05:45:10 jinmei Exp $ 3682cd038dSYoshinobu Inoue */ 3782cd038dSYoshinobu Inoue 38caf43b02SWarner Losh /*- 3982cd038dSYoshinobu Inoue * Copyright (c) 1982, 1986, 1991, 1993 4082cd038dSYoshinobu Inoue * The Regents of the University of California. All rights reserved. 4182cd038dSYoshinobu Inoue * 4282cd038dSYoshinobu Inoue * Redistribution and use in source and binary forms, with or without 4382cd038dSYoshinobu Inoue * modification, are permitted provided that the following conditions 4482cd038dSYoshinobu Inoue * are met: 4582cd038dSYoshinobu Inoue * 1. Redistributions of source code must retain the above copyright 4682cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer. 4782cd038dSYoshinobu Inoue * 2. Redistributions in binary form must reproduce the above copyright 4882cd038dSYoshinobu Inoue * notice, this list of conditions and the following disclaimer in the 4982cd038dSYoshinobu Inoue * documentation and/or other materials provided with the distribution. 50fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 5182cd038dSYoshinobu Inoue * may be used to endorse or promote products derived from this software 5282cd038dSYoshinobu Inoue * without specific prior written permission. 5382cd038dSYoshinobu Inoue * 5482cd038dSYoshinobu Inoue * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 5582cd038dSYoshinobu Inoue * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 5682cd038dSYoshinobu Inoue * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 5782cd038dSYoshinobu Inoue * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 5882cd038dSYoshinobu Inoue * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 5982cd038dSYoshinobu Inoue * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 6082cd038dSYoshinobu Inoue * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 6182cd038dSYoshinobu Inoue * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 6282cd038dSYoshinobu Inoue * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 6382cd038dSYoshinobu Inoue * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 6482cd038dSYoshinobu Inoue * SUCH DAMAGE. 6582cd038dSYoshinobu Inoue */ 6682cd038dSYoshinobu Inoue 67b48287a3SDavid E. O'Brien #include <sys/cdefs.h> 6833841545SHajimu UMEMOTO #include "opt_inet.h" 6933841545SHajimu UMEMOTO #include "opt_inet6.h" 706a800098SYoshinobu Inoue #include "opt_ipsec.h" 710c325f53SAlexander V. Chernikov #include "opt_route.h" 727527624eSRobert Watson #include "opt_rss.h" 7382cd038dSYoshinobu Inoue 74a0577692SGleb Smirnoff #include <sys/hash.h> 7582cd038dSYoshinobu Inoue #include <sys/param.h> 7682cd038dSYoshinobu Inoue #include <sys/systm.h> 7782cd038dSYoshinobu Inoue #include <sys/malloc.h> 7882cd038dSYoshinobu Inoue #include <sys/mbuf.h> 79fb59c426SYoshinobu Inoue #include <sys/domain.h> 80fdb987beSMark Johnston #include <sys/proc.h> 8182cd038dSYoshinobu Inoue #include <sys/protosw.h> 82fdb987beSMark Johnston #include <sys/smr.h> 8382cd038dSYoshinobu Inoue #include <sys/socket.h> 8482cd038dSYoshinobu Inoue #include <sys/socketvar.h> 8582cd038dSYoshinobu Inoue #include <sys/sockio.h> 86417b35a9SMark Johnston #include <sys/sysctl.h> 8782cd038dSYoshinobu Inoue #include <sys/errno.h> 8882cd038dSYoshinobu Inoue #include <sys/time.h> 89acd3428bSRobert Watson #include <sys/priv.h> 9082cd038dSYoshinobu Inoue #include <sys/proc.h> 9182cd038dSYoshinobu Inoue #include <sys/jail.h> 9282cd038dSYoshinobu Inoue 9394540027SJeff Roberson #include <vm/uma.h> 9482cd038dSYoshinobu Inoue 9582cd038dSYoshinobu Inoue #include <net/if.h> 9676039bc8SGleb Smirnoff #include <net/if_var.h> 976d768226SGeorge V. Neville-Neil #include <net/if_llatbl.h> 9882cd038dSYoshinobu Inoue #include <net/if_types.h> 9982cd038dSYoshinobu Inoue #include <net/route.h> 100983066f0SAlexander V. Chernikov #include <net/route/nhop.h> 101417b35a9SMark Johnston #include <net/vnet.h> 10282cd038dSYoshinobu Inoue 10382cd038dSYoshinobu Inoue #include <netinet/in.h> 10482cd038dSYoshinobu Inoue #include <netinet/in_var.h> 10582cd038dSYoshinobu Inoue #include <netinet/in_systm.h> 106686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h> 107fb59c426SYoshinobu Inoue #include <netinet/ip_var.h> 108ac957cd2SJulian Elischer 10982cd038dSYoshinobu Inoue #include <netinet6/ip6_var.h> 11082cd038dSYoshinobu Inoue #include <netinet6/nd6.h> 11182cd038dSYoshinobu Inoue #include <netinet/in_pcb.h> 1120f617ae4SGleb Smirnoff #include <netinet/in_pcb_var.h> 11382cd038dSYoshinobu Inoue #include <netinet6/in6_pcb.h> 114983066f0SAlexander V. Chernikov #include <netinet6/in6_fib.h> 115a1f7e5f8SHajimu UMEMOTO #include <netinet6/scope6_var.h> 11682cd038dSYoshinobu Inoue 117417b35a9SMark Johnston SYSCTL_DECL(_net_inet6); 118417b35a9SMark Johnston SYSCTL_DECL(_net_inet6_ip6); 119417b35a9SMark Johnston VNET_DEFINE_STATIC(int, connect_in6addr_wild) = 1; 120417b35a9SMark Johnston #define V_connect_in6addr_wild VNET(connect_in6addr_wild) 121417b35a9SMark Johnston SYSCTL_INT(_net_inet6_ip6, OID_AUTO, connect_in6addr_wild, 122417b35a9SMark Johnston CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(connect_in6addr_wild), 0, 123417b35a9SMark Johnston "Allow connecting to the unspecified address for connect(2)"); 124417b35a9SMark Johnston 12582cd038dSYoshinobu Inoue int 126147f018aSGleb Smirnoff in6_pcbsetport(struct in6_addr *laddr, struct inpcb *inp, struct ucred *cred) 127147f018aSGleb Smirnoff { 128147f018aSGleb Smirnoff struct socket *so = inp->inp_socket; 129147f018aSGleb Smirnoff u_int16_t lport = 0; 130147f018aSGleb Smirnoff int error, lookupflags = 0; 131147f018aSGleb Smirnoff #ifdef INVARIANTS 132147f018aSGleb Smirnoff struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 133147f018aSGleb Smirnoff #endif 134147f018aSGleb Smirnoff 135147f018aSGleb Smirnoff INP_WLOCK_ASSERT(inp); 136147f018aSGleb Smirnoff INP_HASH_WLOCK_ASSERT(pcbinfo); 137147f018aSGleb Smirnoff 138147f018aSGleb Smirnoff error = prison_local_ip6(cred, laddr, 139147f018aSGleb Smirnoff ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0)); 140147f018aSGleb Smirnoff if (error) 141147f018aSGleb Smirnoff return(error); 142147f018aSGleb Smirnoff 143147f018aSGleb Smirnoff /* XXX: this is redundant when called from in6_pcbbind */ 144147f018aSGleb Smirnoff if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT|SO_REUSEPORT_LB)) == 0) 145147f018aSGleb Smirnoff lookupflags = INPLOOKUP_WILDCARD; 146147f018aSGleb Smirnoff 147147f018aSGleb Smirnoff inp->inp_flags |= INP_ANONPORT; 148147f018aSGleb Smirnoff 149147f018aSGleb Smirnoff error = in_pcb_lport(inp, NULL, &lport, cred, lookupflags); 150147f018aSGleb Smirnoff if (error != 0) 151147f018aSGleb Smirnoff return (error); 152147f018aSGleb Smirnoff 153147f018aSGleb Smirnoff inp->inp_lport = lport; 154147f018aSGleb Smirnoff if (in_pcbinshash(inp) != 0) { 155147f018aSGleb Smirnoff inp->in6p_laddr = in6addr_any; 156147f018aSGleb Smirnoff inp->inp_lport = 0; 157147f018aSGleb Smirnoff return (EAGAIN); 158147f018aSGleb Smirnoff } 159147f018aSGleb Smirnoff 160147f018aSGleb Smirnoff return (0); 161147f018aSGleb Smirnoff } 162147f018aSGleb Smirnoff 1631a43cff9SSean Bruno /* 16401f8ce83SMark Johnston * Determine whether the inpcb can be bound to the specified address/port tuple. 1651a43cff9SSean Bruno */ 16601f8ce83SMark Johnston static int 16701f8ce83SMark Johnston in6_pcbbind_avail(struct inpcb *inp, const struct sockaddr_in6 *sin6, 16801f8ce83SMark Johnston int sooptions, int lookupflags, struct ucred *cred) 16901f8ce83SMark Johnston { 17001f8ce83SMark Johnston const struct in6_addr *laddr; 17101f8ce83SMark Johnston int reuseport, reuseport_lb; 17201f8ce83SMark Johnston u_short lport; 1731a43cff9SSean Bruno 17401f8ce83SMark Johnston INP_LOCK_ASSERT(inp); 17501f8ce83SMark Johnston INP_HASH_LOCK_ASSERT(inp->inp_pcbinfo); 17607385abdSRobert Watson 17701f8ce83SMark Johnston laddr = &sin6->sin6_addr; 17882cd038dSYoshinobu Inoue lport = sin6->sin6_port; 17901f8ce83SMark Johnston 18001f8ce83SMark Johnston reuseport = (sooptions & SO_REUSEPORT); 18101f8ce83SMark Johnston reuseport_lb = (sooptions & SO_REUSEPORT_LB); 18201f8ce83SMark Johnston 18301f8ce83SMark Johnston if (IN6_IS_ADDR_MULTICAST(laddr)) { 18482cd038dSYoshinobu Inoue /* 18582cd038dSYoshinobu Inoue * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 18682cd038dSYoshinobu Inoue * allow compepte duplication of binding if 18782cd038dSYoshinobu Inoue * SO_REUSEPORT is set, or if SO_REUSEADDR is set 18882cd038dSYoshinobu Inoue * and a multicast address is bound on both 18982cd038dSYoshinobu Inoue * new and duplicated sockets. 19082cd038dSYoshinobu Inoue */ 19101f8ce83SMark Johnston if ((sooptions & (SO_REUSEADDR | SO_REUSEPORT)) != 0) 19282cd038dSYoshinobu Inoue reuseport = SO_REUSEADDR | SO_REUSEPORT; 1931a43cff9SSean Bruno /* 1941a43cff9SSean Bruno * XXX: How to deal with SO_REUSEPORT_LB here? 1951a43cff9SSean Bruno * Treat same as SO_REUSEPORT for now. 1961a43cff9SSean Bruno */ 19701f8ce83SMark Johnston if ((sooptions & (SO_REUSEADDR | SO_REUSEPORT_LB)) != 0) 1981a43cff9SSean Bruno reuseport_lb = SO_REUSEADDR | SO_REUSEPORT_LB; 19901f8ce83SMark Johnston } else if (!IN6_IS_ADDR_UNSPECIFIED(laddr)) { 20001f8ce83SMark Johnston struct sockaddr_in6 sin6; 201a68cc388SGleb Smirnoff struct epoch_tracker et; 2028c0fec80SRobert Watson struct ifaddr *ifa; 20382cd038dSYoshinobu Inoue 20401f8ce83SMark Johnston memset(&sin6, 0, sizeof(sin6)); 20501f8ce83SMark Johnston sin6.sin6_family = AF_INET6; 20601f8ce83SMark Johnston sin6.sin6_len = sizeof(sin6); 20701f8ce83SMark Johnston sin6.sin6_addr = *laddr; 20801f8ce83SMark Johnston 209a68cc388SGleb Smirnoff NET_EPOCH_ENTER(et); 21001f8ce83SMark Johnston if ((ifa = ifa_ifwithaddr((const struct sockaddr *)&sin6)) == 21101f8ce83SMark Johnston NULL && (inp->inp_flags & INP_BINDANY) == 0) { 212a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 21382cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 214f44270e7SPawel Jakub Dawidek } 21582cd038dSYoshinobu Inoue 21682cd038dSYoshinobu Inoue /* 21782cd038dSYoshinobu Inoue * XXX: bind to an anycast address might accidentally 21882cd038dSYoshinobu Inoue * cause sending a packet with anycast source address. 21933841545SHajimu UMEMOTO * We should allow to bind to a deprecated address, since 2207efe5d92SHajimu UMEMOTO * the application dares to use it. 22182cd038dSYoshinobu Inoue */ 2228c0fec80SRobert Watson if (ifa != NULL && 2238c0fec80SRobert Watson ((struct in6_ifaddr *)ifa)->ia6_flags & 22433841545SHajimu UMEMOTO (IN6_IFF_ANYCAST | IN6_IFF_NOTREADY | IN6_IFF_DETACHED)) { 225a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 22682cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 22782cd038dSYoshinobu Inoue } 228a68cc388SGleb Smirnoff NET_EPOCH_EXIT(et); 22982cd038dSYoshinobu Inoue } 23001f8ce83SMark Johnston 23101f8ce83SMark Johnston if (lport != 0) { 23282cd038dSYoshinobu Inoue struct inpcb *t; 23382cd038dSYoshinobu Inoue 234603724d3SBjoern A. Zeeb if (ntohs(lport) <= V_ipport_reservedhigh && 235603724d3SBjoern A. Zeeb ntohs(lport) >= V_ipport_reservedlow && 236cc426dd3SMateusz Guzik priv_check_cred(cred, PRIV_NETINET_RESERVEDPORT)) 23782cd038dSYoshinobu Inoue return (EACCES); 23845a77bf2SMark Johnston 23901f8ce83SMark Johnston if (!IN6_IS_ADDR_MULTICAST(laddr) && 24001f8ce83SMark Johnston priv_check_cred(inp->inp_cred, PRIV_NETINET_REUSEPORT) != 24101f8ce83SMark Johnston 0) { 24201f8ce83SMark Johnston t = in6_pcblookup_local(inp->inp_pcbinfo, laddr, lport, 243078b7042SBjoern A. Zeeb INPLOOKUP_WILDCARD, cred); 2443aff4ccdSMark Johnston if (t != NULL && 24501f8ce83SMark Johnston (inp->inp_socket->so_type != SOCK_STREAM || 246f66145c6SYaroslav Tykhiy IN6_IS_ADDR_UNSPECIFIED(&t->in6p_faddr)) && 24701f8ce83SMark Johnston (!IN6_IS_ADDR_UNSPECIFIED(laddr) || 24882cd038dSYoshinobu Inoue !IN6_IS_ADDR_UNSPECIFIED(&t->in6p_laddr) || 249e3ba0d6aSGleb Smirnoff (t->inp_socket->so_options & SO_REUSEPORT) || 250e3ba0d6aSGleb Smirnoff (t->inp_socket->so_options & SO_REUSEPORT_LB) == 0) && 25101f8ce83SMark Johnston (inp->inp_cred->cr_uid != t->inp_cred->cr_uid)) 25282cd038dSYoshinobu Inoue return (EADDRINUSE); 253c7c0d948SAdrian Chadd 25467107f45SBjoern A. Zeeb #ifdef INET 25533841545SHajimu UMEMOTO if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 25601f8ce83SMark Johnston IN6_IS_ADDR_UNSPECIFIED(laddr)) { 257fb59c426SYoshinobu Inoue struct sockaddr_in sin; 258fb59c426SYoshinobu Inoue 259fb59c426SYoshinobu Inoue in6_sin6_2_sin(&sin, sin6); 26001f8ce83SMark Johnston t = in_pcblookup_local(inp->inp_pcbinfo, 26101f8ce83SMark Johnston sin.sin_addr, lport, INPLOOKUP_WILDCARD, 26201f8ce83SMark Johnston cred); 2633aff4ccdSMark Johnston if (t != NULL && 26401f8ce83SMark Johnston (inp->inp_socket->so_type != SOCK_STREAM || 26545a77bf2SMark Johnston in_nullhost(t->inp_faddr)) && 26686d02c5cSBjoern A. Zeeb (inp->inp_cred->cr_uid != 26786d02c5cSBjoern A. Zeeb t->inp_cred->cr_uid)) 268fb59c426SYoshinobu Inoue return (EADDRINUSE); 269fb59c426SYoshinobu Inoue } 27067107f45SBjoern A. Zeeb #endif 27182cd038dSYoshinobu Inoue } 27201f8ce83SMark Johnston t = in6_pcblookup_local(inp->inp_pcbinfo, laddr, lport, 27301f8ce83SMark Johnston lookupflags, cred); 27445a77bf2SMark Johnston if (t != NULL && ((reuseport | reuseport_lb) & 27545a77bf2SMark Johnston t->inp_socket->so_options) == 0) 27629381b36SMikolaj Golub return (EADDRINUSE); 27767107f45SBjoern A. Zeeb #ifdef INET 27833841545SHajimu UMEMOTO if ((inp->inp_flags & IN6P_IPV6_V6ONLY) == 0 && 27901f8ce83SMark Johnston IN6_IS_ADDR_UNSPECIFIED(laddr)) { 280fb59c426SYoshinobu Inoue struct sockaddr_in sin; 281fb59c426SYoshinobu Inoue 282fb59c426SYoshinobu Inoue in6_sin6_2_sin(&sin, sin6); 28301f8ce83SMark Johnston t = in_pcblookup_local(inp->inp_pcbinfo, sin.sin_addr, 28468e0d7e0SRobert Watson lport, lookupflags, cred); 28545a77bf2SMark Johnston if (t != NULL && ((reuseport | reuseport_lb) & 28645a77bf2SMark Johnston t->inp_socket->so_options) == 0 && 28745a77bf2SMark Johnston (!in_nullhost(t->inp_laddr) || 2881a43cff9SSean Bruno (t->inp_vflag & INP_IPV6PROTO) != 0)) { 289fb59c426SYoshinobu Inoue return (EADDRINUSE); 290fb59c426SYoshinobu Inoue } 2911a43cff9SSean Bruno } 29267107f45SBjoern A. Zeeb #endif 29382cd038dSYoshinobu Inoue } 29401f8ce83SMark Johnston return (0); 29501f8ce83SMark Johnston } 29601f8ce83SMark Johnston 29701f8ce83SMark Johnston int 29801f8ce83SMark Johnston in6_pcbbind(struct inpcb *inp, struct sockaddr_in6 *sin6, struct ucred *cred) 29901f8ce83SMark Johnston { 30001f8ce83SMark Johnston struct socket *so = inp->inp_socket; 30101f8ce83SMark Johnston u_short lport = 0; 30201f8ce83SMark Johnston int error, lookupflags, sooptions; 30301f8ce83SMark Johnston 30401f8ce83SMark Johnston INP_WLOCK_ASSERT(inp); 305ffb3d384SMark Johnston INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); 30601f8ce83SMark Johnston 30701f8ce83SMark Johnston if (inp->inp_lport || !IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 30801f8ce83SMark Johnston return (EINVAL); 30901f8ce83SMark Johnston 31001f8ce83SMark Johnston lookupflags = 0; 31101f8ce83SMark Johnston sooptions = atomic_load_int(&so->so_options); 31201f8ce83SMark Johnston if ((sooptions & (SO_REUSEADDR | SO_REUSEPORT | SO_REUSEPORT_LB)) == 0) 31301f8ce83SMark Johnston lookupflags = INPLOOKUP_WILDCARD; 31401f8ce83SMark Johnston if (sin6 == NULL) { 31501f8ce83SMark Johnston if ((error = prison_local_ip6(cred, &inp->in6p_laddr, 31601f8ce83SMark Johnston ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0))) != 0) 31701f8ce83SMark Johnston return (error); 31801f8ce83SMark Johnston } else { 31901f8ce83SMark Johnston KASSERT(sin6->sin6_family == AF_INET6, 32001f8ce83SMark Johnston ("%s: invalid address family for %p", __func__, sin6)); 32101f8ce83SMark Johnston KASSERT(sin6->sin6_len == sizeof(*sin6), 32201f8ce83SMark Johnston ("%s: invalid address length for %p", __func__, sin6)); 32301f8ce83SMark Johnston 32401f8ce83SMark Johnston if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0) 32501f8ce83SMark Johnston return(error); 32601f8ce83SMark Johnston 32701f8ce83SMark Johnston if ((error = prison_local_ip6(cred, &sin6->sin6_addr, 32801f8ce83SMark Johnston ((inp->inp_flags & IN6P_IPV6_V6ONLY) != 0))) != 0) 32901f8ce83SMark Johnston return (error); 33001f8ce83SMark Johnston 33101f8ce83SMark Johnston /* See if this address/port combo is available. */ 33201f8ce83SMark Johnston error = in6_pcbbind_avail(inp, sin6, sooptions, lookupflags, 33301f8ce83SMark Johnston cred); 33401f8ce83SMark Johnston if (error != 0) 33501f8ce83SMark Johnston return (error); 33601f8ce83SMark Johnston 33701f8ce83SMark Johnston lport = sin6->sin6_port; 33882cd038dSYoshinobu Inoue inp->in6p_laddr = sin6->sin6_addr; 33982cd038dSYoshinobu Inoue } 34082cd038dSYoshinobu Inoue if (lport == 0) { 3414616026fSErmal Luçi if ((error = in6_pcbsetport(&inp->in6p_laddr, inp, cred)) != 0) { 3424a2b2562SBjoern A. Zeeb /* Undo an address bind that may have occurred. */ 3434a2b2562SBjoern A. Zeeb inp->in6p_laddr = in6addr_any; 344b89e82ddSJamie Gritton return (error); 3454a2b2562SBjoern A. Zeeb } 34655fd3bafSBjoern A. Zeeb } else { 34782cd038dSYoshinobu Inoue inp->inp_lport = lport; 34882cd038dSYoshinobu Inoue if (in_pcbinshash(inp) != 0) { 34982cd038dSYoshinobu Inoue inp->in6p_laddr = in6addr_any; 35082cd038dSYoshinobu Inoue inp->inp_lport = 0; 35182cd038dSYoshinobu Inoue return (EAGAIN); 35282cd038dSYoshinobu Inoue } 353686cdd19SJun-ichiro itojun Hagino } 35482cd038dSYoshinobu Inoue return (0); 35582cd038dSYoshinobu Inoue } 35682cd038dSYoshinobu Inoue 35782cd038dSYoshinobu Inoue /* 35882cd038dSYoshinobu Inoue * Transform old in6_pcbconnect() into an inner subroutine for new 35982cd038dSYoshinobu Inoue * in6_pcbconnect(): Do some validity-checking on the remote 36082cd038dSYoshinobu Inoue * address (in mbuf 'nam') and then determine local host address 36182cd038dSYoshinobu Inoue * (i.e., which interface) to use to access that remote host. 36282cd038dSYoshinobu Inoue * 36382cd038dSYoshinobu Inoue * This preserves definition of in6_pcbconnect(), while supporting a 36482cd038dSYoshinobu Inoue * slightly different version for T/TCP. (This is more than 36582cd038dSYoshinobu Inoue * a bit of a kludge, but cleaning up the internal interfaces would 36682cd038dSYoshinobu Inoue * have forced minor changes in every protocol). 36782cd038dSYoshinobu Inoue */ 368a7e201bbSAndrey V. Elsukov static int 369f161d294SMark Johnston in6_pcbladdr(struct inpcb *inp, struct sockaddr_in6 *sin6, 3700bf5377bSAndrey V. Elsukov struct in6_addr *plocal_addr6, bool sas_required) 37182cd038dSYoshinobu Inoue { 37282cd038dSYoshinobu Inoue int error = 0; 373a1f7e5f8SHajimu UMEMOTO int scope_ambiguous = 0; 37488d166bfSBjoern A. Zeeb struct in6_addr in6a; 37582cd038dSYoshinobu Inoue 3763d76be28SGleb Smirnoff NET_EPOCH_ASSERT(); 3778501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 378fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); /* XXXRW: why? */ 3798deea4a8SRobert Watson 38082cd038dSYoshinobu Inoue if (sin6->sin6_port == 0) 38182cd038dSYoshinobu Inoue return (EADDRNOTAVAIL); 38282cd038dSYoshinobu Inoue 383603724d3SBjoern A. Zeeb if (sin6->sin6_scope_id == 0 && !V_ip6_use_defzone) 384a1f7e5f8SHajimu UMEMOTO scope_ambiguous = 1; 385603724d3SBjoern A. Zeeb if ((error = sa6_embedscope(sin6, V_ip6_use_defzone)) != 0) 386a1f7e5f8SHajimu UMEMOTO return(error); 387a1f7e5f8SHajimu UMEMOTO 388417b35a9SMark Johnston if (V_connect_in6addr_wild && !CK_STAILQ_EMPTY(&V_in6_ifaddrhead)) { 38982cd038dSYoshinobu Inoue /* 39082cd038dSYoshinobu Inoue * If the destination address is UNSPECIFIED addr, 39182cd038dSYoshinobu Inoue * use the loopback addr, e.g ::1. 39282cd038dSYoshinobu Inoue */ 39382cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) 39482cd038dSYoshinobu Inoue sin6->sin6_addr = in6addr_loopback; 3950c605af3SMark Johnston } else if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) { 3960c605af3SMark Johnston return (ENETUNREACH); 39782cd038dSYoshinobu Inoue } 3980c605af3SMark Johnston 399b89e82ddSJamie Gritton if ((error = prison_remote_ip6(inp->inp_cred, &sin6->sin6_addr)) != 0) 400b89e82ddSJamie Gritton return (error); 401a1f7e5f8SHajimu UMEMOTO 4020bf5377bSAndrey V. Elsukov if (sas_required) { 403601c0b8bSAlexander V. Chernikov error = in6_selectsrc_socket(sin6, inp->in6p_outputopts, 404601c0b8bSAlexander V. Chernikov inp, inp->inp_cred, scope_ambiguous, &in6a, NULL); 40588d166bfSBjoern A. Zeeb if (error) 40688d166bfSBjoern A. Zeeb return (error); 4070bf5377bSAndrey V. Elsukov } else { 4080bf5377bSAndrey V. Elsukov /* 4090bf5377bSAndrey V. Elsukov * Source address selection isn't required when syncache 4100bf5377bSAndrey V. Elsukov * has already established connection and both source and 4110bf5377bSAndrey V. Elsukov * destination addresses was chosen. 4120bf5377bSAndrey V. Elsukov * 4130bf5377bSAndrey V. Elsukov * This also includes the case when fwd_tag was used to 4140bf5377bSAndrey V. Elsukov * select source address in tcp_input(). 4150bf5377bSAndrey V. Elsukov */ 4160bf5377bSAndrey V. Elsukov in6a = inp->in6p_laddr; 4170bf5377bSAndrey V. Elsukov } 4180bf5377bSAndrey V. Elsukov 419713264f6SMark Johnston if (IN6_IS_ADDR_UNSPECIFIED(&in6a)) 420713264f6SMark Johnston return (EHOSTUNREACH); 42188d166bfSBjoern A. Zeeb /* 42288d166bfSBjoern A. Zeeb * Do not update this earlier, in case we return with an error. 42388d166bfSBjoern A. Zeeb * 424601c0b8bSAlexander V. Chernikov * XXX: this in6_selectsrc_socket result might replace the bound local 425681ffdf9SBjoern A. Zeeb * address with the address specified by setsockopt(IPV6_PKTINFO). 42688d166bfSBjoern A. Zeeb * Is it the intended behavior? 42788d166bfSBjoern A. Zeeb */ 42888d166bfSBjoern A. Zeeb *plocal_addr6 = in6a; 42988d166bfSBjoern A. Zeeb 43082cd038dSYoshinobu Inoue /* 43182cd038dSYoshinobu Inoue * Don't do pcblookup call here; return interface in 43282cd038dSYoshinobu Inoue * plocal_addr6 43382cd038dSYoshinobu Inoue * and exit to caller, that will do the lookup. 43482cd038dSYoshinobu Inoue */ 435a1f7e5f8SHajimu UMEMOTO 43682cd038dSYoshinobu Inoue return (0); 43782cd038dSYoshinobu Inoue } 43882cd038dSYoshinobu Inoue 43982cd038dSYoshinobu Inoue /* 44082cd038dSYoshinobu Inoue * Outer subroutine: 44182cd038dSYoshinobu Inoue * Connect from a socket to a specified address. 44282cd038dSYoshinobu Inoue * Both address and port must be specified in argument sin. 44382cd038dSYoshinobu Inoue * If don't have a local address for this socket yet, 44482cd038dSYoshinobu Inoue * then pick one. 44582cd038dSYoshinobu Inoue */ 44682cd038dSYoshinobu Inoue int 447a9d22cceSGleb Smirnoff in6_pcbconnect(struct inpcb *inp, struct sockaddr_in6 *sin6, struct ucred *cred, 4480bf5377bSAndrey V. Elsukov bool sas_required) 44982cd038dSYoshinobu Inoue { 450fa046d87SRobert Watson struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 45125102351SMike Karels struct sockaddr_in6 laddr6; 45282cd038dSYoshinobu Inoue int error; 45382cd038dSYoshinobu Inoue 4543d76be28SGleb Smirnoff NET_EPOCH_ASSERT(); 4553d76be28SGleb Smirnoff INP_WLOCK_ASSERT(inp); 4563d76be28SGleb Smirnoff INP_HASH_WLOCK_ASSERT(pcbinfo); 457f161d294SMark Johnston KASSERT(sin6->sin6_family == AF_INET6, 458f161d294SMark Johnston ("%s: invalid address family for %p", __func__, sin6)); 459f161d294SMark Johnston KASSERT(sin6->sin6_len == sizeof(*sin6), 460f161d294SMark Johnston ("%s: invalid address length for %p", __func__, sin6)); 461fdb987beSMark Johnston KASSERT(IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr), 462fdb987beSMark Johnston ("%s: inp is already connected", __func__)); 463f161d294SMark Johnston 46425102351SMike Karels bzero(&laddr6, sizeof(laddr6)); 46525102351SMike Karels laddr6.sin6_family = AF_INET6; 46625102351SMike Karels 4670c325f53SAlexander V. Chernikov #ifdef ROUTE_MPATH 4680c325f53SAlexander V. Chernikov if (CALC_FLOWID_OUTBOUND) { 4690c325f53SAlexander V. Chernikov uint32_t hash_type, hash_val; 4700c325f53SAlexander V. Chernikov 4710c325f53SAlexander V. Chernikov hash_val = fib6_calc_software_hash(&inp->in6p_laddr, 4720c325f53SAlexander V. Chernikov &sin6->sin6_addr, 0, sin6->sin6_port, 4730c325f53SAlexander V. Chernikov inp->inp_socket->so_proto->pr_protocol, &hash_type); 4740c325f53SAlexander V. Chernikov inp->inp_flowid = hash_val; 4750c325f53SAlexander V. Chernikov inp->inp_flowtype = hash_type; 4760c325f53SAlexander V. Chernikov } 4770c325f53SAlexander V. Chernikov #endif 47882cd038dSYoshinobu Inoue /* 47982cd038dSYoshinobu Inoue * Call inner routine, to assign local interface address. 48088ff5695SSUZUKI Shinsuke * in6_pcbladdr() may automatically fill in sin6_scope_id. 48182cd038dSYoshinobu Inoue */ 4820bf5377bSAndrey V. Elsukov if ((error = in6_pcbladdr(inp, sin6, &laddr6.sin6_addr, 4830bf5377bSAndrey V. Elsukov sas_required)) != 0) 48482cd038dSYoshinobu Inoue return (error); 48582cd038dSYoshinobu Inoue 486fa046d87SRobert Watson if (in6_pcblookup_hash_locked(pcbinfo, &sin6->sin6_addr, 4874130ea61SMark Johnston sin6->sin6_port, IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) ? 4884130ea61SMark Johnston &laddr6.sin6_addr : &inp->in6p_laddr, inp->inp_lport, 0, 4894130ea61SMark Johnston M_NODOM) != NULL) 49082cd038dSYoshinobu Inoue return (EADDRINUSE); 49182cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) { 49282cd038dSYoshinobu Inoue if (inp->inp_lport == 0) { 49325102351SMike Karels error = in_pcb_lport_dest(inp, 49425102351SMike Karels (struct sockaddr *) &laddr6, &inp->inp_lport, 495440598ddSJonathan T. Looney (struct sockaddr *) sin6, sin6->sin6_port, cred, 496440598ddSJonathan T. Looney INPLOOKUP_WILDCARD); 4974616026fSErmal Luçi if (error) 49882cd038dSYoshinobu Inoue return (error); 49982cd038dSYoshinobu Inoue } 50025102351SMike Karels inp->in6p_laddr = laddr6.sin6_addr; 50182cd038dSYoshinobu Inoue } 50282cd038dSYoshinobu Inoue inp->in6p_faddr = sin6->sin6_addr; 50382cd038dSYoshinobu Inoue inp->inp_fport = sin6->sin6_port; 50433841545SHajimu UMEMOTO /* update flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 505fc384fa5SBjoern A. Zeeb inp->inp_flow &= ~IPV6_FLOWLABEL_MASK; 506fc384fa5SBjoern A. Zeeb if (inp->inp_flags & IN6P_AUTOFLOWLABEL) 507fc384fa5SBjoern A. Zeeb inp->inp_flow |= 508b79274baSHajimu UMEMOTO (htonl(ip6_randomflowlabel()) & IPV6_FLOWLABEL_MASK); 50982cd038dSYoshinobu Inoue 510fdb987beSMark Johnston if ((inp->inp_flags & INP_INHASHLIST) != 0) { 511db0ac6deSCy Schubert in_pcbrehash(inp); 512fe1274eeSMichael Tuexen } else { 513db0ac6deSCy Schubert in_pcbinshash(inp); 514fe1274eeSMichael Tuexen } 5152cb64cb2SGeorge V. Neville-Neil 51682cd038dSYoshinobu Inoue return (0); 51782cd038dSYoshinobu Inoue } 51882cd038dSYoshinobu Inoue 51982cd038dSYoshinobu Inoue void 5201272577eSXin LI in6_pcbdisconnect(struct inpcb *inp) 52182cd038dSYoshinobu Inoue { 52207385abdSRobert Watson 5238501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 524fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(inp->inp_pcbinfo); 525fdb987beSMark Johnston KASSERT(inp->inp_smr == SMR_SEQ_INVALID, 526fdb987beSMark Johnston ("%s: inp %p was already disconnected", __func__, inp)); 52707385abdSRobert Watson 528fdb987beSMark Johnston in_pcbremhash_locked(inp); 529fdb987beSMark Johnston 530fdb987beSMark Johnston /* See the comment in in_pcbinshash(). */ 531fdb987beSMark Johnston inp->inp_smr = smr_advance(inp->inp_pcbinfo->ipi_smr); 532fdb987beSMark Johnston 533fdb987beSMark Johnston /* XXX-MJ torn writes are visible to SMR lookup */ 5342589ec0fSMark Johnston memset(&inp->in6p_laddr, 0, sizeof(inp->in6p_laddr)); 5352589ec0fSMark Johnston memset(&inp->in6p_faddr, 0, sizeof(inp->in6p_faddr)); 53682cd038dSYoshinobu Inoue inp->inp_fport = 0; 53733841545SHajimu UMEMOTO /* clear flowinfo - draft-itojun-ipv6-flowlabel-api-00 */ 538fc384fa5SBjoern A. Zeeb inp->inp_flow &= ~IPV6_FLOWLABEL_MASK; 53982cd038dSYoshinobu Inoue } 54082cd038dSYoshinobu Inoue 54182cd038dSYoshinobu Inoue int 5420fac350cSGleb Smirnoff in6_getsockaddr(struct socket *so, struct sockaddr *sa) 54382cd038dSYoshinobu Inoue { 5443e85b721SEd Maste struct inpcb *inp; 54582cd038dSYoshinobu Inoue 54682cd038dSYoshinobu Inoue inp = sotoinpcb(so); 54754d642bbSRobert Watson KASSERT(inp != NULL, ("in6_getsockaddr: inp == NULL")); 54848477723SRobert Watson 5490fac350cSGleb Smirnoff *(struct sockaddr_in6 *)sa = (struct sockaddr_in6 ){ 5500fac350cSGleb Smirnoff .sin6_len = sizeof(struct sockaddr_in6), 5510fac350cSGleb Smirnoff .sin6_family = AF_INET6, 5520fac350cSGleb Smirnoff .sin6_port = inp->inp_lport, 5530fac350cSGleb Smirnoff .sin6_addr = inp->in6p_laddr, 5540fac350cSGleb Smirnoff }; 5550fac350cSGleb Smirnoff /* XXX: should catch errors */ 5560fac350cSGleb Smirnoff (void)sa6_recoverscope((struct sockaddr_in6 *)sa); 55782cd038dSYoshinobu Inoue 5580fac350cSGleb Smirnoff return (0); 55982cd038dSYoshinobu Inoue } 56082cd038dSYoshinobu Inoue 56182cd038dSYoshinobu Inoue int 5620fac350cSGleb Smirnoff in6_getpeeraddr(struct socket *so, struct sockaddr *sa) 56382cd038dSYoshinobu Inoue { 56482cd038dSYoshinobu Inoue struct inpcb *inp; 56582cd038dSYoshinobu Inoue 56682cd038dSYoshinobu Inoue inp = sotoinpcb(so); 56754d642bbSRobert Watson KASSERT(inp != NULL, ("in6_getpeeraddr: inp == NULL")); 56848477723SRobert Watson 5690fac350cSGleb Smirnoff *(struct sockaddr_in6 *)sa = (struct sockaddr_in6 ){ 5700fac350cSGleb Smirnoff .sin6_len = sizeof(struct sockaddr_in6), 5710fac350cSGleb Smirnoff .sin6_family = AF_INET6, 5720fac350cSGleb Smirnoff .sin6_port = inp->inp_fport, 5730fac350cSGleb Smirnoff .sin6_addr = inp->in6p_faddr, 5740fac350cSGleb Smirnoff }; 5750fac350cSGleb Smirnoff /* XXX: should catch errors */ 5760fac350cSGleb Smirnoff (void)sa6_recoverscope((struct sockaddr_in6 *)sa); 57782cd038dSYoshinobu Inoue 5780fac350cSGleb Smirnoff return (0); 57982cd038dSYoshinobu Inoue } 58082cd038dSYoshinobu Inoue 58182cd038dSYoshinobu Inoue int 5820fac350cSGleb Smirnoff in6_mapped_sockaddr(struct socket *so, struct sockaddr *sa) 58382cd038dSYoshinobu Inoue { 58482cd038dSYoshinobu Inoue int error; 585042fb58dSLexi Winter #ifdef INET 586042fb58dSLexi Winter struct inpcb *inp; 58782cd038dSYoshinobu Inoue 58848477723SRobert Watson inp = sotoinpcb(so); 58948477723SRobert Watson KASSERT(inp != NULL, ("in6_mapped_sockaddr: inp == NULL")); 59048477723SRobert Watson 5915fac4178SHajimu UMEMOTO if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 5920fac350cSGleb Smirnoff struct sockaddr_in sin; 5930fac350cSGleb Smirnoff 5940fac350cSGleb Smirnoff error = in_getsockaddr(so, (struct sockaddr *)&sin); 595369dc8ceSEivind Eklund if (error == 0) 5960fac350cSGleb Smirnoff in6_sin_2_v4mapsin6(&sin, (struct sockaddr_in6 *)sa); 59767107f45SBjoern A. Zeeb } else 59867107f45SBjoern A. Zeeb #endif 59967107f45SBjoern A. Zeeb { 60054d642bbSRobert Watson /* scope issues will be handled in in6_getsockaddr(). */ 6010fac350cSGleb Smirnoff error = in6_getsockaddr(so, sa); 6027efe5d92SHajimu UMEMOTO } 60382cd038dSYoshinobu Inoue 60482cd038dSYoshinobu Inoue return error; 60582cd038dSYoshinobu Inoue } 60682cd038dSYoshinobu Inoue 60782cd038dSYoshinobu Inoue int 6080fac350cSGleb Smirnoff in6_mapped_peeraddr(struct socket *so, struct sockaddr *sa) 60982cd038dSYoshinobu Inoue { 61082cd038dSYoshinobu Inoue int error; 611042fb58dSLexi Winter #ifdef INET 612042fb58dSLexi Winter struct inpcb *inp; 61382cd038dSYoshinobu Inoue 61448477723SRobert Watson inp = sotoinpcb(so); 61548477723SRobert Watson KASSERT(inp != NULL, ("in6_mapped_peeraddr: inp == NULL")); 61648477723SRobert Watson 6175fac4178SHajimu UMEMOTO if ((inp->inp_vflag & (INP_IPV4 | INP_IPV6)) == INP_IPV4) { 6180fac350cSGleb Smirnoff struct sockaddr_in sin; 6190fac350cSGleb Smirnoff 6200fac350cSGleb Smirnoff error = in_getpeeraddr(so, (struct sockaddr *)&sin); 621369dc8ceSEivind Eklund if (error == 0) 6220fac350cSGleb Smirnoff in6_sin_2_v4mapsin6(&sin, (struct sockaddr_in6 *)sa); 62382cd038dSYoshinobu Inoue } else 62467107f45SBjoern A. Zeeb #endif 625042fb58dSLexi Winter { 62654d642bbSRobert Watson /* scope issues will be handled in in6_getpeeraddr(). */ 6270fac350cSGleb Smirnoff error = in6_getpeeraddr(so, sa); 628042fb58dSLexi Winter } 62982cd038dSYoshinobu Inoue 63082cd038dSYoshinobu Inoue return error; 63182cd038dSYoshinobu Inoue } 63282cd038dSYoshinobu Inoue 63382cd038dSYoshinobu Inoue /* 63482cd038dSYoshinobu Inoue * Pass some notification to all connections of a protocol 63582cd038dSYoshinobu Inoue * associated with address dst. The local address and/or port numbers 63682cd038dSYoshinobu Inoue * may be specified to limit the search. The "usual action" will be 63782cd038dSYoshinobu Inoue * taken, depending on the ctlinput cmd. The caller must filter any 63882cd038dSYoshinobu Inoue * cmds that are uninteresting (e.g., no error in the map). 63982cd038dSYoshinobu Inoue * Call the protocol specific routine (if any) to report 64082cd038dSYoshinobu Inoue * any errors for each matching socket. 64182cd038dSYoshinobu Inoue */ 642db0ac6deSCy Schubert static bool 643db0ac6deSCy Schubert inp_match6(const struct inpcb *inp, void *v __unused) 644db0ac6deSCy Schubert { 645db0ac6deSCy Schubert 646db0ac6deSCy Schubert return ((inp->inp_vflag & INP_IPV6) != 0); 647db0ac6deSCy Schubert } 648fcb3f813SGleb Smirnoff 64982cd038dSYoshinobu Inoue void 65043d39ca7SGleb Smirnoff in6_pcbnotify(struct inpcbinfo *pcbinfo, struct sockaddr_in6 *sa6_dst, 65143d39ca7SGleb Smirnoff u_int fport_arg, const struct sockaddr_in6 *src, u_int lport_arg, 652fcb3f813SGleb Smirnoff int errno, void *cmdarg, 6539233d8f3SDavid E. O'Brien struct inpcb *(*notify)(struct inpcb *, int)) 65482cd038dSYoshinobu Inoue { 655db0ac6deSCy Schubert struct inpcb_iterator inpi = INP_ITERATOR(pcbinfo, INPLOOKUP_WLOCKPCB, 656db0ac6deSCy Schubert inp_match6, NULL); 657db0ac6deSCy Schubert struct inpcb *inp; 65843d39ca7SGleb Smirnoff struct sockaddr_in6 sa6_src; 65982cd038dSYoshinobu Inoue u_short fport = fport_arg, lport = lport_arg; 66033841545SHajimu UMEMOTO u_int32_t flowinfo; 66133841545SHajimu UMEMOTO 66233841545SHajimu UMEMOTO if (IN6_IS_ADDR_UNSPECIFIED(&sa6_dst->sin6_addr)) 66382cd038dSYoshinobu Inoue return; 66482cd038dSYoshinobu Inoue 66582cd038dSYoshinobu Inoue /* 66633841545SHajimu UMEMOTO * note that src can be NULL when we get notify by local fragmentation. 66733841545SHajimu UMEMOTO */ 66843d39ca7SGleb Smirnoff sa6_src = (src == NULL) ? sa6_any : *src; 66933841545SHajimu UMEMOTO flowinfo = sa6_src.sin6_flowinfo; 67033841545SHajimu UMEMOTO 671db0ac6deSCy Schubert while ((inp = inp_next(&inpi)) != NULL) { 672db0ac6deSCy Schubert INP_WLOCK_ASSERT(inp); 673686cdd19SJun-ichiro itojun Hagino /* 674efddf5c6SHajimu UMEMOTO * If the error designates a new path MTU for a destination 675efddf5c6SHajimu UMEMOTO * and the application (associated with this socket) wanted to 6768f1beb88SAndrey V. Elsukov * know the value, notify. 677efddf5c6SHajimu UMEMOTO * XXX: should we avoid to notify the value to TCP sockets? 678efddf5c6SHajimu UMEMOTO */ 679fcb3f813SGleb Smirnoff if (errno == EMSGSIZE && cmdarg != NULL) 68043d39ca7SGleb Smirnoff ip6_notify_pmtu(inp, sa6_dst, *(uint32_t *)cmdarg); 681efddf5c6SHajimu UMEMOTO 682efddf5c6SHajimu UMEMOTO /* 68333841545SHajimu UMEMOTO * Detect if we should notify the error. If no source and 68404389c85SGordon Bergling * destination ports are specified, but non-zero flowinfo and 68533841545SHajimu UMEMOTO * local address match, notify the error. This is the case 68633841545SHajimu UMEMOTO * when the error is delivered with an encrypted buffer 68733841545SHajimu UMEMOTO * by ESP. Otherwise, just compare addresses and ports 68833841545SHajimu UMEMOTO * as usual. 689686cdd19SJun-ichiro itojun Hagino */ 69033841545SHajimu UMEMOTO if (lport == 0 && fport == 0 && flowinfo && 69133841545SHajimu UMEMOTO inp->inp_socket != NULL && 692fc384fa5SBjoern A. Zeeb flowinfo == (inp->inp_flow & IPV6_FLOWLABEL_MASK) && 69333841545SHajimu UMEMOTO IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, &sa6_src.sin6_addr)) 69433841545SHajimu UMEMOTO goto do_notify; 69533841545SHajimu UMEMOTO else if (!IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, 69633841545SHajimu UMEMOTO &sa6_dst->sin6_addr) || 69782cd038dSYoshinobu Inoue inp->inp_socket == 0 || 69882cd038dSYoshinobu Inoue (lport && inp->inp_lport != lport) || 69933841545SHajimu UMEMOTO (!IN6_IS_ADDR_UNSPECIFIED(&sa6_src.sin6_addr) && 70033841545SHajimu UMEMOTO !IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, 70133841545SHajimu UMEMOTO &sa6_src.sin6_addr)) || 702f31f65a7SRobert Watson (fport && inp->inp_fport != fport)) { 70382cd038dSYoshinobu Inoue continue; 704f31f65a7SRobert Watson } 705686cdd19SJun-ichiro itojun Hagino 70633841545SHajimu UMEMOTO do_notify: 707db0ac6deSCy Schubert if (notify) 708db0ac6deSCy Schubert (*notify)(inp, errno); 70982cd038dSYoshinobu Inoue } 71082cd038dSYoshinobu Inoue } 71182cd038dSYoshinobu Inoue 71282cd038dSYoshinobu Inoue /* 713fa046d87SRobert Watson * Lookup a PCB based on the local address and port. Caller must hold the 714fa046d87SRobert Watson * hash lock. No inpcb locks or references are acquired. 71582cd038dSYoshinobu Inoue */ 71682cd038dSYoshinobu Inoue struct inpcb * 71752ef944bSMark Johnston in6_pcblookup_local(struct inpcbinfo *pcbinfo, const struct in6_addr *laddr, 71868e0d7e0SRobert Watson u_short lport, int lookupflags, struct ucred *cred) 71982cd038dSYoshinobu Inoue { 7203e85b721SEd Maste struct inpcb *inp; 72182cd038dSYoshinobu Inoue int matchwild = 3, wildcard; 72282cd038dSYoshinobu Inoue 72368e0d7e0SRobert Watson KASSERT((lookupflags & ~(INPLOOKUP_WILDCARD)) == 0, 72468e0d7e0SRobert Watson ("%s: invalid lookup flags %d", __func__, lookupflags)); 72568e0d7e0SRobert Watson 726c17cd08fSGleb Smirnoff INP_HASH_LOCK_ASSERT(pcbinfo); 7278deea4a8SRobert Watson 72868e0d7e0SRobert Watson if ((lookupflags & INPLOOKUP_WILDCARD) == 0) { 72982cd038dSYoshinobu Inoue struct inpcbhead *head; 73082cd038dSYoshinobu Inoue /* 73182cd038dSYoshinobu Inoue * Look for an unconnected (wildcard foreign addr) PCB that 73282cd038dSYoshinobu Inoue * matches the local address and port we're looking for. 73382cd038dSYoshinobu Inoue */ 734fdb987beSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 7351b44e5ffSAndrey V. Elsukov pcbinfo->ipi_hashmask)]; 736fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 737413628a7SBjoern A. Zeeb /* XXX inp locking */ 738369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV6) == 0) 73982cd038dSYoshinobu Inoue continue; 74082cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) && 74182cd038dSYoshinobu Inoue IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 74282cd038dSYoshinobu Inoue inp->inp_lport == lport) { 743413628a7SBjoern A. Zeeb /* Found. */ 744ac1750ddSMark Johnston if (prison_equal_ip6(cred->cr_prison, 7450304c731SJamie Gritton inp->inp_cred->cr_prison)) 74682cd038dSYoshinobu Inoue return (inp); 74782cd038dSYoshinobu Inoue } 74882cd038dSYoshinobu Inoue } 74982cd038dSYoshinobu Inoue /* 75082cd038dSYoshinobu Inoue * Not found. 75182cd038dSYoshinobu Inoue */ 75282cd038dSYoshinobu Inoue return (NULL); 75382cd038dSYoshinobu Inoue } else { 75482cd038dSYoshinobu Inoue struct inpcbporthead *porthash; 75582cd038dSYoshinobu Inoue struct inpcbport *phd; 75682cd038dSYoshinobu Inoue struct inpcb *match = NULL; 75782cd038dSYoshinobu Inoue /* 75882cd038dSYoshinobu Inoue * Best fit PCB lookup. 75982cd038dSYoshinobu Inoue * 76082cd038dSYoshinobu Inoue * First see if this local port is in use by looking on the 76182cd038dSYoshinobu Inoue * port hash list. 76282cd038dSYoshinobu Inoue */ 763712fc218SRobert Watson porthash = &pcbinfo->ipi_porthashbase[INP_PCBPORTHASH(lport, 764712fc218SRobert Watson pcbinfo->ipi_porthashmask)]; 765b872626dSMatt Macy CK_LIST_FOREACH(phd, porthash, phd_hash) { 76682cd038dSYoshinobu Inoue if (phd->phd_port == lport) 76782cd038dSYoshinobu Inoue break; 76882cd038dSYoshinobu Inoue } 76982cd038dSYoshinobu Inoue if (phd != NULL) { 77082cd038dSYoshinobu Inoue /* 77182cd038dSYoshinobu Inoue * Port is in use by one or more PCBs. Look for best 77282cd038dSYoshinobu Inoue * fit. 77382cd038dSYoshinobu Inoue */ 774b872626dSMatt Macy CK_LIST_FOREACH(inp, &phd->phd_pcblist, inp_portlist) { 77582cd038dSYoshinobu Inoue wildcard = 0; 776ac1750ddSMark Johnston if (!prison_equal_ip6(cred->cr_prison, 7770304c731SJamie Gritton inp->inp_cred->cr_prison)) 778413628a7SBjoern A. Zeeb continue; 779413628a7SBjoern A. Zeeb /* XXX inp locking */ 780369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV6) == 0) 78182cd038dSYoshinobu Inoue continue; 78282cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr)) 78382cd038dSYoshinobu Inoue wildcard++; 78482cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED( 78582cd038dSYoshinobu Inoue &inp->in6p_laddr)) { 78682cd038dSYoshinobu Inoue if (IN6_IS_ADDR_UNSPECIFIED(laddr)) 78782cd038dSYoshinobu Inoue wildcard++; 78882cd038dSYoshinobu Inoue else if (!IN6_ARE_ADDR_EQUAL( 78982cd038dSYoshinobu Inoue &inp->in6p_laddr, laddr)) 79082cd038dSYoshinobu Inoue continue; 79182cd038dSYoshinobu Inoue } else { 79282cd038dSYoshinobu Inoue if (!IN6_IS_ADDR_UNSPECIFIED(laddr)) 79382cd038dSYoshinobu Inoue wildcard++; 79482cd038dSYoshinobu Inoue } 79582cd038dSYoshinobu Inoue if (wildcard < matchwild) { 79682cd038dSYoshinobu Inoue match = inp; 79782cd038dSYoshinobu Inoue matchwild = wildcard; 798413628a7SBjoern A. Zeeb if (matchwild == 0) 79982cd038dSYoshinobu Inoue break; 80082cd038dSYoshinobu Inoue } 80182cd038dSYoshinobu Inoue } 80282cd038dSYoshinobu Inoue } 80382cd038dSYoshinobu Inoue return (match); 80482cd038dSYoshinobu Inoue } 80582cd038dSYoshinobu Inoue } 80682cd038dSYoshinobu Inoue 807db0ac6deSCy Schubert static bool 808db0ac6deSCy Schubert in6_multi_match(const struct inpcb *inp, void *v __unused) 809db0ac6deSCy Schubert { 810db0ac6deSCy Schubert 811db0ac6deSCy Schubert if ((inp->inp_vflag & INP_IPV6) && inp->in6p_moptions != NULL) 812db0ac6deSCy Schubert return (true); 813db0ac6deSCy Schubert else 814db0ac6deSCy Schubert return (false); 815db0ac6deSCy Schubert } 816db0ac6deSCy Schubert 817e43cc4aeSHajimu UMEMOTO void 8181272577eSXin LI in6_pcbpurgeif0(struct inpcbinfo *pcbinfo, struct ifnet *ifp) 819e43cc4aeSHajimu UMEMOTO { 820db0ac6deSCy Schubert struct inpcb_iterator inpi = INP_ITERATOR(pcbinfo, INPLOOKUP_RLOCKPCB, 821db0ac6deSCy Schubert in6_multi_match, NULL); 8220ecd976eSBjoern A. Zeeb struct inpcb *inp; 82359854ecfSHans Petter Selasky struct in6_multi *inm; 82459854ecfSHans Petter Selasky struct in6_mfilter *imf; 825e43cc4aeSHajimu UMEMOTO struct ip6_moptions *im6o; 826e43cc4aeSHajimu UMEMOTO 827db0ac6deSCy Schubert IN6_MULTI_LOCK_ASSERT(); 828db0ac6deSCy Schubert 829db0ac6deSCy Schubert while ((inp = inp_next(&inpi)) != NULL) { 830db0ac6deSCy Schubert INP_RLOCK_ASSERT(inp); 831db0ac6deSCy Schubert 8320ecd976eSBjoern A. Zeeb im6o = inp->in6p_moptions; 833e43cc4aeSHajimu UMEMOTO /* 83433cde130SBruce M Simpson * Unselect the outgoing ifp for multicast if it 83533cde130SBruce M Simpson * is being detached. 836e43cc4aeSHajimu UMEMOTO */ 837e43cc4aeSHajimu UMEMOTO if (im6o->im6o_multicast_ifp == ifp) 838e43cc4aeSHajimu UMEMOTO im6o->im6o_multicast_ifp = NULL; 839e43cc4aeSHajimu UMEMOTO /* 840e43cc4aeSHajimu UMEMOTO * Drop multicast group membership if we joined 841e43cc4aeSHajimu UMEMOTO * through the interface being detached. 842e43cc4aeSHajimu UMEMOTO */ 84359854ecfSHans Petter Selasky restart: 84459854ecfSHans Petter Selasky IP6_MFILTER_FOREACH(imf, &im6o->im6o_head) { 84559854ecfSHans Petter Selasky if ((inm = imf->im6f_in6m) == NULL) 84659854ecfSHans Petter Selasky continue; 84759854ecfSHans Petter Selasky if (inm->in6m_ifp != ifp) 84859854ecfSHans Petter Selasky continue; 84959854ecfSHans Petter Selasky ip6_mfilter_remove(&im6o->im6o_head, imf); 85059854ecfSHans Petter Selasky in6_leavegroup_locked(inm, NULL); 85159854ecfSHans Petter Selasky ip6_mfilter_free(imf); 85259854ecfSHans Petter Selasky goto restart; 853e43cc4aeSHajimu UMEMOTO } 854e43cc4aeSHajimu UMEMOTO } 855e43cc4aeSHajimu UMEMOTO } 856e43cc4aeSHajimu UMEMOTO 85782cd038dSYoshinobu Inoue /* 85882cd038dSYoshinobu Inoue * Check for alternatives when higher level complains 85982cd038dSYoshinobu Inoue * about service problems. For now, invalidate cached 86082cd038dSYoshinobu Inoue * routing information. If the route was created dynamically 86182cd038dSYoshinobu Inoue * (by a redirect), time to try a default gateway again. 86282cd038dSYoshinobu Inoue */ 86382cd038dSYoshinobu Inoue void 864ec86402eSBjoern A. Zeeb in6_losing(struct inpcb *inp) 86582cd038dSYoshinobu Inoue { 8661272577eSXin LI 867ec86402eSBjoern A. Zeeb RO_INVALIDATE_CACHE(&inp->inp_route6); 86882cd038dSYoshinobu Inoue } 86982cd038dSYoshinobu Inoue 87082cd038dSYoshinobu Inoue /* 87182cd038dSYoshinobu Inoue * After a routing change, flush old routing 87282cd038dSYoshinobu Inoue * and allocate a (hopefully) better one. 87382cd038dSYoshinobu Inoue */ 8743ce144eaSJeffrey Hsu struct inpcb * 875ec86402eSBjoern A. Zeeb in6_rtchange(struct inpcb *inp, int errno __unused) 87682cd038dSYoshinobu Inoue { 87784cc0778SGeorge V. Neville-Neil 878ec86402eSBjoern A. Zeeb RO_INVALIDATE_CACHE(&inp->inp_route6); 8793ce144eaSJeffrey Hsu return inp; 88082cd038dSYoshinobu Inoue } 88182cd038dSYoshinobu Inoue 882d93ec8cbSMark Johnston static bool 883d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(const struct inpcblbgroup *grp, int domain) 884d93ec8cbSMark Johnston { 885d93ec8cbSMark Johnston return (domain == M_NODOM || domain == grp->il_numa_domain); 886d93ec8cbSMark Johnston } 887d93ec8cbSMark Johnston 8881a43cff9SSean Bruno static struct inpcb * 8891a43cff9SSean Bruno in6_pcblookup_lbgroup(const struct inpcbinfo *pcbinfo, 8904130ea61SMark Johnston const struct in6_addr *faddr, uint16_t fport, const struct in6_addr *laddr, 8914130ea61SMark Johnston uint16_t lport, uint8_t domain) 8921a43cff9SSean Bruno { 8931a43cff9SSean Bruno const struct inpcblbgrouphead *hdr; 8941a43cff9SSean Bruno struct inpcblbgroup *grp; 895d93ec8cbSMark Johnston struct inpcblbgroup *jail_exact, *jail_wild, *local_exact, *local_wild; 896*a600aabeSMark Johnston struct inpcb *inp; 897*a600aabeSMark Johnston u_int count; 8981a43cff9SSean Bruno 8991a43cff9SSean Bruno INP_HASH_LOCK_ASSERT(pcbinfo); 9001a43cff9SSean Bruno 9019d2877fcSMark Johnston hdr = &pcbinfo->ipi_lbgrouphashbase[ 9029d2877fcSMark Johnston INP_PCBPORTHASH(lport, pcbinfo->ipi_lbgrouphashmask)]; 9031a43cff9SSean Bruno 9041a43cff9SSean Bruno /* 905d93ec8cbSMark Johnston * Search for an LB group match based on the following criteria: 906d93ec8cbSMark Johnston * - prefer jailed groups to non-jailed groups 907d93ec8cbSMark Johnston * - prefer exact source address matches to wildcard matches 908d93ec8cbSMark Johnston * - prefer groups bound to the specified NUMA domain 9091a43cff9SSean Bruno */ 910d93ec8cbSMark Johnston jail_exact = jail_wild = local_exact = local_wild = NULL; 91154af3d0dSMark Johnston CK_LIST_FOREACH(grp, hdr, il_list) { 912d93ec8cbSMark Johnston bool injail; 913d93ec8cbSMark Johnston 9144b82a7b6SAndrew Gallatin #ifdef INET 9154b82a7b6SAndrew Gallatin if (!(grp->il_vflag & INP_IPV6)) 9164b82a7b6SAndrew Gallatin continue; 9174b82a7b6SAndrew Gallatin #endif 918d3a4b0daSMark Johnston if (grp->il_lport != lport) 919d3a4b0daSMark Johnston continue; 9201a43cff9SSean Bruno 921d93ec8cbSMark Johnston injail = prison_flag(grp->il_cred, PR_IP6) != 0; 922d93ec8cbSMark Johnston if (injail && prison_check_ip6_locked(grp->il_cred->cr_prison, 923d93ec8cbSMark Johnston laddr) != 0) 924d93ec8cbSMark Johnston continue; 925d93ec8cbSMark Johnston 926a034518aSAndrew Gallatin if (IN6_ARE_ADDR_EQUAL(&grp->il6_laddr, laddr)) { 927d93ec8cbSMark Johnston if (injail) { 928d93ec8cbSMark Johnston jail_exact = grp; 929d93ec8cbSMark Johnston if (in6_pcblookup_lb_numa_match(grp, domain)) 930d93ec8cbSMark Johnston /* This is a perfect match. */ 931d93ec8cbSMark Johnston goto out; 932d93ec8cbSMark Johnston } else if (local_exact == NULL || 933d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) { 934d93ec8cbSMark Johnston local_exact = grp; 935a034518aSAndrew Gallatin } 9364130ea61SMark Johnston } else if (IN6_IS_ADDR_UNSPECIFIED(&grp->il6_laddr)) { 937d93ec8cbSMark Johnston if (injail) { 938d93ec8cbSMark Johnston if (jail_wild == NULL || 939d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) 940d93ec8cbSMark Johnston jail_wild = grp; 941d93ec8cbSMark Johnston } else if (local_wild == NULL || 942d93ec8cbSMark Johnston in6_pcblookup_lb_numa_match(grp, domain)) { 943d93ec8cbSMark Johnston local_wild = grp; 944d93ec8cbSMark Johnston } 945d93ec8cbSMark Johnston } 946d93ec8cbSMark Johnston } 947d93ec8cbSMark Johnston 948d93ec8cbSMark Johnston if (jail_exact != NULL) 949d93ec8cbSMark Johnston grp = jail_exact; 950d93ec8cbSMark Johnston else if (jail_wild != NULL) 951d93ec8cbSMark Johnston grp = jail_wild; 952d93ec8cbSMark Johnston else if (local_exact != NULL) 953d93ec8cbSMark Johnston grp = local_exact; 954a034518aSAndrew Gallatin else 955d93ec8cbSMark Johnston grp = local_wild; 956d93ec8cbSMark Johnston if (grp == NULL) 957d93ec8cbSMark Johnston return (NULL); 958d93ec8cbSMark Johnston out: 959*a600aabeSMark Johnston /* 960*a600aabeSMark Johnston * Synchronize with in_pcblbgroup_insert(). 961*a600aabeSMark Johnston */ 962*a600aabeSMark Johnston count = atomic_load_acq_int(&grp->il_inpcnt); 963*a600aabeSMark Johnston if (count == 0) 964*a600aabeSMark Johnston return (NULL); 965*a600aabeSMark Johnston inp = grp->il_inp[INP6_PCBLBGROUP_PKTHASH(faddr, lport, fport) % count]; 966*a600aabeSMark Johnston KASSERT(inp != NULL, ("%s: inp == NULL", __func__)); 967*a600aabeSMark Johnston return (inp); 9681a43cff9SSean Bruno } 9691a43cff9SSean Bruno 9703e98dcb3SMark Johnston static bool 9713e98dcb3SMark Johnston in6_pcblookup_exact_match(const struct inpcb *inp, const struct in6_addr *faddr, 9723e98dcb3SMark Johnston u_short fport, const struct in6_addr *laddr, u_short lport) 9733e98dcb3SMark Johnston { 9743e98dcb3SMark Johnston /* XXX inp locking */ 9753e98dcb3SMark Johnston if ((inp->inp_vflag & INP_IPV6) == 0) 9763e98dcb3SMark Johnston return (false); 9773e98dcb3SMark Johnston if (IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, faddr) && 9783e98dcb3SMark Johnston IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr) && 9793e98dcb3SMark Johnston inp->inp_fport == fport && inp->inp_lport == lport) 9803e98dcb3SMark Johnston return (true); 9813e98dcb3SMark Johnston return (false); 9823e98dcb3SMark Johnston } 9833e98dcb3SMark Johnston 9844130ea61SMark Johnston static struct inpcb * 9857b92493aSMark Johnston in6_pcblookup_hash_exact(struct inpcbinfo *pcbinfo, 9867b92493aSMark Johnston const struct in6_addr *faddr, u_short fport, 9877b92493aSMark Johnston const struct in6_addr *laddr, u_short lport) 98882cd038dSYoshinobu Inoue { 98982cd038dSYoshinobu Inoue struct inpcbhead *head; 9903e98dcb3SMark Johnston struct inpcb *inp; 99168e0d7e0SRobert Watson 992fa046d87SRobert Watson INP_HASH_LOCK_ASSERT(pcbinfo); 9938deea4a8SRobert Watson 99482cd038dSYoshinobu Inoue /* 99582cd038dSYoshinobu Inoue * First look for an exact match. 99682cd038dSYoshinobu Inoue */ 997fdb987beSMark Johnston head = &pcbinfo->ipi_hash_exact[INP6_PCBHASH(faddr, lport, fport, 998a0577692SGleb Smirnoff pcbinfo->ipi_hashmask)]; 999fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_exact) { 10003e98dcb3SMark Johnston if (in6_pcblookup_exact_match(inp, faddr, fport, laddr, lport)) 100182cd038dSYoshinobu Inoue return (inp); 100282cd038dSYoshinobu Inoue } 10033e98dcb3SMark Johnston return (NULL); 10043e98dcb3SMark Johnston } 10053e98dcb3SMark Johnston 10063e98dcb3SMark Johnston typedef enum { 10073e98dcb3SMark Johnston INPLOOKUP_MATCH_NONE = 0, 10083e98dcb3SMark Johnston INPLOOKUP_MATCH_WILD = 1, 10093e98dcb3SMark Johnston INPLOOKUP_MATCH_LADDR = 2, 10103e98dcb3SMark Johnston } inp_lookup_match_t; 10113e98dcb3SMark Johnston 10123e98dcb3SMark Johnston static inp_lookup_match_t 10133e98dcb3SMark Johnston in6_pcblookup_wild_match(const struct inpcb *inp, const struct in6_addr *laddr, 10143e98dcb3SMark Johnston u_short lport) 10153e98dcb3SMark Johnston { 10163e98dcb3SMark Johnston /* XXX inp locking */ 10173e98dcb3SMark Johnston if ((inp->inp_vflag & INP_IPV6) == 0) 10183e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 10193e98dcb3SMark Johnston if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) || 10203e98dcb3SMark Johnston inp->inp_lport != lport) 10213e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 10223e98dcb3SMark Johnston if (IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) 10233e98dcb3SMark Johnston return (INPLOOKUP_MATCH_WILD); 10243e98dcb3SMark Johnston if (IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, laddr)) 10253e98dcb3SMark Johnston return (INPLOOKUP_MATCH_LADDR); 10263e98dcb3SMark Johnston return (INPLOOKUP_MATCH_NONE); 10274130ea61SMark Johnston } 102882cd038dSYoshinobu Inoue 10297b92493aSMark Johnston #define INP_LOOKUP_AGAIN ((struct inpcb *)(uintptr_t)-1) 10307b92493aSMark Johnston 10317b92493aSMark Johnston static struct inpcb * 10327b92493aSMark Johnston in6_pcblookup_hash_wild_smr(struct inpcbinfo *pcbinfo, 103321d7ac8cSMark Johnston const struct in6_addr *laddr, u_short lport, const inp_lookup_t lockflags) 10347b92493aSMark Johnston { 10357b92493aSMark Johnston struct inpcbhead *head; 10367b92493aSMark Johnston struct inpcb *inp; 10377b92493aSMark Johnston 10387b92493aSMark Johnston KASSERT(SMR_ENTERED(pcbinfo->ipi_smr), 10397b92493aSMark Johnston ("%s: not in SMR read section", __func__)); 10407b92493aSMark Johnston 10417b92493aSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 10427b92493aSMark Johnston pcbinfo->ipi_hashmask)]; 10437b92493aSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 10447b92493aSMark Johnston inp_lookup_match_t match; 10457b92493aSMark Johnston 10467b92493aSMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 10477b92493aSMark Johnston if (match == INPLOOKUP_MATCH_NONE) 10487b92493aSMark Johnston continue; 10497b92493aSMark Johnston 10507b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 1051a306ed50SMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 1052a306ed50SMark Johnston if (match != INPLOOKUP_MATCH_NONE && 1053a306ed50SMark Johnston prison_check_ip6_locked(inp->inp_cred->cr_prison, 1054a306ed50SMark Johnston laddr) == 0) 10557b92493aSMark Johnston return (inp); 10567b92493aSMark Johnston inp_unlock(inp, lockflags); 10577b92493aSMark Johnston } 10587b92493aSMark Johnston 10597b92493aSMark Johnston /* 10607b92493aSMark Johnston * The matching socket disappeared out from under us. Fall back 10617b92493aSMark Johnston * to a serialized lookup. 10627b92493aSMark Johnston */ 10637b92493aSMark Johnston return (INP_LOOKUP_AGAIN); 10647b92493aSMark Johnston } 10657b92493aSMark Johnston return (NULL); 10667b92493aSMark Johnston } 10677b92493aSMark Johnston 10684130ea61SMark Johnston static struct inpcb * 10694130ea61SMark Johnston in6_pcblookup_hash_wild_locked(struct inpcbinfo *pcbinfo, 107021d7ac8cSMark Johnston const struct in6_addr *laddr, u_short lport) 10714130ea61SMark Johnston { 10724130ea61SMark Johnston struct inpcbhead *head; 10734130ea61SMark Johnston struct inpcb *inp, *jail_wild, *local_exact, *local_wild; 1074d93ec8cbSMark Johnston 10753e98dcb3SMark Johnston INP_HASH_LOCK_ASSERT(pcbinfo); 10763e98dcb3SMark Johnston 1077d93ec8cbSMark Johnston /* 1078413628a7SBjoern A. Zeeb * Order of socket selection - we always prefer jails. 1079413628a7SBjoern A. Zeeb * 1. jailed, non-wild. 1080413628a7SBjoern A. Zeeb * 2. jailed, wild. 1081413628a7SBjoern A. Zeeb * 3. non-jailed, non-wild. 1082413628a7SBjoern A. Zeeb * 4. non-jailed, wild. 1083413628a7SBjoern A. Zeeb */ 1084fdb987beSMark Johnston head = &pcbinfo->ipi_hash_wild[INP_PCBHASH_WILD(lport, 10851b44e5ffSAndrey V. Elsukov pcbinfo->ipi_hashmask)]; 10864130ea61SMark Johnston local_wild = local_exact = jail_wild = NULL; 1087fdb987beSMark Johnston CK_LIST_FOREACH(inp, head, inp_hash_wild) { 10883e98dcb3SMark Johnston inp_lookup_match_t match; 10894130ea61SMark Johnston bool injail; 10904130ea61SMark Johnston 10913e98dcb3SMark Johnston match = in6_pcblookup_wild_match(inp, laddr, lport); 10923e98dcb3SMark Johnston if (match == INPLOOKUP_MATCH_NONE) 109382cd038dSYoshinobu Inoue continue; 1094413628a7SBjoern A. Zeeb 10954130ea61SMark Johnston injail = prison_flag(inp->inp_cred, PR_IP6) != 0; 1096413628a7SBjoern A. Zeeb if (injail) { 1097185e659cSGleb Smirnoff if (prison_check_ip6_locked( 1098185e659cSGleb Smirnoff inp->inp_cred->cr_prison, laddr) != 0) 1099413628a7SBjoern A. Zeeb continue; 1100413628a7SBjoern A. Zeeb } else { 1101413628a7SBjoern A. Zeeb if (local_exact != NULL) 1102413628a7SBjoern A. Zeeb continue; 1103413628a7SBjoern A. Zeeb } 1104413628a7SBjoern A. Zeeb 11053e98dcb3SMark Johnston if (match == INPLOOKUP_MATCH_LADDR) { 1106413628a7SBjoern A. Zeeb if (injail) 110782cd038dSYoshinobu Inoue return (inp); 1108413628a7SBjoern A. Zeeb else 1109413628a7SBjoern A. Zeeb local_exact = inp; 11103e98dcb3SMark Johnston } else { 1111413628a7SBjoern A. Zeeb if (injail) 1112413628a7SBjoern A. Zeeb jail_wild = inp; 1113413628a7SBjoern A. Zeeb else 111482cd038dSYoshinobu Inoue local_wild = inp; 111582cd038dSYoshinobu Inoue } 11164130ea61SMark Johnston } 1117413628a7SBjoern A. Zeeb 1118413628a7SBjoern A. Zeeb if (jail_wild != NULL) 1119413628a7SBjoern A. Zeeb return (jail_wild); 1120413628a7SBjoern A. Zeeb if (local_exact != NULL) 1121413628a7SBjoern A. Zeeb return (local_exact); 1122413628a7SBjoern A. Zeeb if (local_wild != NULL) 112382cd038dSYoshinobu Inoue return (local_wild); 112482cd038dSYoshinobu Inoue return (NULL); 112582cd038dSYoshinobu Inoue } 112682cd038dSYoshinobu Inoue 11274130ea61SMark Johnston struct inpcb * 11287b92493aSMark Johnston in6_pcblookup_hash_locked(struct inpcbinfo *pcbinfo, 11297b92493aSMark Johnston const struct in6_addr *faddr, u_int fport_arg, 11307b92493aSMark Johnston const struct in6_addr *laddr, u_int lport_arg, 11314130ea61SMark Johnston int lookupflags, uint8_t numa_domain) 11324130ea61SMark Johnston { 11334130ea61SMark Johnston struct inpcb *inp; 11344130ea61SMark Johnston u_short fport = fport_arg, lport = lport_arg; 11354130ea61SMark Johnston 11364130ea61SMark Johnston KASSERT((lookupflags & ~INPLOOKUP_WILDCARD) == 0, 11374130ea61SMark Johnston ("%s: invalid lookup flags %d", __func__, lookupflags)); 11384130ea61SMark Johnston KASSERT(!IN6_IS_ADDR_UNSPECIFIED(faddr), 11394130ea61SMark Johnston ("%s: invalid foreign address", __func__)); 11404130ea61SMark Johnston KASSERT(!IN6_IS_ADDR_UNSPECIFIED(laddr), 11414130ea61SMark Johnston ("%s: invalid local address", __func__)); 11424130ea61SMark Johnston INP_HASH_LOCK_ASSERT(pcbinfo); 11434130ea61SMark Johnston 11444130ea61SMark Johnston inp = in6_pcblookup_hash_exact(pcbinfo, faddr, fport, laddr, lport); 11454130ea61SMark Johnston if (inp != NULL) 11464130ea61SMark Johnston return (inp); 11474130ea61SMark Johnston 11484130ea61SMark Johnston if ((lookupflags & INPLOOKUP_WILDCARD) != 0) { 11494130ea61SMark Johnston inp = in6_pcblookup_lbgroup(pcbinfo, faddr, fport, laddr, 11504130ea61SMark Johnston lport, numa_domain); 11514130ea61SMark Johnston if (inp == NULL) { 115221d7ac8cSMark Johnston inp = in6_pcblookup_hash_wild_locked(pcbinfo, 115321d7ac8cSMark Johnston laddr, lport); 11544130ea61SMark Johnston } 11554130ea61SMark Johnston } 11564130ea61SMark Johnston return (inp); 11574130ea61SMark Johnston } 11584130ea61SMark Johnston 1159fa046d87SRobert Watson static struct inpcb * 11607b92493aSMark Johnston in6_pcblookup_hash(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 11617b92493aSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 11624130ea61SMark Johnston uint8_t numa_domain) 1163fa046d87SRobert Watson { 1164fa046d87SRobert Watson struct inpcb *inp; 11657b92493aSMark Johnston const inp_lookup_t lockflags = lookupflags & INPLOOKUP_LOCKMASK; 11667b92493aSMark Johnston 11677b92493aSMark Johnston KASSERT((lookupflags & (INPLOOKUP_RLOCKPCB | INPLOOKUP_WLOCKPCB)) != 0, 11687b92493aSMark Johnston ("%s: LOCKPCB not set", __func__)); 11697b92493aSMark Johnston 11707b92493aSMark Johnston INP_HASH_WLOCK(pcbinfo); 11717b92493aSMark Johnston inp = in6_pcblookup_hash_locked(pcbinfo, faddr, fport, laddr, lport, 11727b92493aSMark Johnston lookupflags & ~INPLOOKUP_LOCKMASK, numa_domain); 11737b92493aSMark Johnston if (inp != NULL && !inp_trylock(inp, lockflags)) { 11747b92493aSMark Johnston in_pcbref(inp); 11757b92493aSMark Johnston INP_HASH_WUNLOCK(pcbinfo); 11767b92493aSMark Johnston inp_lock(inp, lockflags); 11777b92493aSMark Johnston if (in_pcbrele(inp, lockflags)) 11787b92493aSMark Johnston /* XXX-MJ or retry until we get a negative match? */ 11797b92493aSMark Johnston inp = NULL; 11807b92493aSMark Johnston } else { 11817b92493aSMark Johnston INP_HASH_WUNLOCK(pcbinfo); 11827b92493aSMark Johnston } 11837b92493aSMark Johnston return (inp); 11847b92493aSMark Johnston } 11857b92493aSMark Johnston 11867b92493aSMark Johnston static struct inpcb * 118752ef944bSMark Johnston in6_pcblookup_hash_smr(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 118852ef944bSMark Johnston u_int fport_arg, const struct in6_addr *laddr, u_int lport_arg, 118952ef944bSMark Johnston int lookupflags, uint8_t numa_domain) 11907b92493aSMark Johnston { 11917b92493aSMark Johnston struct inpcb *inp; 11927b92493aSMark Johnston const inp_lookup_t lockflags = lookupflags & INPLOOKUP_LOCKMASK; 11937b92493aSMark Johnston const u_short fport = fport_arg, lport = lport_arg; 1194fa046d87SRobert Watson 1195675e2618SMark Johnston KASSERT((lookupflags & ~INPLOOKUP_MASK) == 0, 1196675e2618SMark Johnston ("%s: invalid lookup flags %d", __func__, lookupflags)); 1197675e2618SMark Johnston KASSERT((lookupflags & (INPLOOKUP_RLOCKPCB | INPLOOKUP_WLOCKPCB)) != 0, 1198675e2618SMark Johnston ("%s: LOCKPCB not set", __func__)); 1199675e2618SMark Johnston 1200db0ac6deSCy Schubert smr_enter(pcbinfo->ipi_smr); 12017b92493aSMark Johnston inp = in6_pcblookup_hash_exact(pcbinfo, faddr, fport, laddr, lport); 1202fa046d87SRobert Watson if (inp != NULL) { 12037b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 12047b92493aSMark Johnston if (__predict_true(in6_pcblookup_exact_match(inp, 12057b92493aSMark Johnston faddr, fport, laddr, lport))) 12067b92493aSMark Johnston return (inp); 12077b92493aSMark Johnston inp_unlock(inp, lockflags); 12087b92493aSMark Johnston } 12097b92493aSMark Johnston /* 12107b92493aSMark Johnston * We failed to lock the inpcb, or its connection state changed 12117b92493aSMark Johnston * out from under us. Fall back to a precise search. 12127b92493aSMark Johnston */ 12137b92493aSMark Johnston return (in6_pcblookup_hash(pcbinfo, faddr, fport, laddr, lport, 12147b92493aSMark Johnston lookupflags, numa_domain)); 12157b92493aSMark Johnston } 12167b92493aSMark Johnston 12177b92493aSMark Johnston if ((lookupflags & INPLOOKUP_WILDCARD) != 0) { 12187b92493aSMark Johnston inp = in6_pcblookup_lbgroup(pcbinfo, faddr, fport, 12197b92493aSMark Johnston laddr, lport, numa_domain); 12207b92493aSMark Johnston if (inp != NULL) { 12217b92493aSMark Johnston if (__predict_true(inp_smr_lock(inp, lockflags))) { 12227b92493aSMark Johnston if (__predict_true(in6_pcblookup_wild_match(inp, 12237b92493aSMark Johnston laddr, lport) != INPLOOKUP_MATCH_NONE)) 12247b92493aSMark Johnston return (inp); 12257b92493aSMark Johnston inp_unlock(inp, lockflags); 12267b92493aSMark Johnston } 12277b92493aSMark Johnston inp = INP_LOOKUP_AGAIN; 12287b92493aSMark Johnston } else { 122921d7ac8cSMark Johnston inp = in6_pcblookup_hash_wild_smr(pcbinfo, laddr, lport, 123021d7ac8cSMark Johnston lockflags); 12317b92493aSMark Johnston } 12327b92493aSMark Johnston if (inp == INP_LOOKUP_AGAIN) { 12337b92493aSMark Johnston return (in6_pcblookup_hash(pcbinfo, faddr, fport, laddr, 12347b92493aSMark Johnston lport, lookupflags, numa_domain)); 12357b92493aSMark Johnston } 12367b92493aSMark Johnston } 12377b92493aSMark Johnston 12387b92493aSMark Johnston if (inp == NULL) 1239db0ac6deSCy Schubert smr_exit(pcbinfo->ipi_smr); 1240db0ac6deSCy Schubert 1241fa046d87SRobert Watson return (inp); 1242fa046d87SRobert Watson } 1243fa046d87SRobert Watson 1244fa046d87SRobert Watson /* 1245d3c1f003SRobert Watson * Public inpcb lookup routines, accepting a 4-tuple, and optionally, an mbuf 1246d3c1f003SRobert Watson * from which a pre-calculated hash value may be extracted. 1247fa046d87SRobert Watson */ 1248fa046d87SRobert Watson struct inpcb * 124952ef944bSMark Johnston in6_pcblookup(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 125052ef944bSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 12514130ea61SMark Johnston struct ifnet *ifp __unused) 1252fa046d87SRobert Watson { 12534130ea61SMark Johnston return (in6_pcblookup_hash_smr(pcbinfo, faddr, fport, laddr, lport, 12544130ea61SMark Johnston lookupflags, M_NODOM)); 1255d3c1f003SRobert Watson } 1256d3c1f003SRobert Watson 1257d3c1f003SRobert Watson struct inpcb * 125852ef944bSMark Johnston in6_pcblookup_mbuf(struct inpcbinfo *pcbinfo, const struct in6_addr *faddr, 125952ef944bSMark Johnston u_int fport, const struct in6_addr *laddr, u_int lport, int lookupflags, 12604130ea61SMark Johnston struct ifnet *ifp __unused, struct mbuf *m) 1261d3c1f003SRobert Watson { 12624130ea61SMark Johnston return (in6_pcblookup_hash_smr(pcbinfo, faddr, fport, laddr, lport, 12634130ea61SMark Johnston lookupflags, m->m_pkthdr.numa_domain)); 1264fa046d87SRobert Watson } 1265fa046d87SRobert Watson 126682cd038dSYoshinobu Inoue void 1267dce33a45SErmal Luçi init_sin6(struct sockaddr_in6 *sin6, struct mbuf *m, int srcordst) 126882cd038dSYoshinobu Inoue { 126982cd038dSYoshinobu Inoue struct ip6_hdr *ip; 127082cd038dSYoshinobu Inoue 127182cd038dSYoshinobu Inoue ip = mtod(m, struct ip6_hdr *); 127282cd038dSYoshinobu Inoue bzero(sin6, sizeof(*sin6)); 127382cd038dSYoshinobu Inoue sin6->sin6_len = sizeof(*sin6); 127482cd038dSYoshinobu Inoue sin6->sin6_family = AF_INET6; 1275dce33a45SErmal Luçi sin6->sin6_addr = srcordst ? ip->ip6_dst : ip->ip6_src; 1276a1f7e5f8SHajimu UMEMOTO 1277a1f7e5f8SHajimu UMEMOTO (void)sa6_recoverscope(sin6); /* XXX: should catch errors... */ 127882cd038dSYoshinobu Inoue 127982cd038dSYoshinobu Inoue return; 128082cd038dSYoshinobu Inoue } 1281