1c398230bSWarner Losh /*- 22469dd60SGarrett Wollman * Copyright (c) 1982, 1986, 1991, 1993, 1995 3df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 6df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 7df8bae1dSRodney W. Grimes * are met: 8df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 9df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 10df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 12df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 13df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 14df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 15df8bae1dSRodney W. Grimes * without specific prior written permission. 16df8bae1dSRodney W. Grimes * 17df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27df8bae1dSRodney W. Grimes * SUCH DAMAGE. 28df8bae1dSRodney W. Grimes * 292469dd60SGarrett Wollman * @(#)in_pcb.c 8.4 (Berkeley) 5/24/95 30c3aac50fSPeter Wemm * $FreeBSD$ 31df8bae1dSRodney W. Grimes */ 32df8bae1dSRodney W. Grimes 336a800098SYoshinobu Inoue #include "opt_ipsec.h" 34cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h" 35a557af22SRobert Watson #include "opt_mac.h" 36cfa1ca9dSYoshinobu Inoue 37df8bae1dSRodney W. Grimes #include <sys/param.h> 38df8bae1dSRodney W. Grimes #include <sys/systm.h> 39a557af22SRobert Watson #include <sys/mac.h> 40df8bae1dSRodney W. Grimes #include <sys/malloc.h> 41df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 42cfa1ca9dSYoshinobu Inoue #include <sys/domain.h> 43df8bae1dSRodney W. Grimes #include <sys/protosw.h> 44df8bae1dSRodney W. Grimes #include <sys/socket.h> 45df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 46df8bae1dSRodney W. Grimes #include <sys/proc.h> 4775c13541SPoul-Henning Kamp #include <sys/jail.h> 48101f9fc8SPeter Wemm #include <sys/kernel.h> 49101f9fc8SPeter Wemm #include <sys/sysctl.h> 508781d8e9SBruce Evans 5169c2d429SJeff Roberson #include <vm/uma.h> 52df8bae1dSRodney W. Grimes 53df8bae1dSRodney W. Grimes #include <net/if.h> 54cfa1ca9dSYoshinobu Inoue #include <net/if_types.h> 55df8bae1dSRodney W. Grimes #include <net/route.h> 56df8bae1dSRodney W. Grimes 57df8bae1dSRodney W. Grimes #include <netinet/in.h> 58df8bae1dSRodney W. Grimes #include <netinet/in_pcb.h> 59df8bae1dSRodney W. Grimes #include <netinet/in_var.h> 60df8bae1dSRodney W. Grimes #include <netinet/ip_var.h> 61340c35deSJonathan Lemon #include <netinet/tcp_var.h> 625f311da2SMike Silbersack #include <netinet/udp.h> 635f311da2SMike Silbersack #include <netinet/udp_var.h> 64cfa1ca9dSYoshinobu Inoue #ifdef INET6 65cfa1ca9dSYoshinobu Inoue #include <netinet/ip6.h> 66cfa1ca9dSYoshinobu Inoue #include <netinet6/ip6_var.h> 67cfa1ca9dSYoshinobu Inoue #endif /* INET6 */ 68cfa1ca9dSYoshinobu Inoue 69cfa1ca9dSYoshinobu Inoue #ifdef IPSEC 70cfa1ca9dSYoshinobu Inoue #include <netinet6/ipsec.h> 71cfa1ca9dSYoshinobu Inoue #include <netkey/key.h> 72cfa1ca9dSYoshinobu Inoue #endif /* IPSEC */ 73df8bae1dSRodney W. Grimes 74b9234fafSSam Leffler #ifdef FAST_IPSEC 75b9234fafSSam Leffler #if defined(IPSEC) || defined(IPSEC_ESP) 76b9234fafSSam Leffler #error "Bad idea: don't compile with both IPSEC and FAST_IPSEC!" 77b9234fafSSam Leffler #endif 78b9234fafSSam Leffler 79b9234fafSSam Leffler #include <netipsec/ipsec.h> 80b9234fafSSam Leffler #include <netipsec/key.h> 81b9234fafSSam Leffler #endif /* FAST_IPSEC */ 82b9234fafSSam Leffler 83101f9fc8SPeter Wemm /* 84101f9fc8SPeter Wemm * These configure the range of local port addresses assigned to 85101f9fc8SPeter Wemm * "unspecified" outgoing connections/packets/whatever. 86101f9fc8SPeter Wemm */ 8782cd038dSYoshinobu Inoue int ipport_lowfirstauto = IPPORT_RESERVED - 1; /* 1023 */ 8882cd038dSYoshinobu Inoue int ipport_lowlastauto = IPPORT_RESERVEDSTART; /* 600 */ 899e5a5ed4SMike Silbersack int ipport_firstauto = IPPORT_HIFIRSTAUTO; /* 49152 */ 909e5a5ed4SMike Silbersack int ipport_lastauto = IPPORT_HILASTAUTO; /* 65535 */ 9182cd038dSYoshinobu Inoue int ipport_hifirstauto = IPPORT_HIFIRSTAUTO; /* 49152 */ 9282cd038dSYoshinobu Inoue int ipport_hilastauto = IPPORT_HILASTAUTO; /* 65535 */ 93101f9fc8SPeter Wemm 94b0d22693SCrist J. Clark /* 95b0d22693SCrist J. Clark * Reserved ports accessible only to root. There are significant 96b0d22693SCrist J. Clark * security considerations that must be accounted for when changing these, 97b0d22693SCrist J. Clark * but the security benefits can be great. Please be careful. 98b0d22693SCrist J. Clark */ 99b0d22693SCrist J. Clark int ipport_reservedhigh = IPPORT_RESERVED - 1; /* 1023 */ 100b0d22693SCrist J. Clark int ipport_reservedlow = 0; 101b0d22693SCrist J. Clark 1025f311da2SMike Silbersack /* Variables dealing with random ephemeral port allocation. */ 1035f311da2SMike Silbersack int ipport_randomized = 1; /* user controlled via sysctl */ 1045f311da2SMike Silbersack int ipport_randomcps = 10; /* user controlled via sysctl */ 1055f311da2SMike Silbersack int ipport_randomtime = 45; /* user controlled via sysctl */ 1065f311da2SMike Silbersack int ipport_stoprandom = 0; /* toggled by ipport_tick */ 1075f311da2SMike Silbersack int ipport_tcpallocs; 1085f311da2SMike Silbersack int ipport_tcplastcount; 1096ac48b74SMike Silbersack 110bbd42ad0SPeter Wemm #define RANGECHK(var, min, max) \ 111bbd42ad0SPeter Wemm if ((var) < (min)) { (var) = (min); } \ 112bbd42ad0SPeter Wemm else if ((var) > (max)) { (var) = (max); } 113bbd42ad0SPeter Wemm 114bbd42ad0SPeter Wemm static int 11582d9ae4eSPoul-Henning Kamp sysctl_net_ipport_check(SYSCTL_HANDLER_ARGS) 116bbd42ad0SPeter Wemm { 11730a4ab08SBruce Evans int error; 11830a4ab08SBruce Evans 11930a4ab08SBruce Evans error = sysctl_handle_int(oidp, oidp->oid_arg1, oidp->oid_arg2, req); 12030a4ab08SBruce Evans if (error == 0) { 121bbd42ad0SPeter Wemm RANGECHK(ipport_lowfirstauto, 1, IPPORT_RESERVED - 1); 122bbd42ad0SPeter Wemm RANGECHK(ipport_lowlastauto, 1, IPPORT_RESERVED - 1); 12330a4ab08SBruce Evans RANGECHK(ipport_firstauto, IPPORT_RESERVED, IPPORT_MAX); 12430a4ab08SBruce Evans RANGECHK(ipport_lastauto, IPPORT_RESERVED, IPPORT_MAX); 12530a4ab08SBruce Evans RANGECHK(ipport_hifirstauto, IPPORT_RESERVED, IPPORT_MAX); 12630a4ab08SBruce Evans RANGECHK(ipport_hilastauto, IPPORT_RESERVED, IPPORT_MAX); 127bbd42ad0SPeter Wemm } 12830a4ab08SBruce Evans return (error); 129bbd42ad0SPeter Wemm } 130bbd42ad0SPeter Wemm 131bbd42ad0SPeter Wemm #undef RANGECHK 132bbd42ad0SPeter Wemm 13333b3ac06SPeter Wemm SYSCTL_NODE(_net_inet_ip, IPPROTO_IP, portrange, CTLFLAG_RW, 0, "IP Ports"); 13433b3ac06SPeter Wemm 135bbd42ad0SPeter Wemm SYSCTL_PROC(_net_inet_ip_portrange, OID_AUTO, lowfirst, CTLTYPE_INT|CTLFLAG_RW, 136bbd42ad0SPeter Wemm &ipport_lowfirstauto, 0, &sysctl_net_ipport_check, "I", ""); 137bbd42ad0SPeter Wemm SYSCTL_PROC(_net_inet_ip_portrange, OID_AUTO, lowlast, CTLTYPE_INT|CTLFLAG_RW, 138bbd42ad0SPeter Wemm &ipport_lowlastauto, 0, &sysctl_net_ipport_check, "I", ""); 139bbd42ad0SPeter Wemm SYSCTL_PROC(_net_inet_ip_portrange, OID_AUTO, first, CTLTYPE_INT|CTLFLAG_RW, 140bbd42ad0SPeter Wemm &ipport_firstauto, 0, &sysctl_net_ipport_check, "I", ""); 141bbd42ad0SPeter Wemm SYSCTL_PROC(_net_inet_ip_portrange, OID_AUTO, last, CTLTYPE_INT|CTLFLAG_RW, 142bbd42ad0SPeter Wemm &ipport_lastauto, 0, &sysctl_net_ipport_check, "I", ""); 143bbd42ad0SPeter Wemm SYSCTL_PROC(_net_inet_ip_portrange, OID_AUTO, hifirst, CTLTYPE_INT|CTLFLAG_RW, 144bbd42ad0SPeter Wemm &ipport_hifirstauto, 0, &sysctl_net_ipport_check, "I", ""); 145bbd42ad0SPeter Wemm SYSCTL_PROC(_net_inet_ip_portrange, OID_AUTO, hilast, CTLTYPE_INT|CTLFLAG_RW, 146bbd42ad0SPeter Wemm &ipport_hilastauto, 0, &sysctl_net_ipport_check, "I", ""); 147b0d22693SCrist J. Clark SYSCTL_INT(_net_inet_ip_portrange, OID_AUTO, reservedhigh, 148b0d22693SCrist J. Clark CTLFLAG_RW|CTLFLAG_SECURE, &ipport_reservedhigh, 0, ""); 149b0d22693SCrist J. Clark SYSCTL_INT(_net_inet_ip_portrange, OID_AUTO, reservedlow, 150b0d22693SCrist J. Clark CTLFLAG_RW|CTLFLAG_SECURE, &ipport_reservedlow, 0, ""); 1516ee79c59SMaxim Konovalov SYSCTL_INT(_net_inet_ip_portrange, OID_AUTO, randomized, CTLFLAG_RW, 1526ee79c59SMaxim Konovalov &ipport_randomized, 0, "Enable random port allocation"); 1536ee79c59SMaxim Konovalov SYSCTL_INT(_net_inet_ip_portrange, OID_AUTO, randomcps, CTLFLAG_RW, 1546ee79c59SMaxim Konovalov &ipport_randomcps, 0, "Maximum number of random port " 1556ee79c59SMaxim Konovalov "allocations before switching to a sequental one"); 1566ee79c59SMaxim Konovalov SYSCTL_INT(_net_inet_ip_portrange, OID_AUTO, randomtime, CTLFLAG_RW, 1576ee79c59SMaxim Konovalov &ipport_randomtime, 0, "Minimum time to keep sequental port " 1586ee79c59SMaxim Konovalov "allocation before switching to a random one"); 1590312fbe9SPoul-Henning Kamp 160c3229e05SDavid Greenman /* 161c3229e05SDavid Greenman * in_pcb.c: manage the Protocol Control Blocks. 162c3229e05SDavid Greenman * 163de35559fSRobert Watson * NOTE: It is assumed that most of these functions will be called with 164de35559fSRobert Watson * the pcbinfo lock held, and often, the inpcb lock held, as these utility 165de35559fSRobert Watson * functions often modify hash chains or addresses in pcbs. 166c3229e05SDavid Greenman */ 167c3229e05SDavid Greenman 168c3229e05SDavid Greenman /* 169c3229e05SDavid Greenman * Allocate a PCB and associate it with the socket. 170c3229e05SDavid Greenman */ 171df8bae1dSRodney W. Grimes int 172136d4f1cSRobert Watson in_pcballoc(struct socket *so, struct inpcbinfo *pcbinfo, const char *type) 173df8bae1dSRodney W. Grimes { 174136d4f1cSRobert Watson struct inpcb *inp; 17513cf67f3SHajimu UMEMOTO int error; 176a557af22SRobert Watson 17759daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 178a557af22SRobert Watson error = 0; 179d1dd20beSSam Leffler inp = uma_zalloc(pcbinfo->ipi_zone, M_NOWAIT | M_ZERO); 180df8bae1dSRodney W. Grimes if (inp == NULL) 181df8bae1dSRodney W. Grimes return (ENOBUFS); 1823d4d47f3SGarrett Wollman inp->inp_gencnt = ++pcbinfo->ipi_gencnt; 18315bd2b43SDavid Greenman inp->inp_pcbinfo = pcbinfo; 184df8bae1dSRodney W. Grimes inp->inp_socket = so; 185a557af22SRobert Watson #ifdef MAC 186a557af22SRobert Watson error = mac_init_inpcb(inp, M_NOWAIT); 187a557af22SRobert Watson if (error != 0) 188a557af22SRobert Watson goto out; 189310e7cebSRobert Watson SOCK_LOCK(so); 190a557af22SRobert Watson mac_create_inpcb_from_socket(so, inp); 191310e7cebSRobert Watson SOCK_UNLOCK(so); 192a557af22SRobert Watson #endif 1930f9ade71SHajimu UMEMOTO #if defined(IPSEC) || defined(FAST_IPSEC) 1940f9ade71SHajimu UMEMOTO #ifdef FAST_IPSEC 19513cf67f3SHajimu UMEMOTO error = ipsec_init_policy(so, &inp->inp_sp); 1960f9ade71SHajimu UMEMOTO #else 1970f9ade71SHajimu UMEMOTO error = ipsec_init_pcbpolicy(so, &inp->inp_sp); 1980f9ade71SHajimu UMEMOTO #endif 199a557af22SRobert Watson if (error != 0) 200a557af22SRobert Watson goto out; 20113cf67f3SHajimu UMEMOTO #endif /*IPSEC*/ 20275daea93SPaul Saab #if defined(INET6) 203340c35deSJonathan Lemon if (INP_SOCKAF(so) == AF_INET6) { 204340c35deSJonathan Lemon inp->inp_vflag |= INP_IPV6PROTO; 205340c35deSJonathan Lemon if (ip6_v6only) 20633841545SHajimu UMEMOTO inp->inp_flags |= IN6P_IPV6_V6ONLY; 207340c35deSJonathan Lemon } 20875daea93SPaul Saab #endif 20915bd2b43SDavid Greenman LIST_INSERT_HEAD(pcbinfo->listhead, inp, inp_list); 2103d4d47f3SGarrett Wollman pcbinfo->ipi_count++; 211df8bae1dSRodney W. Grimes so->so_pcb = (caddr_t)inp; 2125bd311a5SSam Leffler INP_LOCK_INIT(inp, "inp", type); 21333841545SHajimu UMEMOTO #ifdef INET6 21433841545SHajimu UMEMOTO if (ip6_auto_flowlabel) 21533841545SHajimu UMEMOTO inp->inp_flags |= IN6P_AUTOFLOWLABEL; 21633841545SHajimu UMEMOTO #endif 217a557af22SRobert Watson #if defined(IPSEC) || defined(FAST_IPSEC) || defined(MAC) 218a557af22SRobert Watson out: 219a557af22SRobert Watson if (error != 0) 220a557af22SRobert Watson uma_zfree(pcbinfo->ipi_zone, inp); 221a557af22SRobert Watson #endif 222a557af22SRobert Watson return (error); 223df8bae1dSRodney W. Grimes } 224df8bae1dSRodney W. Grimes 225df8bae1dSRodney W. Grimes int 226136d4f1cSRobert Watson in_pcbbind(struct inpcb *inp, struct sockaddr *nam, struct ucred *cred) 227df8bae1dSRodney W. Grimes { 2284b932371SIan Dowse int anonport, error; 2294b932371SIan Dowse 2301b73ca0bSSam Leffler INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 23159daba27SSam Leffler INP_LOCK_ASSERT(inp); 23259daba27SSam Leffler 2334b932371SIan Dowse if (inp->inp_lport != 0 || inp->inp_laddr.s_addr != INADDR_ANY) 2344b932371SIan Dowse return (EINVAL); 2354b932371SIan Dowse anonport = inp->inp_lport == 0 && (nam == NULL || 2364b932371SIan Dowse ((struct sockaddr_in *)nam)->sin_port == 0); 2374b932371SIan Dowse error = in_pcbbind_setup(inp, nam, &inp->inp_laddr.s_addr, 238b0330ed9SPawel Jakub Dawidek &inp->inp_lport, cred); 2394b932371SIan Dowse if (error) 2404b932371SIan Dowse return (error); 2414b932371SIan Dowse if (in_pcbinshash(inp) != 0) { 2424b932371SIan Dowse inp->inp_laddr.s_addr = INADDR_ANY; 2434b932371SIan Dowse inp->inp_lport = 0; 2444b932371SIan Dowse return (EAGAIN); 2454b932371SIan Dowse } 2464b932371SIan Dowse if (anonport) 2474b932371SIan Dowse inp->inp_flags |= INP_ANONPORT; 2484b932371SIan Dowse return (0); 2494b932371SIan Dowse } 2504b932371SIan Dowse 2514b932371SIan Dowse /* 2524b932371SIan Dowse * Set up a bind operation on a PCB, performing port allocation 2534b932371SIan Dowse * as required, but do not actually modify the PCB. Callers can 2544b932371SIan Dowse * either complete the bind by setting inp_laddr/inp_lport and 2554b932371SIan Dowse * calling in_pcbinshash(), or they can just use the resulting 2564b932371SIan Dowse * port and address to authorise the sending of a once-off packet. 2574b932371SIan Dowse * 2584b932371SIan Dowse * On error, the values of *laddrp and *lportp are not changed. 2594b932371SIan Dowse */ 2604b932371SIan Dowse int 261136d4f1cSRobert Watson in_pcbbind_setup(struct inpcb *inp, struct sockaddr *nam, in_addr_t *laddrp, 262136d4f1cSRobert Watson u_short *lportp, struct ucred *cred) 2634b932371SIan Dowse { 2644b932371SIan Dowse struct socket *so = inp->inp_socket; 26537bd2b30SPeter Wemm unsigned short *lastport; 26615bd2b43SDavid Greenman struct sockaddr_in *sin; 267c3229e05SDavid Greenman struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 2684b932371SIan Dowse struct in_addr laddr; 269df8bae1dSRodney W. Grimes u_short lport = 0; 2704cc20ab1SSeigo Tanimura int wild = 0, reuseport = (so->so_options & SO_REUSEPORT); 27175c13541SPoul-Henning Kamp int error, prison = 0; 2725f311da2SMike Silbersack int dorandom; 273df8bae1dSRodney W. Grimes 2741b73ca0bSSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 27559daba27SSam Leffler INP_LOCK_ASSERT(inp); 27659daba27SSam Leffler 27759562606SGarrett Wollman if (TAILQ_EMPTY(&in_ifaddrhead)) /* XXX broken! */ 278df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 2794b932371SIan Dowse laddr.s_addr = *laddrp; 2804b932371SIan Dowse if (nam != NULL && laddr.s_addr != INADDR_ANY) 281df8bae1dSRodney W. Grimes return (EINVAL); 282c3229e05SDavid Greenman if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0) 2836d6a026bSDavid Greenman wild = 1; 284df8bae1dSRodney W. Grimes if (nam) { 28557bf258eSGarrett Wollman sin = (struct sockaddr_in *)nam; 28657bf258eSGarrett Wollman if (nam->sa_len != sizeof (*sin)) 287df8bae1dSRodney W. Grimes return (EINVAL); 288df8bae1dSRodney W. Grimes #ifdef notdef 289df8bae1dSRodney W. Grimes /* 290df8bae1dSRodney W. Grimes * We should check the family, but old programs 291df8bae1dSRodney W. Grimes * incorrectly fail to initialize it. 292df8bae1dSRodney W. Grimes */ 293df8bae1dSRodney W. Grimes if (sin->sin_family != AF_INET) 294df8bae1dSRodney W. Grimes return (EAFNOSUPPORT); 295df8bae1dSRodney W. Grimes #endif 296e4bdf25dSPoul-Henning Kamp if (sin->sin_addr.s_addr != INADDR_ANY) 297b0330ed9SPawel Jakub Dawidek if (prison_ip(cred, 0, &sin->sin_addr.s_addr)) 29875c13541SPoul-Henning Kamp return(EINVAL); 2994b932371SIan Dowse if (sin->sin_port != *lportp) { 3004b932371SIan Dowse /* Don't allow the port to change. */ 3014b932371SIan Dowse if (*lportp != 0) 3024b932371SIan Dowse return (EINVAL); 303df8bae1dSRodney W. Grimes lport = sin->sin_port; 3044b932371SIan Dowse } 3054b932371SIan Dowse /* NB: lport is left as 0 if the port isn't being changed. */ 306df8bae1dSRodney W. Grimes if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr))) { 307df8bae1dSRodney W. Grimes /* 308df8bae1dSRodney W. Grimes * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 309df8bae1dSRodney W. Grimes * allow complete duplication of binding if 310df8bae1dSRodney W. Grimes * SO_REUSEPORT is set, or if SO_REUSEADDR is set 311df8bae1dSRodney W. Grimes * and a multicast address is bound on both 312df8bae1dSRodney W. Grimes * new and duplicated sockets. 313df8bae1dSRodney W. Grimes */ 314df8bae1dSRodney W. Grimes if (so->so_options & SO_REUSEADDR) 315df8bae1dSRodney W. Grimes reuseport = SO_REUSEADDR|SO_REUSEPORT; 316df8bae1dSRodney W. Grimes } else if (sin->sin_addr.s_addr != INADDR_ANY) { 317df8bae1dSRodney W. Grimes sin->sin_port = 0; /* yech... */ 31883103a73SAndrew R. Reiter bzero(&sin->sin_zero, sizeof(sin->sin_zero)); 319df8bae1dSRodney W. Grimes if (ifa_ifwithaddr((struct sockaddr *)sin) == 0) 320df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 321df8bae1dSRodney W. Grimes } 3224b932371SIan Dowse laddr = sin->sin_addr; 323df8bae1dSRodney W. Grimes if (lport) { 324df8bae1dSRodney W. Grimes struct inpcb *t; 325df8bae1dSRodney W. Grimes /* GROSS */ 326b0d22693SCrist J. Clark if (ntohs(lport) <= ipport_reservedhigh && 327b0d22693SCrist J. Clark ntohs(lport) >= ipport_reservedlow && 32856f21b9dSColin Percival suser_cred(cred, SUSER_ALLOWJAIL)) 3292469dd60SGarrett Wollman return (EACCES); 330b0330ed9SPawel Jakub Dawidek if (jailed(cred)) 33175c13541SPoul-Henning Kamp prison = 1; 3322f9a2132SBrian Feldman if (so->so_cred->cr_uid != 0 && 33352b65dbeSBill Fenner !IN_MULTICAST(ntohl(sin->sin_addr.s_addr))) { 3344049a042SGuido van Rooij t = in_pcblookup_local(inp->inp_pcbinfo, 33575c13541SPoul-Henning Kamp sin->sin_addr, lport, 33675c13541SPoul-Henning Kamp prison ? 0 : INPLOOKUP_WILDCARD); 337340c35deSJonathan Lemon /* 338340c35deSJonathan Lemon * XXX 339340c35deSJonathan Lemon * This entire block sorely needs a rewrite. 340340c35deSJonathan Lemon */ 3414cc20ab1SSeigo Tanimura if (t && 3424658dc83SYaroslav Tykhiy ((t->inp_vflag & INP_TIMEWAIT) == 0) && 3434658dc83SYaroslav Tykhiy (so->so_type != SOCK_STREAM || 3444658dc83SYaroslav Tykhiy ntohl(t->inp_faddr.s_addr) == INADDR_ANY) && 3454cc20ab1SSeigo Tanimura (ntohl(sin->sin_addr.s_addr) != INADDR_ANY || 34652b65dbeSBill Fenner ntohl(t->inp_laddr.s_addr) != INADDR_ANY || 34752b65dbeSBill Fenner (t->inp_socket->so_options & 34852b65dbeSBill Fenner SO_REUSEPORT) == 0) && 3492f9a2132SBrian Feldman (so->so_cred->cr_uid != 350a4eb4405SYaroslav Tykhiy t->inp_socket->so_cred->cr_uid)) 3514049a042SGuido van Rooij return (EADDRINUSE); 3524049a042SGuido van Rooij } 353b0330ed9SPawel Jakub Dawidek if (prison && prison_ip(cred, 0, &sin->sin_addr.s_addr)) 354970680faSPoul-Henning Kamp return (EADDRNOTAVAIL); 355c3229e05SDavid Greenman t = in_pcblookup_local(pcbinfo, sin->sin_addr, 35675c13541SPoul-Henning Kamp lport, prison ? 0 : wild); 357340c35deSJonathan Lemon if (t && (t->inp_vflag & INP_TIMEWAIT)) { 358340c35deSJonathan Lemon if ((reuseport & intotw(t)->tw_so_options) == 0) 359340c35deSJonathan Lemon return (EADDRINUSE); 360340c35deSJonathan Lemon } else 3614cc20ab1SSeigo Tanimura if (t && 3624cc20ab1SSeigo Tanimura (reuseport & t->inp_socket->so_options) == 0) { 363cfa1ca9dSYoshinobu Inoue #if defined(INET6) 36433841545SHajimu UMEMOTO if (ntohl(sin->sin_addr.s_addr) != 365cfa1ca9dSYoshinobu Inoue INADDR_ANY || 366cfa1ca9dSYoshinobu Inoue ntohl(t->inp_laddr.s_addr) != 367cfa1ca9dSYoshinobu Inoue INADDR_ANY || 368cfa1ca9dSYoshinobu Inoue INP_SOCKAF(so) == 369cfa1ca9dSYoshinobu Inoue INP_SOCKAF(t->inp_socket)) 370cfa1ca9dSYoshinobu Inoue #endif /* defined(INET6) */ 371df8bae1dSRodney W. Grimes return (EADDRINUSE); 372df8bae1dSRodney W. Grimes } 373cfa1ca9dSYoshinobu Inoue } 374df8bae1dSRodney W. Grimes } 3754b932371SIan Dowse if (*lportp != 0) 3764b932371SIan Dowse lport = *lportp; 37733b3ac06SPeter Wemm if (lport == 0) { 3786ac48b74SMike Silbersack u_short first, last; 379174624e0SMike Silbersack int count; 38033b3ac06SPeter Wemm 3814b932371SIan Dowse if (laddr.s_addr != INADDR_ANY) 382b0330ed9SPawel Jakub Dawidek if (prison_ip(cred, 0, &laddr.s_addr)) 38375c13541SPoul-Henning Kamp return (EINVAL); 384321a2846SPoul-Henning Kamp 38533b3ac06SPeter Wemm if (inp->inp_flags & INP_HIGHPORT) { 38633b3ac06SPeter Wemm first = ipport_hifirstauto; /* sysctl */ 38733b3ac06SPeter Wemm last = ipport_hilastauto; 388c3229e05SDavid Greenman lastport = &pcbinfo->lasthi; 38933b3ac06SPeter Wemm } else if (inp->inp_flags & INP_LOWPORT) { 39056f21b9dSColin Percival if ((error = suser_cred(cred, SUSER_ALLOWJAIL)) != 0) 391a29f300eSGarrett Wollman return error; 392bbd42ad0SPeter Wemm first = ipport_lowfirstauto; /* 1023 */ 393bbd42ad0SPeter Wemm last = ipport_lowlastauto; /* 600 */ 394c3229e05SDavid Greenman lastport = &pcbinfo->lastlow; 39533b3ac06SPeter Wemm } else { 39633b3ac06SPeter Wemm first = ipport_firstauto; /* sysctl */ 39733b3ac06SPeter Wemm last = ipport_lastauto; 398c3229e05SDavid Greenman lastport = &pcbinfo->lastport; 39933b3ac06SPeter Wemm } 40033b3ac06SPeter Wemm /* 4015f311da2SMike Silbersack * For UDP, use random port allocation as long as the user 4025f311da2SMike Silbersack * allows it. For TCP (and as of yet unknown) connections, 4035f311da2SMike Silbersack * use random port allocation only if the user allows it AND 40429f2a6ecSMaxim Konovalov * ipport_tick() allows it. 4055f311da2SMike Silbersack */ 4065f311da2SMike Silbersack if (ipport_randomized && 4075f311da2SMike Silbersack (!ipport_stoprandom || pcbinfo == &udbinfo)) 4085f311da2SMike Silbersack dorandom = 1; 4095f311da2SMike Silbersack else 4105f311da2SMike Silbersack dorandom = 0; 411e99971bfSMaxim Konovalov /* 412e99971bfSMaxim Konovalov * It makes no sense to do random port allocation if 413e99971bfSMaxim Konovalov * we have the only port available. 414e99971bfSMaxim Konovalov */ 415e99971bfSMaxim Konovalov if (first == last) 416e99971bfSMaxim Konovalov dorandom = 0; 4175f311da2SMike Silbersack /* Make sure to not include UDP packets in the count. */ 4185f311da2SMike Silbersack if (pcbinfo != &udbinfo) 4195f311da2SMike Silbersack ipport_tcpallocs++; 4205f311da2SMike Silbersack /* 42133b3ac06SPeter Wemm * Simple check to ensure all ports are not used up causing 42233b3ac06SPeter Wemm * a deadlock here. 42333b3ac06SPeter Wemm * 42433b3ac06SPeter Wemm * We split the two cases (up and down) so that the direction 42533b3ac06SPeter Wemm * is not being tested on each round of the loop. 42633b3ac06SPeter Wemm */ 42733b3ac06SPeter Wemm if (first > last) { 42833b3ac06SPeter Wemm /* 42933b3ac06SPeter Wemm * counting down 43033b3ac06SPeter Wemm */ 4315f311da2SMike Silbersack if (dorandom) 4326b2fc10bSMike Silbersack *lastport = first - 4336b2fc10bSMike Silbersack (arc4random() % (first - last)); 43433b3ac06SPeter Wemm count = first - last; 435174624e0SMike Silbersack 436df8bae1dSRodney W. Grimes do { 4376ac48b74SMike Silbersack if (count-- < 0) /* completely used? */ 438550b1518SWes Peters return (EADDRNOTAVAIL); 43933b3ac06SPeter Wemm --*lastport; 44033b3ac06SPeter Wemm if (*lastport > first || *lastport < last) 44133b3ac06SPeter Wemm *lastport = first; 44215bd2b43SDavid Greenman lport = htons(*lastport); 4434b932371SIan Dowse } while (in_pcblookup_local(pcbinfo, laddr, lport, 4444b932371SIan Dowse wild)); 44533b3ac06SPeter Wemm } else { 44633b3ac06SPeter Wemm /* 44733b3ac06SPeter Wemm * counting up 44833b3ac06SPeter Wemm */ 4495f311da2SMike Silbersack if (dorandom) 4506b2fc10bSMike Silbersack *lastport = first + 4516b2fc10bSMike Silbersack (arc4random() % (last - first)); 45233b3ac06SPeter Wemm count = last - first; 453174624e0SMike Silbersack 45433b3ac06SPeter Wemm do { 4556ac48b74SMike Silbersack if (count-- < 0) /* completely used? */ 456550b1518SWes Peters return (EADDRNOTAVAIL); 45733b3ac06SPeter Wemm ++*lastport; 45833b3ac06SPeter Wemm if (*lastport < first || *lastport > last) 45933b3ac06SPeter Wemm *lastport = first; 46033b3ac06SPeter Wemm lport = htons(*lastport); 4614b932371SIan Dowse } while (in_pcblookup_local(pcbinfo, laddr, lport, 4624b932371SIan Dowse wild)); 46333b3ac06SPeter Wemm } 46433b3ac06SPeter Wemm } 465b0330ed9SPawel Jakub Dawidek if (prison_ip(cred, 0, &laddr.s_addr)) 466e4bdf25dSPoul-Henning Kamp return (EINVAL); 4674b932371SIan Dowse *laddrp = laddr.s_addr; 4684b932371SIan Dowse *lportp = lport; 469df8bae1dSRodney W. Grimes return (0); 470df8bae1dSRodney W. Grimes } 471df8bae1dSRodney W. Grimes 472999f1343SGarrett Wollman /* 4735200e00eSIan Dowse * Connect from a socket to a specified address. 4745200e00eSIan Dowse * Both address and port must be specified in argument sin. 4755200e00eSIan Dowse * If don't have a local address for this socket yet, 4765200e00eSIan Dowse * then pick one. 477999f1343SGarrett Wollman */ 478999f1343SGarrett Wollman int 479136d4f1cSRobert Watson in_pcbconnect(struct inpcb *inp, struct sockaddr *nam, struct ucred *cred) 480999f1343SGarrett Wollman { 4815200e00eSIan Dowse u_short lport, fport; 4825200e00eSIan Dowse in_addr_t laddr, faddr; 4835200e00eSIan Dowse int anonport, error; 484df8bae1dSRodney W. Grimes 48527f74fd0SRobert Watson INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 48627f74fd0SRobert Watson INP_LOCK_ASSERT(inp); 48727f74fd0SRobert Watson 4885200e00eSIan Dowse lport = inp->inp_lport; 4895200e00eSIan Dowse laddr = inp->inp_laddr.s_addr; 4905200e00eSIan Dowse anonport = (lport == 0); 4915200e00eSIan Dowse error = in_pcbconnect_setup(inp, nam, &laddr, &lport, &faddr, &fport, 492b0330ed9SPawel Jakub Dawidek NULL, cred); 4935200e00eSIan Dowse if (error) 4945200e00eSIan Dowse return (error); 4955200e00eSIan Dowse 4965200e00eSIan Dowse /* Do the initial binding of the local address if required. */ 4975200e00eSIan Dowse if (inp->inp_laddr.s_addr == INADDR_ANY && inp->inp_lport == 0) { 4985200e00eSIan Dowse inp->inp_lport = lport; 4995200e00eSIan Dowse inp->inp_laddr.s_addr = laddr; 5005200e00eSIan Dowse if (in_pcbinshash(inp) != 0) { 5015200e00eSIan Dowse inp->inp_laddr.s_addr = INADDR_ANY; 5025200e00eSIan Dowse inp->inp_lport = 0; 5035200e00eSIan Dowse return (EAGAIN); 5045200e00eSIan Dowse } 5055200e00eSIan Dowse } 5065200e00eSIan Dowse 5075200e00eSIan Dowse /* Commit the remaining changes. */ 5085200e00eSIan Dowse inp->inp_lport = lport; 5095200e00eSIan Dowse inp->inp_laddr.s_addr = laddr; 5105200e00eSIan Dowse inp->inp_faddr.s_addr = faddr; 5115200e00eSIan Dowse inp->inp_fport = fport; 5125200e00eSIan Dowse in_pcbrehash(inp); 5130f9ade71SHajimu UMEMOTO #ifdef IPSEC 5140f9ade71SHajimu UMEMOTO if (inp->inp_socket->so_type == SOCK_STREAM) 5150f9ade71SHajimu UMEMOTO ipsec_pcbconn(inp->inp_sp); 5160f9ade71SHajimu UMEMOTO #endif 5175200e00eSIan Dowse if (anonport) 5185200e00eSIan Dowse inp->inp_flags |= INP_ANONPORT; 5195200e00eSIan Dowse return (0); 5205200e00eSIan Dowse } 5215200e00eSIan Dowse 5225200e00eSIan Dowse /* 5235200e00eSIan Dowse * Set up for a connect from a socket to the specified address. 5245200e00eSIan Dowse * On entry, *laddrp and *lportp should contain the current local 5255200e00eSIan Dowse * address and port for the PCB; these are updated to the values 5265200e00eSIan Dowse * that should be placed in inp_laddr and inp_lport to complete 5275200e00eSIan Dowse * the connect. 5285200e00eSIan Dowse * 5295200e00eSIan Dowse * On success, *faddrp and *fportp will be set to the remote address 5305200e00eSIan Dowse * and port. These are not updated in the error case. 5315200e00eSIan Dowse * 5325200e00eSIan Dowse * If the operation fails because the connection already exists, 5335200e00eSIan Dowse * *oinpp will be set to the PCB of that connection so that the 5345200e00eSIan Dowse * caller can decide to override it. In all other cases, *oinpp 5355200e00eSIan Dowse * is set to NULL. 5365200e00eSIan Dowse */ 5375200e00eSIan Dowse int 538136d4f1cSRobert Watson in_pcbconnect_setup(struct inpcb *inp, struct sockaddr *nam, 539136d4f1cSRobert Watson in_addr_t *laddrp, u_short *lportp, in_addr_t *faddrp, u_short *fportp, 540136d4f1cSRobert Watson struct inpcb **oinpp, struct ucred *cred) 5415200e00eSIan Dowse { 5425200e00eSIan Dowse struct sockaddr_in *sin = (struct sockaddr_in *)nam; 5435200e00eSIan Dowse struct in_ifaddr *ia; 5445200e00eSIan Dowse struct sockaddr_in sa; 545b0330ed9SPawel Jakub Dawidek struct ucred *socred; 5465200e00eSIan Dowse struct inpcb *oinp; 5475200e00eSIan Dowse struct in_addr laddr, faddr; 5485200e00eSIan Dowse u_short lport, fport; 5495200e00eSIan Dowse int error; 5505200e00eSIan Dowse 55127f74fd0SRobert Watson INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 55227f74fd0SRobert Watson INP_LOCK_ASSERT(inp); 55327f74fd0SRobert Watson 5545200e00eSIan Dowse if (oinpp != NULL) 5555200e00eSIan Dowse *oinpp = NULL; 55657bf258eSGarrett Wollman if (nam->sa_len != sizeof (*sin)) 557df8bae1dSRodney W. Grimes return (EINVAL); 558df8bae1dSRodney W. Grimes if (sin->sin_family != AF_INET) 559df8bae1dSRodney W. Grimes return (EAFNOSUPPORT); 560df8bae1dSRodney W. Grimes if (sin->sin_port == 0) 561df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 5625200e00eSIan Dowse laddr.s_addr = *laddrp; 5635200e00eSIan Dowse lport = *lportp; 5645200e00eSIan Dowse faddr = sin->sin_addr; 5655200e00eSIan Dowse fport = sin->sin_port; 566b0330ed9SPawel Jakub Dawidek socred = inp->inp_socket->so_cred; 567b0330ed9SPawel Jakub Dawidek if (laddr.s_addr == INADDR_ANY && jailed(socred)) { 5685200e00eSIan Dowse bzero(&sa, sizeof(sa)); 569b0330ed9SPawel Jakub Dawidek sa.sin_addr.s_addr = htonl(prison_getip(socred)); 5705200e00eSIan Dowse sa.sin_len = sizeof(sa); 5715200e00eSIan Dowse sa.sin_family = AF_INET; 5725200e00eSIan Dowse error = in_pcbbind_setup(inp, (struct sockaddr *)&sa, 573b0330ed9SPawel Jakub Dawidek &laddr.s_addr, &lport, cred); 5745200e00eSIan Dowse if (error) 5755200e00eSIan Dowse return (error); 5765200e00eSIan Dowse } 57759562606SGarrett Wollman if (!TAILQ_EMPTY(&in_ifaddrhead)) { 578df8bae1dSRodney W. Grimes /* 579df8bae1dSRodney W. Grimes * If the destination address is INADDR_ANY, 580df8bae1dSRodney W. Grimes * use the primary local address. 581df8bae1dSRodney W. Grimes * If the supplied address is INADDR_BROADCAST, 582df8bae1dSRodney W. Grimes * and the primary interface supports broadcast, 583df8bae1dSRodney W. Grimes * choose the broadcast address for that interface. 584df8bae1dSRodney W. Grimes */ 5855200e00eSIan Dowse if (faddr.s_addr == INADDR_ANY) 5865200e00eSIan Dowse faddr = IA_SIN(TAILQ_FIRST(&in_ifaddrhead))->sin_addr; 5875200e00eSIan Dowse else if (faddr.s_addr == (u_long)INADDR_BROADCAST && 5885200e00eSIan Dowse (TAILQ_FIRST(&in_ifaddrhead)->ia_ifp->if_flags & 5895200e00eSIan Dowse IFF_BROADCAST)) 5905200e00eSIan Dowse faddr = satosin(&TAILQ_FIRST( 5915200e00eSIan Dowse &in_ifaddrhead)->ia_broadaddr)->sin_addr; 592df8bae1dSRodney W. Grimes } 5935200e00eSIan Dowse if (laddr.s_addr == INADDR_ANY) { 594df8bae1dSRodney W. Grimes ia = (struct in_ifaddr *)0; 595df8bae1dSRodney W. Grimes /* 59697d8d152SAndre Oppermann * If route is known our src addr is taken from the i/f, 59797d8d152SAndre Oppermann * else punt. 598cf744713SAndre Oppermann * 599cf744713SAndre Oppermann * Find out route to destination 600df8bae1dSRodney W. Grimes */ 601cf744713SAndre Oppermann if ((inp->inp_socket->so_options & SO_DONTROUTE) == 0) 602cf744713SAndre Oppermann ia = ip_rtaddr(faddr); 603df8bae1dSRodney W. Grimes /* 604cf744713SAndre Oppermann * If we found a route, use the address corresponding to 605cf744713SAndre Oppermann * the outgoing interface. 606cf744713SAndre Oppermann * 607cf744713SAndre Oppermann * Otherwise assume faddr is reachable on a directly connected 608cf744713SAndre Oppermann * network and try to find a corresponding interface to take 609cf744713SAndre Oppermann * the source address from. 610df8bae1dSRodney W. Grimes */ 611df8bae1dSRodney W. Grimes if (ia == 0) { 6125200e00eSIan Dowse bzero(&sa, sizeof(sa)); 6135200e00eSIan Dowse sa.sin_addr = faddr; 6145200e00eSIan Dowse sa.sin_len = sizeof(sa); 6155200e00eSIan Dowse sa.sin_family = AF_INET; 616df8bae1dSRodney W. Grimes 6175200e00eSIan Dowse ia = ifatoia(ifa_ifwithdstaddr(sintosa(&sa))); 618df8bae1dSRodney W. Grimes if (ia == 0) 6195200e00eSIan Dowse ia = ifatoia(ifa_ifwithnet(sintosa(&sa))); 620df8bae1dSRodney W. Grimes if (ia == 0) 621ef14c369SMaxim Konovalov return (ENETUNREACH); 622df8bae1dSRodney W. Grimes } 623df8bae1dSRodney W. Grimes /* 624df8bae1dSRodney W. Grimes * If the destination address is multicast and an outgoing 625df8bae1dSRodney W. Grimes * interface has been set as a multicast option, use the 626df8bae1dSRodney W. Grimes * address of that interface as our source address. 627df8bae1dSRodney W. Grimes */ 6285200e00eSIan Dowse if (IN_MULTICAST(ntohl(faddr.s_addr)) && 629df8bae1dSRodney W. Grimes inp->inp_moptions != NULL) { 630df8bae1dSRodney W. Grimes struct ip_moptions *imo; 631df8bae1dSRodney W. Grimes struct ifnet *ifp; 632df8bae1dSRodney W. Grimes 633df8bae1dSRodney W. Grimes imo = inp->inp_moptions; 634df8bae1dSRodney W. Grimes if (imo->imo_multicast_ifp != NULL) { 635df8bae1dSRodney W. Grimes ifp = imo->imo_multicast_ifp; 63637d40066SPoul-Henning Kamp TAILQ_FOREACH(ia, &in_ifaddrhead, ia_link) 637df8bae1dSRodney W. Grimes if (ia->ia_ifp == ifp) 638df8bae1dSRodney W. Grimes break; 639df8bae1dSRodney W. Grimes if (ia == 0) 640df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 641df8bae1dSRodney W. Grimes } 642df8bae1dSRodney W. Grimes } 6435200e00eSIan Dowse laddr = ia->ia_addr.sin_addr; 644999f1343SGarrett Wollman } 645999f1343SGarrett Wollman 6465200e00eSIan Dowse oinp = in_pcblookup_hash(inp->inp_pcbinfo, faddr, fport, laddr, lport, 6475200e00eSIan Dowse 0, NULL); 6485200e00eSIan Dowse if (oinp != NULL) { 6495200e00eSIan Dowse if (oinpp != NULL) 6505200e00eSIan Dowse *oinpp = oinp; 651df8bae1dSRodney W. Grimes return (EADDRINUSE); 652c3229e05SDavid Greenman } 6535200e00eSIan Dowse if (lport == 0) { 654b0330ed9SPawel Jakub Dawidek error = in_pcbbind_setup(inp, NULL, &laddr.s_addr, &lport, 655b0330ed9SPawel Jakub Dawidek cred); 6565a903f8dSPierre Beyssac if (error) 6575a903f8dSPierre Beyssac return (error); 6585a903f8dSPierre Beyssac } 6595200e00eSIan Dowse *laddrp = laddr.s_addr; 6605200e00eSIan Dowse *lportp = lport; 6615200e00eSIan Dowse *faddrp = faddr.s_addr; 6625200e00eSIan Dowse *fportp = fport; 663df8bae1dSRodney W. Grimes return (0); 664df8bae1dSRodney W. Grimes } 665df8bae1dSRodney W. Grimes 66626f9a767SRodney W. Grimes void 667136d4f1cSRobert Watson in_pcbdisconnect(struct inpcb *inp) 668df8bae1dSRodney W. Grimes { 6696b348152SRobert Watson 670fe6bfc37SRobert Watson INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 67159daba27SSam Leffler INP_LOCK_ASSERT(inp); 672df8bae1dSRodney W. Grimes 673df8bae1dSRodney W. Grimes inp->inp_faddr.s_addr = INADDR_ANY; 674df8bae1dSRodney W. Grimes inp->inp_fport = 0; 67515bd2b43SDavid Greenman in_pcbrehash(inp); 6760f9ade71SHajimu UMEMOTO #ifdef IPSEC 6770f9ade71SHajimu UMEMOTO ipsec_pcbdisconn(inp->inp_sp); 6780f9ade71SHajimu UMEMOTO #endif 679df8bae1dSRodney W. Grimes } 680df8bae1dSRodney W. Grimes 6814c7c478dSRobert Watson /* 6824c7c478dSRobert Watson * In the old world order, in_pcbdetach() served two functions: to detach the 6834c7c478dSRobert Watson * pcb from the socket/potentially free the socket, and to free the pcb 6844c7c478dSRobert Watson * itself. In the new world order, the protocol code is responsible for 6854c7c478dSRobert Watson * managing the relationship with the socket, and this code simply frees the 6864c7c478dSRobert Watson * pcb. 6874c7c478dSRobert Watson */ 68826f9a767SRodney W. Grimes void 689136d4f1cSRobert Watson in_pcbdetach(struct inpcb *inp) 690df8bae1dSRodney W. Grimes { 6914c7c478dSRobert Watson 6924c7c478dSRobert Watson KASSERT(inp->inp_socket != NULL, ("in_pcbdetach: inp_socket == NULL")); 6934c7c478dSRobert Watson inp->inp_socket->so_pcb = NULL; 6944c7c478dSRobert Watson inp->inp_socket = NULL; 6954c7c478dSRobert Watson } 6964c7c478dSRobert Watson 6974c7c478dSRobert Watson void 6984c7c478dSRobert Watson in_pcbfree(struct inpcb *inp) 6994c7c478dSRobert Watson { 7003d4d47f3SGarrett Wollman struct inpcbinfo *ipi = inp->inp_pcbinfo; 701df8bae1dSRodney W. Grimes 7024c7c478dSRobert Watson KASSERT(inp->inp_socket == NULL, ("in_pcbfree: inp_socket != NULL")); 703fe6bfc37SRobert Watson INP_INFO_WLOCK_ASSERT(ipi); 70459daba27SSam Leffler INP_LOCK_ASSERT(inp); 70559daba27SSam Leffler 7060f9ade71SHajimu UMEMOTO #if defined(IPSEC) || defined(FAST_IPSEC) 707cfa1ca9dSYoshinobu Inoue ipsec4_delete_pcbpolicy(inp); 708cfa1ca9dSYoshinobu Inoue #endif /*IPSEC*/ 7093d4d47f3SGarrett Wollman inp->inp_gencnt = ++ipi->ipi_gencnt; 710c3229e05SDavid Greenman in_pcbremlists(inp); 711df8bae1dSRodney W. Grimes if (inp->inp_options) 712df8bae1dSRodney W. Grimes (void)m_free(inp->inp_options); 713df8bae1dSRodney W. Grimes ip_freemoptions(inp->inp_moptions); 714cfa1ca9dSYoshinobu Inoue inp->inp_vflag = 0; 715f76fcf6dSJeffrey Hsu INP_LOCK_DESTROY(inp); 716a557af22SRobert Watson #ifdef MAC 717a557af22SRobert Watson mac_destroy_inpcb(inp); 718a557af22SRobert Watson #endif 71969c2d429SJeff Roberson uma_zfree(ipi->ipi_zone, inp); 720df8bae1dSRodney W. Grimes } 721df8bae1dSRodney W. Grimes 72226ef6ac4SDon Lewis struct sockaddr * 723136d4f1cSRobert Watson in_sockaddr(in_port_t port, struct in_addr *addr_p) 72426ef6ac4SDon Lewis { 72526ef6ac4SDon Lewis struct sockaddr_in *sin; 72626ef6ac4SDon Lewis 72726ef6ac4SDon Lewis MALLOC(sin, struct sockaddr_in *, sizeof *sin, M_SONAME, 728a163d034SWarner Losh M_WAITOK | M_ZERO); 72926ef6ac4SDon Lewis sin->sin_family = AF_INET; 73026ef6ac4SDon Lewis sin->sin_len = sizeof(*sin); 73126ef6ac4SDon Lewis sin->sin_addr = *addr_p; 73226ef6ac4SDon Lewis sin->sin_port = port; 73326ef6ac4SDon Lewis 73426ef6ac4SDon Lewis return (struct sockaddr *)sin; 73526ef6ac4SDon Lewis } 73626ef6ac4SDon Lewis 737117bcae7SGarrett Wollman /* 738f76fcf6dSJeffrey Hsu * The wrapper function will pass down the pcbinfo for this function to lock. 739f76fcf6dSJeffrey Hsu * The socket must have a valid 740117bcae7SGarrett Wollman * (i.e., non-nil) PCB, but it should be impossible to get an invalid one 741117bcae7SGarrett Wollman * except through a kernel programming error, so it is acceptable to panic 74257bf258eSGarrett Wollman * (or in this case trap) if the PCB is invalid. (Actually, we don't trap 74357bf258eSGarrett Wollman * because there actually /is/ a programming error somewhere... XXX) 744117bcae7SGarrett Wollman */ 745117bcae7SGarrett Wollman int 746136d4f1cSRobert Watson in_setsockaddr(struct socket *so, struct sockaddr **nam, 747136d4f1cSRobert Watson struct inpcbinfo *pcbinfo) 748df8bae1dSRodney W. Grimes { 749136d4f1cSRobert Watson struct inpcb *inp; 75026ef6ac4SDon Lewis struct in_addr addr; 75126ef6ac4SDon Lewis in_port_t port; 75242fa505bSDavid Greenman 753f76fcf6dSJeffrey Hsu INP_INFO_RLOCK(pcbinfo); 754fdc984f7STor Egge inp = sotoinpcb(so); 7554c7c478dSRobert Watson KASSERT(inp != NULL, ("in_setsockaddr: so_pcb == NULL")); 756f76fcf6dSJeffrey Hsu INP_LOCK(inp); 75726ef6ac4SDon Lewis port = inp->inp_lport; 75826ef6ac4SDon Lewis addr = inp->inp_laddr; 759f76fcf6dSJeffrey Hsu INP_UNLOCK(inp); 760f76fcf6dSJeffrey Hsu INP_INFO_RUNLOCK(pcbinfo); 76142fa505bSDavid Greenman 76226ef6ac4SDon Lewis *nam = in_sockaddr(port, &addr); 763117bcae7SGarrett Wollman return 0; 764df8bae1dSRodney W. Grimes } 765df8bae1dSRodney W. Grimes 766f76fcf6dSJeffrey Hsu /* 767f76fcf6dSJeffrey Hsu * The wrapper function will pass down the pcbinfo for this function to lock. 768f76fcf6dSJeffrey Hsu */ 769117bcae7SGarrett Wollman int 770136d4f1cSRobert Watson in_setpeeraddr(struct socket *so, struct sockaddr **nam, 771136d4f1cSRobert Watson struct inpcbinfo *pcbinfo) 772df8bae1dSRodney W. Grimes { 773136d4f1cSRobert Watson struct inpcb *inp; 77426ef6ac4SDon Lewis struct in_addr addr; 77526ef6ac4SDon Lewis in_port_t port; 77642fa505bSDavid Greenman 777f76fcf6dSJeffrey Hsu INP_INFO_RLOCK(pcbinfo); 778fdc984f7STor Egge inp = sotoinpcb(so); 7794c7c478dSRobert Watson KASSERT(inp != NULL, ("in_setpeeraddr: so_pcb == NULL")); 780f76fcf6dSJeffrey Hsu INP_LOCK(inp); 78126ef6ac4SDon Lewis port = inp->inp_fport; 78226ef6ac4SDon Lewis addr = inp->inp_faddr; 783f76fcf6dSJeffrey Hsu INP_UNLOCK(inp); 784f76fcf6dSJeffrey Hsu INP_INFO_RUNLOCK(pcbinfo); 78542fa505bSDavid Greenman 78626ef6ac4SDon Lewis *nam = in_sockaddr(port, &addr); 787117bcae7SGarrett Wollman return 0; 788df8bae1dSRodney W. Grimes } 789df8bae1dSRodney W. Grimes 79026f9a767SRodney W. Grimes void 791136d4f1cSRobert Watson in_pcbnotifyall(struct inpcbinfo *pcbinfo, struct in_addr faddr, int errno, 792136d4f1cSRobert Watson struct inpcb *(*notify)(struct inpcb *, int)) 793d1c54148SJesper Skriver { 794c693a045SJonathan Lemon struct inpcb *inp, *ninp; 795f76fcf6dSJeffrey Hsu struct inpcbhead *head; 796d1c54148SJesper Skriver 7973dc7ebf9SJeffrey Hsu INP_INFO_WLOCK(pcbinfo); 798f76fcf6dSJeffrey Hsu head = pcbinfo->listhead; 799c693a045SJonathan Lemon for (inp = LIST_FIRST(head); inp != NULL; inp = ninp) { 800f76fcf6dSJeffrey Hsu INP_LOCK(inp); 801c693a045SJonathan Lemon ninp = LIST_NEXT(inp, inp_list); 802d1c54148SJesper Skriver #ifdef INET6 803f76fcf6dSJeffrey Hsu if ((inp->inp_vflag & INP_IPV4) == 0) { 804f76fcf6dSJeffrey Hsu INP_UNLOCK(inp); 805d1c54148SJesper Skriver continue; 806f76fcf6dSJeffrey Hsu } 807d1c54148SJesper Skriver #endif 808d1c54148SJesper Skriver if (inp->inp_faddr.s_addr != faddr.s_addr || 809f76fcf6dSJeffrey Hsu inp->inp_socket == NULL) { 810f76fcf6dSJeffrey Hsu INP_UNLOCK(inp); 811d1c54148SJesper Skriver continue; 812d1c54148SJesper Skriver } 8133dc7ebf9SJeffrey Hsu if ((*notify)(inp, errno)) 814f76fcf6dSJeffrey Hsu INP_UNLOCK(inp); 815f76fcf6dSJeffrey Hsu } 8163dc7ebf9SJeffrey Hsu INP_INFO_WUNLOCK(pcbinfo); 817d1c54148SJesper Skriver } 818d1c54148SJesper Skriver 819e43cc4aeSHajimu UMEMOTO void 820136d4f1cSRobert Watson in_pcbpurgeif0(struct inpcbinfo *pcbinfo, struct ifnet *ifp) 821e43cc4aeSHajimu UMEMOTO { 822e43cc4aeSHajimu UMEMOTO struct inpcb *inp; 823e43cc4aeSHajimu UMEMOTO struct ip_moptions *imo; 824e43cc4aeSHajimu UMEMOTO int i, gap; 825e43cc4aeSHajimu UMEMOTO 826f76fcf6dSJeffrey Hsu INP_INFO_RLOCK(pcbinfo); 8273cfcc388SJeffrey Hsu LIST_FOREACH(inp, pcbinfo->listhead, inp_list) { 828f76fcf6dSJeffrey Hsu INP_LOCK(inp); 829e43cc4aeSHajimu UMEMOTO imo = inp->inp_moptions; 830e43cc4aeSHajimu UMEMOTO if ((inp->inp_vflag & INP_IPV4) && 831e43cc4aeSHajimu UMEMOTO imo != NULL) { 832e43cc4aeSHajimu UMEMOTO /* 833e43cc4aeSHajimu UMEMOTO * Unselect the outgoing interface if it is being 834e43cc4aeSHajimu UMEMOTO * detached. 835e43cc4aeSHajimu UMEMOTO */ 836e43cc4aeSHajimu UMEMOTO if (imo->imo_multicast_ifp == ifp) 837e43cc4aeSHajimu UMEMOTO imo->imo_multicast_ifp = NULL; 838e43cc4aeSHajimu UMEMOTO 839e43cc4aeSHajimu UMEMOTO /* 840e43cc4aeSHajimu UMEMOTO * Drop multicast group membership if we joined 841e43cc4aeSHajimu UMEMOTO * through the interface being detached. 842e43cc4aeSHajimu UMEMOTO */ 843e43cc4aeSHajimu UMEMOTO for (i = 0, gap = 0; i < imo->imo_num_memberships; 844e43cc4aeSHajimu UMEMOTO i++) { 845e43cc4aeSHajimu UMEMOTO if (imo->imo_membership[i]->inm_ifp == ifp) { 846e43cc4aeSHajimu UMEMOTO in_delmulti(imo->imo_membership[i]); 847e43cc4aeSHajimu UMEMOTO gap++; 848e43cc4aeSHajimu UMEMOTO } else if (gap != 0) 849e43cc4aeSHajimu UMEMOTO imo->imo_membership[i - gap] = 850e43cc4aeSHajimu UMEMOTO imo->imo_membership[i]; 851e43cc4aeSHajimu UMEMOTO } 852e43cc4aeSHajimu UMEMOTO imo->imo_num_memberships -= gap; 853e43cc4aeSHajimu UMEMOTO } 854f76fcf6dSJeffrey Hsu INP_UNLOCK(inp); 855e43cc4aeSHajimu UMEMOTO } 8563cfcc388SJeffrey Hsu INP_INFO_RUNLOCK(pcbinfo); 857e43cc4aeSHajimu UMEMOTO } 858e43cc4aeSHajimu UMEMOTO 859df8bae1dSRodney W. Grimes /* 860c3229e05SDavid Greenman * Lookup a PCB based on the local address and port. 861c3229e05SDavid Greenman */ 862d5e8a67eSHajimu UMEMOTO #define INP_LOOKUP_MAPPED_PCB_COST 3 863df8bae1dSRodney W. Grimes struct inpcb * 864136d4f1cSRobert Watson in_pcblookup_local(struct inpcbinfo *pcbinfo, struct in_addr laddr, 865136d4f1cSRobert Watson u_int lport_arg, int wild_okay) 866df8bae1dSRodney W. Grimes { 867136d4f1cSRobert Watson struct inpcb *inp; 868d5e8a67eSHajimu UMEMOTO #ifdef INET6 869d5e8a67eSHajimu UMEMOTO int matchwild = 3 + INP_LOOKUP_MAPPED_PCB_COST; 870d5e8a67eSHajimu UMEMOTO #else 871d5e8a67eSHajimu UMEMOTO int matchwild = 3; 872d5e8a67eSHajimu UMEMOTO #endif 873d5e8a67eSHajimu UMEMOTO int wildcard; 874c3229e05SDavid Greenman u_short lport = lport_arg; 8757bc4aca7SDavid Greenman 8761b73ca0bSSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 8771b73ca0bSSam Leffler 878c3229e05SDavid Greenman if (!wild_okay) { 879c3229e05SDavid Greenman struct inpcbhead *head; 880c3229e05SDavid Greenman /* 881c3229e05SDavid Greenman * Look for an unconnected (wildcard foreign addr) PCB that 882c3229e05SDavid Greenman * matches the local address and port we're looking for. 883c3229e05SDavid Greenman */ 884c3229e05SDavid Greenman head = &pcbinfo->hashbase[INP_PCBHASH(INADDR_ANY, lport, 0, pcbinfo->hashmask)]; 885fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(inp, head, inp_hash) { 886cfa1ca9dSYoshinobu Inoue #ifdef INET6 887369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 888cfa1ca9dSYoshinobu Inoue continue; 889cfa1ca9dSYoshinobu Inoue #endif 890c3229e05SDavid Greenman if (inp->inp_faddr.s_addr == INADDR_ANY && 891c3229e05SDavid Greenman inp->inp_laddr.s_addr == laddr.s_addr && 892c3229e05SDavid Greenman inp->inp_lport == lport) { 893c3229e05SDavid Greenman /* 894c3229e05SDavid Greenman * Found. 895c3229e05SDavid Greenman */ 896c3229e05SDavid Greenman return (inp); 897df8bae1dSRodney W. Grimes } 898c3229e05SDavid Greenman } 899c3229e05SDavid Greenman /* 900c3229e05SDavid Greenman * Not found. 901c3229e05SDavid Greenman */ 902c3229e05SDavid Greenman return (NULL); 903c3229e05SDavid Greenman } else { 904c3229e05SDavid Greenman struct inpcbporthead *porthash; 905c3229e05SDavid Greenman struct inpcbport *phd; 906c3229e05SDavid Greenman struct inpcb *match = NULL; 907c3229e05SDavid Greenman /* 908c3229e05SDavid Greenman * Best fit PCB lookup. 909c3229e05SDavid Greenman * 910c3229e05SDavid Greenman * First see if this local port is in use by looking on the 911c3229e05SDavid Greenman * port hash list. 912c3229e05SDavid Greenman */ 91396af9ea5SMike Silbersack retrylookup: 914c3229e05SDavid Greenman porthash = &pcbinfo->porthashbase[INP_PCBPORTHASH(lport, 915c3229e05SDavid Greenman pcbinfo->porthashmask)]; 916fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(phd, porthash, phd_hash) { 917c3229e05SDavid Greenman if (phd->phd_port == lport) 918c3229e05SDavid Greenman break; 919c3229e05SDavid Greenman } 920c3229e05SDavid Greenman if (phd != NULL) { 921c3229e05SDavid Greenman /* 922c3229e05SDavid Greenman * Port is in use by one or more PCBs. Look for best 923c3229e05SDavid Greenman * fit. 924c3229e05SDavid Greenman */ 92537d40066SPoul-Henning Kamp LIST_FOREACH(inp, &phd->phd_pcblist, inp_portlist) { 926c3229e05SDavid Greenman wildcard = 0; 927cfa1ca9dSYoshinobu Inoue #ifdef INET6 928369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 929cfa1ca9dSYoshinobu Inoue continue; 930d5e8a67eSHajimu UMEMOTO /* 931d5e8a67eSHajimu UMEMOTO * We never select the PCB that has 932d5e8a67eSHajimu UMEMOTO * INP_IPV6 flag and is bound to :: if 933d5e8a67eSHajimu UMEMOTO * we have another PCB which is bound 934d5e8a67eSHajimu UMEMOTO * to 0.0.0.0. If a PCB has the 935d5e8a67eSHajimu UMEMOTO * INP_IPV6 flag, then we set its cost 936d5e8a67eSHajimu UMEMOTO * higher than IPv4 only PCBs. 937d5e8a67eSHajimu UMEMOTO * 938d5e8a67eSHajimu UMEMOTO * Note that the case only happens 939d5e8a67eSHajimu UMEMOTO * when a socket is bound to ::, under 940d5e8a67eSHajimu UMEMOTO * the condition that the use of the 941d5e8a67eSHajimu UMEMOTO * mapped address is allowed. 942d5e8a67eSHajimu UMEMOTO */ 943d5e8a67eSHajimu UMEMOTO if ((inp->inp_vflag & INP_IPV6) != 0) 944d5e8a67eSHajimu UMEMOTO wildcard += INP_LOOKUP_MAPPED_PCB_COST; 945cfa1ca9dSYoshinobu Inoue #endif 94696af9ea5SMike Silbersack /* 94796af9ea5SMike Silbersack * Clean out old time_wait sockets if they 94896af9ea5SMike Silbersack * are clogging up needed local ports. 94996af9ea5SMike Silbersack */ 95096af9ea5SMike Silbersack if ((inp->inp_vflag & INP_TIMEWAIT) != 0) { 95196af9ea5SMike Silbersack if (tcp_twrecycleable((struct tcptw *)inp->inp_ppcb)) { 952f7bbe2c0SSam Leffler INP_LOCK(inp); 95396af9ea5SMike Silbersack tcp_twclose((struct tcptw *)inp->inp_ppcb, 0); 95496af9ea5SMike Silbersack match = NULL; 95596af9ea5SMike Silbersack goto retrylookup; 95696af9ea5SMike Silbersack } 95796af9ea5SMike Silbersack } 958c3229e05SDavid Greenman if (inp->inp_faddr.s_addr != INADDR_ANY) 959c3229e05SDavid Greenman wildcard++; 96015bd2b43SDavid Greenman if (inp->inp_laddr.s_addr != INADDR_ANY) { 96115bd2b43SDavid Greenman if (laddr.s_addr == INADDR_ANY) 96215bd2b43SDavid Greenman wildcard++; 96315bd2b43SDavid Greenman else if (inp->inp_laddr.s_addr != laddr.s_addr) 96415bd2b43SDavid Greenman continue; 96515bd2b43SDavid Greenman } else { 96615bd2b43SDavid Greenman if (laddr.s_addr != INADDR_ANY) 96715bd2b43SDavid Greenman wildcard++; 96815bd2b43SDavid Greenman } 969df8bae1dSRodney W. Grimes if (wildcard < matchwild) { 970df8bae1dSRodney W. Grimes match = inp; 971df8bae1dSRodney W. Grimes matchwild = wildcard; 9723dbdc25cSDavid Greenman if (matchwild == 0) { 973df8bae1dSRodney W. Grimes break; 974df8bae1dSRodney W. Grimes } 975df8bae1dSRodney W. Grimes } 9763dbdc25cSDavid Greenman } 977c3229e05SDavid Greenman } 978df8bae1dSRodney W. Grimes return (match); 979df8bae1dSRodney W. Grimes } 980c3229e05SDavid Greenman } 981d5e8a67eSHajimu UMEMOTO #undef INP_LOOKUP_MAPPED_PCB_COST 98215bd2b43SDavid Greenman 98315bd2b43SDavid Greenman /* 98415bd2b43SDavid Greenman * Lookup PCB in hash list. 98515bd2b43SDavid Greenman */ 98615bd2b43SDavid Greenman struct inpcb * 987136d4f1cSRobert Watson in_pcblookup_hash(struct inpcbinfo *pcbinfo, struct in_addr faddr, 988136d4f1cSRobert Watson u_int fport_arg, struct in_addr laddr, u_int lport_arg, int wildcard, 989136d4f1cSRobert Watson struct ifnet *ifp) 99015bd2b43SDavid Greenman { 99115bd2b43SDavid Greenman struct inpcbhead *head; 992136d4f1cSRobert Watson struct inpcb *inp; 99315bd2b43SDavid Greenman u_short fport = fport_arg, lport = lport_arg; 99415bd2b43SDavid Greenman 99559daba27SSam Leffler INP_INFO_RLOCK_ASSERT(pcbinfo); 99615bd2b43SDavid Greenman /* 99715bd2b43SDavid Greenman * First look for an exact match. 99815bd2b43SDavid Greenman */ 999ddd79a97SDavid Greenman head = &pcbinfo->hashbase[INP_PCBHASH(faddr.s_addr, lport, fport, pcbinfo->hashmask)]; 1000fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(inp, head, inp_hash) { 1001cfa1ca9dSYoshinobu Inoue #ifdef INET6 1002369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 1003cfa1ca9dSYoshinobu Inoue continue; 1004cfa1ca9dSYoshinobu Inoue #endif 10056d6a026bSDavid Greenman if (inp->inp_faddr.s_addr == faddr.s_addr && 1006ca98b82cSDavid Greenman inp->inp_laddr.s_addr == laddr.s_addr && 1007ca98b82cSDavid Greenman inp->inp_fport == fport && 1008c3229e05SDavid Greenman inp->inp_lport == lport) { 1009c3229e05SDavid Greenman /* 1010c3229e05SDavid Greenman * Found. 1011c3229e05SDavid Greenman */ 1012c3229e05SDavid Greenman return (inp); 1013c3229e05SDavid Greenman } 10146d6a026bSDavid Greenman } 10156d6a026bSDavid Greenman if (wildcard) { 10166d6a026bSDavid Greenman struct inpcb *local_wild = NULL; 1017cfa1ca9dSYoshinobu Inoue #if defined(INET6) 1018cfa1ca9dSYoshinobu Inoue struct inpcb *local_wild_mapped = NULL; 1019cfa1ca9dSYoshinobu Inoue #endif /* defined(INET6) */ 10206d6a026bSDavid Greenman 1021ddd79a97SDavid Greenman head = &pcbinfo->hashbase[INP_PCBHASH(INADDR_ANY, lport, 0, pcbinfo->hashmask)]; 1022fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(inp, head, inp_hash) { 1023cfa1ca9dSYoshinobu Inoue #ifdef INET6 1024369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 1025cfa1ca9dSYoshinobu Inoue continue; 1026cfa1ca9dSYoshinobu Inoue #endif 10276d6a026bSDavid Greenman if (inp->inp_faddr.s_addr == INADDR_ANY && 1028c3229e05SDavid Greenman inp->inp_lport == lport) { 1029cfa1ca9dSYoshinobu Inoue if (ifp && ifp->if_type == IFT_FAITH && 1030cfa1ca9dSYoshinobu Inoue (inp->inp_flags & INP_FAITH) == 0) 1031cfa1ca9dSYoshinobu Inoue continue; 10326d6a026bSDavid Greenman if (inp->inp_laddr.s_addr == laddr.s_addr) 1033c3229e05SDavid Greenman return (inp); 1034cfa1ca9dSYoshinobu Inoue else if (inp->inp_laddr.s_addr == INADDR_ANY) { 1035cfa1ca9dSYoshinobu Inoue #if defined(INET6) 1036cfa1ca9dSYoshinobu Inoue if (INP_CHECK_SOCKAF(inp->inp_socket, 1037cfa1ca9dSYoshinobu Inoue AF_INET6)) 1038cfa1ca9dSYoshinobu Inoue local_wild_mapped = inp; 1039cfa1ca9dSYoshinobu Inoue else 1040cfa1ca9dSYoshinobu Inoue #endif /* defined(INET6) */ 10416d6a026bSDavid Greenman local_wild = inp; 10426d6a026bSDavid Greenman } 10436d6a026bSDavid Greenman } 1044cfa1ca9dSYoshinobu Inoue } 1045cfa1ca9dSYoshinobu Inoue #if defined(INET6) 1046cfa1ca9dSYoshinobu Inoue if (local_wild == NULL) 1047cfa1ca9dSYoshinobu Inoue return (local_wild_mapped); 1048cfa1ca9dSYoshinobu Inoue #endif /* defined(INET6) */ 1049c3229e05SDavid Greenman return (local_wild); 10506d6a026bSDavid Greenman } 1051c3229e05SDavid Greenman 1052c3229e05SDavid Greenman /* 1053c3229e05SDavid Greenman * Not found. 1054c3229e05SDavid Greenman */ 10556d6a026bSDavid Greenman return (NULL); 105615bd2b43SDavid Greenman } 105715bd2b43SDavid Greenman 10587bc4aca7SDavid Greenman /* 1059c3229e05SDavid Greenman * Insert PCB onto various hash lists. 10607bc4aca7SDavid Greenman */ 1061c3229e05SDavid Greenman int 1062136d4f1cSRobert Watson in_pcbinshash(struct inpcb *inp) 106315bd2b43SDavid Greenman { 1064c3229e05SDavid Greenman struct inpcbhead *pcbhash; 1065c3229e05SDavid Greenman struct inpcbporthead *pcbporthash; 1066c3229e05SDavid Greenman struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 1067c3229e05SDavid Greenman struct inpcbport *phd; 1068cfa1ca9dSYoshinobu Inoue u_int32_t hashkey_faddr; 106915bd2b43SDavid Greenman 107059daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 1071cfa1ca9dSYoshinobu Inoue #ifdef INET6 1072cfa1ca9dSYoshinobu Inoue if (inp->inp_vflag & INP_IPV6) 1073cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->in6p_faddr.s6_addr32[3] /* XXX */; 1074cfa1ca9dSYoshinobu Inoue else 1075cfa1ca9dSYoshinobu Inoue #endif /* INET6 */ 1076cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->inp_faddr.s_addr; 1077cfa1ca9dSYoshinobu Inoue 1078cfa1ca9dSYoshinobu Inoue pcbhash = &pcbinfo->hashbase[INP_PCBHASH(hashkey_faddr, 1079c3229e05SDavid Greenman inp->inp_lport, inp->inp_fport, pcbinfo->hashmask)]; 108015bd2b43SDavid Greenman 1081c3229e05SDavid Greenman pcbporthash = &pcbinfo->porthashbase[INP_PCBPORTHASH(inp->inp_lport, 1082c3229e05SDavid Greenman pcbinfo->porthashmask)]; 1083c3229e05SDavid Greenman 1084c3229e05SDavid Greenman /* 1085c3229e05SDavid Greenman * Go through port list and look for a head for this lport. 1086c3229e05SDavid Greenman */ 1087fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(phd, pcbporthash, phd_hash) { 1088c3229e05SDavid Greenman if (phd->phd_port == inp->inp_lport) 1089c3229e05SDavid Greenman break; 1090c3229e05SDavid Greenman } 1091c3229e05SDavid Greenman /* 1092c3229e05SDavid Greenman * If none exists, malloc one and tack it on. 1093c3229e05SDavid Greenman */ 1094c3229e05SDavid Greenman if (phd == NULL) { 1095c3229e05SDavid Greenman MALLOC(phd, struct inpcbport *, sizeof(struct inpcbport), M_PCB, M_NOWAIT); 1096c3229e05SDavid Greenman if (phd == NULL) { 1097c3229e05SDavid Greenman return (ENOBUFS); /* XXX */ 1098c3229e05SDavid Greenman } 1099c3229e05SDavid Greenman phd->phd_port = inp->inp_lport; 1100c3229e05SDavid Greenman LIST_INIT(&phd->phd_pcblist); 1101c3229e05SDavid Greenman LIST_INSERT_HEAD(pcbporthash, phd, phd_hash); 1102c3229e05SDavid Greenman } 1103c3229e05SDavid Greenman inp->inp_phd = phd; 1104c3229e05SDavid Greenman LIST_INSERT_HEAD(&phd->phd_pcblist, inp, inp_portlist); 1105c3229e05SDavid Greenman LIST_INSERT_HEAD(pcbhash, inp, inp_hash); 1106c3229e05SDavid Greenman return (0); 110715bd2b43SDavid Greenman } 110815bd2b43SDavid Greenman 1109c3229e05SDavid Greenman /* 1110c3229e05SDavid Greenman * Move PCB to the proper hash bucket when { faddr, fport } have been 1111c3229e05SDavid Greenman * changed. NOTE: This does not handle the case of the lport changing (the 1112c3229e05SDavid Greenman * hashed port list would have to be updated as well), so the lport must 1113c3229e05SDavid Greenman * not change after in_pcbinshash() has been called. 1114c3229e05SDavid Greenman */ 111515bd2b43SDavid Greenman void 1116136d4f1cSRobert Watson in_pcbrehash(struct inpcb *inp) 111715bd2b43SDavid Greenman { 111859daba27SSam Leffler struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 111915bd2b43SDavid Greenman struct inpcbhead *head; 1120cfa1ca9dSYoshinobu Inoue u_int32_t hashkey_faddr; 112115bd2b43SDavid Greenman 112259daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 11234c2bb15aSRobert Watson INP_LOCK_ASSERT(inp); 1124cfa1ca9dSYoshinobu Inoue #ifdef INET6 1125cfa1ca9dSYoshinobu Inoue if (inp->inp_vflag & INP_IPV6) 1126cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->in6p_faddr.s6_addr32[3] /* XXX */; 1127cfa1ca9dSYoshinobu Inoue else 1128cfa1ca9dSYoshinobu Inoue #endif /* INET6 */ 1129cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->inp_faddr.s_addr; 1130cfa1ca9dSYoshinobu Inoue 113159daba27SSam Leffler head = &pcbinfo->hashbase[INP_PCBHASH(hashkey_faddr, 113259daba27SSam Leffler inp->inp_lport, inp->inp_fport, pcbinfo->hashmask)]; 113315bd2b43SDavid Greenman 1134c3229e05SDavid Greenman LIST_REMOVE(inp, inp_hash); 113515bd2b43SDavid Greenman LIST_INSERT_HEAD(head, inp, inp_hash); 1136c3229e05SDavid Greenman } 1137c3229e05SDavid Greenman 1138c3229e05SDavid Greenman /* 1139c3229e05SDavid Greenman * Remove PCB from various lists. 1140c3229e05SDavid Greenman */ 114176429de4SYoshinobu Inoue void 1142136d4f1cSRobert Watson in_pcbremlists(struct inpcb *inp) 1143c3229e05SDavid Greenman { 114459daba27SSam Leffler struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 114559daba27SSam Leffler 114659daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 114759daba27SSam Leffler INP_LOCK_ASSERT(inp); 114859daba27SSam Leffler 114959daba27SSam Leffler inp->inp_gencnt = ++pcbinfo->ipi_gencnt; 1150c3229e05SDavid Greenman if (inp->inp_lport) { 1151c3229e05SDavid Greenman struct inpcbport *phd = inp->inp_phd; 1152c3229e05SDavid Greenman 1153c3229e05SDavid Greenman LIST_REMOVE(inp, inp_hash); 1154c3229e05SDavid Greenman LIST_REMOVE(inp, inp_portlist); 1155fc2ffbe6SPoul-Henning Kamp if (LIST_FIRST(&phd->phd_pcblist) == NULL) { 1156c3229e05SDavid Greenman LIST_REMOVE(phd, phd_hash); 1157c3229e05SDavid Greenman free(phd, M_PCB); 1158c3229e05SDavid Greenman } 1159c3229e05SDavid Greenman } 1160c3229e05SDavid Greenman LIST_REMOVE(inp, inp_list); 116159daba27SSam Leffler pcbinfo->ipi_count--; 116215bd2b43SDavid Greenman } 116375c13541SPoul-Henning Kamp 1164a557af22SRobert Watson /* 1165a557af22SRobert Watson * A set label operation has occurred at the socket layer, propagate the 1166a557af22SRobert Watson * label change into the in_pcb for the socket. 1167a557af22SRobert Watson */ 1168a557af22SRobert Watson void 1169136d4f1cSRobert Watson in_pcbsosetlabel(struct socket *so) 1170a557af22SRobert Watson { 1171a557af22SRobert Watson #ifdef MAC 1172a557af22SRobert Watson struct inpcb *inp; 1173a557af22SRobert Watson 11744c7c478dSRobert Watson inp = sotoinpcb(so); 11754c7c478dSRobert Watson KASSERT(inp != NULL, ("in_pcbsosetlabel: so->so_pcb == NULL")); 1176a557af22SRobert Watson INP_LOCK(inp); 1177310e7cebSRobert Watson SOCK_LOCK(so); 1178a557af22SRobert Watson mac_inpcb_sosetlabel(so, inp); 1179310e7cebSRobert Watson SOCK_UNLOCK(so); 1180a557af22SRobert Watson INP_UNLOCK(inp); 1181a557af22SRobert Watson #endif 1182a557af22SRobert Watson } 11835f311da2SMike Silbersack 11845f311da2SMike Silbersack /* 11855f311da2SMike Silbersack * ipport_tick runs once per second, determining if random port 11865f311da2SMike Silbersack * allocation should be continued. If more than ipport_randomcps 11875f311da2SMike Silbersack * ports have been allocated in the last second, then we return to 11885f311da2SMike Silbersack * sequential port allocation. We return to random allocation only 11896ee79c59SMaxim Konovalov * once we drop below ipport_randomcps for at least ipport_randomtime 11906ee79c59SMaxim Konovalov * seconds. 11915f311da2SMike Silbersack */ 11925f311da2SMike Silbersack 11935f311da2SMike Silbersack void 1194136d4f1cSRobert Watson ipport_tick(void *xtp) 11955f311da2SMike Silbersack { 11965f311da2SMike Silbersack if (ipport_tcpallocs > ipport_tcplastcount + ipport_randomcps) { 11975f311da2SMike Silbersack ipport_stoprandom = ipport_randomtime; 11985f311da2SMike Silbersack } else { 11995f311da2SMike Silbersack if (ipport_stoprandom > 0) 12005f311da2SMike Silbersack ipport_stoprandom--; 12015f311da2SMike Silbersack } 12025f311da2SMike Silbersack ipport_tcplastcount = ipport_tcpallocs; 12035f311da2SMike Silbersack callout_reset(&ipport_tick_callout, hz, ipport_tick, NULL); 12045f311da2SMike Silbersack } 1205