1c398230bSWarner Losh /*- 22469dd60SGarrett Wollman * Copyright (c) 1982, 1986, 1991, 1993, 1995 3497057eeSRobert Watson * The Regents of the University of California. 4111d57a6SRobert Watson * Copyright (c) 2007-2009 Robert N. M. Watson 5497057eeSRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 312469dd60SGarrett Wollman * @(#)in_pcb.c 8.4 (Berkeley) 5/24/95 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 344b421e2dSMike Silbersack #include <sys/cdefs.h> 354b421e2dSMike Silbersack __FBSDID("$FreeBSD$"); 364b421e2dSMike Silbersack 37497057eeSRobert Watson #include "opt_ddb.h" 386a800098SYoshinobu Inoue #include "opt_ipsec.h" 39cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h" 40cfa1ca9dSYoshinobu Inoue 41df8bae1dSRodney W. Grimes #include <sys/param.h> 42df8bae1dSRodney W. Grimes #include <sys/systm.h> 43df8bae1dSRodney W. Grimes #include <sys/malloc.h> 44df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 45cfa1ca9dSYoshinobu Inoue #include <sys/domain.h> 46df8bae1dSRodney W. Grimes #include <sys/protosw.h> 47df8bae1dSRodney W. Grimes #include <sys/socket.h> 48df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 49acd3428bSRobert Watson #include <sys/priv.h> 50df8bae1dSRodney W. Grimes #include <sys/proc.h> 5175c13541SPoul-Henning Kamp #include <sys/jail.h> 52101f9fc8SPeter Wemm #include <sys/kernel.h> 53101f9fc8SPeter Wemm #include <sys/sysctl.h> 548781d8e9SBruce Evans 55497057eeSRobert Watson #ifdef DDB 56497057eeSRobert Watson #include <ddb/ddb.h> 57497057eeSRobert Watson #endif 58497057eeSRobert Watson 5969c2d429SJeff Roberson #include <vm/uma.h> 60df8bae1dSRodney W. Grimes 61df8bae1dSRodney W. Grimes #include <net/if.h> 62cfa1ca9dSYoshinobu Inoue #include <net/if_types.h> 63df8bae1dSRodney W. Grimes #include <net/route.h> 64530c0060SRobert Watson #include <net/vnet.h> 65df8bae1dSRodney W. Grimes 66df8bae1dSRodney W. Grimes #include <netinet/in.h> 67df8bae1dSRodney W. Grimes #include <netinet/in_pcb.h> 68df8bae1dSRodney W. Grimes #include <netinet/in_var.h> 69df8bae1dSRodney W. Grimes #include <netinet/ip_var.h> 70340c35deSJonathan Lemon #include <netinet/tcp_var.h> 715f311da2SMike Silbersack #include <netinet/udp.h> 725f311da2SMike Silbersack #include <netinet/udp_var.h> 73cfa1ca9dSYoshinobu Inoue #ifdef INET6 74cfa1ca9dSYoshinobu Inoue #include <netinet/ip6.h> 75cfa1ca9dSYoshinobu Inoue #include <netinet6/ip6_var.h> 76cfa1ca9dSYoshinobu Inoue #endif /* INET6 */ 77cfa1ca9dSYoshinobu Inoue 78df8bae1dSRodney W. Grimes 79b2630c29SGeorge V. Neville-Neil #ifdef IPSEC 80b9234fafSSam Leffler #include <netipsec/ipsec.h> 81b9234fafSSam Leffler #include <netipsec/key.h> 82b2630c29SGeorge V. Neville-Neil #endif /* IPSEC */ 83b9234fafSSam Leffler 84aed55708SRobert Watson #include <security/mac/mac_framework.h> 85aed55708SRobert Watson 86101f9fc8SPeter Wemm /* 87101f9fc8SPeter Wemm * These configure the range of local port addresses assigned to 88101f9fc8SPeter Wemm * "unspecified" outgoing connections/packets/whatever. 89101f9fc8SPeter Wemm */ 90eddfbb76SRobert Watson VNET_DEFINE(int, ipport_lowfirstauto) = IPPORT_RESERVED - 1; /* 1023 */ 91eddfbb76SRobert Watson VNET_DEFINE(int, ipport_lowlastauto) = IPPORT_RESERVEDSTART; /* 600 */ 92eddfbb76SRobert Watson VNET_DEFINE(int, ipport_firstauto) = IPPORT_EPHEMERALFIRST; /* 10000 */ 93eddfbb76SRobert Watson VNET_DEFINE(int, ipport_lastauto) = IPPORT_EPHEMERALLAST; /* 65535 */ 94eddfbb76SRobert Watson VNET_DEFINE(int, ipport_hifirstauto) = IPPORT_HIFIRSTAUTO; /* 49152 */ 95eddfbb76SRobert Watson VNET_DEFINE(int, ipport_hilastauto) = IPPORT_HILASTAUTO; /* 65535 */ 96101f9fc8SPeter Wemm 97b0d22693SCrist J. Clark /* 98b0d22693SCrist J. Clark * Reserved ports accessible only to root. There are significant 99b0d22693SCrist J. Clark * security considerations that must be accounted for when changing these, 100b0d22693SCrist J. Clark * but the security benefits can be great. Please be careful. 101b0d22693SCrist J. Clark */ 102eddfbb76SRobert Watson VNET_DEFINE(int, ipport_reservedhigh) = IPPORT_RESERVED - 1; /* 1023 */ 103eddfbb76SRobert Watson VNET_DEFINE(int, ipport_reservedlow); 104b0d22693SCrist J. Clark 1055f311da2SMike Silbersack /* Variables dealing with random ephemeral port allocation. */ 106eddfbb76SRobert Watson VNET_DEFINE(int, ipport_randomized) = 1; /* user controlled via sysctl */ 107eddfbb76SRobert Watson VNET_DEFINE(int, ipport_randomcps) = 10; /* user controlled via sysctl */ 108eddfbb76SRobert Watson VNET_DEFINE(int, ipport_randomtime) = 45; /* user controlled via sysctl */ 109eddfbb76SRobert Watson VNET_DEFINE(int, ipport_stoprandom); /* toggled by ipport_tick */ 110eddfbb76SRobert Watson VNET_DEFINE(int, ipport_tcpallocs); 111eddfbb76SRobert Watson static VNET_DEFINE(int, ipport_tcplastcount); 112eddfbb76SRobert Watson 1131e77c105SRobert Watson #define V_ipport_tcplastcount VNET(ipport_tcplastcount) 1146ac48b74SMike Silbersack 115bbd42ad0SPeter Wemm #define RANGECHK(var, min, max) \ 116bbd42ad0SPeter Wemm if ((var) < (min)) { (var) = (min); } \ 117bbd42ad0SPeter Wemm else if ((var) > (max)) { (var) = (max); } 118bbd42ad0SPeter Wemm 1196d888973SRobert Watson static void in_pcbremlists(struct inpcb *inp); 1206d888973SRobert Watson 121bbd42ad0SPeter Wemm static int 12282d9ae4eSPoul-Henning Kamp sysctl_net_ipport_check(SYSCTL_HANDLER_ARGS) 123bbd42ad0SPeter Wemm { 12430a4ab08SBruce Evans int error; 12530a4ab08SBruce Evans 126eddfbb76SRobert Watson #ifdef VIMAGE 127eddfbb76SRobert Watson error = vnet_sysctl_handle_int(oidp, arg1, arg2, req); 128eddfbb76SRobert Watson #else 129f6dfe47aSMarko Zec error = sysctl_handle_int(oidp, arg1, arg2, req); 130eddfbb76SRobert Watson #endif 13130a4ab08SBruce Evans if (error == 0) { 132603724d3SBjoern A. Zeeb RANGECHK(V_ipport_lowfirstauto, 1, IPPORT_RESERVED - 1); 133603724d3SBjoern A. Zeeb RANGECHK(V_ipport_lowlastauto, 1, IPPORT_RESERVED - 1); 134603724d3SBjoern A. Zeeb RANGECHK(V_ipport_firstauto, IPPORT_RESERVED, IPPORT_MAX); 135603724d3SBjoern A. Zeeb RANGECHK(V_ipport_lastauto, IPPORT_RESERVED, IPPORT_MAX); 136603724d3SBjoern A. Zeeb RANGECHK(V_ipport_hifirstauto, IPPORT_RESERVED, IPPORT_MAX); 137603724d3SBjoern A. Zeeb RANGECHK(V_ipport_hilastauto, IPPORT_RESERVED, IPPORT_MAX); 138bbd42ad0SPeter Wemm } 13930a4ab08SBruce Evans return (error); 140bbd42ad0SPeter Wemm } 141bbd42ad0SPeter Wemm 142bbd42ad0SPeter Wemm #undef RANGECHK 143bbd42ad0SPeter Wemm 14433b3ac06SPeter Wemm SYSCTL_NODE(_net_inet_ip, IPPROTO_IP, portrange, CTLFLAG_RW, 0, "IP Ports"); 14533b3ac06SPeter Wemm 146eddfbb76SRobert Watson SYSCTL_VNET_PROC(_net_inet_ip_portrange, OID_AUTO, lowfirst, 147eddfbb76SRobert Watson CTLTYPE_INT|CTLFLAG_RW, &VNET_NAME(ipport_lowfirstauto), 0, 1488b615593SMarko Zec &sysctl_net_ipport_check, "I", ""); 149eddfbb76SRobert Watson SYSCTL_VNET_PROC(_net_inet_ip_portrange, OID_AUTO, lowlast, 150eddfbb76SRobert Watson CTLTYPE_INT|CTLFLAG_RW, &VNET_NAME(ipport_lowlastauto), 0, 1518b615593SMarko Zec &sysctl_net_ipport_check, "I", ""); 152eddfbb76SRobert Watson SYSCTL_VNET_PROC(_net_inet_ip_portrange, OID_AUTO, first, 153eddfbb76SRobert Watson CTLTYPE_INT|CTLFLAG_RW, &VNET_NAME(ipport_firstauto), 0, 1548b615593SMarko Zec &sysctl_net_ipport_check, "I", ""); 155eddfbb76SRobert Watson SYSCTL_VNET_PROC(_net_inet_ip_portrange, OID_AUTO, last, 156eddfbb76SRobert Watson CTLTYPE_INT|CTLFLAG_RW, &VNET_NAME(ipport_lastauto), 0, 1578b615593SMarko Zec &sysctl_net_ipport_check, "I", ""); 158eddfbb76SRobert Watson SYSCTL_VNET_PROC(_net_inet_ip_portrange, OID_AUTO, hifirst, 159eddfbb76SRobert Watson CTLTYPE_INT|CTLFLAG_RW, &VNET_NAME(ipport_hifirstauto), 0, 1608b615593SMarko Zec &sysctl_net_ipport_check, "I", ""); 161eddfbb76SRobert Watson SYSCTL_VNET_PROC(_net_inet_ip_portrange, OID_AUTO, hilast, 162eddfbb76SRobert Watson CTLTYPE_INT|CTLFLAG_RW, &VNET_NAME(ipport_hilastauto), 0, 1638b615593SMarko Zec &sysctl_net_ipport_check, "I", ""); 164eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_ip_portrange, OID_AUTO, reservedhigh, 165eddfbb76SRobert Watson CTLFLAG_RW|CTLFLAG_SECURE, &VNET_NAME(ipport_reservedhigh), 0, ""); 166eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_ip_portrange, OID_AUTO, reservedlow, 167eddfbb76SRobert Watson CTLFLAG_RW|CTLFLAG_SECURE, &VNET_NAME(ipport_reservedlow), 0, ""); 168eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_ip_portrange, OID_AUTO, randomized, CTLFLAG_RW, 169eddfbb76SRobert Watson &VNET_NAME(ipport_randomized), 0, "Enable random port allocation"); 170eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_ip_portrange, OID_AUTO, randomcps, CTLFLAG_RW, 171eddfbb76SRobert Watson &VNET_NAME(ipport_randomcps), 0, "Maximum number of random port " 1726ee79c59SMaxim Konovalov "allocations before switching to a sequental one"); 173eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_ip_portrange, OID_AUTO, randomtime, CTLFLAG_RW, 174eddfbb76SRobert Watson &VNET_NAME(ipport_randomtime), 0, 1758b615593SMarko Zec "Minimum time to keep sequental port " 1766ee79c59SMaxim Konovalov "allocation before switching to a random one"); 1770312fbe9SPoul-Henning Kamp 178c3229e05SDavid Greenman /* 179c3229e05SDavid Greenman * in_pcb.c: manage the Protocol Control Blocks. 180c3229e05SDavid Greenman * 181de35559fSRobert Watson * NOTE: It is assumed that most of these functions will be called with 182de35559fSRobert Watson * the pcbinfo lock held, and often, the inpcb lock held, as these utility 183de35559fSRobert Watson * functions often modify hash chains or addresses in pcbs. 184c3229e05SDavid Greenman */ 185c3229e05SDavid Greenman 186c3229e05SDavid Greenman /* 1879bcd427bSRobert Watson * Initialize an inpcbinfo -- we should be able to reduce the number of 1889bcd427bSRobert Watson * arguments in time. 1899bcd427bSRobert Watson */ 1909bcd427bSRobert Watson void 1919bcd427bSRobert Watson in_pcbinfo_init(struct inpcbinfo *pcbinfo, const char *name, 1929bcd427bSRobert Watson struct inpcbhead *listhead, int hash_nelements, int porthash_nelements, 1939bcd427bSRobert Watson char *inpcbzone_name, uma_init inpcbzone_init, uma_fini inpcbzone_fini, 1949bcd427bSRobert Watson uint32_t inpcbzone_flags) 1959bcd427bSRobert Watson { 1969bcd427bSRobert Watson 1979bcd427bSRobert Watson INP_INFO_LOCK_INIT(pcbinfo, name); 1989bcd427bSRobert Watson #ifdef VIMAGE 1999bcd427bSRobert Watson pcbinfo->ipi_vnet = curvnet; 2009bcd427bSRobert Watson #endif 2019bcd427bSRobert Watson pcbinfo->ipi_listhead = listhead; 2029bcd427bSRobert Watson LIST_INIT(pcbinfo->ipi_listhead); 2039bcd427bSRobert Watson pcbinfo->ipi_hashbase = hashinit(hash_nelements, M_PCB, 2049bcd427bSRobert Watson &pcbinfo->ipi_hashmask); 2059bcd427bSRobert Watson pcbinfo->ipi_porthashbase = hashinit(porthash_nelements, M_PCB, 2069bcd427bSRobert Watson &pcbinfo->ipi_porthashmask); 2079bcd427bSRobert Watson pcbinfo->ipi_zone = uma_zcreate(inpcbzone_name, sizeof(struct inpcb), 2089bcd427bSRobert Watson NULL, NULL, inpcbzone_init, inpcbzone_fini, UMA_ALIGN_PTR, 2099bcd427bSRobert Watson inpcbzone_flags); 2109bcd427bSRobert Watson uma_zone_set_max(pcbinfo->ipi_zone, maxsockets); 2119bcd427bSRobert Watson } 2129bcd427bSRobert Watson 2139bcd427bSRobert Watson /* 2149bcd427bSRobert Watson * Destroy an inpcbinfo. 2159bcd427bSRobert Watson */ 2169bcd427bSRobert Watson void 2179bcd427bSRobert Watson in_pcbinfo_destroy(struct inpcbinfo *pcbinfo) 2189bcd427bSRobert Watson { 2199bcd427bSRobert Watson 2209bcd427bSRobert Watson hashdestroy(pcbinfo->ipi_hashbase, M_PCB, pcbinfo->ipi_hashmask); 2219bcd427bSRobert Watson hashdestroy(pcbinfo->ipi_porthashbase, M_PCB, 2229bcd427bSRobert Watson pcbinfo->ipi_porthashmask); 2239bcd427bSRobert Watson uma_zdestroy(pcbinfo->ipi_zone); 2249bcd427bSRobert Watson INP_INFO_LOCK_DESTROY(pcbinfo); 2259bcd427bSRobert Watson } 2269bcd427bSRobert Watson 2279bcd427bSRobert Watson /* 228c3229e05SDavid Greenman * Allocate a PCB and associate it with the socket. 229d915b280SStephan Uphoff * On success return with the PCB locked. 230c3229e05SDavid Greenman */ 231df8bae1dSRodney W. Grimes int 232d915b280SStephan Uphoff in_pcballoc(struct socket *so, struct inpcbinfo *pcbinfo) 233df8bae1dSRodney W. Grimes { 234136d4f1cSRobert Watson struct inpcb *inp; 23513cf67f3SHajimu UMEMOTO int error; 236a557af22SRobert Watson 23759daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 238a557af22SRobert Watson error = 0; 239d915b280SStephan Uphoff inp = uma_zalloc(pcbinfo->ipi_zone, M_NOWAIT); 240df8bae1dSRodney W. Grimes if (inp == NULL) 241df8bae1dSRodney W. Grimes return (ENOBUFS); 242d915b280SStephan Uphoff bzero(inp, inp_zero_size); 24315bd2b43SDavid Greenman inp->inp_pcbinfo = pcbinfo; 244df8bae1dSRodney W. Grimes inp->inp_socket = so; 24586d02c5cSBjoern A. Zeeb inp->inp_cred = crhold(so->so_cred); 2468b07e49aSJulian Elischer inp->inp_inc.inc_fibnum = so->so_fibnum; 247a557af22SRobert Watson #ifdef MAC 24830d239bcSRobert Watson error = mac_inpcb_init(inp, M_NOWAIT); 249a557af22SRobert Watson if (error != 0) 250a557af22SRobert Watson goto out; 25130d239bcSRobert Watson mac_inpcb_create(so, inp); 252a557af22SRobert Watson #endif 253b2630c29SGeorge V. Neville-Neil #ifdef IPSEC 25413cf67f3SHajimu UMEMOTO error = ipsec_init_policy(so, &inp->inp_sp); 2550bffde27SRobert Watson if (error != 0) { 2560bffde27SRobert Watson #ifdef MAC 2570bffde27SRobert Watson mac_inpcb_destroy(inp); 2580bffde27SRobert Watson #endif 259a557af22SRobert Watson goto out; 2600bffde27SRobert Watson } 261b2630c29SGeorge V. Neville-Neil #endif /*IPSEC*/ 262e3fd5ffdSRobert Watson #ifdef INET6 263340c35deSJonathan Lemon if (INP_SOCKAF(so) == AF_INET6) { 264340c35deSJonathan Lemon inp->inp_vflag |= INP_IPV6PROTO; 265603724d3SBjoern A. Zeeb if (V_ip6_v6only) 26633841545SHajimu UMEMOTO inp->inp_flags |= IN6P_IPV6_V6ONLY; 267340c35deSJonathan Lemon } 26875daea93SPaul Saab #endif 269712fc218SRobert Watson LIST_INSERT_HEAD(pcbinfo->ipi_listhead, inp, inp_list); 2703d4d47f3SGarrett Wollman pcbinfo->ipi_count++; 271df8bae1dSRodney W. Grimes so->so_pcb = (caddr_t)inp; 27233841545SHajimu UMEMOTO #ifdef INET6 273603724d3SBjoern A. Zeeb if (V_ip6_auto_flowlabel) 27433841545SHajimu UMEMOTO inp->inp_flags |= IN6P_AUTOFLOWLABEL; 27533841545SHajimu UMEMOTO #endif 2768501a69cSRobert Watson INP_WLOCK(inp); 277d915b280SStephan Uphoff inp->inp_gencnt = ++pcbinfo->ipi_gencnt; 27828696211SRobert Watson inp->inp_refcount = 1; /* Reference from the inpcbinfo */ 279b2630c29SGeorge V. Neville-Neil #if defined(IPSEC) || defined(MAC) 280a557af22SRobert Watson out: 28186d02c5cSBjoern A. Zeeb if (error != 0) { 28286d02c5cSBjoern A. Zeeb crfree(inp->inp_cred); 283a557af22SRobert Watson uma_zfree(pcbinfo->ipi_zone, inp); 28486d02c5cSBjoern A. Zeeb } 285a557af22SRobert Watson #endif 286a557af22SRobert Watson return (error); 287df8bae1dSRodney W. Grimes } 288df8bae1dSRodney W. Grimes 289df8bae1dSRodney W. Grimes int 290136d4f1cSRobert Watson in_pcbbind(struct inpcb *inp, struct sockaddr *nam, struct ucred *cred) 291df8bae1dSRodney W. Grimes { 2924b932371SIan Dowse int anonport, error; 2934b932371SIan Dowse 2941b73ca0bSSam Leffler INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 2958501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 29659daba27SSam Leffler 2974b932371SIan Dowse if (inp->inp_lport != 0 || inp->inp_laddr.s_addr != INADDR_ANY) 2984b932371SIan Dowse return (EINVAL); 2994b932371SIan Dowse anonport = inp->inp_lport == 0 && (nam == NULL || 3004b932371SIan Dowse ((struct sockaddr_in *)nam)->sin_port == 0); 3014b932371SIan Dowse error = in_pcbbind_setup(inp, nam, &inp->inp_laddr.s_addr, 302b0330ed9SPawel Jakub Dawidek &inp->inp_lport, cred); 3034b932371SIan Dowse if (error) 3044b932371SIan Dowse return (error); 3054b932371SIan Dowse if (in_pcbinshash(inp) != 0) { 3064b932371SIan Dowse inp->inp_laddr.s_addr = INADDR_ANY; 3074b932371SIan Dowse inp->inp_lport = 0; 3084b932371SIan Dowse return (EAGAIN); 3094b932371SIan Dowse } 3104b932371SIan Dowse if (anonport) 3114b932371SIan Dowse inp->inp_flags |= INP_ANONPORT; 3124b932371SIan Dowse return (0); 3134b932371SIan Dowse } 3144b932371SIan Dowse 3154b932371SIan Dowse /* 3164b932371SIan Dowse * Set up a bind operation on a PCB, performing port allocation 3174b932371SIan Dowse * as required, but do not actually modify the PCB. Callers can 3184b932371SIan Dowse * either complete the bind by setting inp_laddr/inp_lport and 3194b932371SIan Dowse * calling in_pcbinshash(), or they can just use the resulting 3204b932371SIan Dowse * port and address to authorise the sending of a once-off packet. 3214b932371SIan Dowse * 3224b932371SIan Dowse * On error, the values of *laddrp and *lportp are not changed. 3234b932371SIan Dowse */ 3244b932371SIan Dowse int 325136d4f1cSRobert Watson in_pcbbind_setup(struct inpcb *inp, struct sockaddr *nam, in_addr_t *laddrp, 326136d4f1cSRobert Watson u_short *lportp, struct ucred *cred) 3274b932371SIan Dowse { 3284b932371SIan Dowse struct socket *so = inp->inp_socket; 32937bd2b30SPeter Wemm unsigned short *lastport; 33015bd2b43SDavid Greenman struct sockaddr_in *sin; 331c3229e05SDavid Greenman struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 3324b932371SIan Dowse struct in_addr laddr; 333df8bae1dSRodney W. Grimes u_short lport = 0; 3344cc20ab1SSeigo Tanimura int wild = 0, reuseport = (so->so_options & SO_REUSEPORT); 335413628a7SBjoern A. Zeeb int error; 3365f311da2SMike Silbersack int dorandom; 337df8bae1dSRodney W. Grimes 3388501a69cSRobert Watson /* 33972bed082SRobert Watson * Because no actual state changes occur here, a global write lock on 34072bed082SRobert Watson * the pcbinfo isn't required. 3418501a69cSRobert Watson */ 3428501a69cSRobert Watson INP_INFO_LOCK_ASSERT(pcbinfo); 34359daba27SSam Leffler INP_LOCK_ASSERT(inp); 34459daba27SSam Leffler 345603724d3SBjoern A. Zeeb if (TAILQ_EMPTY(&V_in_ifaddrhead)) /* XXX broken! */ 346df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 3474b932371SIan Dowse laddr.s_addr = *laddrp; 3484b932371SIan Dowse if (nam != NULL && laddr.s_addr != INADDR_ANY) 349df8bae1dSRodney W. Grimes return (EINVAL); 350c3229e05SDavid Greenman if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0) 351421d8aa6SBjoern A. Zeeb wild = INPLOOKUP_WILDCARD; 3527c2f3cb9SJamie Gritton if (nam == NULL) { 3537c2f3cb9SJamie Gritton if ((error = prison_local_ip4(cred, &laddr)) != 0) 3547c2f3cb9SJamie Gritton return (error); 3557c2f3cb9SJamie Gritton } else { 35657bf258eSGarrett Wollman sin = (struct sockaddr_in *)nam; 35757bf258eSGarrett Wollman if (nam->sa_len != sizeof (*sin)) 358df8bae1dSRodney W. Grimes return (EINVAL); 359df8bae1dSRodney W. Grimes #ifdef notdef 360df8bae1dSRodney W. Grimes /* 361df8bae1dSRodney W. Grimes * We should check the family, but old programs 362df8bae1dSRodney W. Grimes * incorrectly fail to initialize it. 363df8bae1dSRodney W. Grimes */ 364df8bae1dSRodney W. Grimes if (sin->sin_family != AF_INET) 365df8bae1dSRodney W. Grimes return (EAFNOSUPPORT); 366df8bae1dSRodney W. Grimes #endif 367b89e82ddSJamie Gritton error = prison_local_ip4(cred, &sin->sin_addr); 368b89e82ddSJamie Gritton if (error) 369b89e82ddSJamie Gritton return (error); 3704b932371SIan Dowse if (sin->sin_port != *lportp) { 3714b932371SIan Dowse /* Don't allow the port to change. */ 3724b932371SIan Dowse if (*lportp != 0) 3734b932371SIan Dowse return (EINVAL); 374df8bae1dSRodney W. Grimes lport = sin->sin_port; 3754b932371SIan Dowse } 3764b932371SIan Dowse /* NB: lport is left as 0 if the port isn't being changed. */ 377df8bae1dSRodney W. Grimes if (IN_MULTICAST(ntohl(sin->sin_addr.s_addr))) { 378df8bae1dSRodney W. Grimes /* 379df8bae1dSRodney W. Grimes * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 380df8bae1dSRodney W. Grimes * allow complete duplication of binding if 381df8bae1dSRodney W. Grimes * SO_REUSEPORT is set, or if SO_REUSEADDR is set 382df8bae1dSRodney W. Grimes * and a multicast address is bound on both 383df8bae1dSRodney W. Grimes * new and duplicated sockets. 384df8bae1dSRodney W. Grimes */ 385df8bae1dSRodney W. Grimes if (so->so_options & SO_REUSEADDR) 386df8bae1dSRodney W. Grimes reuseport = SO_REUSEADDR|SO_REUSEPORT; 387df8bae1dSRodney W. Grimes } else if (sin->sin_addr.s_addr != INADDR_ANY) { 388df8bae1dSRodney W. Grimes sin->sin_port = 0; /* yech... */ 38983103a73SAndrew R. Reiter bzero(&sin->sin_zero, sizeof(sin->sin_zero)); 3904209e01aSAdrian Chadd /* 3914209e01aSAdrian Chadd * Is the address a local IP address? 392f44270e7SPawel Jakub Dawidek * If INP_BINDANY is set, then the socket may be bound 3938696873dSAdrian Chadd * to any endpoint address, local or not. 3944209e01aSAdrian Chadd */ 395f44270e7SPawel Jakub Dawidek if ((inp->inp_flags & INP_BINDANY) == 0 && 3968896f83aSRobert Watson ifa_ifwithaddr_check((struct sockaddr *)sin) == 0) 397df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 398df8bae1dSRodney W. Grimes } 3994b932371SIan Dowse laddr = sin->sin_addr; 400df8bae1dSRodney W. Grimes if (lport) { 401df8bae1dSRodney W. Grimes struct inpcb *t; 402ae0e7143SRobert Watson struct tcptw *tw; 403ae0e7143SRobert Watson 404df8bae1dSRodney W. Grimes /* GROSS */ 405603724d3SBjoern A. Zeeb if (ntohs(lport) <= V_ipport_reservedhigh && 406603724d3SBjoern A. Zeeb ntohs(lport) >= V_ipport_reservedlow && 407acd3428bSRobert Watson priv_check_cred(cred, PRIV_NETINET_RESERVEDPORT, 40832f9753cSRobert Watson 0)) 4092469dd60SGarrett Wollman return (EACCES); 410835d4b89SPawel Jakub Dawidek if (!IN_MULTICAST(ntohl(sin->sin_addr.s_addr)) && 41186d02c5cSBjoern A. Zeeb priv_check_cred(inp->inp_cred, 41232f9753cSRobert Watson PRIV_NETINET_REUSEPORT, 0) != 0) { 413078b7042SBjoern A. Zeeb t = in_pcblookup_local(pcbinfo, sin->sin_addr, 414413628a7SBjoern A. Zeeb lport, INPLOOKUP_WILDCARD, cred); 415340c35deSJonathan Lemon /* 416340c35deSJonathan Lemon * XXX 417340c35deSJonathan Lemon * This entire block sorely needs a rewrite. 418340c35deSJonathan Lemon */ 4194cc20ab1SSeigo Tanimura if (t && 420ad71fe3cSRobert Watson ((t->inp_flags & INP_TIMEWAIT) == 0) && 4214658dc83SYaroslav Tykhiy (so->so_type != SOCK_STREAM || 4224658dc83SYaroslav Tykhiy ntohl(t->inp_faddr.s_addr) == INADDR_ANY) && 4234cc20ab1SSeigo Tanimura (ntohl(sin->sin_addr.s_addr) != INADDR_ANY || 42452b65dbeSBill Fenner ntohl(t->inp_laddr.s_addr) != INADDR_ANY || 42552b65dbeSBill Fenner (t->inp_socket->so_options & 42652b65dbeSBill Fenner SO_REUSEPORT) == 0) && 42786d02c5cSBjoern A. Zeeb (inp->inp_cred->cr_uid != 42886d02c5cSBjoern A. Zeeb t->inp_cred->cr_uid)) 4294049a042SGuido van Rooij return (EADDRINUSE); 4304049a042SGuido van Rooij } 431c3229e05SDavid Greenman t = in_pcblookup_local(pcbinfo, sin->sin_addr, 432413628a7SBjoern A. Zeeb lport, wild, cred); 433ad71fe3cSRobert Watson if (t && (t->inp_flags & INP_TIMEWAIT)) { 434ae0e7143SRobert Watson /* 435ae0e7143SRobert Watson * XXXRW: If an incpb has had its timewait 436ae0e7143SRobert Watson * state recycled, we treat the address as 437ae0e7143SRobert Watson * being in use (for now). This is better 438ae0e7143SRobert Watson * than a panic, but not desirable. 439ae0e7143SRobert Watson */ 440ae0e7143SRobert Watson tw = intotw(inp); 441ae0e7143SRobert Watson if (tw == NULL || 442ae0e7143SRobert Watson (reuseport & tw->tw_so_options) == 0) 443340c35deSJonathan Lemon return (EADDRINUSE); 444ae0e7143SRobert Watson } else if (t && 4454cc20ab1SSeigo Tanimura (reuseport & t->inp_socket->so_options) == 0) { 446e3fd5ffdSRobert Watson #ifdef INET6 44733841545SHajimu UMEMOTO if (ntohl(sin->sin_addr.s_addr) != 448cfa1ca9dSYoshinobu Inoue INADDR_ANY || 449cfa1ca9dSYoshinobu Inoue ntohl(t->inp_laddr.s_addr) != 450cfa1ca9dSYoshinobu Inoue INADDR_ANY || 451cfa1ca9dSYoshinobu Inoue INP_SOCKAF(so) == 452cfa1ca9dSYoshinobu Inoue INP_SOCKAF(t->inp_socket)) 453e3fd5ffdSRobert Watson #endif 454df8bae1dSRodney W. Grimes return (EADDRINUSE); 455df8bae1dSRodney W. Grimes } 456cfa1ca9dSYoshinobu Inoue } 457df8bae1dSRodney W. Grimes } 4584b932371SIan Dowse if (*lportp != 0) 4594b932371SIan Dowse lport = *lportp; 46033b3ac06SPeter Wemm if (lport == 0) { 4611cf6e4f5SRui Paulo u_short first, last, aux; 462174624e0SMike Silbersack int count; 46333b3ac06SPeter Wemm 46433b3ac06SPeter Wemm if (inp->inp_flags & INP_HIGHPORT) { 465603724d3SBjoern A. Zeeb first = V_ipport_hifirstauto; /* sysctl */ 466603724d3SBjoern A. Zeeb last = V_ipport_hilastauto; 467712fc218SRobert Watson lastport = &pcbinfo->ipi_lasthi; 46833b3ac06SPeter Wemm } else if (inp->inp_flags & INP_LOWPORT) { 469acd3428bSRobert Watson error = priv_check_cred(cred, 47032f9753cSRobert Watson PRIV_NETINET_RESERVEDPORT, 0); 471acd3428bSRobert Watson if (error) 472a29f300eSGarrett Wollman return error; 473603724d3SBjoern A. Zeeb first = V_ipport_lowfirstauto; /* 1023 */ 474603724d3SBjoern A. Zeeb last = V_ipport_lowlastauto; /* 600 */ 475712fc218SRobert Watson lastport = &pcbinfo->ipi_lastlow; 47633b3ac06SPeter Wemm } else { 477603724d3SBjoern A. Zeeb first = V_ipport_firstauto; /* sysctl */ 478603724d3SBjoern A. Zeeb last = V_ipport_lastauto; 479712fc218SRobert Watson lastport = &pcbinfo->ipi_lastport; 48033b3ac06SPeter Wemm } 48133b3ac06SPeter Wemm /* 4825f311da2SMike Silbersack * For UDP, use random port allocation as long as the user 4835f311da2SMike Silbersack * allows it. For TCP (and as of yet unknown) connections, 4845f311da2SMike Silbersack * use random port allocation only if the user allows it AND 48529f2a6ecSMaxim Konovalov * ipport_tick() allows it. 4865f311da2SMike Silbersack */ 487603724d3SBjoern A. Zeeb if (V_ipport_randomized && 488603724d3SBjoern A. Zeeb (!V_ipport_stoprandom || pcbinfo == &V_udbinfo)) 4895f311da2SMike Silbersack dorandom = 1; 4905f311da2SMike Silbersack else 4915f311da2SMike Silbersack dorandom = 0; 492e99971bfSMaxim Konovalov /* 493e99971bfSMaxim Konovalov * It makes no sense to do random port allocation if 494e99971bfSMaxim Konovalov * we have the only port available. 495e99971bfSMaxim Konovalov */ 496e99971bfSMaxim Konovalov if (first == last) 497e99971bfSMaxim Konovalov dorandom = 0; 4985f311da2SMike Silbersack /* Make sure to not include UDP packets in the count. */ 499603724d3SBjoern A. Zeeb if (pcbinfo != &V_udbinfo) 500603724d3SBjoern A. Zeeb V_ipport_tcpallocs++; 5015f311da2SMike Silbersack /* 5027e1bc272SBjoern A. Zeeb * Instead of having two loops further down counting up or down 5037e1bc272SBjoern A. Zeeb * make sure that first is always <= last and go with only one 5047e1bc272SBjoern A. Zeeb * code path implementing all logic. 50533b3ac06SPeter Wemm */ 50633b3ac06SPeter Wemm if (first > last) { 5071cf6e4f5SRui Paulo aux = first; 5081cf6e4f5SRui Paulo first = last; 5091cf6e4f5SRui Paulo last = aux; 5101cf6e4f5SRui Paulo } 511174624e0SMike Silbersack 5125f311da2SMike Silbersack if (dorandom) 5136b2fc10bSMike Silbersack *lastport = first + 5146b2fc10bSMike Silbersack (arc4random() % (last - first)); 5151cf6e4f5SRui Paulo 51633b3ac06SPeter Wemm count = last - first; 517174624e0SMike Silbersack 51833b3ac06SPeter Wemm do { 5196ac48b74SMike Silbersack if (count-- < 0) /* completely used? */ 520550b1518SWes Peters return (EADDRNOTAVAIL); 52133b3ac06SPeter Wemm ++*lastport; 52233b3ac06SPeter Wemm if (*lastport < first || *lastport > last) 52333b3ac06SPeter Wemm *lastport = first; 52433b3ac06SPeter Wemm lport = htons(*lastport); 525078b7042SBjoern A. Zeeb } while (in_pcblookup_local(pcbinfo, laddr, 526078b7042SBjoern A. Zeeb lport, wild, cred)); 52733b3ac06SPeter Wemm } 5284b932371SIan Dowse *laddrp = laddr.s_addr; 5294b932371SIan Dowse *lportp = lport; 530df8bae1dSRodney W. Grimes return (0); 531df8bae1dSRodney W. Grimes } 532df8bae1dSRodney W. Grimes 533999f1343SGarrett Wollman /* 5345200e00eSIan Dowse * Connect from a socket to a specified address. 5355200e00eSIan Dowse * Both address and port must be specified in argument sin. 5365200e00eSIan Dowse * If don't have a local address for this socket yet, 5375200e00eSIan Dowse * then pick one. 538999f1343SGarrett Wollman */ 539999f1343SGarrett Wollman int 540136d4f1cSRobert Watson in_pcbconnect(struct inpcb *inp, struct sockaddr *nam, struct ucred *cred) 541999f1343SGarrett Wollman { 5425200e00eSIan Dowse u_short lport, fport; 5435200e00eSIan Dowse in_addr_t laddr, faddr; 5445200e00eSIan Dowse int anonport, error; 545df8bae1dSRodney W. Grimes 54627f74fd0SRobert Watson INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 5478501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 54827f74fd0SRobert Watson 5495200e00eSIan Dowse lport = inp->inp_lport; 5505200e00eSIan Dowse laddr = inp->inp_laddr.s_addr; 5515200e00eSIan Dowse anonport = (lport == 0); 5525200e00eSIan Dowse error = in_pcbconnect_setup(inp, nam, &laddr, &lport, &faddr, &fport, 553b0330ed9SPawel Jakub Dawidek NULL, cred); 5545200e00eSIan Dowse if (error) 5555200e00eSIan Dowse return (error); 5565200e00eSIan Dowse 5575200e00eSIan Dowse /* Do the initial binding of the local address if required. */ 5585200e00eSIan Dowse if (inp->inp_laddr.s_addr == INADDR_ANY && inp->inp_lport == 0) { 5595200e00eSIan Dowse inp->inp_lport = lport; 5605200e00eSIan Dowse inp->inp_laddr.s_addr = laddr; 5615200e00eSIan Dowse if (in_pcbinshash(inp) != 0) { 5625200e00eSIan Dowse inp->inp_laddr.s_addr = INADDR_ANY; 5635200e00eSIan Dowse inp->inp_lport = 0; 5645200e00eSIan Dowse return (EAGAIN); 5655200e00eSIan Dowse } 5665200e00eSIan Dowse } 5675200e00eSIan Dowse 5685200e00eSIan Dowse /* Commit the remaining changes. */ 5695200e00eSIan Dowse inp->inp_lport = lport; 5705200e00eSIan Dowse inp->inp_laddr.s_addr = laddr; 5715200e00eSIan Dowse inp->inp_faddr.s_addr = faddr; 5725200e00eSIan Dowse inp->inp_fport = fport; 5735200e00eSIan Dowse in_pcbrehash(inp); 5742cb64cb2SGeorge V. Neville-Neil 5755200e00eSIan Dowse if (anonport) 5765200e00eSIan Dowse inp->inp_flags |= INP_ANONPORT; 5775200e00eSIan Dowse return (0); 5785200e00eSIan Dowse } 5795200e00eSIan Dowse 5805200e00eSIan Dowse /* 5810895aec3SBjoern A. Zeeb * Do proper source address selection on an unbound socket in case 5820895aec3SBjoern A. Zeeb * of connect. Take jails into account as well. 5830895aec3SBjoern A. Zeeb */ 5840895aec3SBjoern A. Zeeb static int 5850895aec3SBjoern A. Zeeb in_pcbladdr(struct inpcb *inp, struct in_addr *faddr, struct in_addr *laddr, 5860895aec3SBjoern A. Zeeb struct ucred *cred) 5870895aec3SBjoern A. Zeeb { 5880895aec3SBjoern A. Zeeb struct ifaddr *ifa; 5890895aec3SBjoern A. Zeeb struct sockaddr *sa; 5900895aec3SBjoern A. Zeeb struct sockaddr_in *sin; 5910895aec3SBjoern A. Zeeb struct route sro; 5920895aec3SBjoern A. Zeeb int error; 5930895aec3SBjoern A. Zeeb 594413628a7SBjoern A. Zeeb KASSERT(laddr != NULL, ("%s: laddr NULL", __func__)); 5950895aec3SBjoern A. Zeeb 596592bcae8SBjoern A. Zeeb /* 597592bcae8SBjoern A. Zeeb * Bypass source address selection and use the primary jail IP 598592bcae8SBjoern A. Zeeb * if requested. 599592bcae8SBjoern A. Zeeb */ 600592bcae8SBjoern A. Zeeb if (cred != NULL && !prison_saddrsel_ip4(cred, laddr)) 601592bcae8SBjoern A. Zeeb return (0); 602592bcae8SBjoern A. Zeeb 6030895aec3SBjoern A. Zeeb error = 0; 6040895aec3SBjoern A. Zeeb bzero(&sro, sizeof(sro)); 6050895aec3SBjoern A. Zeeb 6060895aec3SBjoern A. Zeeb sin = (struct sockaddr_in *)&sro.ro_dst; 6070895aec3SBjoern A. Zeeb sin->sin_family = AF_INET; 6080895aec3SBjoern A. Zeeb sin->sin_len = sizeof(struct sockaddr_in); 6090895aec3SBjoern A. Zeeb sin->sin_addr.s_addr = faddr->s_addr; 6100895aec3SBjoern A. Zeeb 6110895aec3SBjoern A. Zeeb /* 6120895aec3SBjoern A. Zeeb * If route is known our src addr is taken from the i/f, 6130895aec3SBjoern A. Zeeb * else punt. 6140895aec3SBjoern A. Zeeb * 6150895aec3SBjoern A. Zeeb * Find out route to destination. 6160895aec3SBjoern A. Zeeb */ 6170895aec3SBjoern A. Zeeb if ((inp->inp_socket->so_options & SO_DONTROUTE) == 0) 6186e6b3f7cSQing Li in_rtalloc_ign(&sro, 0, inp->inp_inc.inc_fibnum); 6190895aec3SBjoern A. Zeeb 6200895aec3SBjoern A. Zeeb /* 6210895aec3SBjoern A. Zeeb * If we found a route, use the address corresponding to 6220895aec3SBjoern A. Zeeb * the outgoing interface. 6230895aec3SBjoern A. Zeeb * 6240895aec3SBjoern A. Zeeb * Otherwise assume faddr is reachable on a directly connected 6250895aec3SBjoern A. Zeeb * network and try to find a corresponding interface to take 6260895aec3SBjoern A. Zeeb * the source address from. 6270895aec3SBjoern A. Zeeb */ 6280895aec3SBjoern A. Zeeb if (sro.ro_rt == NULL || sro.ro_rt->rt_ifp == NULL) { 6298c0fec80SRobert Watson struct in_ifaddr *ia; 6300895aec3SBjoern A. Zeeb struct ifnet *ifp; 6310895aec3SBjoern A. Zeeb 6320895aec3SBjoern A. Zeeb ia = ifatoia(ifa_ifwithdstaddr((struct sockaddr *)sin)); 6330895aec3SBjoern A. Zeeb if (ia == NULL) 6340895aec3SBjoern A. Zeeb ia = ifatoia(ifa_ifwithnet((struct sockaddr *)sin)); 6350895aec3SBjoern A. Zeeb if (ia == NULL) { 6360895aec3SBjoern A. Zeeb error = ENETUNREACH; 6370895aec3SBjoern A. Zeeb goto done; 6380895aec3SBjoern A. Zeeb } 6390895aec3SBjoern A. Zeeb 6400304c731SJamie Gritton if (cred == NULL || !prison_flag(cred, PR_IP4)) { 6410895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 6428c0fec80SRobert Watson ifa_free(&ia->ia_ifa); 6430895aec3SBjoern A. Zeeb goto done; 6440895aec3SBjoern A. Zeeb } 6450895aec3SBjoern A. Zeeb 6460895aec3SBjoern A. Zeeb ifp = ia->ia_ifp; 6478c0fec80SRobert Watson ifa_free(&ia->ia_ifa); 6480895aec3SBjoern A. Zeeb ia = NULL; 6499317b04eSRobert Watson IF_ADDR_LOCK(ifp); 6500895aec3SBjoern A. Zeeb TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 6510895aec3SBjoern A. Zeeb 6520895aec3SBjoern A. Zeeb sa = ifa->ifa_addr; 6530895aec3SBjoern A. Zeeb if (sa->sa_family != AF_INET) 6540895aec3SBjoern A. Zeeb continue; 6550895aec3SBjoern A. Zeeb sin = (struct sockaddr_in *)sa; 656b89e82ddSJamie Gritton if (prison_check_ip4(cred, &sin->sin_addr) == 0) { 6570895aec3SBjoern A. Zeeb ia = (struct in_ifaddr *)ifa; 6580895aec3SBjoern A. Zeeb break; 6590895aec3SBjoern A. Zeeb } 6600895aec3SBjoern A. Zeeb } 6610895aec3SBjoern A. Zeeb if (ia != NULL) { 6620895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 6639317b04eSRobert Watson IF_ADDR_UNLOCK(ifp); 6640895aec3SBjoern A. Zeeb goto done; 6650895aec3SBjoern A. Zeeb } 6669317b04eSRobert Watson IF_ADDR_UNLOCK(ifp); 6670895aec3SBjoern A. Zeeb 6680895aec3SBjoern A. Zeeb /* 3. As a last resort return the 'default' jail address. */ 669b89e82ddSJamie Gritton error = prison_get_ip4(cred, laddr); 6700895aec3SBjoern A. Zeeb goto done; 6710895aec3SBjoern A. Zeeb } 6720895aec3SBjoern A. Zeeb 6730895aec3SBjoern A. Zeeb /* 6740895aec3SBjoern A. Zeeb * If the outgoing interface on the route found is not 6750895aec3SBjoern A. Zeeb * a loopback interface, use the address from that interface. 6760895aec3SBjoern A. Zeeb * In case of jails do those three steps: 6770895aec3SBjoern A. Zeeb * 1. check if the interface address belongs to the jail. If so use it. 6780895aec3SBjoern A. Zeeb * 2. check if we have any address on the outgoing interface 6790895aec3SBjoern A. Zeeb * belonging to this jail. If so use it. 6800895aec3SBjoern A. Zeeb * 3. as a last resort return the 'default' jail address. 6810895aec3SBjoern A. Zeeb */ 6820895aec3SBjoern A. Zeeb if ((sro.ro_rt->rt_ifp->if_flags & IFF_LOOPBACK) == 0) { 6838c0fec80SRobert Watson struct in_ifaddr *ia; 6849317b04eSRobert Watson struct ifnet *ifp; 6850895aec3SBjoern A. Zeeb 6860895aec3SBjoern A. Zeeb /* If not jailed, use the default returned. */ 6870304c731SJamie Gritton if (cred == NULL || !prison_flag(cred, PR_IP4)) { 6880895aec3SBjoern A. Zeeb ia = (struct in_ifaddr *)sro.ro_rt->rt_ifa; 6890895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 6900895aec3SBjoern A. Zeeb goto done; 6910895aec3SBjoern A. Zeeb } 6920895aec3SBjoern A. Zeeb 6930895aec3SBjoern A. Zeeb /* Jailed. */ 6940895aec3SBjoern A. Zeeb /* 1. Check if the iface address belongs to the jail. */ 6950895aec3SBjoern A. Zeeb sin = (struct sockaddr_in *)sro.ro_rt->rt_ifa->ifa_addr; 696b89e82ddSJamie Gritton if (prison_check_ip4(cred, &sin->sin_addr) == 0) { 6970895aec3SBjoern A. Zeeb ia = (struct in_ifaddr *)sro.ro_rt->rt_ifa; 6980895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 6990895aec3SBjoern A. Zeeb goto done; 7000895aec3SBjoern A. Zeeb } 7010895aec3SBjoern A. Zeeb 7020895aec3SBjoern A. Zeeb /* 7030895aec3SBjoern A. Zeeb * 2. Check if we have any address on the outgoing interface 7040895aec3SBjoern A. Zeeb * belonging to this jail. 7050895aec3SBjoern A. Zeeb */ 7068c0fec80SRobert Watson ia = NULL; 7079317b04eSRobert Watson ifp = sro.ro_rt->rt_ifp; 7089317b04eSRobert Watson IF_ADDR_LOCK(ifp); 7099317b04eSRobert Watson TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 7100895aec3SBjoern A. Zeeb sa = ifa->ifa_addr; 7110895aec3SBjoern A. Zeeb if (sa->sa_family != AF_INET) 7120895aec3SBjoern A. Zeeb continue; 7130895aec3SBjoern A. Zeeb sin = (struct sockaddr_in *)sa; 714b89e82ddSJamie Gritton if (prison_check_ip4(cred, &sin->sin_addr) == 0) { 7150895aec3SBjoern A. Zeeb ia = (struct in_ifaddr *)ifa; 7160895aec3SBjoern A. Zeeb break; 7170895aec3SBjoern A. Zeeb } 7180895aec3SBjoern A. Zeeb } 7190895aec3SBjoern A. Zeeb if (ia != NULL) { 7200895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 7219317b04eSRobert Watson IF_ADDR_UNLOCK(ifp); 7220895aec3SBjoern A. Zeeb goto done; 7230895aec3SBjoern A. Zeeb } 7249317b04eSRobert Watson IF_ADDR_UNLOCK(ifp); 7250895aec3SBjoern A. Zeeb 7260895aec3SBjoern A. Zeeb /* 3. As a last resort return the 'default' jail address. */ 727b89e82ddSJamie Gritton error = prison_get_ip4(cred, laddr); 7280895aec3SBjoern A. Zeeb goto done; 7290895aec3SBjoern A. Zeeb } 7300895aec3SBjoern A. Zeeb 7310895aec3SBjoern A. Zeeb /* 7320895aec3SBjoern A. Zeeb * The outgoing interface is marked with 'loopback net', so a route 7330895aec3SBjoern A. Zeeb * to ourselves is here. 7340895aec3SBjoern A. Zeeb * Try to find the interface of the destination address and then 7350895aec3SBjoern A. Zeeb * take the address from there. That interface is not necessarily 7360895aec3SBjoern A. Zeeb * a loopback interface. 7370895aec3SBjoern A. Zeeb * In case of jails, check that it is an address of the jail 7380895aec3SBjoern A. Zeeb * and if we cannot find, fall back to the 'default' jail address. 7390895aec3SBjoern A. Zeeb */ 7400895aec3SBjoern A. Zeeb if ((sro.ro_rt->rt_ifp->if_flags & IFF_LOOPBACK) != 0) { 7410895aec3SBjoern A. Zeeb struct sockaddr_in sain; 7428c0fec80SRobert Watson struct in_ifaddr *ia; 7430895aec3SBjoern A. Zeeb 7440895aec3SBjoern A. Zeeb bzero(&sain, sizeof(struct sockaddr_in)); 7450895aec3SBjoern A. Zeeb sain.sin_family = AF_INET; 7460895aec3SBjoern A. Zeeb sain.sin_len = sizeof(struct sockaddr_in); 7470895aec3SBjoern A. Zeeb sain.sin_addr.s_addr = faddr->s_addr; 7480895aec3SBjoern A. Zeeb 7490895aec3SBjoern A. Zeeb ia = ifatoia(ifa_ifwithdstaddr(sintosa(&sain))); 7500895aec3SBjoern A. Zeeb if (ia == NULL) 7510895aec3SBjoern A. Zeeb ia = ifatoia(ifa_ifwithnet(sintosa(&sain))); 752f0bb05fcSQing Li if (ia == NULL) 753f0bb05fcSQing Li ia = ifatoia(ifa_ifwithaddr(sintosa(&sain))); 7540895aec3SBjoern A. Zeeb 7550304c731SJamie Gritton if (cred == NULL || !prison_flag(cred, PR_IP4)) { 7560895aec3SBjoern A. Zeeb if (ia == NULL) { 7570895aec3SBjoern A. Zeeb error = ENETUNREACH; 7580895aec3SBjoern A. Zeeb goto done; 7590895aec3SBjoern A. Zeeb } 7600895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 7618c0fec80SRobert Watson ifa_free(&ia->ia_ifa); 7620895aec3SBjoern A. Zeeb goto done; 7630895aec3SBjoern A. Zeeb } 7640895aec3SBjoern A. Zeeb 7650895aec3SBjoern A. Zeeb /* Jailed. */ 7660895aec3SBjoern A. Zeeb if (ia != NULL) { 7670895aec3SBjoern A. Zeeb struct ifnet *ifp; 7680895aec3SBjoern A. Zeeb 7690895aec3SBjoern A. Zeeb ifp = ia->ia_ifp; 7708c0fec80SRobert Watson ifa_free(&ia->ia_ifa); 7710895aec3SBjoern A. Zeeb ia = NULL; 7729317b04eSRobert Watson IF_ADDR_LOCK(ifp); 7730895aec3SBjoern A. Zeeb TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) { 7740895aec3SBjoern A. Zeeb 7750895aec3SBjoern A. Zeeb sa = ifa->ifa_addr; 7760895aec3SBjoern A. Zeeb if (sa->sa_family != AF_INET) 7770895aec3SBjoern A. Zeeb continue; 7780895aec3SBjoern A. Zeeb sin = (struct sockaddr_in *)sa; 779b89e82ddSJamie Gritton if (prison_check_ip4(cred, 780b89e82ddSJamie Gritton &sin->sin_addr) == 0) { 7810895aec3SBjoern A. Zeeb ia = (struct in_ifaddr *)ifa; 7820895aec3SBjoern A. Zeeb break; 7830895aec3SBjoern A. Zeeb } 7840895aec3SBjoern A. Zeeb } 7850895aec3SBjoern A. Zeeb if (ia != NULL) { 7860895aec3SBjoern A. Zeeb laddr->s_addr = ia->ia_addr.sin_addr.s_addr; 7879317b04eSRobert Watson IF_ADDR_UNLOCK(ifp); 7880895aec3SBjoern A. Zeeb goto done; 7890895aec3SBjoern A. Zeeb } 7909317b04eSRobert Watson IF_ADDR_UNLOCK(ifp); 7910895aec3SBjoern A. Zeeb } 7920895aec3SBjoern A. Zeeb 7930895aec3SBjoern A. Zeeb /* 3. As a last resort return the 'default' jail address. */ 794b89e82ddSJamie Gritton error = prison_get_ip4(cred, laddr); 7950895aec3SBjoern A. Zeeb goto done; 7960895aec3SBjoern A. Zeeb } 7970895aec3SBjoern A. Zeeb 7980895aec3SBjoern A. Zeeb done: 7990895aec3SBjoern A. Zeeb if (sro.ro_rt != NULL) 8000895aec3SBjoern A. Zeeb RTFREE(sro.ro_rt); 8010895aec3SBjoern A. Zeeb return (error); 8020895aec3SBjoern A. Zeeb } 8030895aec3SBjoern A. Zeeb 8040895aec3SBjoern A. Zeeb /* 8055200e00eSIan Dowse * Set up for a connect from a socket to the specified address. 8065200e00eSIan Dowse * On entry, *laddrp and *lportp should contain the current local 8075200e00eSIan Dowse * address and port for the PCB; these are updated to the values 8085200e00eSIan Dowse * that should be placed in inp_laddr and inp_lport to complete 8095200e00eSIan Dowse * the connect. 8105200e00eSIan Dowse * 8115200e00eSIan Dowse * On success, *faddrp and *fportp will be set to the remote address 8125200e00eSIan Dowse * and port. These are not updated in the error case. 8135200e00eSIan Dowse * 8145200e00eSIan Dowse * If the operation fails because the connection already exists, 8155200e00eSIan Dowse * *oinpp will be set to the PCB of that connection so that the 8165200e00eSIan Dowse * caller can decide to override it. In all other cases, *oinpp 8175200e00eSIan Dowse * is set to NULL. 8185200e00eSIan Dowse */ 8195200e00eSIan Dowse int 820136d4f1cSRobert Watson in_pcbconnect_setup(struct inpcb *inp, struct sockaddr *nam, 821136d4f1cSRobert Watson in_addr_t *laddrp, u_short *lportp, in_addr_t *faddrp, u_short *fportp, 822136d4f1cSRobert Watson struct inpcb **oinpp, struct ucred *cred) 8235200e00eSIan Dowse { 8245200e00eSIan Dowse struct sockaddr_in *sin = (struct sockaddr_in *)nam; 8255200e00eSIan Dowse struct in_ifaddr *ia; 8265200e00eSIan Dowse struct inpcb *oinp; 827b89e82ddSJamie Gritton struct in_addr laddr, faddr; 8285200e00eSIan Dowse u_short lport, fport; 8295200e00eSIan Dowse int error; 8305200e00eSIan Dowse 8318501a69cSRobert Watson /* 8328501a69cSRobert Watson * Because a global state change doesn't actually occur here, a read 8338501a69cSRobert Watson * lock is sufficient. 8348501a69cSRobert Watson */ 8358501a69cSRobert Watson INP_INFO_LOCK_ASSERT(inp->inp_pcbinfo); 83627f74fd0SRobert Watson INP_LOCK_ASSERT(inp); 83727f74fd0SRobert Watson 8385200e00eSIan Dowse if (oinpp != NULL) 8395200e00eSIan Dowse *oinpp = NULL; 84057bf258eSGarrett Wollman if (nam->sa_len != sizeof (*sin)) 841df8bae1dSRodney W. Grimes return (EINVAL); 842df8bae1dSRodney W. Grimes if (sin->sin_family != AF_INET) 843df8bae1dSRodney W. Grimes return (EAFNOSUPPORT); 844df8bae1dSRodney W. Grimes if (sin->sin_port == 0) 845df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 8465200e00eSIan Dowse laddr.s_addr = *laddrp; 8475200e00eSIan Dowse lport = *lportp; 8485200e00eSIan Dowse faddr = sin->sin_addr; 8495200e00eSIan Dowse fport = sin->sin_port; 8500895aec3SBjoern A. Zeeb 851603724d3SBjoern A. Zeeb if (!TAILQ_EMPTY(&V_in_ifaddrhead)) { 852df8bae1dSRodney W. Grimes /* 853df8bae1dSRodney W. Grimes * If the destination address is INADDR_ANY, 854df8bae1dSRodney W. Grimes * use the primary local address. 855df8bae1dSRodney W. Grimes * If the supplied address is INADDR_BROADCAST, 856df8bae1dSRodney W. Grimes * and the primary interface supports broadcast, 857df8bae1dSRodney W. Grimes * choose the broadcast address for that interface. 858df8bae1dSRodney W. Grimes */ 859413628a7SBjoern A. Zeeb if (faddr.s_addr == INADDR_ANY) { 8602d9cfabaSRobert Watson IN_IFADDR_RLOCK(); 861413628a7SBjoern A. Zeeb faddr = 862b89e82ddSJamie Gritton IA_SIN(TAILQ_FIRST(&V_in_ifaddrhead))->sin_addr; 8632d9cfabaSRobert Watson IN_IFADDR_RUNLOCK(); 864b89e82ddSJamie Gritton if (cred != NULL && 865b89e82ddSJamie Gritton (error = prison_get_ip4(cred, &faddr)) != 0) 866b89e82ddSJamie Gritton return (error); 8672d9cfabaSRobert Watson } else if (faddr.s_addr == (u_long)INADDR_BROADCAST) { 8682d9cfabaSRobert Watson IN_IFADDR_RLOCK(); 8692d9cfabaSRobert Watson if (TAILQ_FIRST(&V_in_ifaddrhead)->ia_ifp->if_flags & 8702d9cfabaSRobert Watson IFF_BROADCAST) 8715200e00eSIan Dowse faddr = satosin(&TAILQ_FIRST( 872603724d3SBjoern A. Zeeb &V_in_ifaddrhead)->ia_broadaddr)->sin_addr; 8732d9cfabaSRobert Watson IN_IFADDR_RUNLOCK(); 8742d9cfabaSRobert Watson } 875df8bae1dSRodney W. Grimes } 8765200e00eSIan Dowse if (laddr.s_addr == INADDR_ANY) { 8770895aec3SBjoern A. Zeeb error = in_pcbladdr(inp, &faddr, &laddr, cred); 8780895aec3SBjoern A. Zeeb if (error) 8790895aec3SBjoern A. Zeeb return (error); 880df8bae1dSRodney W. Grimes 881df8bae1dSRodney W. Grimes /* 882df8bae1dSRodney W. Grimes * If the destination address is multicast and an outgoing 883df8bae1dSRodney W. Grimes * interface has been set as a multicast option, use the 884df8bae1dSRodney W. Grimes * address of that interface as our source address. 885df8bae1dSRodney W. Grimes */ 8865200e00eSIan Dowse if (IN_MULTICAST(ntohl(faddr.s_addr)) && 887df8bae1dSRodney W. Grimes inp->inp_moptions != NULL) { 888df8bae1dSRodney W. Grimes struct ip_moptions *imo; 889df8bae1dSRodney W. Grimes struct ifnet *ifp; 890df8bae1dSRodney W. Grimes 891df8bae1dSRodney W. Grimes imo = inp->inp_moptions; 892df8bae1dSRodney W. Grimes if (imo->imo_multicast_ifp != NULL) { 893df8bae1dSRodney W. Grimes ifp = imo->imo_multicast_ifp; 8942d9cfabaSRobert Watson IN_IFADDR_RLOCK(); 895603724d3SBjoern A. Zeeb TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) 896df8bae1dSRodney W. Grimes if (ia->ia_ifp == ifp) 897df8bae1dSRodney W. Grimes break; 8982d9cfabaSRobert Watson if (ia == NULL) { 8992d9cfabaSRobert Watson IN_IFADDR_RUNLOCK(); 900df8bae1dSRodney W. Grimes return (EADDRNOTAVAIL); 9012d9cfabaSRobert Watson } 9025200e00eSIan Dowse laddr = ia->ia_addr.sin_addr; 9032d9cfabaSRobert Watson IN_IFADDR_RUNLOCK(); 904999f1343SGarrett Wollman } 9050895aec3SBjoern A. Zeeb } 9060895aec3SBjoern A. Zeeb } 907999f1343SGarrett Wollman 9085200e00eSIan Dowse oinp = in_pcblookup_hash(inp->inp_pcbinfo, faddr, fport, laddr, lport, 9095200e00eSIan Dowse 0, NULL); 9105200e00eSIan Dowse if (oinp != NULL) { 9115200e00eSIan Dowse if (oinpp != NULL) 9125200e00eSIan Dowse *oinpp = oinp; 913df8bae1dSRodney W. Grimes return (EADDRINUSE); 914c3229e05SDavid Greenman } 9155200e00eSIan Dowse if (lport == 0) { 916b0330ed9SPawel Jakub Dawidek error = in_pcbbind_setup(inp, NULL, &laddr.s_addr, &lport, 917b0330ed9SPawel Jakub Dawidek cred); 9185a903f8dSPierre Beyssac if (error) 9195a903f8dSPierre Beyssac return (error); 9205a903f8dSPierre Beyssac } 9215200e00eSIan Dowse *laddrp = laddr.s_addr; 9225200e00eSIan Dowse *lportp = lport; 9235200e00eSIan Dowse *faddrp = faddr.s_addr; 9245200e00eSIan Dowse *fportp = fport; 925df8bae1dSRodney W. Grimes return (0); 926df8bae1dSRodney W. Grimes } 927df8bae1dSRodney W. Grimes 92826f9a767SRodney W. Grimes void 929136d4f1cSRobert Watson in_pcbdisconnect(struct inpcb *inp) 930df8bae1dSRodney W. Grimes { 9316b348152SRobert Watson 932fe6bfc37SRobert Watson INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 9338501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 934df8bae1dSRodney W. Grimes 935df8bae1dSRodney W. Grimes inp->inp_faddr.s_addr = INADDR_ANY; 936df8bae1dSRodney W. Grimes inp->inp_fport = 0; 93715bd2b43SDavid Greenman in_pcbrehash(inp); 938df8bae1dSRodney W. Grimes } 939df8bae1dSRodney W. Grimes 9404c7c478dSRobert Watson /* 94128696211SRobert Watson * in_pcbdetach() is responsibe for disassociating a socket from an inpcb. 942c0a211c5SRobert Watson * For most protocols, this will be invoked immediately prior to calling 94328696211SRobert Watson * in_pcbfree(). However, with TCP the inpcb may significantly outlive the 94428696211SRobert Watson * socket, in which case in_pcbfree() is deferred. 9454c7c478dSRobert Watson */ 94626f9a767SRodney W. Grimes void 947136d4f1cSRobert Watson in_pcbdetach(struct inpcb *inp) 948df8bae1dSRodney W. Grimes { 9494c7c478dSRobert Watson 950a7df09e8SBjoern A. Zeeb KASSERT(inp->inp_socket != NULL, ("%s: inp_socket == NULL", __func__)); 951c0a211c5SRobert Watson 9524c7c478dSRobert Watson inp->inp_socket->so_pcb = NULL; 9534c7c478dSRobert Watson inp->inp_socket = NULL; 9544c7c478dSRobert Watson } 9554c7c478dSRobert Watson 956c0a211c5SRobert Watson /* 95728696211SRobert Watson * in_pcbfree_internal() frees an inpcb that has been detached from its 95828696211SRobert Watson * socket, and whose reference count has reached 0. It will also remove the 95928696211SRobert Watson * inpcb from any global lists it might remain on. 960c0a211c5SRobert Watson */ 96128696211SRobert Watson static void 96228696211SRobert Watson in_pcbfree_internal(struct inpcb *inp) 9634c7c478dSRobert Watson { 9643d4d47f3SGarrett Wollman struct inpcbinfo *ipi = inp->inp_pcbinfo; 965df8bae1dSRodney W. Grimes 966a7df09e8SBjoern A. Zeeb KASSERT(inp->inp_socket == NULL, ("%s: inp_socket != NULL", __func__)); 96728696211SRobert Watson KASSERT(inp->inp_refcount == 0, ("%s: refcount !0", __func__)); 9688501a69cSRobert Watson 969fe6bfc37SRobert Watson INP_INFO_WLOCK_ASSERT(ipi); 9708501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 97159daba27SSam Leffler 972b2630c29SGeorge V. Neville-Neil #ifdef IPSEC 9736aee2fc5SBjoern A. Zeeb if (inp->inp_sp != NULL) 9746974bd9eSBjoern A. Zeeb ipsec_delete_pcbpolicy(inp); 975b2630c29SGeorge V. Neville-Neil #endif /* IPSEC */ 9763d4d47f3SGarrett Wollman inp->inp_gencnt = ++ipi->ipi_gencnt; 977c3229e05SDavid Greenman in_pcbremlists(inp); 9786aee2fc5SBjoern A. Zeeb #ifdef INET6 9796aee2fc5SBjoern A. Zeeb if (inp->inp_vflag & INP_IPV6PROTO) { 9806aee2fc5SBjoern A. Zeeb ip6_freepcbopts(inp->in6p_outputopts); 9811096332aSBruce M Simpson if (inp->in6p_moptions != NULL) 9826aee2fc5SBjoern A. Zeeb ip6_freemoptions(inp->in6p_moptions); 9836aee2fc5SBjoern A. Zeeb } 9846aee2fc5SBjoern A. Zeeb #endif 985df8bae1dSRodney W. Grimes if (inp->inp_options) 986df8bae1dSRodney W. Grimes (void)m_free(inp->inp_options); 98771498f30SBruce M Simpson if (inp->inp_moptions != NULL) 98871498f30SBruce M Simpson inp_freemoptions(inp->inp_moptions); 989cfa1ca9dSYoshinobu Inoue inp->inp_vflag = 0; 99086d02c5cSBjoern A. Zeeb crfree(inp->inp_cred); 991d915b280SStephan Uphoff 992a557af22SRobert Watson #ifdef MAC 99330d239bcSRobert Watson mac_inpcb_destroy(inp); 994a557af22SRobert Watson #endif 9958501a69cSRobert Watson INP_WUNLOCK(inp); 99669c2d429SJeff Roberson uma_zfree(ipi->ipi_zone, inp); 997df8bae1dSRodney W. Grimes } 998df8bae1dSRodney W. Grimes 99910702a28SRobert Watson /* 100028696211SRobert Watson * in_pcbref() bumps the reference count on an inpcb in order to maintain 100128696211SRobert Watson * stability of an inpcb pointer despite the inpcb lock being released. This 100228696211SRobert Watson * is used in TCP when the inpcbinfo lock needs to be acquired or upgraded, 100328696211SRobert Watson * but where the inpcb lock is already held. 100428696211SRobert Watson * 100528696211SRobert Watson * While the inpcb will not be freed, releasing the inpcb lock means that the 100628696211SRobert Watson * connection's state may change, so the caller should be careful to 100728696211SRobert Watson * revalidate any cached state on reacquiring the lock. Drop the reference 100828696211SRobert Watson * using in_pcbrele(). 100928696211SRobert Watson */ 101028696211SRobert Watson void 101128696211SRobert Watson in_pcbref(struct inpcb *inp) 101228696211SRobert Watson { 101328696211SRobert Watson 101428696211SRobert Watson INP_WLOCK_ASSERT(inp); 101528696211SRobert Watson 101628696211SRobert Watson KASSERT(inp->inp_refcount > 0, ("%s: refcount 0", __func__)); 101728696211SRobert Watson 101828696211SRobert Watson inp->inp_refcount++; 101928696211SRobert Watson } 102028696211SRobert Watson 102128696211SRobert Watson /* 102228696211SRobert Watson * Drop a refcount on an inpcb elevated using in_pcbref(); because a call to 102328696211SRobert Watson * in_pcbfree() may have been made between in_pcbref() and in_pcbrele(), we 102428696211SRobert Watson * return a flag indicating whether or not the inpcb remains valid. If it is 102528696211SRobert Watson * valid, we return with the inpcb lock held. 102628696211SRobert Watson */ 102728696211SRobert Watson int 102828696211SRobert Watson in_pcbrele(struct inpcb *inp) 102928696211SRobert Watson { 103028696211SRobert Watson #ifdef INVARIANTS 103128696211SRobert Watson struct inpcbinfo *ipi = inp->inp_pcbinfo; 103228696211SRobert Watson #endif 103328696211SRobert Watson 103428696211SRobert Watson KASSERT(inp->inp_refcount > 0, ("%s: refcount 0", __func__)); 103528696211SRobert Watson 103628696211SRobert Watson INP_INFO_WLOCK_ASSERT(ipi); 103728696211SRobert Watson INP_WLOCK_ASSERT(inp); 103828696211SRobert Watson 103928696211SRobert Watson inp->inp_refcount--; 104028696211SRobert Watson if (inp->inp_refcount > 0) 104128696211SRobert Watson return (0); 104228696211SRobert Watson in_pcbfree_internal(inp); 104328696211SRobert Watson return (1); 104428696211SRobert Watson } 104528696211SRobert Watson 104628696211SRobert Watson /* 104728696211SRobert Watson * Unconditionally schedule an inpcb to be freed by decrementing its 104828696211SRobert Watson * reference count, which should occur only after the inpcb has been detached 104928696211SRobert Watson * from its socket. If another thread holds a temporary reference (acquired 105028696211SRobert Watson * using in_pcbref()) then the free is deferred until that reference is 105128696211SRobert Watson * released using in_pcbrele(), but the inpcb is still unlocked. 105228696211SRobert Watson */ 105328696211SRobert Watson void 105428696211SRobert Watson in_pcbfree(struct inpcb *inp) 105528696211SRobert Watson { 105628696211SRobert Watson #ifdef INVARIANTS 105728696211SRobert Watson struct inpcbinfo *ipi = inp->inp_pcbinfo; 105828696211SRobert Watson #endif 105928696211SRobert Watson 106028696211SRobert Watson KASSERT(inp->inp_socket == NULL, ("%s: inp_socket != NULL", 106128696211SRobert Watson __func__)); 106228696211SRobert Watson 106328696211SRobert Watson INP_INFO_WLOCK_ASSERT(ipi); 106428696211SRobert Watson INP_WLOCK_ASSERT(inp); 106528696211SRobert Watson 106628696211SRobert Watson if (!in_pcbrele(inp)) 106728696211SRobert Watson INP_WUNLOCK(inp); 106828696211SRobert Watson } 106928696211SRobert Watson 107028696211SRobert Watson /* 1071c0a211c5SRobert Watson * in_pcbdrop() removes an inpcb from hashed lists, releasing its address and 1072c0a211c5SRobert Watson * port reservation, and preventing it from being returned by inpcb lookups. 1073c0a211c5SRobert Watson * 1074c0a211c5SRobert Watson * It is used by TCP to mark an inpcb as unused and avoid future packet 1075c0a211c5SRobert Watson * delivery or event notification when a socket remains open but TCP has 1076c0a211c5SRobert Watson * closed. This might occur as a result of a shutdown()-initiated TCP close 1077c0a211c5SRobert Watson * or a RST on the wire, and allows the port binding to be reused while still 1078c0a211c5SRobert Watson * maintaining the invariant that so_pcb always points to a valid inpcb until 1079c0a211c5SRobert Watson * in_pcbdetach(). 1080c0a211c5SRobert Watson * 1081c0a211c5SRobert Watson * XXXRW: An inp_lport of 0 is used to indicate that the inpcb is not on hash 1082c0a211c5SRobert Watson * lists, but can lead to confusing netstat output, as open sockets with 1083c0a211c5SRobert Watson * closed TCP connections will no longer appear to have their bound port 1084c0a211c5SRobert Watson * number. An explicit flag would be better, as it would allow us to leave 1085c0a211c5SRobert Watson * the port number intact after the connection is dropped. 1086c0a211c5SRobert Watson * 1087c0a211c5SRobert Watson * XXXRW: Possibly in_pcbdrop() should also prevent future notifications by 1088c0a211c5SRobert Watson * in_pcbnotifyall() and in_pcbpurgeif0()? 108910702a28SRobert Watson */ 109010702a28SRobert Watson void 109110702a28SRobert Watson in_pcbdrop(struct inpcb *inp) 109210702a28SRobert Watson { 109310702a28SRobert Watson 10947c5a8ab2SMarcel Moolenaar INP_INFO_WLOCK_ASSERT(inp->inp_pcbinfo); 10958501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 109610702a28SRobert Watson 1097ad71fe3cSRobert Watson inp->inp_flags |= INP_DROPPED; 1098111d57a6SRobert Watson if (inp->inp_flags & INP_INHASHLIST) { 109910702a28SRobert Watson struct inpcbport *phd = inp->inp_phd; 110010702a28SRobert Watson 110110702a28SRobert Watson LIST_REMOVE(inp, inp_hash); 110210702a28SRobert Watson LIST_REMOVE(inp, inp_portlist); 110310702a28SRobert Watson if (LIST_FIRST(&phd->phd_pcblist) == NULL) { 110410702a28SRobert Watson LIST_REMOVE(phd, phd_hash); 110510702a28SRobert Watson free(phd, M_PCB); 110610702a28SRobert Watson } 1107111d57a6SRobert Watson inp->inp_flags &= ~INP_INHASHLIST; 110810702a28SRobert Watson } 110910702a28SRobert Watson } 111010702a28SRobert Watson 111154d642bbSRobert Watson /* 111254d642bbSRobert Watson * Common routines to return the socket addresses associated with inpcbs. 111354d642bbSRobert Watson */ 111426ef6ac4SDon Lewis struct sockaddr * 1115136d4f1cSRobert Watson in_sockaddr(in_port_t port, struct in_addr *addr_p) 111626ef6ac4SDon Lewis { 111726ef6ac4SDon Lewis struct sockaddr_in *sin; 111826ef6ac4SDon Lewis 11191ede983cSDag-Erling Smørgrav sin = malloc(sizeof *sin, M_SONAME, 1120a163d034SWarner Losh M_WAITOK | M_ZERO); 112126ef6ac4SDon Lewis sin->sin_family = AF_INET; 112226ef6ac4SDon Lewis sin->sin_len = sizeof(*sin); 112326ef6ac4SDon Lewis sin->sin_addr = *addr_p; 112426ef6ac4SDon Lewis sin->sin_port = port; 112526ef6ac4SDon Lewis 112626ef6ac4SDon Lewis return (struct sockaddr *)sin; 112726ef6ac4SDon Lewis } 112826ef6ac4SDon Lewis 1129117bcae7SGarrett Wollman int 113054d642bbSRobert Watson in_getsockaddr(struct socket *so, struct sockaddr **nam) 1131df8bae1dSRodney W. Grimes { 1132136d4f1cSRobert Watson struct inpcb *inp; 113326ef6ac4SDon Lewis struct in_addr addr; 113426ef6ac4SDon Lewis in_port_t port; 113542fa505bSDavid Greenman 1136fdc984f7STor Egge inp = sotoinpcb(so); 113754d642bbSRobert Watson KASSERT(inp != NULL, ("in_getsockaddr: inp == NULL")); 11386466b28aSRobert Watson 1139a69042a5SRobert Watson INP_RLOCK(inp); 114026ef6ac4SDon Lewis port = inp->inp_lport; 114126ef6ac4SDon Lewis addr = inp->inp_laddr; 1142a69042a5SRobert Watson INP_RUNLOCK(inp); 114342fa505bSDavid Greenman 114426ef6ac4SDon Lewis *nam = in_sockaddr(port, &addr); 1145117bcae7SGarrett Wollman return 0; 1146df8bae1dSRodney W. Grimes } 1147df8bae1dSRodney W. Grimes 1148117bcae7SGarrett Wollman int 114954d642bbSRobert Watson in_getpeeraddr(struct socket *so, struct sockaddr **nam) 1150df8bae1dSRodney W. Grimes { 1151136d4f1cSRobert Watson struct inpcb *inp; 115226ef6ac4SDon Lewis struct in_addr addr; 115326ef6ac4SDon Lewis in_port_t port; 115442fa505bSDavid Greenman 1155fdc984f7STor Egge inp = sotoinpcb(so); 115654d642bbSRobert Watson KASSERT(inp != NULL, ("in_getpeeraddr: inp == NULL")); 11576466b28aSRobert Watson 1158a69042a5SRobert Watson INP_RLOCK(inp); 115926ef6ac4SDon Lewis port = inp->inp_fport; 116026ef6ac4SDon Lewis addr = inp->inp_faddr; 1161a69042a5SRobert Watson INP_RUNLOCK(inp); 116242fa505bSDavid Greenman 116326ef6ac4SDon Lewis *nam = in_sockaddr(port, &addr); 1164117bcae7SGarrett Wollman return 0; 1165df8bae1dSRodney W. Grimes } 1166df8bae1dSRodney W. Grimes 116726f9a767SRodney W. Grimes void 1168136d4f1cSRobert Watson in_pcbnotifyall(struct inpcbinfo *pcbinfo, struct in_addr faddr, int errno, 1169136d4f1cSRobert Watson struct inpcb *(*notify)(struct inpcb *, int)) 1170d1c54148SJesper Skriver { 1171f457d580SRobert Watson struct inpcb *inp, *inp_temp; 1172d1c54148SJesper Skriver 11733dc7ebf9SJeffrey Hsu INP_INFO_WLOCK(pcbinfo); 1174f457d580SRobert Watson LIST_FOREACH_SAFE(inp, pcbinfo->ipi_listhead, inp_list, inp_temp) { 11758501a69cSRobert Watson INP_WLOCK(inp); 1176d1c54148SJesper Skriver #ifdef INET6 1177f76fcf6dSJeffrey Hsu if ((inp->inp_vflag & INP_IPV4) == 0) { 11788501a69cSRobert Watson INP_WUNLOCK(inp); 1179d1c54148SJesper Skriver continue; 1180f76fcf6dSJeffrey Hsu } 1181d1c54148SJesper Skriver #endif 1182d1c54148SJesper Skriver if (inp->inp_faddr.s_addr != faddr.s_addr || 1183f76fcf6dSJeffrey Hsu inp->inp_socket == NULL) { 11848501a69cSRobert Watson INP_WUNLOCK(inp); 1185d1c54148SJesper Skriver continue; 1186d1c54148SJesper Skriver } 11873dc7ebf9SJeffrey Hsu if ((*notify)(inp, errno)) 11888501a69cSRobert Watson INP_WUNLOCK(inp); 1189f76fcf6dSJeffrey Hsu } 11903dc7ebf9SJeffrey Hsu INP_INFO_WUNLOCK(pcbinfo); 1191d1c54148SJesper Skriver } 1192d1c54148SJesper Skriver 1193e43cc4aeSHajimu UMEMOTO void 1194136d4f1cSRobert Watson in_pcbpurgeif0(struct inpcbinfo *pcbinfo, struct ifnet *ifp) 1195e43cc4aeSHajimu UMEMOTO { 1196e43cc4aeSHajimu UMEMOTO struct inpcb *inp; 1197e43cc4aeSHajimu UMEMOTO struct ip_moptions *imo; 1198e43cc4aeSHajimu UMEMOTO int i, gap; 1199e43cc4aeSHajimu UMEMOTO 1200f76fcf6dSJeffrey Hsu INP_INFO_RLOCK(pcbinfo); 1201712fc218SRobert Watson LIST_FOREACH(inp, pcbinfo->ipi_listhead, inp_list) { 12028501a69cSRobert Watson INP_WLOCK(inp); 1203e43cc4aeSHajimu UMEMOTO imo = inp->inp_moptions; 1204e43cc4aeSHajimu UMEMOTO if ((inp->inp_vflag & INP_IPV4) && 1205e43cc4aeSHajimu UMEMOTO imo != NULL) { 1206e43cc4aeSHajimu UMEMOTO /* 1207e43cc4aeSHajimu UMEMOTO * Unselect the outgoing interface if it is being 1208e43cc4aeSHajimu UMEMOTO * detached. 1209e43cc4aeSHajimu UMEMOTO */ 1210e43cc4aeSHajimu UMEMOTO if (imo->imo_multicast_ifp == ifp) 1211e43cc4aeSHajimu UMEMOTO imo->imo_multicast_ifp = NULL; 1212e43cc4aeSHajimu UMEMOTO 1213e43cc4aeSHajimu UMEMOTO /* 1214e43cc4aeSHajimu UMEMOTO * Drop multicast group membership if we joined 1215e43cc4aeSHajimu UMEMOTO * through the interface being detached. 1216e43cc4aeSHajimu UMEMOTO */ 1217e43cc4aeSHajimu UMEMOTO for (i = 0, gap = 0; i < imo->imo_num_memberships; 1218e43cc4aeSHajimu UMEMOTO i++) { 1219e43cc4aeSHajimu UMEMOTO if (imo->imo_membership[i]->inm_ifp == ifp) { 1220e43cc4aeSHajimu UMEMOTO in_delmulti(imo->imo_membership[i]); 1221e43cc4aeSHajimu UMEMOTO gap++; 1222e43cc4aeSHajimu UMEMOTO } else if (gap != 0) 1223e43cc4aeSHajimu UMEMOTO imo->imo_membership[i - gap] = 1224e43cc4aeSHajimu UMEMOTO imo->imo_membership[i]; 1225e43cc4aeSHajimu UMEMOTO } 1226e43cc4aeSHajimu UMEMOTO imo->imo_num_memberships -= gap; 1227e43cc4aeSHajimu UMEMOTO } 12288501a69cSRobert Watson INP_WUNLOCK(inp); 1229e43cc4aeSHajimu UMEMOTO } 12303cfcc388SJeffrey Hsu INP_INFO_RUNLOCK(pcbinfo); 1231e43cc4aeSHajimu UMEMOTO } 1232e43cc4aeSHajimu UMEMOTO 1233df8bae1dSRodney W. Grimes /* 1234c3229e05SDavid Greenman * Lookup a PCB based on the local address and port. 1235c3229e05SDavid Greenman */ 1236d5e8a67eSHajimu UMEMOTO #define INP_LOOKUP_MAPPED_PCB_COST 3 1237df8bae1dSRodney W. Grimes struct inpcb * 1238136d4f1cSRobert Watson in_pcblookup_local(struct inpcbinfo *pcbinfo, struct in_addr laddr, 1239078b7042SBjoern A. Zeeb u_short lport, int wild_okay, struct ucred *cred) 1240df8bae1dSRodney W. Grimes { 1241136d4f1cSRobert Watson struct inpcb *inp; 1242d5e8a67eSHajimu UMEMOTO #ifdef INET6 1243d5e8a67eSHajimu UMEMOTO int matchwild = 3 + INP_LOOKUP_MAPPED_PCB_COST; 1244d5e8a67eSHajimu UMEMOTO #else 1245d5e8a67eSHajimu UMEMOTO int matchwild = 3; 1246d5e8a67eSHajimu UMEMOTO #endif 1247d5e8a67eSHajimu UMEMOTO int wildcard; 12487bc4aca7SDavid Greenman 12498501a69cSRobert Watson INP_INFO_LOCK_ASSERT(pcbinfo); 12501b73ca0bSSam Leffler 1251c3229e05SDavid Greenman if (!wild_okay) { 1252c3229e05SDavid Greenman struct inpcbhead *head; 1253c3229e05SDavid Greenman /* 1254c3229e05SDavid Greenman * Look for an unconnected (wildcard foreign addr) PCB that 1255c3229e05SDavid Greenman * matches the local address and port we're looking for. 1256c3229e05SDavid Greenman */ 1257712fc218SRobert Watson head = &pcbinfo->ipi_hashbase[INP_PCBHASH(INADDR_ANY, lport, 1258712fc218SRobert Watson 0, pcbinfo->ipi_hashmask)]; 1259fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(inp, head, inp_hash) { 1260cfa1ca9dSYoshinobu Inoue #ifdef INET6 1261413628a7SBjoern A. Zeeb /* XXX inp locking */ 1262369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 1263cfa1ca9dSYoshinobu Inoue continue; 1264cfa1ca9dSYoshinobu Inoue #endif 1265c3229e05SDavid Greenman if (inp->inp_faddr.s_addr == INADDR_ANY && 1266c3229e05SDavid Greenman inp->inp_laddr.s_addr == laddr.s_addr && 1267c3229e05SDavid Greenman inp->inp_lport == lport) { 1268c3229e05SDavid Greenman /* 1269413628a7SBjoern A. Zeeb * Found? 1270c3229e05SDavid Greenman */ 1271413628a7SBjoern A. Zeeb if (cred == NULL || 12720304c731SJamie Gritton prison_equal_ip4(cred->cr_prison, 12730304c731SJamie Gritton inp->inp_cred->cr_prison)) 1274c3229e05SDavid Greenman return (inp); 1275df8bae1dSRodney W. Grimes } 1276c3229e05SDavid Greenman } 1277c3229e05SDavid Greenman /* 1278c3229e05SDavid Greenman * Not found. 1279c3229e05SDavid Greenman */ 1280c3229e05SDavid Greenman return (NULL); 1281c3229e05SDavid Greenman } else { 1282c3229e05SDavid Greenman struct inpcbporthead *porthash; 1283c3229e05SDavid Greenman struct inpcbport *phd; 1284c3229e05SDavid Greenman struct inpcb *match = NULL; 1285c3229e05SDavid Greenman /* 1286c3229e05SDavid Greenman * Best fit PCB lookup. 1287c3229e05SDavid Greenman * 1288c3229e05SDavid Greenman * First see if this local port is in use by looking on the 1289c3229e05SDavid Greenman * port hash list. 1290c3229e05SDavid Greenman */ 1291712fc218SRobert Watson porthash = &pcbinfo->ipi_porthashbase[INP_PCBPORTHASH(lport, 1292712fc218SRobert Watson pcbinfo->ipi_porthashmask)]; 1293fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(phd, porthash, phd_hash) { 1294c3229e05SDavid Greenman if (phd->phd_port == lport) 1295c3229e05SDavid Greenman break; 1296c3229e05SDavid Greenman } 1297c3229e05SDavid Greenman if (phd != NULL) { 1298c3229e05SDavid Greenman /* 1299c3229e05SDavid Greenman * Port is in use by one or more PCBs. Look for best 1300c3229e05SDavid Greenman * fit. 1301c3229e05SDavid Greenman */ 130237d40066SPoul-Henning Kamp LIST_FOREACH(inp, &phd->phd_pcblist, inp_portlist) { 1303c3229e05SDavid Greenman wildcard = 0; 1304413628a7SBjoern A. Zeeb if (cred != NULL && 13050304c731SJamie Gritton !prison_equal_ip4(inp->inp_cred->cr_prison, 13060304c731SJamie Gritton cred->cr_prison)) 1307413628a7SBjoern A. Zeeb continue; 1308cfa1ca9dSYoshinobu Inoue #ifdef INET6 1309413628a7SBjoern A. Zeeb /* XXX inp locking */ 1310369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 1311cfa1ca9dSYoshinobu Inoue continue; 1312d5e8a67eSHajimu UMEMOTO /* 1313d5e8a67eSHajimu UMEMOTO * We never select the PCB that has 1314d5e8a67eSHajimu UMEMOTO * INP_IPV6 flag and is bound to :: if 1315d5e8a67eSHajimu UMEMOTO * we have another PCB which is bound 1316d5e8a67eSHajimu UMEMOTO * to 0.0.0.0. If a PCB has the 1317d5e8a67eSHajimu UMEMOTO * INP_IPV6 flag, then we set its cost 1318d5e8a67eSHajimu UMEMOTO * higher than IPv4 only PCBs. 1319d5e8a67eSHajimu UMEMOTO * 1320d5e8a67eSHajimu UMEMOTO * Note that the case only happens 1321d5e8a67eSHajimu UMEMOTO * when a socket is bound to ::, under 1322d5e8a67eSHajimu UMEMOTO * the condition that the use of the 1323d5e8a67eSHajimu UMEMOTO * mapped address is allowed. 1324d5e8a67eSHajimu UMEMOTO */ 1325d5e8a67eSHajimu UMEMOTO if ((inp->inp_vflag & INP_IPV6) != 0) 1326d5e8a67eSHajimu UMEMOTO wildcard += INP_LOOKUP_MAPPED_PCB_COST; 1327cfa1ca9dSYoshinobu Inoue #endif 1328c3229e05SDavid Greenman if (inp->inp_faddr.s_addr != INADDR_ANY) 1329c3229e05SDavid Greenman wildcard++; 133015bd2b43SDavid Greenman if (inp->inp_laddr.s_addr != INADDR_ANY) { 133115bd2b43SDavid Greenman if (laddr.s_addr == INADDR_ANY) 133215bd2b43SDavid Greenman wildcard++; 133315bd2b43SDavid Greenman else if (inp->inp_laddr.s_addr != laddr.s_addr) 133415bd2b43SDavid Greenman continue; 133515bd2b43SDavid Greenman } else { 133615bd2b43SDavid Greenman if (laddr.s_addr != INADDR_ANY) 133715bd2b43SDavid Greenman wildcard++; 133815bd2b43SDavid Greenman } 1339df8bae1dSRodney W. Grimes if (wildcard < matchwild) { 1340df8bae1dSRodney W. Grimes match = inp; 1341df8bae1dSRodney W. Grimes matchwild = wildcard; 1342413628a7SBjoern A. Zeeb if (matchwild == 0) 1343df8bae1dSRodney W. Grimes break; 1344df8bae1dSRodney W. Grimes } 1345df8bae1dSRodney W. Grimes } 13463dbdc25cSDavid Greenman } 1347df8bae1dSRodney W. Grimes return (match); 1348df8bae1dSRodney W. Grimes } 1349c3229e05SDavid Greenman } 1350d5e8a67eSHajimu UMEMOTO #undef INP_LOOKUP_MAPPED_PCB_COST 135115bd2b43SDavid Greenman 135215bd2b43SDavid Greenman /* 135315bd2b43SDavid Greenman * Lookup PCB in hash list. 135415bd2b43SDavid Greenman */ 135515bd2b43SDavid Greenman struct inpcb * 1356136d4f1cSRobert Watson in_pcblookup_hash(struct inpcbinfo *pcbinfo, struct in_addr faddr, 1357136d4f1cSRobert Watson u_int fport_arg, struct in_addr laddr, u_int lport_arg, int wildcard, 1358136d4f1cSRobert Watson struct ifnet *ifp) 135915bd2b43SDavid Greenman { 136015bd2b43SDavid Greenman struct inpcbhead *head; 1361413628a7SBjoern A. Zeeb struct inpcb *inp, *tmpinp; 136215bd2b43SDavid Greenman u_short fport = fport_arg, lport = lport_arg; 136315bd2b43SDavid Greenman 13648501a69cSRobert Watson INP_INFO_LOCK_ASSERT(pcbinfo); 1365602cc7f1SRobert Watson 136615bd2b43SDavid Greenman /* 136715bd2b43SDavid Greenman * First look for an exact match. 136815bd2b43SDavid Greenman */ 1369413628a7SBjoern A. Zeeb tmpinp = NULL; 1370712fc218SRobert Watson head = &pcbinfo->ipi_hashbase[INP_PCBHASH(faddr.s_addr, lport, fport, 1371712fc218SRobert Watson pcbinfo->ipi_hashmask)]; 1372fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(inp, head, inp_hash) { 1373cfa1ca9dSYoshinobu Inoue #ifdef INET6 1374413628a7SBjoern A. Zeeb /* XXX inp locking */ 1375369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 1376cfa1ca9dSYoshinobu Inoue continue; 1377cfa1ca9dSYoshinobu Inoue #endif 13786d6a026bSDavid Greenman if (inp->inp_faddr.s_addr == faddr.s_addr && 1379ca98b82cSDavid Greenman inp->inp_laddr.s_addr == laddr.s_addr && 1380ca98b82cSDavid Greenman inp->inp_fport == fport && 1381413628a7SBjoern A. Zeeb inp->inp_lport == lport) { 1382413628a7SBjoern A. Zeeb /* 1383413628a7SBjoern A. Zeeb * XXX We should be able to directly return 1384413628a7SBjoern A. Zeeb * the inp here, without any checks. 1385413628a7SBjoern A. Zeeb * Well unless both bound with SO_REUSEPORT? 1386413628a7SBjoern A. Zeeb */ 13870304c731SJamie Gritton if (prison_flag(inp->inp_cred, PR_IP4)) 1388c3229e05SDavid Greenman return (inp); 1389413628a7SBjoern A. Zeeb if (tmpinp == NULL) 1390413628a7SBjoern A. Zeeb tmpinp = inp; 1391c3229e05SDavid Greenman } 1392413628a7SBjoern A. Zeeb } 1393413628a7SBjoern A. Zeeb if (tmpinp != NULL) 1394413628a7SBjoern A. Zeeb return (tmpinp); 1395e3fd5ffdSRobert Watson 1396e3fd5ffdSRobert Watson /* 1397e3fd5ffdSRobert Watson * Then look for a wildcard match, if requested. 1398e3fd5ffdSRobert Watson */ 1399413628a7SBjoern A. Zeeb if (wildcard == INPLOOKUP_WILDCARD) { 1400413628a7SBjoern A. Zeeb struct inpcb *local_wild = NULL, *local_exact = NULL; 1401e3fd5ffdSRobert Watson #ifdef INET6 1402cfa1ca9dSYoshinobu Inoue struct inpcb *local_wild_mapped = NULL; 1403e3fd5ffdSRobert Watson #endif 1404413628a7SBjoern A. Zeeb struct inpcb *jail_wild = NULL; 1405413628a7SBjoern A. Zeeb int injail; 1406413628a7SBjoern A. Zeeb 1407413628a7SBjoern A. Zeeb /* 1408413628a7SBjoern A. Zeeb * Order of socket selection - we always prefer jails. 1409413628a7SBjoern A. Zeeb * 1. jailed, non-wild. 1410413628a7SBjoern A. Zeeb * 2. jailed, wild. 1411413628a7SBjoern A. Zeeb * 3. non-jailed, non-wild. 1412413628a7SBjoern A. Zeeb * 4. non-jailed, wild. 1413413628a7SBjoern A. Zeeb */ 14146d6a026bSDavid Greenman 1415712fc218SRobert Watson head = &pcbinfo->ipi_hashbase[INP_PCBHASH(INADDR_ANY, lport, 1416712fc218SRobert Watson 0, pcbinfo->ipi_hashmask)]; 1417fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(inp, head, inp_hash) { 1418cfa1ca9dSYoshinobu Inoue #ifdef INET6 1419413628a7SBjoern A. Zeeb /* XXX inp locking */ 1420369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 1421cfa1ca9dSYoshinobu Inoue continue; 1422cfa1ca9dSYoshinobu Inoue #endif 1423413628a7SBjoern A. Zeeb if (inp->inp_faddr.s_addr != INADDR_ANY || 1424413628a7SBjoern A. Zeeb inp->inp_lport != lport) 1425413628a7SBjoern A. Zeeb continue; 1426413628a7SBjoern A. Zeeb 1427413628a7SBjoern A. Zeeb /* XXX inp locking */ 1428cfa1ca9dSYoshinobu Inoue if (ifp && ifp->if_type == IFT_FAITH && 1429cfa1ca9dSYoshinobu Inoue (inp->inp_flags & INP_FAITH) == 0) 1430cfa1ca9dSYoshinobu Inoue continue; 1431413628a7SBjoern A. Zeeb 14320304c731SJamie Gritton injail = prison_flag(inp->inp_cred, PR_IP4); 1433413628a7SBjoern A. Zeeb if (injail) { 1434b89e82ddSJamie Gritton if (prison_check_ip4(inp->inp_cred, 1435b89e82ddSJamie Gritton &laddr) != 0) 1436413628a7SBjoern A. Zeeb continue; 1437413628a7SBjoern A. Zeeb } else { 1438413628a7SBjoern A. Zeeb if (local_exact != NULL) 1439413628a7SBjoern A. Zeeb continue; 1440413628a7SBjoern A. Zeeb } 1441413628a7SBjoern A. Zeeb 1442413628a7SBjoern A. Zeeb if (inp->inp_laddr.s_addr == laddr.s_addr) { 1443413628a7SBjoern A. Zeeb if (injail) 1444c3229e05SDavid Greenman return (inp); 1445413628a7SBjoern A. Zeeb else 1446413628a7SBjoern A. Zeeb local_exact = inp; 1447413628a7SBjoern A. Zeeb } else if (inp->inp_laddr.s_addr == INADDR_ANY) { 1448e3fd5ffdSRobert Watson #ifdef INET6 1449413628a7SBjoern A. Zeeb /* XXX inp locking, NULL check */ 14505cd54324SBjoern A. Zeeb if (inp->inp_vflag & INP_IPV6PROTO) 1451cfa1ca9dSYoshinobu Inoue local_wild_mapped = inp; 1452cfa1ca9dSYoshinobu Inoue else 1453413628a7SBjoern A. Zeeb #endif /* INET6 */ 1454413628a7SBjoern A. Zeeb if (injail) 1455413628a7SBjoern A. Zeeb jail_wild = inp; 1456413628a7SBjoern A. Zeeb else 14576d6a026bSDavid Greenman local_wild = inp; 14586d6a026bSDavid Greenman } 1459413628a7SBjoern A. Zeeb } /* LIST_FOREACH */ 1460413628a7SBjoern A. Zeeb if (jail_wild != NULL) 1461413628a7SBjoern A. Zeeb return (jail_wild); 1462413628a7SBjoern A. Zeeb if (local_exact != NULL) 1463413628a7SBjoern A. Zeeb return (local_exact); 1464413628a7SBjoern A. Zeeb if (local_wild != NULL) 1465c3229e05SDavid Greenman return (local_wild); 1466413628a7SBjoern A. Zeeb #ifdef INET6 1467413628a7SBjoern A. Zeeb if (local_wild_mapped != NULL) 1468413628a7SBjoern A. Zeeb return (local_wild_mapped); 1469413628a7SBjoern A. Zeeb #endif /* defined(INET6) */ 1470413628a7SBjoern A. Zeeb } /* if (wildcard == INPLOOKUP_WILDCARD) */ 1471413628a7SBjoern A. Zeeb 14726d6a026bSDavid Greenman return (NULL); 147315bd2b43SDavid Greenman } 147415bd2b43SDavid Greenman 14757bc4aca7SDavid Greenman /* 1476c3229e05SDavid Greenman * Insert PCB onto various hash lists. 14777bc4aca7SDavid Greenman */ 1478c3229e05SDavid Greenman int 1479136d4f1cSRobert Watson in_pcbinshash(struct inpcb *inp) 148015bd2b43SDavid Greenman { 1481c3229e05SDavid Greenman struct inpcbhead *pcbhash; 1482c3229e05SDavid Greenman struct inpcbporthead *pcbporthash; 1483c3229e05SDavid Greenman struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 1484c3229e05SDavid Greenman struct inpcbport *phd; 1485cfa1ca9dSYoshinobu Inoue u_int32_t hashkey_faddr; 148615bd2b43SDavid Greenman 148759daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 14888501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 1489111d57a6SRobert Watson KASSERT((inp->inp_flags & INP_INHASHLIST) == 0, 1490111d57a6SRobert Watson ("in_pcbinshash: INP_INHASHLIST")); 1491602cc7f1SRobert Watson 1492cfa1ca9dSYoshinobu Inoue #ifdef INET6 1493cfa1ca9dSYoshinobu Inoue if (inp->inp_vflag & INP_IPV6) 1494cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->in6p_faddr.s6_addr32[3] /* XXX */; 1495cfa1ca9dSYoshinobu Inoue else 1496cfa1ca9dSYoshinobu Inoue #endif /* INET6 */ 1497cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->inp_faddr.s_addr; 1498cfa1ca9dSYoshinobu Inoue 1499712fc218SRobert Watson pcbhash = &pcbinfo->ipi_hashbase[INP_PCBHASH(hashkey_faddr, 1500712fc218SRobert Watson inp->inp_lport, inp->inp_fport, pcbinfo->ipi_hashmask)]; 150115bd2b43SDavid Greenman 1502712fc218SRobert Watson pcbporthash = &pcbinfo->ipi_porthashbase[ 1503712fc218SRobert Watson INP_PCBPORTHASH(inp->inp_lport, pcbinfo->ipi_porthashmask)]; 1504c3229e05SDavid Greenman 1505c3229e05SDavid Greenman /* 1506c3229e05SDavid Greenman * Go through port list and look for a head for this lport. 1507c3229e05SDavid Greenman */ 1508fc2ffbe6SPoul-Henning Kamp LIST_FOREACH(phd, pcbporthash, phd_hash) { 1509c3229e05SDavid Greenman if (phd->phd_port == inp->inp_lport) 1510c3229e05SDavid Greenman break; 1511c3229e05SDavid Greenman } 1512c3229e05SDavid Greenman /* 1513c3229e05SDavid Greenman * If none exists, malloc one and tack it on. 1514c3229e05SDavid Greenman */ 1515c3229e05SDavid Greenman if (phd == NULL) { 15161ede983cSDag-Erling Smørgrav phd = malloc(sizeof(struct inpcbport), M_PCB, M_NOWAIT); 1517c3229e05SDavid Greenman if (phd == NULL) { 1518c3229e05SDavid Greenman return (ENOBUFS); /* XXX */ 1519c3229e05SDavid Greenman } 1520c3229e05SDavid Greenman phd->phd_port = inp->inp_lport; 1521c3229e05SDavid Greenman LIST_INIT(&phd->phd_pcblist); 1522c3229e05SDavid Greenman LIST_INSERT_HEAD(pcbporthash, phd, phd_hash); 1523c3229e05SDavid Greenman } 1524c3229e05SDavid Greenman inp->inp_phd = phd; 1525c3229e05SDavid Greenman LIST_INSERT_HEAD(&phd->phd_pcblist, inp, inp_portlist); 1526c3229e05SDavid Greenman LIST_INSERT_HEAD(pcbhash, inp, inp_hash); 1527111d57a6SRobert Watson inp->inp_flags |= INP_INHASHLIST; 1528c3229e05SDavid Greenman return (0); 152915bd2b43SDavid Greenman } 153015bd2b43SDavid Greenman 1531c3229e05SDavid Greenman /* 1532c3229e05SDavid Greenman * Move PCB to the proper hash bucket when { faddr, fport } have been 1533c3229e05SDavid Greenman * changed. NOTE: This does not handle the case of the lport changing (the 1534c3229e05SDavid Greenman * hashed port list would have to be updated as well), so the lport must 1535c3229e05SDavid Greenman * not change after in_pcbinshash() has been called. 1536c3229e05SDavid Greenman */ 153715bd2b43SDavid Greenman void 1538136d4f1cSRobert Watson in_pcbrehash(struct inpcb *inp) 153915bd2b43SDavid Greenman { 154059daba27SSam Leffler struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 154115bd2b43SDavid Greenman struct inpcbhead *head; 1542cfa1ca9dSYoshinobu Inoue u_int32_t hashkey_faddr; 154315bd2b43SDavid Greenman 154459daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 15458501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 1546111d57a6SRobert Watson KASSERT(inp->inp_flags & INP_INHASHLIST, 1547111d57a6SRobert Watson ("in_pcbrehash: !INP_INHASHLIST")); 1548602cc7f1SRobert Watson 1549cfa1ca9dSYoshinobu Inoue #ifdef INET6 1550cfa1ca9dSYoshinobu Inoue if (inp->inp_vflag & INP_IPV6) 1551cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->in6p_faddr.s6_addr32[3] /* XXX */; 1552cfa1ca9dSYoshinobu Inoue else 1553cfa1ca9dSYoshinobu Inoue #endif /* INET6 */ 1554cfa1ca9dSYoshinobu Inoue hashkey_faddr = inp->inp_faddr.s_addr; 1555cfa1ca9dSYoshinobu Inoue 1556712fc218SRobert Watson head = &pcbinfo->ipi_hashbase[INP_PCBHASH(hashkey_faddr, 1557712fc218SRobert Watson inp->inp_lport, inp->inp_fport, pcbinfo->ipi_hashmask)]; 155815bd2b43SDavid Greenman 1559c3229e05SDavid Greenman LIST_REMOVE(inp, inp_hash); 156015bd2b43SDavid Greenman LIST_INSERT_HEAD(head, inp, inp_hash); 1561c3229e05SDavid Greenman } 1562c3229e05SDavid Greenman 1563c3229e05SDavid Greenman /* 1564c3229e05SDavid Greenman * Remove PCB from various lists. 1565c3229e05SDavid Greenman */ 15666d888973SRobert Watson static void 1567136d4f1cSRobert Watson in_pcbremlists(struct inpcb *inp) 1568c3229e05SDavid Greenman { 156959daba27SSam Leffler struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 157059daba27SSam Leffler 157159daba27SSam Leffler INP_INFO_WLOCK_ASSERT(pcbinfo); 15728501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 157359daba27SSam Leffler 157459daba27SSam Leffler inp->inp_gencnt = ++pcbinfo->ipi_gencnt; 1575111d57a6SRobert Watson if (inp->inp_flags & INP_INHASHLIST) { 1576c3229e05SDavid Greenman struct inpcbport *phd = inp->inp_phd; 1577c3229e05SDavid Greenman 1578c3229e05SDavid Greenman LIST_REMOVE(inp, inp_hash); 1579c3229e05SDavid Greenman LIST_REMOVE(inp, inp_portlist); 1580fc2ffbe6SPoul-Henning Kamp if (LIST_FIRST(&phd->phd_pcblist) == NULL) { 1581c3229e05SDavid Greenman LIST_REMOVE(phd, phd_hash); 1582c3229e05SDavid Greenman free(phd, M_PCB); 1583c3229e05SDavid Greenman } 1584111d57a6SRobert Watson inp->inp_flags &= ~INP_INHASHLIST; 1585c3229e05SDavid Greenman } 1586c3229e05SDavid Greenman LIST_REMOVE(inp, inp_list); 158759daba27SSam Leffler pcbinfo->ipi_count--; 158815bd2b43SDavid Greenman } 158975c13541SPoul-Henning Kamp 1590a557af22SRobert Watson /* 1591a557af22SRobert Watson * A set label operation has occurred at the socket layer, propagate the 1592a557af22SRobert Watson * label change into the in_pcb for the socket. 1593a557af22SRobert Watson */ 1594a557af22SRobert Watson void 1595136d4f1cSRobert Watson in_pcbsosetlabel(struct socket *so) 1596a557af22SRobert Watson { 1597a557af22SRobert Watson #ifdef MAC 1598a557af22SRobert Watson struct inpcb *inp; 1599a557af22SRobert Watson 16004c7c478dSRobert Watson inp = sotoinpcb(so); 16014c7c478dSRobert Watson KASSERT(inp != NULL, ("in_pcbsosetlabel: so->so_pcb == NULL")); 1602602cc7f1SRobert Watson 16038501a69cSRobert Watson INP_WLOCK(inp); 1604310e7cebSRobert Watson SOCK_LOCK(so); 1605a557af22SRobert Watson mac_inpcb_sosetlabel(so, inp); 1606310e7cebSRobert Watson SOCK_UNLOCK(so); 16078501a69cSRobert Watson INP_WUNLOCK(inp); 1608a557af22SRobert Watson #endif 1609a557af22SRobert Watson } 16105f311da2SMike Silbersack 16115f311da2SMike Silbersack /* 1612ad3a630fSRobert Watson * ipport_tick runs once per second, determining if random port allocation 1613ad3a630fSRobert Watson * should be continued. If more than ipport_randomcps ports have been 1614ad3a630fSRobert Watson * allocated in the last second, then we return to sequential port 1615ad3a630fSRobert Watson * allocation. We return to random allocation only once we drop below 1616ad3a630fSRobert Watson * ipport_randomcps for at least ipport_randomtime seconds. 16175f311da2SMike Silbersack */ 16185f311da2SMike Silbersack void 1619136d4f1cSRobert Watson ipport_tick(void *xtp) 16205f311da2SMike Silbersack { 16218b615593SMarko Zec VNET_ITERATOR_DECL(vnet_iter); 1622ad3a630fSRobert Watson 16235ee847d3SRobert Watson VNET_LIST_RLOCK_NOSLEEP(); 16248b615593SMarko Zec VNET_FOREACH(vnet_iter) { 16258b615593SMarko Zec CURVNET_SET(vnet_iter); /* XXX appease INVARIANTS here */ 16268b615593SMarko Zec if (V_ipport_tcpallocs <= 16278b615593SMarko Zec V_ipport_tcplastcount + V_ipport_randomcps) { 1628603724d3SBjoern A. Zeeb if (V_ipport_stoprandom > 0) 1629603724d3SBjoern A. Zeeb V_ipport_stoprandom--; 1630ad3a630fSRobert Watson } else 1631603724d3SBjoern A. Zeeb V_ipport_stoprandom = V_ipport_randomtime; 1632603724d3SBjoern A. Zeeb V_ipport_tcplastcount = V_ipport_tcpallocs; 16338b615593SMarko Zec CURVNET_RESTORE(); 16348b615593SMarko Zec } 16355ee847d3SRobert Watson VNET_LIST_RUNLOCK_NOSLEEP(); 16365f311da2SMike Silbersack callout_reset(&ipport_tick_callout, hz, ipport_tick, NULL); 16375f311da2SMike Silbersack } 1638497057eeSRobert Watson 16393d585327SKip Macy void 16403d585327SKip Macy inp_wlock(struct inpcb *inp) 16413d585327SKip Macy { 16423d585327SKip Macy 16438501a69cSRobert Watson INP_WLOCK(inp); 16443d585327SKip Macy } 16453d585327SKip Macy 16463d585327SKip Macy void 16473d585327SKip Macy inp_wunlock(struct inpcb *inp) 16483d585327SKip Macy { 16493d585327SKip Macy 16508501a69cSRobert Watson INP_WUNLOCK(inp); 16513d585327SKip Macy } 16523d585327SKip Macy 16533d585327SKip Macy void 16543d585327SKip Macy inp_rlock(struct inpcb *inp) 16553d585327SKip Macy { 16563d585327SKip Macy 1657a69042a5SRobert Watson INP_RLOCK(inp); 16583d585327SKip Macy } 16593d585327SKip Macy 16603d585327SKip Macy void 16613d585327SKip Macy inp_runlock(struct inpcb *inp) 16623d585327SKip Macy { 16633d585327SKip Macy 1664a69042a5SRobert Watson INP_RUNLOCK(inp); 16653d585327SKip Macy } 16663d585327SKip Macy 16673d585327SKip Macy #ifdef INVARIANTS 16683d585327SKip Macy void 1669e79dd20dSKip Macy inp_lock_assert(struct inpcb *inp) 16703d585327SKip Macy { 16713d585327SKip Macy 16728501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 16733d585327SKip Macy } 16743d585327SKip Macy 16753d585327SKip Macy void 1676e79dd20dSKip Macy inp_unlock_assert(struct inpcb *inp) 16773d585327SKip Macy { 16783d585327SKip Macy 16793d585327SKip Macy INP_UNLOCK_ASSERT(inp); 16803d585327SKip Macy } 16813d585327SKip Macy #endif 16823d585327SKip Macy 16839378e437SKip Macy void 16849378e437SKip Macy inp_apply_all(void (*func)(struct inpcb *, void *), void *arg) 16859378e437SKip Macy { 16869378e437SKip Macy struct inpcb *inp; 16879378e437SKip Macy 1688603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_tcbinfo); 168997021c24SMarko Zec LIST_FOREACH(inp, V_tcbinfo.ipi_listhead, inp_list) { 16909378e437SKip Macy INP_WLOCK(inp); 16919378e437SKip Macy func(inp, arg); 16929378e437SKip Macy INP_WUNLOCK(inp); 16939378e437SKip Macy } 1694603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_tcbinfo); 16959378e437SKip Macy } 16969378e437SKip Macy 16979378e437SKip Macy struct socket * 16989378e437SKip Macy inp_inpcbtosocket(struct inpcb *inp) 16999378e437SKip Macy { 17009378e437SKip Macy 17019378e437SKip Macy INP_WLOCK_ASSERT(inp); 17029378e437SKip Macy return (inp->inp_socket); 17039378e437SKip Macy } 17049378e437SKip Macy 17059378e437SKip Macy struct tcpcb * 17069378e437SKip Macy inp_inpcbtotcpcb(struct inpcb *inp) 17079378e437SKip Macy { 17089378e437SKip Macy 17099378e437SKip Macy INP_WLOCK_ASSERT(inp); 17109378e437SKip Macy return ((struct tcpcb *)inp->inp_ppcb); 17119378e437SKip Macy } 17129378e437SKip Macy 17139378e437SKip Macy int 17149378e437SKip Macy inp_ip_tos_get(const struct inpcb *inp) 17159378e437SKip Macy { 17169378e437SKip Macy 17179378e437SKip Macy return (inp->inp_ip_tos); 17189378e437SKip Macy } 17199378e437SKip Macy 17209378e437SKip Macy void 17219378e437SKip Macy inp_ip_tos_set(struct inpcb *inp, int val) 17229378e437SKip Macy { 17239378e437SKip Macy 17249378e437SKip Macy inp->inp_ip_tos = val; 17259378e437SKip Macy } 17269378e437SKip Macy 17279378e437SKip Macy void 1728df9cf830STai-hwa Liang inp_4tuple_get(struct inpcb *inp, uint32_t *laddr, uint16_t *lp, 17299d29c635SKip Macy uint32_t *faddr, uint16_t *fp) 17309378e437SKip Macy { 17319378e437SKip Macy 17329d29c635SKip Macy INP_LOCK_ASSERT(inp); 1733df9cf830STai-hwa Liang *laddr = inp->inp_laddr.s_addr; 1734df9cf830STai-hwa Liang *faddr = inp->inp_faddr.s_addr; 17359378e437SKip Macy *lp = inp->inp_lport; 17369378e437SKip Macy *fp = inp->inp_fport; 17379378e437SKip Macy } 17389378e437SKip Macy 1739dd0e6c38SKip Macy struct inpcb * 1740dd0e6c38SKip Macy so_sotoinpcb(struct socket *so) 1741dd0e6c38SKip Macy { 1742dd0e6c38SKip Macy 1743dd0e6c38SKip Macy return (sotoinpcb(so)); 1744dd0e6c38SKip Macy } 1745dd0e6c38SKip Macy 1746dd0e6c38SKip Macy struct tcpcb * 1747dd0e6c38SKip Macy so_sototcpcb(struct socket *so) 1748dd0e6c38SKip Macy { 1749dd0e6c38SKip Macy 1750dd0e6c38SKip Macy return (sototcpcb(so)); 1751dd0e6c38SKip Macy } 1752dd0e6c38SKip Macy 1753497057eeSRobert Watson #ifdef DDB 1754497057eeSRobert Watson static void 1755497057eeSRobert Watson db_print_indent(int indent) 1756497057eeSRobert Watson { 1757497057eeSRobert Watson int i; 1758497057eeSRobert Watson 1759497057eeSRobert Watson for (i = 0; i < indent; i++) 1760497057eeSRobert Watson db_printf(" "); 1761497057eeSRobert Watson } 1762497057eeSRobert Watson 1763497057eeSRobert Watson static void 1764497057eeSRobert Watson db_print_inconninfo(struct in_conninfo *inc, const char *name, int indent) 1765497057eeSRobert Watson { 1766497057eeSRobert Watson char faddr_str[48], laddr_str[48]; 1767497057eeSRobert Watson 1768497057eeSRobert Watson db_print_indent(indent); 1769497057eeSRobert Watson db_printf("%s at %p\n", name, inc); 1770497057eeSRobert Watson 1771497057eeSRobert Watson indent += 2; 1772497057eeSRobert Watson 177303dc38a4SRobert Watson #ifdef INET6 1774dcdb4371SBjoern A. Zeeb if (inc->inc_flags & INC_ISIPV6) { 1775497057eeSRobert Watson /* IPv6. */ 1776497057eeSRobert Watson ip6_sprintf(laddr_str, &inc->inc6_laddr); 1777497057eeSRobert Watson ip6_sprintf(faddr_str, &inc->inc6_faddr); 1778497057eeSRobert Watson } else { 177903dc38a4SRobert Watson #endif 1780497057eeSRobert Watson /* IPv4. */ 1781497057eeSRobert Watson inet_ntoa_r(inc->inc_laddr, laddr_str); 1782497057eeSRobert Watson inet_ntoa_r(inc->inc_faddr, faddr_str); 178303dc38a4SRobert Watson #ifdef INET6 1784497057eeSRobert Watson } 178503dc38a4SRobert Watson #endif 1786497057eeSRobert Watson db_print_indent(indent); 1787497057eeSRobert Watson db_printf("inc_laddr %s inc_lport %u\n", laddr_str, 1788497057eeSRobert Watson ntohs(inc->inc_lport)); 1789497057eeSRobert Watson db_print_indent(indent); 1790497057eeSRobert Watson db_printf("inc_faddr %s inc_fport %u\n", faddr_str, 1791497057eeSRobert Watson ntohs(inc->inc_fport)); 1792497057eeSRobert Watson } 1793497057eeSRobert Watson 1794497057eeSRobert Watson static void 1795497057eeSRobert Watson db_print_inpflags(int inp_flags) 1796497057eeSRobert Watson { 1797497057eeSRobert Watson int comma; 1798497057eeSRobert Watson 1799497057eeSRobert Watson comma = 0; 1800497057eeSRobert Watson if (inp_flags & INP_RECVOPTS) { 1801497057eeSRobert Watson db_printf("%sINP_RECVOPTS", comma ? ", " : ""); 1802497057eeSRobert Watson comma = 1; 1803497057eeSRobert Watson } 1804497057eeSRobert Watson if (inp_flags & INP_RECVRETOPTS) { 1805497057eeSRobert Watson db_printf("%sINP_RECVRETOPTS", comma ? ", " : ""); 1806497057eeSRobert Watson comma = 1; 1807497057eeSRobert Watson } 1808497057eeSRobert Watson if (inp_flags & INP_RECVDSTADDR) { 1809497057eeSRobert Watson db_printf("%sINP_RECVDSTADDR", comma ? ", " : ""); 1810497057eeSRobert Watson comma = 1; 1811497057eeSRobert Watson } 1812497057eeSRobert Watson if (inp_flags & INP_HDRINCL) { 1813497057eeSRobert Watson db_printf("%sINP_HDRINCL", comma ? ", " : ""); 1814497057eeSRobert Watson comma = 1; 1815497057eeSRobert Watson } 1816497057eeSRobert Watson if (inp_flags & INP_HIGHPORT) { 1817497057eeSRobert Watson db_printf("%sINP_HIGHPORT", comma ? ", " : ""); 1818497057eeSRobert Watson comma = 1; 1819497057eeSRobert Watson } 1820497057eeSRobert Watson if (inp_flags & INP_LOWPORT) { 1821497057eeSRobert Watson db_printf("%sINP_LOWPORT", comma ? ", " : ""); 1822497057eeSRobert Watson comma = 1; 1823497057eeSRobert Watson } 1824497057eeSRobert Watson if (inp_flags & INP_ANONPORT) { 1825497057eeSRobert Watson db_printf("%sINP_ANONPORT", comma ? ", " : ""); 1826497057eeSRobert Watson comma = 1; 1827497057eeSRobert Watson } 1828497057eeSRobert Watson if (inp_flags & INP_RECVIF) { 1829497057eeSRobert Watson db_printf("%sINP_RECVIF", comma ? ", " : ""); 1830497057eeSRobert Watson comma = 1; 1831497057eeSRobert Watson } 1832497057eeSRobert Watson if (inp_flags & INP_MTUDISC) { 1833497057eeSRobert Watson db_printf("%sINP_MTUDISC", comma ? ", " : ""); 1834497057eeSRobert Watson comma = 1; 1835497057eeSRobert Watson } 1836497057eeSRobert Watson if (inp_flags & INP_FAITH) { 1837497057eeSRobert Watson db_printf("%sINP_FAITH", comma ? ", " : ""); 1838497057eeSRobert Watson comma = 1; 1839497057eeSRobert Watson } 1840497057eeSRobert Watson if (inp_flags & INP_RECVTTL) { 1841497057eeSRobert Watson db_printf("%sINP_RECVTTL", comma ? ", " : ""); 1842497057eeSRobert Watson comma = 1; 1843497057eeSRobert Watson } 1844497057eeSRobert Watson if (inp_flags & INP_DONTFRAG) { 1845497057eeSRobert Watson db_printf("%sINP_DONTFRAG", comma ? ", " : ""); 1846497057eeSRobert Watson comma = 1; 1847497057eeSRobert Watson } 1848497057eeSRobert Watson if (inp_flags & IN6P_IPV6_V6ONLY) { 1849497057eeSRobert Watson db_printf("%sIN6P_IPV6_V6ONLY", comma ? ", " : ""); 1850497057eeSRobert Watson comma = 1; 1851497057eeSRobert Watson } 1852497057eeSRobert Watson if (inp_flags & IN6P_PKTINFO) { 1853497057eeSRobert Watson db_printf("%sIN6P_PKTINFO", comma ? ", " : ""); 1854497057eeSRobert Watson comma = 1; 1855497057eeSRobert Watson } 1856497057eeSRobert Watson if (inp_flags & IN6P_HOPLIMIT) { 1857497057eeSRobert Watson db_printf("%sIN6P_HOPLIMIT", comma ? ", " : ""); 1858497057eeSRobert Watson comma = 1; 1859497057eeSRobert Watson } 1860497057eeSRobert Watson if (inp_flags & IN6P_HOPOPTS) { 1861497057eeSRobert Watson db_printf("%sIN6P_HOPOPTS", comma ? ", " : ""); 1862497057eeSRobert Watson comma = 1; 1863497057eeSRobert Watson } 1864497057eeSRobert Watson if (inp_flags & IN6P_DSTOPTS) { 1865497057eeSRobert Watson db_printf("%sIN6P_DSTOPTS", comma ? ", " : ""); 1866497057eeSRobert Watson comma = 1; 1867497057eeSRobert Watson } 1868497057eeSRobert Watson if (inp_flags & IN6P_RTHDR) { 1869497057eeSRobert Watson db_printf("%sIN6P_RTHDR", comma ? ", " : ""); 1870497057eeSRobert Watson comma = 1; 1871497057eeSRobert Watson } 1872497057eeSRobert Watson if (inp_flags & IN6P_RTHDRDSTOPTS) { 1873497057eeSRobert Watson db_printf("%sIN6P_RTHDRDSTOPTS", comma ? ", " : ""); 1874497057eeSRobert Watson comma = 1; 1875497057eeSRobert Watson } 1876497057eeSRobert Watson if (inp_flags & IN6P_TCLASS) { 1877497057eeSRobert Watson db_printf("%sIN6P_TCLASS", comma ? ", " : ""); 1878497057eeSRobert Watson comma = 1; 1879497057eeSRobert Watson } 1880497057eeSRobert Watson if (inp_flags & IN6P_AUTOFLOWLABEL) { 1881497057eeSRobert Watson db_printf("%sIN6P_AUTOFLOWLABEL", comma ? ", " : ""); 1882497057eeSRobert Watson comma = 1; 1883497057eeSRobert Watson } 1884ad71fe3cSRobert Watson if (inp_flags & INP_TIMEWAIT) { 1885ad71fe3cSRobert Watson db_printf("%sINP_TIMEWAIT", comma ? ", " : ""); 1886ad71fe3cSRobert Watson comma = 1; 1887ad71fe3cSRobert Watson } 1888ad71fe3cSRobert Watson if (inp_flags & INP_ONESBCAST) { 1889ad71fe3cSRobert Watson db_printf("%sINP_ONESBCAST", comma ? ", " : ""); 1890ad71fe3cSRobert Watson comma = 1; 1891ad71fe3cSRobert Watson } 1892ad71fe3cSRobert Watson if (inp_flags & INP_DROPPED) { 1893ad71fe3cSRobert Watson db_printf("%sINP_DROPPED", comma ? ", " : ""); 1894ad71fe3cSRobert Watson comma = 1; 1895ad71fe3cSRobert Watson } 1896ad71fe3cSRobert Watson if (inp_flags & INP_SOCKREF) { 1897ad71fe3cSRobert Watson db_printf("%sINP_SOCKREF", comma ? ", " : ""); 1898ad71fe3cSRobert Watson comma = 1; 1899ad71fe3cSRobert Watson } 1900497057eeSRobert Watson if (inp_flags & IN6P_RFC2292) { 1901497057eeSRobert Watson db_printf("%sIN6P_RFC2292", comma ? ", " : ""); 1902497057eeSRobert Watson comma = 1; 1903497057eeSRobert Watson } 1904497057eeSRobert Watson if (inp_flags & IN6P_MTU) { 1905497057eeSRobert Watson db_printf("IN6P_MTU%s", comma ? ", " : ""); 1906497057eeSRobert Watson comma = 1; 1907497057eeSRobert Watson } 1908497057eeSRobert Watson } 1909497057eeSRobert Watson 1910497057eeSRobert Watson static void 1911497057eeSRobert Watson db_print_inpvflag(u_char inp_vflag) 1912497057eeSRobert Watson { 1913497057eeSRobert Watson int comma; 1914497057eeSRobert Watson 1915497057eeSRobert Watson comma = 0; 1916497057eeSRobert Watson if (inp_vflag & INP_IPV4) { 1917497057eeSRobert Watson db_printf("%sINP_IPV4", comma ? ", " : ""); 1918497057eeSRobert Watson comma = 1; 1919497057eeSRobert Watson } 1920497057eeSRobert Watson if (inp_vflag & INP_IPV6) { 1921497057eeSRobert Watson db_printf("%sINP_IPV6", comma ? ", " : ""); 1922497057eeSRobert Watson comma = 1; 1923497057eeSRobert Watson } 1924497057eeSRobert Watson if (inp_vflag & INP_IPV6PROTO) { 1925497057eeSRobert Watson db_printf("%sINP_IPV6PROTO", comma ? ", " : ""); 1926497057eeSRobert Watson comma = 1; 1927497057eeSRobert Watson } 1928497057eeSRobert Watson } 1929497057eeSRobert Watson 19306d888973SRobert Watson static void 1931497057eeSRobert Watson db_print_inpcb(struct inpcb *inp, const char *name, int indent) 1932497057eeSRobert Watson { 1933497057eeSRobert Watson 1934497057eeSRobert Watson db_print_indent(indent); 1935497057eeSRobert Watson db_printf("%s at %p\n", name, inp); 1936497057eeSRobert Watson 1937497057eeSRobert Watson indent += 2; 1938497057eeSRobert Watson 1939497057eeSRobert Watson db_print_indent(indent); 1940497057eeSRobert Watson db_printf("inp_flow: 0x%x\n", inp->inp_flow); 1941497057eeSRobert Watson 1942497057eeSRobert Watson db_print_inconninfo(&inp->inp_inc, "inp_conninfo", indent); 1943497057eeSRobert Watson 1944497057eeSRobert Watson db_print_indent(indent); 1945497057eeSRobert Watson db_printf("inp_ppcb: %p inp_pcbinfo: %p inp_socket: %p\n", 1946497057eeSRobert Watson inp->inp_ppcb, inp->inp_pcbinfo, inp->inp_socket); 1947497057eeSRobert Watson 1948497057eeSRobert Watson db_print_indent(indent); 1949497057eeSRobert Watson db_printf("inp_label: %p inp_flags: 0x%x (", 1950497057eeSRobert Watson inp->inp_label, inp->inp_flags); 1951497057eeSRobert Watson db_print_inpflags(inp->inp_flags); 1952497057eeSRobert Watson db_printf(")\n"); 1953497057eeSRobert Watson 1954497057eeSRobert Watson db_print_indent(indent); 1955497057eeSRobert Watson db_printf("inp_sp: %p inp_vflag: 0x%x (", inp->inp_sp, 1956497057eeSRobert Watson inp->inp_vflag); 1957497057eeSRobert Watson db_print_inpvflag(inp->inp_vflag); 1958497057eeSRobert Watson db_printf(")\n"); 1959497057eeSRobert Watson 1960497057eeSRobert Watson db_print_indent(indent); 1961497057eeSRobert Watson db_printf("inp_ip_ttl: %d inp_ip_p: %d inp_ip_minttl: %d\n", 1962497057eeSRobert Watson inp->inp_ip_ttl, inp->inp_ip_p, inp->inp_ip_minttl); 1963497057eeSRobert Watson 1964497057eeSRobert Watson db_print_indent(indent); 1965497057eeSRobert Watson #ifdef INET6 1966497057eeSRobert Watson if (inp->inp_vflag & INP_IPV6) { 1967497057eeSRobert Watson db_printf("in6p_options: %p in6p_outputopts: %p " 1968497057eeSRobert Watson "in6p_moptions: %p\n", inp->in6p_options, 1969497057eeSRobert Watson inp->in6p_outputopts, inp->in6p_moptions); 1970497057eeSRobert Watson db_printf("in6p_icmp6filt: %p in6p_cksum %d " 1971497057eeSRobert Watson "in6p_hops %u\n", inp->in6p_icmp6filt, inp->in6p_cksum, 1972497057eeSRobert Watson inp->in6p_hops); 1973497057eeSRobert Watson } else 1974497057eeSRobert Watson #endif 1975497057eeSRobert Watson { 1976497057eeSRobert Watson db_printf("inp_ip_tos: %d inp_ip_options: %p " 1977497057eeSRobert Watson "inp_ip_moptions: %p\n", inp->inp_ip_tos, 1978497057eeSRobert Watson inp->inp_options, inp->inp_moptions); 1979497057eeSRobert Watson } 1980497057eeSRobert Watson 1981497057eeSRobert Watson db_print_indent(indent); 1982497057eeSRobert Watson db_printf("inp_phd: %p inp_gencnt: %ju\n", inp->inp_phd, 1983497057eeSRobert Watson (uintmax_t)inp->inp_gencnt); 1984497057eeSRobert Watson } 1985497057eeSRobert Watson 1986497057eeSRobert Watson DB_SHOW_COMMAND(inpcb, db_show_inpcb) 1987497057eeSRobert Watson { 1988497057eeSRobert Watson struct inpcb *inp; 1989497057eeSRobert Watson 1990497057eeSRobert Watson if (!have_addr) { 1991497057eeSRobert Watson db_printf("usage: show inpcb <addr>\n"); 1992497057eeSRobert Watson return; 1993497057eeSRobert Watson } 1994497057eeSRobert Watson inp = (struct inpcb *)addr; 1995497057eeSRobert Watson 1996497057eeSRobert Watson db_print_inpcb(inp, "inpcb", 0); 1997497057eeSRobert Watson } 1998497057eeSRobert Watson #endif 1999