1c398230bSWarner Losh /*- 26dfab5b1SGarrett Wollman * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995 33329b236SRobert Watson * The Regents of the University of California. 43144b7d3SRobert Watson * Copyright (c) 2008 Robert N. M. Watson 53329b236SRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 316dfab5b1SGarrett Wollman * @(#)udp_usrreq.c 8.6 (Berkeley) 5/23/95 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 344b421e2dSMike Silbersack #include <sys/cdefs.h> 354b421e2dSMike Silbersack __FBSDID("$FreeBSD$"); 364b421e2dSMike Silbersack 370b4ae859SGleb Smirnoff #include "opt_ipfw.h" 38cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h" 39f5514f08SRobert Watson #include "opt_ipsec.h" 40cfa1ca9dSYoshinobu Inoue 41df8bae1dSRodney W. Grimes #include <sys/param.h> 42960ed29cSSeigo Tanimura #include <sys/domain.h> 434f590175SPaul Saab #include <sys/eventhandler.h> 44960ed29cSSeigo Tanimura #include <sys/jail.h> 45b110a8a2SGarrett Wollman #include <sys/kernel.h> 46960ed29cSSeigo Tanimura #include <sys/lock.h> 47df8bae1dSRodney W. Grimes #include <sys/malloc.h> 48df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 49acd3428bSRobert Watson #include <sys/priv.h> 50490d50b6SBrian Feldman #include <sys/proc.h> 51df8bae1dSRodney W. Grimes #include <sys/protosw.h> 52960ed29cSSeigo Tanimura #include <sys/signalvar.h> 53df8bae1dSRodney W. Grimes #include <sys/socket.h> 54df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 55960ed29cSSeigo Tanimura #include <sys/sx.h> 56b5e8ce9fSBruce Evans #include <sys/sysctl.h> 57816a3d83SPoul-Henning Kamp #include <sys/syslog.h> 58f5514f08SRobert Watson #include <sys/systm.h> 598781d8e9SBruce Evans 6069c2d429SJeff Roberson #include <vm/uma.h> 61df8bae1dSRodney W. Grimes 62df8bae1dSRodney W. Grimes #include <net/if.h> 63df8bae1dSRodney W. Grimes #include <net/route.h> 64df8bae1dSRodney W. Grimes 65df8bae1dSRodney W. Grimes #include <netinet/in.h> 66960ed29cSSeigo Tanimura #include <netinet/in_pcb.h> 67f5514f08SRobert Watson #include <netinet/in_systm.h> 68960ed29cSSeigo Tanimura #include <netinet/in_var.h> 69df8bae1dSRodney W. Grimes #include <netinet/ip.h> 70cfa1ca9dSYoshinobu Inoue #ifdef INET6 71cfa1ca9dSYoshinobu Inoue #include <netinet/ip6.h> 72cfa1ca9dSYoshinobu Inoue #endif 73960ed29cSSeigo Tanimura #include <netinet/ip_icmp.h> 74960ed29cSSeigo Tanimura #include <netinet/icmp_var.h> 75df8bae1dSRodney W. Grimes #include <netinet/ip_var.h> 76ef39adf0SAndre Oppermann #include <netinet/ip_options.h> 77cfa1ca9dSYoshinobu Inoue #ifdef INET6 78cfa1ca9dSYoshinobu Inoue #include <netinet6/ip6_var.h> 79cfa1ca9dSYoshinobu Inoue #endif 80df8bae1dSRodney W. Grimes #include <netinet/udp.h> 81df8bae1dSRodney W. Grimes #include <netinet/udp_var.h> 82df8bae1dSRodney W. Grimes 83b2630c29SGeorge V. Neville-Neil #ifdef IPSEC 84b9234fafSSam Leffler #include <netipsec/ipsec.h> 857b495c44SVANHULLEBUS Yvan #include <netipsec/esp.h> 863329b236SRobert Watson #endif 87b9234fafSSam Leffler 88db4f9cc7SJonathan Lemon #include <machine/in_cksum.h> 89db4f9cc7SJonathan Lemon 90aed55708SRobert Watson #include <security/mac/mac_framework.h> 91aed55708SRobert Watson 92df8bae1dSRodney W. Grimes /* 93df8bae1dSRodney W. Grimes * UDP protocol implementation. 94df8bae1dSRodney W. Grimes * Per RFC 768, August, 1980. 95df8bae1dSRodney W. Grimes */ 9674eb3236SWarner Losh 9774eb3236SWarner Losh /* 983329b236SRobert Watson * BSD 4.2 defaulted the udp checksum to be off. Turning off udp checksums 993329b236SRobert Watson * removes the only data integrity mechanism for packets and malformed 100f5514f08SRobert Watson * packets that would otherwise be discarded due to bad checksums, and may 101f5514f08SRobert Watson * cause problems (especially for NFS data blocks). 10274eb3236SWarner Losh */ 103f5514f08SRobert Watson static int udp_cksum = 1; 104f5514f08SRobert Watson SYSCTL_INT(_net_inet_udp, UDPCTL_CHECKSUM, checksum, CTLFLAG_RW, &udp_cksum, 10541698ebfSTom Rhodes 0, "compute udp checksum"); 106df8bae1dSRodney W. Grimes 107afdb4274SRobert Watson int udp_log_in_vain = 0; 108816a3d83SPoul-Henning Kamp SYSCTL_INT(_net_inet_udp, OID_AUTO, log_in_vain, CTLFLAG_RW, 109afdb4274SRobert Watson &udp_log_in_vain, 0, "Log all incoming UDP packets"); 110816a3d83SPoul-Henning Kamp 11182cea7e6SBjoern A. Zeeb VNET_DEFINE(int, udp_blackhole) = 0; 112eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_udp, OID_AUTO, blackhole, CTLFLAG_RW, 113eddfbb76SRobert Watson &VNET_NAME(udp_blackhole), 0, 1143329b236SRobert Watson "Do not send port unreachables for refused connects"); 11516f7f31fSGeoff Rehmet 11643bbb6aaSRobert Watson u_long udp_sendspace = 9216; /* really max datagram size */ 11743bbb6aaSRobert Watson /* 40 1K datagrams */ 11843bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_MAXDGRAM, maxdgram, CTLFLAG_RW, 11943bbb6aaSRobert Watson &udp_sendspace, 0, "Maximum outgoing UDP datagram size"); 12043bbb6aaSRobert Watson 12143bbb6aaSRobert Watson u_long udp_recvspace = 40 * (1024 + 12243bbb6aaSRobert Watson #ifdef INET6 12343bbb6aaSRobert Watson sizeof(struct sockaddr_in6) 12443bbb6aaSRobert Watson #else 12543bbb6aaSRobert Watson sizeof(struct sockaddr_in) 12643bbb6aaSRobert Watson #endif 12743bbb6aaSRobert Watson ); 12843bbb6aaSRobert Watson 12943bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_RECVSPACE, recvspace, CTLFLAG_RW, 13043bbb6aaSRobert Watson &udp_recvspace, 0, "Maximum space for incoming UDP datagrams"); 13143bbb6aaSRobert Watson 132eddfbb76SRobert Watson VNET_DEFINE(struct inpcbhead, udb); /* from udp_var.h */ 133eddfbb76SRobert Watson VNET_DEFINE(struct inpcbinfo, udbinfo); 1343e288e62SDimitry Andric static VNET_DEFINE(uma_zone_t, udpcb_zone); 1351e77c105SRobert Watson #define V_udpcb_zone VNET(udpcb_zone) 13615bd2b43SDavid Greenman 13715bd2b43SDavid Greenman #ifndef UDBHASHSIZE 138e2ed8f35SAlexander Motin #define UDBHASHSIZE 128 13915bd2b43SDavid Greenman #endif 14015bd2b43SDavid Greenman 14182cea7e6SBjoern A. Zeeb VNET_DEFINE(struct udpstat, udpstat); /* from udp_var.h */ 142eddfbb76SRobert Watson SYSCTL_VNET_STRUCT(_net_inet_udp, UDPCTL_STATS, stats, CTLFLAG_RW, 143eddfbb76SRobert Watson &VNET_NAME(udpstat), udpstat, 1448b615593SMarko Zec "UDP statistics (struct udpstat, netinet/udp_var.h)"); 145f2ea20e6SGarrett Wollman 146bc725eafSRobert Watson static void udp_detach(struct socket *so); 1474d77a549SAlfred Perlstein static int udp_output(struct inpcb *, struct mbuf *, struct sockaddr *, 1484d77a549SAlfred Perlstein struct mbuf *, struct thread *); 1497b495c44SVANHULLEBUS Yvan #ifdef IPSEC 1507b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 1517b495c44SVANHULLEBUS Yvan #define UF_ESPINUDP_ALL (UF_ESPINUDP_NON_IKE|UF_ESPINUDP) 1527b495c44SVANHULLEBUS Yvan #ifdef INET 1537b495c44SVANHULLEBUS Yvan static struct mbuf *udp4_espdecap(struct inpcb *, struct mbuf *, int); 1547b495c44SVANHULLEBUS Yvan #endif 1557b495c44SVANHULLEBUS Yvan #endif /* IPSEC_NAT_T */ 1567b495c44SVANHULLEBUS Yvan #endif /* IPSEC */ 157df8bae1dSRodney W. Grimes 1584f590175SPaul Saab static void 1594f590175SPaul Saab udp_zone_change(void *tag) 1604f590175SPaul Saab { 1614f590175SPaul Saab 162603724d3SBjoern A. Zeeb uma_zone_set_max(V_udbinfo.ipi_zone, maxsockets); 1636a9148feSBjoern A. Zeeb uma_zone_set_max(V_udpcb_zone, maxsockets); 1644f590175SPaul Saab } 1654f590175SPaul Saab 166d915b280SStephan Uphoff static int 167d915b280SStephan Uphoff udp_inpcb_init(void *mem, int size, int flags) 168d915b280SStephan Uphoff { 169af1ee11dSRobert Watson struct inpcb *inp; 17008651e1fSJohn Baldwin 171af1ee11dSRobert Watson inp = mem; 172d915b280SStephan Uphoff INP_LOCK_INIT(inp, "inp", "udpinp"); 173d915b280SStephan Uphoff return (0); 174d915b280SStephan Uphoff } 175d915b280SStephan Uphoff 176df8bae1dSRodney W. Grimes void 177af1ee11dSRobert Watson udp_init(void) 178df8bae1dSRodney W. Grimes { 179af1ee11dSRobert Watson 1809bcd427bSRobert Watson in_pcbinfo_init(&V_udbinfo, "udp", &V_udb, UDBHASHSIZE, UDBHASHSIZE, 1819bcd427bSRobert Watson "udp_inpcb", udp_inpcb_init, NULL, UMA_ZONE_NOFREE); 1826a9148feSBjoern A. Zeeb V_udpcb_zone = uma_zcreate("udpcb", sizeof(struct udpcb), 1836a9148feSBjoern A. Zeeb NULL, NULL, NULL, NULL, UMA_ALIGN_PTR, UMA_ZONE_NOFREE); 1846a9148feSBjoern A. Zeeb uma_zone_set_max(V_udpcb_zone, maxsockets); 1854f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, udp_zone_change, NULL, 1864f590175SPaul Saab EVENTHANDLER_PRI_ANY); 187df8bae1dSRodney W. Grimes } 188df8bae1dSRodney W. Grimes 189315e3e38SRobert Watson /* 190315e3e38SRobert Watson * Kernel module interface for updating udpstat. The argument is an index 191315e3e38SRobert Watson * into udpstat treated as an array of u_long. While this encodes the 192315e3e38SRobert Watson * general layout of udpstat into the caller, it doesn't encode its location, 193315e3e38SRobert Watson * so that future changes to add, for example, per-CPU stats support won't 194315e3e38SRobert Watson * cause binary compatibility problems for kernel modules. 195315e3e38SRobert Watson */ 196315e3e38SRobert Watson void 197315e3e38SRobert Watson kmod_udpstat_inc(int statnum) 198315e3e38SRobert Watson { 199315e3e38SRobert Watson 200315e3e38SRobert Watson (*((u_long *)&V_udpstat + statnum))++; 201315e3e38SRobert Watson } 202315e3e38SRobert Watson 2036a9148feSBjoern A. Zeeb int 2046a9148feSBjoern A. Zeeb udp_newudpcb(struct inpcb *inp) 2056a9148feSBjoern A. Zeeb { 2066a9148feSBjoern A. Zeeb struct udpcb *up; 2076a9148feSBjoern A. Zeeb 2086a9148feSBjoern A. Zeeb up = uma_zalloc(V_udpcb_zone, M_NOWAIT | M_ZERO); 2096a9148feSBjoern A. Zeeb if (up == NULL) 2106a9148feSBjoern A. Zeeb return (ENOBUFS); 2116a9148feSBjoern A. Zeeb inp->inp_ppcb = up; 2126a9148feSBjoern A. Zeeb return (0); 2136a9148feSBjoern A. Zeeb } 2146a9148feSBjoern A. Zeeb 2156a9148feSBjoern A. Zeeb void 2166a9148feSBjoern A. Zeeb udp_discardcb(struct udpcb *up) 2176a9148feSBjoern A. Zeeb { 2186a9148feSBjoern A. Zeeb 2196a9148feSBjoern A. Zeeb uma_zfree(V_udpcb_zone, up); 2206a9148feSBjoern A. Zeeb } 2216a9148feSBjoern A. Zeeb 222bc29160dSMarko Zec #ifdef VIMAGE 223bc29160dSMarko Zec void 224bc29160dSMarko Zec udp_destroy(void) 225bc29160dSMarko Zec { 226bc29160dSMarko Zec 2279bcd427bSRobert Watson in_pcbinfo_destroy(&V_udbinfo); 228391dab1cSBjoern A. Zeeb uma_zdestroy(V_udpcb_zone); 229bc29160dSMarko Zec } 230bc29160dSMarko Zec #endif 231bc29160dSMarko Zec 23243bbb6aaSRobert Watson /* 23343bbb6aaSRobert Watson * Subroutine of udp_input(), which appends the provided mbuf chain to the 23443bbb6aaSRobert Watson * passed pcb/socket. The caller must provide a sockaddr_in via udp_in that 23543bbb6aaSRobert Watson * contains the source address. If the socket ends up being an IPv6 socket, 23643bbb6aaSRobert Watson * udp_append() will convert to a sockaddr_in6 before passing the address 23743bbb6aaSRobert Watson * into the socket code. 23843bbb6aaSRobert Watson */ 23943bbb6aaSRobert Watson static void 24043bbb6aaSRobert Watson udp_append(struct inpcb *inp, struct ip *ip, struct mbuf *n, int off, 24143bbb6aaSRobert Watson struct sockaddr_in *udp_in) 24243bbb6aaSRobert Watson { 24343bbb6aaSRobert Watson struct sockaddr *append_sa; 24443bbb6aaSRobert Watson struct socket *so; 24543bbb6aaSRobert Watson struct mbuf *opts = 0; 24643bbb6aaSRobert Watson #ifdef INET6 24743bbb6aaSRobert Watson struct sockaddr_in6 udp_in6; 24843bbb6aaSRobert Watson #endif 2497b495c44SVANHULLEBUS Yvan struct udpcb *up; 25043bbb6aaSRobert Watson 251119d85f6SRobert Watson INP_RLOCK_ASSERT(inp); 25243bbb6aaSRobert Watson 253*79bb84fbSEdward Tomasz Napierala /* 254*79bb84fbSEdward Tomasz Napierala * Engage the tunneling protocol. 255*79bb84fbSEdward Tomasz Napierala */ 256*79bb84fbSEdward Tomasz Napierala up = intoudpcb(inp); 257*79bb84fbSEdward Tomasz Napierala if (up->u_tun_func != NULL) { 258*79bb84fbSEdward Tomasz Napierala (*up->u_tun_func)(n, off, inp); 259*79bb84fbSEdward Tomasz Napierala return; 260*79bb84fbSEdward Tomasz Napierala } 261*79bb84fbSEdward Tomasz Napierala 262*79bb84fbSEdward Tomasz Napierala if (n == NULL) 263*79bb84fbSEdward Tomasz Napierala return; 264*79bb84fbSEdward Tomasz Napierala 265*79bb84fbSEdward Tomasz Napierala off += sizeof(struct udphdr); 266*79bb84fbSEdward Tomasz Napierala 26743bbb6aaSRobert Watson #ifdef IPSEC 26843bbb6aaSRobert Watson /* Check AH/ESP integrity. */ 26943bbb6aaSRobert Watson if (ipsec4_in_reject(n, inp)) { 27043bbb6aaSRobert Watson m_freem(n); 271603724d3SBjoern A. Zeeb V_ipsec4stat.in_polvio++; 27243bbb6aaSRobert Watson return; 27343bbb6aaSRobert Watson } 2747b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 2757b495c44SVANHULLEBUS Yvan #ifdef INET 2767b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 2777b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: udpcb NULL", __func__)); 2787b495c44SVANHULLEBUS Yvan if (up->u_flags & UF_ESPINUDP_ALL) { /* IPSec UDP encaps. */ 2797b495c44SVANHULLEBUS Yvan n = udp4_espdecap(inp, n, off); 2807b495c44SVANHULLEBUS Yvan if (n == NULL) /* Consumed. */ 2817b495c44SVANHULLEBUS Yvan return; 2827b495c44SVANHULLEBUS Yvan } 2837b495c44SVANHULLEBUS Yvan #endif /* INET */ 2847b495c44SVANHULLEBUS Yvan #endif /* IPSEC_NAT_T */ 28543bbb6aaSRobert Watson #endif /* IPSEC */ 28643bbb6aaSRobert Watson #ifdef MAC 28730d239bcSRobert Watson if (mac_inpcb_check_deliver(inp, n) != 0) { 28843bbb6aaSRobert Watson m_freem(n); 28943bbb6aaSRobert Watson return; 29043bbb6aaSRobert Watson } 29143bbb6aaSRobert Watson #endif 29243bbb6aaSRobert Watson if (inp->inp_flags & INP_CONTROLOPTS || 29343bbb6aaSRobert Watson inp->inp_socket->so_options & (SO_TIMESTAMP | SO_BINTIME)) { 29443bbb6aaSRobert Watson #ifdef INET6 2959a38ba81SBjoern A. Zeeb if (inp->inp_vflag & INP_IPV6) 29648d48eb9SBjoern A. Zeeb (void)ip6_savecontrol_v4(inp, n, &opts, NULL); 2979a38ba81SBjoern A. Zeeb else 29843bbb6aaSRobert Watson #endif 29943bbb6aaSRobert Watson ip_savecontrol(inp, &opts, ip, n); 30043bbb6aaSRobert Watson } 30143bbb6aaSRobert Watson #ifdef INET6 30243bbb6aaSRobert Watson if (inp->inp_vflag & INP_IPV6) { 30343bbb6aaSRobert Watson bzero(&udp_in6, sizeof(udp_in6)); 30443bbb6aaSRobert Watson udp_in6.sin6_len = sizeof(udp_in6); 30543bbb6aaSRobert Watson udp_in6.sin6_family = AF_INET6; 30643bbb6aaSRobert Watson in6_sin_2_v4mapsin6(udp_in, &udp_in6); 30743bbb6aaSRobert Watson append_sa = (struct sockaddr *)&udp_in6; 30843bbb6aaSRobert Watson } else 30943bbb6aaSRobert Watson #endif 31043bbb6aaSRobert Watson append_sa = (struct sockaddr *)udp_in; 31143bbb6aaSRobert Watson m_adj(n, off); 31243bbb6aaSRobert Watson 31343bbb6aaSRobert Watson so = inp->inp_socket; 31443bbb6aaSRobert Watson SOCKBUF_LOCK(&so->so_rcv); 31543bbb6aaSRobert Watson if (sbappendaddr_locked(&so->so_rcv, append_sa, n, opts) == 0) { 31643bbb6aaSRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 31743bbb6aaSRobert Watson m_freem(n); 31843bbb6aaSRobert Watson if (opts) 31943bbb6aaSRobert Watson m_freem(opts); 320026decb8SRobert Watson UDPSTAT_INC(udps_fullsock); 32143bbb6aaSRobert Watson } else 32243bbb6aaSRobert Watson sorwakeup_locked(so); 32343bbb6aaSRobert Watson } 32443bbb6aaSRobert Watson 325df8bae1dSRodney W. Grimes void 3263329b236SRobert Watson udp_input(struct mbuf *m, int off) 327df8bae1dSRodney W. Grimes { 328cfa1ca9dSYoshinobu Inoue int iphlen = off; 3293329b236SRobert Watson struct ip *ip; 3303329b236SRobert Watson struct udphdr *uh; 33171498f30SBruce M Simpson struct ifnet *ifp; 3323329b236SRobert Watson struct inpcb *inp; 333df8bae1dSRodney W. Grimes int len; 334df8bae1dSRodney W. Grimes struct ip save_ip; 335d4b509bdSRobert Watson struct sockaddr_in udp_in; 3360b4ae859SGleb Smirnoff #ifdef IPFIREWALL_FORWARD 3370b4ae859SGleb Smirnoff struct m_tag *fwd_tag; 3380b4ae859SGleb Smirnoff #endif 339df8bae1dSRodney W. Grimes 34071498f30SBruce M Simpson ifp = m->m_pkthdr.rcvif; 341026decb8SRobert Watson UDPSTAT_INC(udps_ipackets); 342df8bae1dSRodney W. Grimes 343df8bae1dSRodney W. Grimes /* 3443329b236SRobert Watson * Strip IP options, if any; should skip this, make available to 3453329b236SRobert Watson * user, and use on returned packets, but we don't yet have a way to 3463329b236SRobert Watson * check the checksum with options still present. 347df8bae1dSRodney W. Grimes */ 348df8bae1dSRodney W. Grimes if (iphlen > sizeof (struct ip)) { 349df8bae1dSRodney W. Grimes ip_stripoptions(m, (struct mbuf *)0); 350df8bae1dSRodney W. Grimes iphlen = sizeof(struct ip); 351df8bae1dSRodney W. Grimes } 352df8bae1dSRodney W. Grimes 353df8bae1dSRodney W. Grimes /* 354df8bae1dSRodney W. Grimes * Get IP and UDP header together in first mbuf. 355df8bae1dSRodney W. Grimes */ 356df8bae1dSRodney W. Grimes ip = mtod(m, struct ip *); 357df8bae1dSRodney W. Grimes if (m->m_len < iphlen + sizeof(struct udphdr)) { 358df8bae1dSRodney W. Grimes if ((m = m_pullup(m, iphlen + sizeof(struct udphdr))) == 0) { 359026decb8SRobert Watson UDPSTAT_INC(udps_hdrops); 360df8bae1dSRodney W. Grimes return; 361df8bae1dSRodney W. Grimes } 362df8bae1dSRodney W. Grimes ip = mtod(m, struct ip *); 363df8bae1dSRodney W. Grimes } 364df8bae1dSRodney W. Grimes uh = (struct udphdr *)((caddr_t)ip + iphlen); 365df8bae1dSRodney W. Grimes 3663329b236SRobert Watson /* 3673329b236SRobert Watson * Destination port of 0 is illegal, based on RFC768. 3683329b236SRobert Watson */ 369686cdd19SJun-ichiro itojun Hagino if (uh->uh_dport == 0) 370f76fcf6dSJeffrey Hsu goto badunlocked; 371686cdd19SJun-ichiro itojun Hagino 372df8bae1dSRodney W. Grimes /* 3733329b236SRobert Watson * Construct sockaddr format source address. Stuff source address 3743329b236SRobert Watson * and datagram in user buffer. 375b9234fafSSam Leffler */ 376d4b509bdSRobert Watson bzero(&udp_in, sizeof(udp_in)); 377d4b509bdSRobert Watson udp_in.sin_len = sizeof(udp_in); 378d4b509bdSRobert Watson udp_in.sin_family = AF_INET; 379b9234fafSSam Leffler udp_in.sin_port = uh->uh_sport; 380b9234fafSSam Leffler udp_in.sin_addr = ip->ip_src; 381b9234fafSSam Leffler 382b9234fafSSam Leffler /* 383af1ee11dSRobert Watson * Make mbuf data length reflect UDP length. If not enough data to 384af1ee11dSRobert Watson * reflect UDP length, drop. 385df8bae1dSRodney W. Grimes */ 386df8bae1dSRodney W. Grimes len = ntohs((u_short)uh->uh_ulen); 387df8bae1dSRodney W. Grimes if (ip->ip_len != len) { 3887eb7a449SAndras Olah if (len > ip->ip_len || len < sizeof(struct udphdr)) { 389026decb8SRobert Watson UDPSTAT_INC(udps_badlen); 390f76fcf6dSJeffrey Hsu goto badunlocked; 391df8bae1dSRodney W. Grimes } 392df8bae1dSRodney W. Grimes m_adj(m, len - ip->ip_len); 393df8bae1dSRodney W. Grimes /* ip->ip_len = len; */ 394df8bae1dSRodney W. Grimes } 3953329b236SRobert Watson 396df8bae1dSRodney W. Grimes /* 3973329b236SRobert Watson * Save a copy of the IP header in case we want restore it for 3983329b236SRobert Watson * sending an ICMP error message in response. 399df8bae1dSRodney W. Grimes */ 400603724d3SBjoern A. Zeeb if (!V_udp_blackhole) 401df8bae1dSRodney W. Grimes save_ip = *ip; 402cce418d3SMatt Jacob else 403cce418d3SMatt Jacob memset(&save_ip, 0, sizeof(save_ip)); 404df8bae1dSRodney W. Grimes 405df8bae1dSRodney W. Grimes /* 406df8bae1dSRodney W. Grimes * Checksum extended UDP header and data. 407df8bae1dSRodney W. Grimes */ 4086dfab5b1SGarrett Wollman if (uh->uh_sum) { 40939629c92SDavid Malone u_short uh_sum; 41039629c92SDavid Malone 411db4f9cc7SJonathan Lemon if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) { 412db4f9cc7SJonathan Lemon if (m->m_pkthdr.csum_flags & CSUM_PSEUDO_HDR) 41339629c92SDavid Malone uh_sum = m->m_pkthdr.csum_data; 414db4f9cc7SJonathan Lemon else 41539629c92SDavid Malone uh_sum = in_pseudo(ip->ip_src.s_addr, 416506f4949SRuslan Ermilov ip->ip_dst.s_addr, htonl((u_short)len + 417db4f9cc7SJonathan Lemon m->m_pkthdr.csum_data + IPPROTO_UDP)); 41839629c92SDavid Malone uh_sum ^= 0xffff; 419db4f9cc7SJonathan Lemon } else { 420cb342100SHajimu UMEMOTO char b[9]; 421af1ee11dSRobert Watson 422cb342100SHajimu UMEMOTO bcopy(((struct ipovly *)ip)->ih_x1, b, 9); 4236effc713SDoug Rabson bzero(((struct ipovly *)ip)->ih_x1, 9); 424df8bae1dSRodney W. Grimes ((struct ipovly *)ip)->ih_len = uh->uh_ulen; 42539629c92SDavid Malone uh_sum = in_cksum(m, len + sizeof (struct ip)); 426cb342100SHajimu UMEMOTO bcopy(b, ((struct ipovly *)ip)->ih_x1, 9); 427db4f9cc7SJonathan Lemon } 42839629c92SDavid Malone if (uh_sum) { 429026decb8SRobert Watson UDPSTAT_INC(udps_badsum); 430df8bae1dSRodney W. Grimes m_freem(m); 431df8bae1dSRodney W. Grimes return; 432df8bae1dSRodney W. Grimes } 433fb9aaba0SRuslan Ermilov } else 434026decb8SRobert Watson UDPSTAT_INC(udps_nosum); 435df8bae1dSRodney W. Grimes 4360b4ae859SGleb Smirnoff #ifdef IPFIREWALL_FORWARD 4373329b236SRobert Watson /* 4383329b236SRobert Watson * Grab info from PACKET_TAG_IPFORWARD tag prepended to the chain. 4393329b236SRobert Watson */ 4400b4ae859SGleb Smirnoff fwd_tag = m_tag_find(m, PACKET_TAG_IPFORWARD, NULL); 4410b4ae859SGleb Smirnoff if (fwd_tag != NULL) { 4420b4ae859SGleb Smirnoff struct sockaddr_in *next_hop; 4430b4ae859SGleb Smirnoff 4443329b236SRobert Watson /* 4453329b236SRobert Watson * Do the hack. 4463329b236SRobert Watson */ 4470b4ae859SGleb Smirnoff next_hop = (struct sockaddr_in *)(fwd_tag + 1); 4480b4ae859SGleb Smirnoff ip->ip_dst = next_hop->sin_addr; 4490b4ae859SGleb Smirnoff uh->uh_dport = ntohs(next_hop->sin_port); 4503329b236SRobert Watson 4513329b236SRobert Watson /* 4523329b236SRobert Watson * Remove the tag from the packet. We don't need it anymore. 4533329b236SRobert Watson */ 4540b4ae859SGleb Smirnoff m_tag_delete(m, fwd_tag); 4550b4ae859SGleb Smirnoff } 4560b4ae859SGleb Smirnoff #endif 4570b4ae859SGleb Smirnoff 458603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 459df8bae1dSRodney W. Grimes if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) || 46071498f30SBruce M Simpson in_broadcast(ip->ip_dst, ifp)) { 46182c23ebaSBill Fenner struct inpcb *last; 46271498f30SBruce M Simpson struct ip_moptions *imo; 4633329b236SRobert Watson 464df8bae1dSRodney W. Grimes last = NULL; 465603724d3SBjoern A. Zeeb LIST_FOREACH(inp, &V_udb, inp_list) { 4669c1df695SRobert Watson if (inp->inp_lport != uh->uh_dport) 467f76fcf6dSJeffrey Hsu continue; 468cfa1ca9dSYoshinobu Inoue #ifdef INET6 469369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 4709c1df695SRobert Watson continue; 471cfa1ca9dSYoshinobu Inoue #endif 47271498f30SBruce M Simpson if (inp->inp_laddr.s_addr != INADDR_ANY && 47371498f30SBruce M Simpson inp->inp_laddr.s_addr != ip->ip_dst.s_addr) 4749c1df695SRobert Watson continue; 47571498f30SBruce M Simpson if (inp->inp_faddr.s_addr != INADDR_ANY && 47671498f30SBruce M Simpson inp->inp_faddr.s_addr != ip->ip_src.s_addr) 47771498f30SBruce M Simpson continue; 47871498f30SBruce M Simpson if (inp->inp_fport != 0 && 479df8bae1dSRodney W. Grimes inp->inp_fport != uh->uh_sport) 4809c1df695SRobert Watson continue; 48171498f30SBruce M Simpson 482119d85f6SRobert Watson INP_RLOCK(inp); 483df8bae1dSRodney W. Grimes 48483453a06SBruce M Simpson /* 48571498f30SBruce M Simpson * Handle socket delivery policy for any-source 48671498f30SBruce M Simpson * and source-specific multicast. [RFC3678] 48783453a06SBruce M Simpson */ 48871498f30SBruce M Simpson imo = inp->inp_moptions; 489a38b1c8cSRandall Stewart if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr))) { 490d10910e6SBruce M Simpson struct sockaddr_in group; 491d10910e6SBruce M Simpson int blocked; 492a38b1c8cSRandall Stewart if (imo == NULL) { 493a38b1c8cSRandall Stewart INP_RUNLOCK(inp); 494a38b1c8cSRandall Stewart continue; 495a38b1c8cSRandall Stewart } 496d10910e6SBruce M Simpson bzero(&group, sizeof(struct sockaddr_in)); 497d10910e6SBruce M Simpson group.sin_len = sizeof(struct sockaddr_in); 498d10910e6SBruce M Simpson group.sin_family = AF_INET; 499d10910e6SBruce M Simpson group.sin_addr = ip->ip_dst; 50071498f30SBruce M Simpson 501d10910e6SBruce M Simpson blocked = imo_multi_filter(imo, ifp, 502d10910e6SBruce M Simpson (struct sockaddr *)&group, 50371498f30SBruce M Simpson (struct sockaddr *)&udp_in); 504d10910e6SBruce M Simpson if (blocked != MCAST_PASS) { 505d10910e6SBruce M Simpson if (blocked == MCAST_NOTGMEMBER) 50686425c62SRobert Watson IPSTAT_INC(ips_notmember); 507d10910e6SBruce M Simpson if (blocked == MCAST_NOTSMEMBER || 508d10910e6SBruce M Simpson blocked == MCAST_MUTED) 509026decb8SRobert Watson UDPSTAT_INC(udps_filtermcast); 510119d85f6SRobert Watson INP_RUNLOCK(inp); 5119c1df695SRobert Watson continue; 5129c1df695SRobert Watson } 51383453a06SBruce M Simpson } 514df8bae1dSRodney W. Grimes if (last != NULL) { 515df8bae1dSRodney W. Grimes struct mbuf *n; 516df8bae1dSRodney W. Grimes 517032dcc76SLuigi Rizzo n = m_copy(m, 0, M_COPYALL); 518*79bb84fbSEdward Tomasz Napierala udp_append(last, ip, n, iphlen, &udp_in); 5196a9148feSBjoern A. Zeeb INP_RUNLOCK(last); 520df8bae1dSRodney W. Grimes } 52182c23ebaSBill Fenner last = inp; 522df8bae1dSRodney W. Grimes /* 523df8bae1dSRodney W. Grimes * Don't look for additional matches if this one does 524df8bae1dSRodney W. Grimes * not have either the SO_REUSEPORT or SO_REUSEADDR 5253329b236SRobert Watson * socket options set. This heuristic avoids 5263329b236SRobert Watson * searching through all pcbs in the common case of a 5273329b236SRobert Watson * non-shared port. It assumes that an application 5283329b236SRobert Watson * will never clear these options after setting them. 529df8bae1dSRodney W. Grimes */ 5303329b236SRobert Watson if ((last->inp_socket->so_options & 5313329b236SRobert Watson (SO_REUSEPORT|SO_REUSEADDR)) == 0) 532df8bae1dSRodney W. Grimes break; 533df8bae1dSRodney W. Grimes } 534df8bae1dSRodney W. Grimes 535df8bae1dSRodney W. Grimes if (last == NULL) { 536df8bae1dSRodney W. Grimes /* 5373329b236SRobert Watson * No matching pcb found; discard datagram. (No need 5383329b236SRobert Watson * to send an ICMP Port Unreachable for a broadcast 5393329b236SRobert Watson * or multicast datgram.) 540df8bae1dSRodney W. Grimes */ 541026decb8SRobert Watson UDPSTAT_INC(udps_noportbcast); 54261ffc0b1SJeffrey Hsu goto badheadlocked; 543df8bae1dSRodney W. Grimes } 544*79bb84fbSEdward Tomasz Napierala udp_append(last, ip, m, iphlen, &udp_in); 545c7c7ea4bSRandall Stewart INP_RUNLOCK(last); 546c7c7ea4bSRandall Stewart INP_INFO_RUNLOCK(&V_udbinfo); 547df8bae1dSRodney W. Grimes return; 548df8bae1dSRodney W. Grimes } 5493329b236SRobert Watson 550df8bae1dSRodney W. Grimes /* 5516d6a026bSDavid Greenman * Locate pcb for datagram. 552df8bae1dSRodney W. Grimes */ 553603724d3SBjoern A. Zeeb inp = in_pcblookup_hash(&V_udbinfo, ip->ip_src, uh->uh_sport, 55471498f30SBruce M Simpson ip->ip_dst, uh->uh_dport, 1, ifp); 55515bd2b43SDavid Greenman if (inp == NULL) { 556afdb4274SRobert Watson if (udp_log_in_vain) { 557df5c0b8aSBill Fenner char buf[4*sizeof "123"]; 55875cfc95fSAndrey A. Chernov 55975cfc95fSAndrey A. Chernov strcpy(buf, inet_ntoa(ip->ip_dst)); 560592071e8SBruce Evans log(LOG_INFO, 561592071e8SBruce Evans "Connection attempt to UDP %s:%d from %s:%d\n", 562592071e8SBruce Evans buf, ntohs(uh->uh_dport), inet_ntoa(ip->ip_src), 563592071e8SBruce Evans ntohs(uh->uh_sport)); 56475cfc95fSAndrey A. Chernov } 565026decb8SRobert Watson UDPSTAT_INC(udps_noport); 566df8bae1dSRodney W. Grimes if (m->m_flags & (M_BCAST | M_MCAST)) { 567026decb8SRobert Watson UDPSTAT_INC(udps_noportbcast); 56861ffc0b1SJeffrey Hsu goto badheadlocked; 569df8bae1dSRodney W. Grimes } 570603724d3SBjoern A. Zeeb if (V_udp_blackhole) 57161ffc0b1SJeffrey Hsu goto badheadlocked; 5721cbd978eSLuigi Rizzo if (badport_bandlim(BANDLIM_ICMP_UNREACH) < 0) 5731cbd978eSLuigi Rizzo goto badheadlocked; 57404287599SRuslan Ermilov *ip = save_ip; 57504287599SRuslan Ermilov ip->ip_len += iphlen; 576582a7760SBruce Evans icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_PORT, 0, 0); 577603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 578df8bae1dSRodney W. Grimes return; 579df8bae1dSRodney W. Grimes } 5803329b236SRobert Watson 5813329b236SRobert Watson /* 5823329b236SRobert Watson * Check the minimum TTL for socket. 5833329b236SRobert Watson */ 584119d85f6SRobert Watson INP_RLOCK(inp); 585603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 58610cc62b7SRobert Watson if (inp->inp_ip_minttl && inp->inp_ip_minttl > ip->ip_ttl) { 58710cc62b7SRobert Watson INP_RUNLOCK(inp); 58810cc62b7SRobert Watson goto badunlocked; 58910cc62b7SRobert Watson } 590*79bb84fbSEdward Tomasz Napierala udp_append(inp, ip, m, iphlen, &udp_in); 591119d85f6SRobert Watson INP_RUNLOCK(inp); 592df8bae1dSRodney W. Grimes return; 59361ffc0b1SJeffrey Hsu 59461ffc0b1SJeffrey Hsu badheadlocked: 595f76fcf6dSJeffrey Hsu if (inp) 596119d85f6SRobert Watson INP_RUNLOCK(inp); 597603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 598f76fcf6dSJeffrey Hsu badunlocked: 599df8bae1dSRodney W. Grimes m_freem(m); 600cfa1ca9dSYoshinobu Inoue } 601cfa1ca9dSYoshinobu Inoue 602cfa1ca9dSYoshinobu Inoue /* 6033329b236SRobert Watson * Notify a udp user of an asynchronous error; just wake up so that they can 6043329b236SRobert Watson * collect error status. 605df8bae1dSRodney W. Grimes */ 6063ce144eaSJeffrey Hsu struct inpcb * 6073329b236SRobert Watson udp_notify(struct inpcb *inp, int errno) 608df8bae1dSRodney W. Grimes { 6093329b236SRobert Watson 610ac9ae279SRobert Watson /* 611ac9ae279SRobert Watson * While udp_ctlinput() always calls udp_notify() with a read lock 612ac9ae279SRobert Watson * when invoking it directly, in_pcbnotifyall() currently uses write 613ac9ae279SRobert Watson * locks due to sharing code with TCP. For now, accept either a read 614ac9ae279SRobert Watson * or a write lock, but a read lock is sufficient. 615ac9ae279SRobert Watson */ 616ac9ae279SRobert Watson INP_LOCK_ASSERT(inp); 6178501a69cSRobert Watson 618df8bae1dSRodney W. Grimes inp->inp_socket->so_error = errno; 619df8bae1dSRodney W. Grimes sorwakeup(inp->inp_socket); 620df8bae1dSRodney W. Grimes sowwakeup(inp->inp_socket); 6213329b236SRobert Watson return (inp); 622df8bae1dSRodney W. Grimes } 623df8bae1dSRodney W. Grimes 624df8bae1dSRodney W. Grimes void 6253329b236SRobert Watson udp_ctlinput(int cmd, struct sockaddr *sa, void *vip) 626df8bae1dSRodney W. Grimes { 627c693a045SJonathan Lemon struct ip *ip = vip; 628c693a045SJonathan Lemon struct udphdr *uh; 629c693a045SJonathan Lemon struct in_addr faddr; 630c693a045SJonathan Lemon struct inpcb *inp; 631c693a045SJonathan Lemon 632c693a045SJonathan Lemon faddr = ((struct sockaddr_in *)sa)->sin_addr; 633c693a045SJonathan Lemon if (sa->sa_family != AF_INET || faddr.s_addr == INADDR_ANY) 634c693a045SJonathan Lemon return; 635df8bae1dSRodney W. Grimes 63697d8d152SAndre Oppermann /* 63797d8d152SAndre Oppermann * Redirects don't need to be handled up here. 63897d8d152SAndre Oppermann */ 63997d8d152SAndre Oppermann if (PRC_IS_REDIRECT(cmd)) 64097d8d152SAndre Oppermann return; 6413329b236SRobert Watson 64297d8d152SAndre Oppermann /* 64397d8d152SAndre Oppermann * Hostdead is ugly because it goes linearly through all PCBs. 6443329b236SRobert Watson * 6453329b236SRobert Watson * XXX: We never get this from ICMP, otherwise it makes an excellent 6463329b236SRobert Watson * DoS attack on machines with many connections. 64797d8d152SAndre Oppermann */ 64897d8d152SAndre Oppermann if (cmd == PRC_HOSTDEAD) 649af1ee11dSRobert Watson ip = NULL; 650d1c54148SJesper Skriver else if ((unsigned)cmd >= PRC_NCMDS || inetctlerrmap[cmd] == 0) 651df8bae1dSRodney W. Grimes return; 652af1ee11dSRobert Watson if (ip != NULL) { 653df8bae1dSRodney W. Grimes uh = (struct udphdr *)((caddr_t)ip + (ip->ip_hl << 2)); 654603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 655603724d3SBjoern A. Zeeb inp = in_pcblookup_hash(&V_udbinfo, faddr, uh->uh_dport, 656c693a045SJonathan Lemon ip->ip_src, uh->uh_sport, 0, NULL); 657f76fcf6dSJeffrey Hsu if (inp != NULL) { 658ac9ae279SRobert Watson INP_RLOCK(inp); 659f76fcf6dSJeffrey Hsu if (inp->inp_socket != NULL) { 660f5514f08SRobert Watson udp_notify(inp, inetctlerrmap[cmd]); 661f76fcf6dSJeffrey Hsu } 662ac9ae279SRobert Watson INP_RUNLOCK(inp); 663f76fcf6dSJeffrey Hsu } 664603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 665df8bae1dSRodney W. Grimes } else 666603724d3SBjoern A. Zeeb in_pcbnotifyall(&V_udbinfo, faddr, inetctlerrmap[cmd], 667f5514f08SRobert Watson udp_notify); 668df8bae1dSRodney W. Grimes } 669df8bae1dSRodney W. Grimes 6700312fbe9SPoul-Henning Kamp static int 67182d9ae4eSPoul-Henning Kamp udp_pcblist(SYSCTL_HANDLER_ARGS) 67298271db4SGarrett Wollman { 673277afaffSRobert Watson int error, i, n; 67498271db4SGarrett Wollman struct inpcb *inp, **inp_list; 67598271db4SGarrett Wollman inp_gen_t gencnt; 67698271db4SGarrett Wollman struct xinpgen xig; 67798271db4SGarrett Wollman 67898271db4SGarrett Wollman /* 679f5514f08SRobert Watson * The process of preparing the PCB list is too time-consuming and 68098271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 68198271db4SGarrett Wollman */ 68298271db4SGarrett Wollman if (req->oldptr == 0) { 683603724d3SBjoern A. Zeeb n = V_udbinfo.ipi_count; 684c007b96aSJohn Baldwin n += imax(n / 8, 10); 685c007b96aSJohn Baldwin req->oldidx = 2 * (sizeof xig) + n * sizeof(struct xinpcb); 6863329b236SRobert Watson return (0); 68798271db4SGarrett Wollman } 68898271db4SGarrett Wollman 68998271db4SGarrett Wollman if (req->newptr != 0) 6903329b236SRobert Watson return (EPERM); 69198271db4SGarrett Wollman 69298271db4SGarrett Wollman /* 69398271db4SGarrett Wollman * OK, now we're committed to doing something. 69498271db4SGarrett Wollman */ 695603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 696603724d3SBjoern A. Zeeb gencnt = V_udbinfo.ipi_gencnt; 697603724d3SBjoern A. Zeeb n = V_udbinfo.ipi_count; 698603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 69998271db4SGarrett Wollman 70047934cefSDon Lewis error = sysctl_wire_old_buffer(req, 2 * (sizeof xig) 7015c38b6dbSDon Lewis + n * sizeof(struct xinpcb)); 70247934cefSDon Lewis if (error != 0) 70347934cefSDon Lewis return (error); 7045c38b6dbSDon Lewis 70598271db4SGarrett Wollman xig.xig_len = sizeof xig; 70698271db4SGarrett Wollman xig.xig_count = n; 70798271db4SGarrett Wollman xig.xig_gen = gencnt; 70898271db4SGarrett Wollman xig.xig_sogen = so_gencnt; 70998271db4SGarrett Wollman error = SYSCTL_OUT(req, &xig, sizeof xig); 71098271db4SGarrett Wollman if (error) 7113329b236SRobert Watson return (error); 71298271db4SGarrett Wollman 713a163d034SWarner Losh inp_list = malloc(n * sizeof *inp_list, M_TEMP, M_WAITOK); 71498271db4SGarrett Wollman if (inp_list == 0) 7153329b236SRobert Watson return (ENOMEM); 71698271db4SGarrett Wollman 717603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 718603724d3SBjoern A. Zeeb for (inp = LIST_FIRST(V_udbinfo.ipi_listhead), i = 0; inp && i < n; 719fc2ffbe6SPoul-Henning Kamp inp = LIST_NEXT(inp, inp_list)) { 720d0e157f6SBjoern A. Zeeb INP_WLOCK(inp); 7212ded288cSJeffrey Hsu if (inp->inp_gencnt <= gencnt && 722d0e157f6SBjoern A. Zeeb cr_canseeinpcb(req->td->td_ucred, inp) == 0) { 723d0e157f6SBjoern A. Zeeb in_pcbref(inp); 72498271db4SGarrett Wollman inp_list[i++] = inp; 725d0e157f6SBjoern A. Zeeb } 726d0e157f6SBjoern A. Zeeb INP_WUNLOCK(inp); 7274787fd37SPaul Saab } 728603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 72998271db4SGarrett Wollman n = i; 73098271db4SGarrett Wollman 73198271db4SGarrett Wollman error = 0; 73298271db4SGarrett Wollman for (i = 0; i < n; i++) { 73398271db4SGarrett Wollman inp = inp_list[i]; 7349622e84fSRobert Watson INP_RLOCK(inp); 73598271db4SGarrett Wollman if (inp->inp_gencnt <= gencnt) { 73698271db4SGarrett Wollman struct xinpcb xi; 737d0e157f6SBjoern A. Zeeb 738fd94099eSColin Percival bzero(&xi, sizeof(xi)); 73998271db4SGarrett Wollman xi.xi_len = sizeof xi; 74098271db4SGarrett Wollman /* XXX should avoid extra copy */ 74198271db4SGarrett Wollman bcopy(inp, &xi.xi_inp, sizeof *inp); 74298271db4SGarrett Wollman if (inp->inp_socket) 74398271db4SGarrett Wollman sotoxsocket(inp->inp_socket, &xi.xi_socket); 7444b40c56cSJeffrey Hsu xi.xi_inp.inp_gencnt = inp->inp_gencnt; 7459622e84fSRobert Watson INP_RUNLOCK(inp); 74698271db4SGarrett Wollman error = SYSCTL_OUT(req, &xi, sizeof xi); 747d915b280SStephan Uphoff } else 7489622e84fSRobert Watson INP_RUNLOCK(inp); 74998271db4SGarrett Wollman } 750d0e157f6SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 751d0e157f6SBjoern A. Zeeb for (i = 0; i < n; i++) { 752d0e157f6SBjoern A. Zeeb inp = inp_list[i]; 753d0e157f6SBjoern A. Zeeb INP_WLOCK(inp); 754d0e157f6SBjoern A. Zeeb if (!in_pcbrele(inp)) 755d0e157f6SBjoern A. Zeeb INP_WUNLOCK(inp); 756d0e157f6SBjoern A. Zeeb } 757d0e157f6SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 758d0e157f6SBjoern A. Zeeb 75998271db4SGarrett Wollman if (!error) { 76098271db4SGarrett Wollman /* 7613329b236SRobert Watson * Give the user an updated idea of our state. If the 7623329b236SRobert Watson * generation differs from what we told her before, she knows 7633329b236SRobert Watson * that something happened while we were processing this 7643329b236SRobert Watson * request, and it might be necessary to retry. 76598271db4SGarrett Wollman */ 766603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 767603724d3SBjoern A. Zeeb xig.xig_gen = V_udbinfo.ipi_gencnt; 76898271db4SGarrett Wollman xig.xig_sogen = so_gencnt; 769603724d3SBjoern A. Zeeb xig.xig_count = V_udbinfo.ipi_count; 770603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 77198271db4SGarrett Wollman error = SYSCTL_OUT(req, &xig, sizeof xig); 77298271db4SGarrett Wollman } 77398271db4SGarrett Wollman free(inp_list, M_TEMP); 7743329b236SRobert Watson return (error); 77598271db4SGarrett Wollman } 77698271db4SGarrett Wollman 77779c3d51bSMatthew D Fleming SYSCTL_PROC(_net_inet_udp, UDPCTL_PCBLIST, pcblist, 77879c3d51bSMatthew D Fleming CTLTYPE_OPAQUE | CTLFLAG_RD, NULL, 0, 77998271db4SGarrett Wollman udp_pcblist, "S,xinpcb", "List of active UDP sockets"); 78098271db4SGarrett Wollman 78198271db4SGarrett Wollman static int 78282d9ae4eSPoul-Henning Kamp udp_getcred(SYSCTL_HANDLER_ARGS) 783490d50b6SBrian Feldman { 784c0511d3bSBrian Feldman struct xucred xuc; 785490d50b6SBrian Feldman struct sockaddr_in addrs[2]; 786490d50b6SBrian Feldman struct inpcb *inp; 787277afaffSRobert Watson int error; 788490d50b6SBrian Feldman 78932f9753cSRobert Watson error = priv_check(req->td, PRIV_NETINET_GETCRED); 790490d50b6SBrian Feldman if (error) 791490d50b6SBrian Feldman return (error); 792490d50b6SBrian Feldman error = SYSCTL_IN(req, addrs, sizeof(addrs)); 793490d50b6SBrian Feldman if (error) 794490d50b6SBrian Feldman return (error); 795603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 796603724d3SBjoern A. Zeeb inp = in_pcblookup_hash(&V_udbinfo, addrs[1].sin_addr, addrs[1].sin_port, 797cfa1ca9dSYoshinobu Inoue addrs[0].sin_addr, addrs[0].sin_port, 1, NULL); 7989622e84fSRobert Watson if (inp != NULL) { 7999622e84fSRobert Watson INP_RLOCK(inp); 800603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 8019622e84fSRobert Watson if (inp->inp_socket == NULL) 8029622e84fSRobert Watson error = ENOENT; 8039622e84fSRobert Watson if (error == 0) 804f08ef6c5SBjoern A. Zeeb error = cr_canseeinpcb(req->td->td_ucred, inp); 8059622e84fSRobert Watson if (error == 0) 80686d02c5cSBjoern A. Zeeb cru2x(inp->inp_cred, &xuc); 8079622e84fSRobert Watson INP_RUNLOCK(inp); 8089622e84fSRobert Watson } else { 809603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 8109622e84fSRobert Watson error = ENOENT; 8119622e84fSRobert Watson } 8120e1eebb8SDon Lewis if (error == 0) 8130e1eebb8SDon Lewis error = SYSCTL_OUT(req, &xuc, sizeof(struct xucred)); 814490d50b6SBrian Feldman return (error); 815490d50b6SBrian Feldman } 816490d50b6SBrian Feldman 8177ce87f12SDavid Malone SYSCTL_PROC(_net_inet_udp, OID_AUTO, getcred, 8187ce87f12SDavid Malone CTLTYPE_OPAQUE|CTLFLAG_RW|CTLFLAG_PRISON, 0, 0, 8197ce87f12SDavid Malone udp_getcred, "S,xucred", "Get the xucred of a UDP connection"); 820490d50b6SBrian Feldman 8217b495c44SVANHULLEBUS Yvan int 8227b495c44SVANHULLEBUS Yvan udp_ctloutput(struct socket *so, struct sockopt *sopt) 8237b495c44SVANHULLEBUS Yvan { 8247b495c44SVANHULLEBUS Yvan int error = 0, optval; 8257b495c44SVANHULLEBUS Yvan struct inpcb *inp; 8267b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8277b495c44SVANHULLEBUS Yvan struct udpcb *up; 8287b495c44SVANHULLEBUS Yvan #endif 8297b495c44SVANHULLEBUS Yvan 8307b495c44SVANHULLEBUS Yvan inp = sotoinpcb(so); 8317b495c44SVANHULLEBUS Yvan KASSERT(inp != NULL, ("%s: inp == NULL", __func__)); 8327b495c44SVANHULLEBUS Yvan INP_WLOCK(inp); 8337b495c44SVANHULLEBUS Yvan if (sopt->sopt_level != IPPROTO_UDP) { 8347b495c44SVANHULLEBUS Yvan #ifdef INET6 8357b495c44SVANHULLEBUS Yvan if (INP_CHECK_SOCKAF(so, AF_INET6)) { 8367b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8377b495c44SVANHULLEBUS Yvan error = ip6_ctloutput(so, sopt); 8387b495c44SVANHULLEBUS Yvan } else { 8397b495c44SVANHULLEBUS Yvan #endif 8407b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8417b495c44SVANHULLEBUS Yvan error = ip_ctloutput(so, sopt); 8427b495c44SVANHULLEBUS Yvan #ifdef INET6 8437b495c44SVANHULLEBUS Yvan } 8447b495c44SVANHULLEBUS Yvan #endif 8457b495c44SVANHULLEBUS Yvan return (error); 8467b495c44SVANHULLEBUS Yvan } 8477b495c44SVANHULLEBUS Yvan 8487b495c44SVANHULLEBUS Yvan switch (sopt->sopt_dir) { 8497b495c44SVANHULLEBUS Yvan case SOPT_SET: 8507b495c44SVANHULLEBUS Yvan switch (sopt->sopt_name) { 8517b495c44SVANHULLEBUS Yvan case UDP_ENCAP: 8527b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8537b495c44SVANHULLEBUS Yvan error = sooptcopyin(sopt, &optval, sizeof optval, 8547b495c44SVANHULLEBUS Yvan sizeof optval); 8557b495c44SVANHULLEBUS Yvan if (error) 8567b495c44SVANHULLEBUS Yvan break; 8577b495c44SVANHULLEBUS Yvan inp = sotoinpcb(so); 8587b495c44SVANHULLEBUS Yvan KASSERT(inp != NULL, ("%s: inp == NULL", __func__)); 8597b495c44SVANHULLEBUS Yvan INP_WLOCK(inp); 8607b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8617b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 8627b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: up == NULL", __func__)); 8637b495c44SVANHULLEBUS Yvan #endif 8647b495c44SVANHULLEBUS Yvan switch (optval) { 8657b495c44SVANHULLEBUS Yvan case 0: 8667b495c44SVANHULLEBUS Yvan /* Clear all UDP encap. */ 8677b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8687b495c44SVANHULLEBUS Yvan up->u_flags &= ~UF_ESPINUDP_ALL; 8697b495c44SVANHULLEBUS Yvan #endif 8707b495c44SVANHULLEBUS Yvan break; 8717b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8727b495c44SVANHULLEBUS Yvan case UDP_ENCAP_ESPINUDP: 8737b495c44SVANHULLEBUS Yvan case UDP_ENCAP_ESPINUDP_NON_IKE: 8747b495c44SVANHULLEBUS Yvan up->u_flags &= ~UF_ESPINUDP_ALL; 8757b495c44SVANHULLEBUS Yvan if (optval == UDP_ENCAP_ESPINUDP) 8767b495c44SVANHULLEBUS Yvan up->u_flags |= UF_ESPINUDP; 8777b495c44SVANHULLEBUS Yvan else if (optval == UDP_ENCAP_ESPINUDP_NON_IKE) 8787b495c44SVANHULLEBUS Yvan up->u_flags |= UF_ESPINUDP_NON_IKE; 8797b495c44SVANHULLEBUS Yvan break; 8807b495c44SVANHULLEBUS Yvan #endif 8817b495c44SVANHULLEBUS Yvan default: 8827b495c44SVANHULLEBUS Yvan error = EINVAL; 8837b495c44SVANHULLEBUS Yvan break; 8847b495c44SVANHULLEBUS Yvan } 8857b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8867b495c44SVANHULLEBUS Yvan break; 8877b495c44SVANHULLEBUS Yvan default: 8887b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8897b495c44SVANHULLEBUS Yvan error = ENOPROTOOPT; 8907b495c44SVANHULLEBUS Yvan break; 8917b495c44SVANHULLEBUS Yvan } 8927b495c44SVANHULLEBUS Yvan break; 8937b495c44SVANHULLEBUS Yvan case SOPT_GET: 8947b495c44SVANHULLEBUS Yvan switch (sopt->sopt_name) { 8957b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8967b495c44SVANHULLEBUS Yvan case UDP_ENCAP: 8977b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 8987b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: up == NULL", __func__)); 8997b495c44SVANHULLEBUS Yvan optval = up->u_flags & UF_ESPINUDP_ALL; 9007b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 9017b495c44SVANHULLEBUS Yvan error = sooptcopyout(sopt, &optval, sizeof optval); 9027b495c44SVANHULLEBUS Yvan break; 9037b495c44SVANHULLEBUS Yvan #endif 9047b495c44SVANHULLEBUS Yvan default: 9057b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 9067b495c44SVANHULLEBUS Yvan error = ENOPROTOOPT; 9077b495c44SVANHULLEBUS Yvan break; 9087b495c44SVANHULLEBUS Yvan } 9097b495c44SVANHULLEBUS Yvan break; 9107b495c44SVANHULLEBUS Yvan } 9117b495c44SVANHULLEBUS Yvan return (error); 9127b495c44SVANHULLEBUS Yvan } 9137b495c44SVANHULLEBUS Yvan 914490d50b6SBrian Feldman static int 9153329b236SRobert Watson udp_output(struct inpcb *inp, struct mbuf *m, struct sockaddr *addr, 9163329b236SRobert Watson struct mbuf *control, struct thread *td) 917df8bae1dSRodney W. Grimes { 9183329b236SRobert Watson struct udpiphdr *ui; 9193329b236SRobert Watson int len = m->m_pkthdr.len; 92090162a4eSIan Dowse struct in_addr faddr, laddr; 921c557ae16SIan Dowse struct cmsghdr *cm; 922c557ae16SIan Dowse struct sockaddr_in *sin, src; 92390162a4eSIan Dowse int error = 0; 9248afa2304SBruce M Simpson int ipflags; 92590162a4eSIan Dowse u_short fport, lport; 9265c32ea65SRobert Watson int unlock_udbinfo; 927df8bae1dSRodney W. Grimes 9285c32ea65SRobert Watson /* 9295c32ea65SRobert Watson * udp_output() may need to temporarily bind or connect the current 930f5514f08SRobert Watson * inpcb. As such, we don't know up front whether we will need the 931f5514f08SRobert Watson * pcbinfo lock or not. Do any work to decide what is needed up 932f5514f08SRobert Watson * front before acquiring any locks. 9335c32ea65SRobert Watson */ 934430d30d8SBill Fenner if (len + sizeof(struct udpiphdr) > IP_MAXPACKET) { 935c557ae16SIan Dowse if (control) 936c557ae16SIan Dowse m_freem(control); 9375c32ea65SRobert Watson m_freem(m); 9383329b236SRobert Watson return (EMSGSIZE); 939430d30d8SBill Fenner } 940430d30d8SBill Fenner 9411b7f0384SBruce M Simpson src.sin_family = 0; 942c557ae16SIan Dowse if (control != NULL) { 943c557ae16SIan Dowse /* 9443329b236SRobert Watson * XXX: Currently, we assume all the optional information is 9453329b236SRobert Watson * stored in a single mbuf. 946c557ae16SIan Dowse */ 947c557ae16SIan Dowse if (control->m_next) { 948c557ae16SIan Dowse m_freem(control); 9495c32ea65SRobert Watson m_freem(m); 9503329b236SRobert Watson return (EINVAL); 951c557ae16SIan Dowse } 952c557ae16SIan Dowse for (; control->m_len > 0; 953c557ae16SIan Dowse control->m_data += CMSG_ALIGN(cm->cmsg_len), 954c557ae16SIan Dowse control->m_len -= CMSG_ALIGN(cm->cmsg_len)) { 955c557ae16SIan Dowse cm = mtod(control, struct cmsghdr *); 956af1ee11dSRobert Watson if (control->m_len < sizeof(*cm) || cm->cmsg_len == 0 957af1ee11dSRobert Watson || cm->cmsg_len > control->m_len) { 958c557ae16SIan Dowse error = EINVAL; 959c557ae16SIan Dowse break; 960c557ae16SIan Dowse } 961c557ae16SIan Dowse if (cm->cmsg_level != IPPROTO_IP) 962c557ae16SIan Dowse continue; 963c557ae16SIan Dowse 964c557ae16SIan Dowse switch (cm->cmsg_type) { 965c557ae16SIan Dowse case IP_SENDSRCADDR: 966c557ae16SIan Dowse if (cm->cmsg_len != 967c557ae16SIan Dowse CMSG_LEN(sizeof(struct in_addr))) { 968c557ae16SIan Dowse error = EINVAL; 969c557ae16SIan Dowse break; 970c557ae16SIan Dowse } 971c557ae16SIan Dowse bzero(&src, sizeof(src)); 972c557ae16SIan Dowse src.sin_family = AF_INET; 973c557ae16SIan Dowse src.sin_len = sizeof(src); 974c557ae16SIan Dowse src.sin_port = inp->inp_lport; 975af1ee11dSRobert Watson src.sin_addr = 976af1ee11dSRobert Watson *(struct in_addr *)CMSG_DATA(cm); 977c557ae16SIan Dowse break; 978af1ee11dSRobert Watson 979c557ae16SIan Dowse default: 980c557ae16SIan Dowse error = ENOPROTOOPT; 981c557ae16SIan Dowse break; 982c557ae16SIan Dowse } 983c557ae16SIan Dowse if (error) 984c557ae16SIan Dowse break; 985c557ae16SIan Dowse } 986c557ae16SIan Dowse m_freem(control); 987c557ae16SIan Dowse } 9885c32ea65SRobert Watson if (error) { 9895c32ea65SRobert Watson m_freem(m); 9903329b236SRobert Watson return (error); 9915c32ea65SRobert Watson } 9925c32ea65SRobert Watson 99343cc0bc1SRobert Watson /* 99443cc0bc1SRobert Watson * Depending on whether or not the application has bound or connected 995ca528788SRobert Watson * the socket, we may have to do varying levels of work. The optimal 996ca528788SRobert Watson * case is for a connected UDP socket, as a global lock isn't 997ca528788SRobert Watson * required at all. 99843cc0bc1SRobert Watson * 99943cc0bc1SRobert Watson * In order to decide which we need, we require stability of the 100043cc0bc1SRobert Watson * inpcb binding, which we ensure by acquiring a read lock on the 100143cc0bc1SRobert Watson * inpcb. This doesn't strictly follow the lock order, so we play 100243cc0bc1SRobert Watson * the trylock and retry game; note that we may end up with more 100343cc0bc1SRobert Watson * conservative locks than required the second time around, so later 100443cc0bc1SRobert Watson * assertions have to accept that. Further analysis of the number of 100543cc0bc1SRobert Watson * misses under contention is required. 100643cc0bc1SRobert Watson */ 100743cc0bc1SRobert Watson sin = (struct sockaddr_in *)addr; 100843cc0bc1SRobert Watson INP_RLOCK(inp); 100943cc0bc1SRobert Watson if (sin != NULL && 101043cc0bc1SRobert Watson (inp->inp_laddr.s_addr == INADDR_ANY && inp->inp_lport == 0)) { 101143cc0bc1SRobert Watson INP_RUNLOCK(inp); 1012603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 10138501a69cSRobert Watson INP_WLOCK(inp); 101443cc0bc1SRobert Watson unlock_udbinfo = 2; 101543cc0bc1SRobert Watson } else if ((sin != NULL && ( 101643cc0bc1SRobert Watson (sin->sin_addr.s_addr == INADDR_ANY) || 101743cc0bc1SRobert Watson (sin->sin_addr.s_addr == INADDR_BROADCAST) || 101843cc0bc1SRobert Watson (inp->inp_laddr.s_addr == INADDR_ANY) || 101943cc0bc1SRobert Watson (inp->inp_lport == 0))) || 102043cc0bc1SRobert Watson (src.sin_family == AF_INET)) { 1021603724d3SBjoern A. Zeeb if (!INP_INFO_TRY_RLOCK(&V_udbinfo)) { 102243cc0bc1SRobert Watson INP_RUNLOCK(inp); 1023603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 1024948d0fc9SRobert Watson INP_RLOCK(inp); 1025948d0fc9SRobert Watson } 102643cc0bc1SRobert Watson unlock_udbinfo = 1; 102743cc0bc1SRobert Watson } else 102843cc0bc1SRobert Watson unlock_udbinfo = 0; 10295c32ea65SRobert Watson 10301b7f0384SBruce M Simpson /* 10311b7f0384SBruce M Simpson * If the IP_SENDSRCADDR control message was specified, override the 10321b7f0384SBruce M Simpson * source address for this datagram. Its use is invalidated if the 10331b7f0384SBruce M Simpson * address thus specified is incomplete or clobbers other inpcbs. 10341b7f0384SBruce M Simpson */ 103590162a4eSIan Dowse laddr = inp->inp_laddr; 103690162a4eSIan Dowse lport = inp->inp_lport; 10371b7f0384SBruce M Simpson if (src.sin_family == AF_INET) { 1038603724d3SBjoern A. Zeeb INP_INFO_LOCK_ASSERT(&V_udbinfo); 10391b7f0384SBruce M Simpson if ((lport == 0) || 10401b7f0384SBruce M Simpson (laddr.s_addr == INADDR_ANY && 10411b7f0384SBruce M Simpson src.sin_addr.s_addr == INADDR_ANY)) { 1042c557ae16SIan Dowse error = EINVAL; 1043c557ae16SIan Dowse goto release; 1044c557ae16SIan Dowse } 1045c557ae16SIan Dowse error = in_pcbbind_setup(inp, (struct sockaddr *)&src, 1046b0330ed9SPawel Jakub Dawidek &laddr.s_addr, &lport, td->td_ucred); 1047c557ae16SIan Dowse if (error) 1048c557ae16SIan Dowse goto release; 1049c557ae16SIan Dowse } 1050c557ae16SIan Dowse 10513144b7d3SRobert Watson /* 10523144b7d3SRobert Watson * If a UDP socket has been connected, then a local address/port will 10533144b7d3SRobert Watson * have been selected and bound. 10543144b7d3SRobert Watson * 105543cc0bc1SRobert Watson * If a UDP socket has not been connected to, then an explicit 10563144b7d3SRobert Watson * destination address must be used, in which case a local 10573144b7d3SRobert Watson * address/port may not have been selected and bound. 10583144b7d3SRobert Watson */ 105943cc0bc1SRobert Watson if (sin != NULL) { 1060c4d585aeSRobert Watson INP_LOCK_ASSERT(inp); 1061df8bae1dSRodney W. Grimes if (inp->inp_faddr.s_addr != INADDR_ANY) { 1062df8bae1dSRodney W. Grimes error = EISCONN; 1063df8bae1dSRodney W. Grimes goto release; 1064df8bae1dSRodney W. Grimes } 10653144b7d3SRobert Watson 10663144b7d3SRobert Watson /* 10673144b7d3SRobert Watson * Jail may rewrite the destination address, so let it do 10683144b7d3SRobert Watson * that before we use it. 10693144b7d3SRobert Watson */ 1070b89e82ddSJamie Gritton error = prison_remote_ip4(td->td_ucred, &sin->sin_addr); 1071b89e82ddSJamie Gritton if (error) 1072413628a7SBjoern A. Zeeb goto release; 10733144b7d3SRobert Watson 10743144b7d3SRobert Watson /* 107543cc0bc1SRobert Watson * If a local address or port hasn't yet been selected, or if 107643cc0bc1SRobert Watson * the destination address needs to be rewritten due to using 107743cc0bc1SRobert Watson * a special INADDR_ constant, invoke in_pcbconnect_setup() 107843cc0bc1SRobert Watson * to do the heavy lifting. Once a port is selected, we 107943cc0bc1SRobert Watson * commit the binding back to the socket; we also commit the 108043cc0bc1SRobert Watson * binding of the address if in jail. 108143cc0bc1SRobert Watson * 108243cc0bc1SRobert Watson * If we already have a valid binding and we're not 108343cc0bc1SRobert Watson * requesting a destination address rewrite, use a fast path. 10843144b7d3SRobert Watson */ 108543cc0bc1SRobert Watson if (inp->inp_laddr.s_addr == INADDR_ANY || 108643cc0bc1SRobert Watson inp->inp_lport == 0 || 108743cc0bc1SRobert Watson sin->sin_addr.s_addr == INADDR_ANY || 108843cc0bc1SRobert Watson sin->sin_addr.s_addr == INADDR_BROADCAST) { 1089603724d3SBjoern A. Zeeb INP_INFO_LOCK_ASSERT(&V_udbinfo); 109043cc0bc1SRobert Watson error = in_pcbconnect_setup(inp, addr, &laddr.s_addr, 109143cc0bc1SRobert Watson &lport, &faddr.s_addr, &fport, NULL, 109243cc0bc1SRobert Watson td->td_ucred); 109390162a4eSIan Dowse if (error) 109490162a4eSIan Dowse goto release; 109590162a4eSIan Dowse 109643cc0bc1SRobert Watson /* 109743cc0bc1SRobert Watson * XXXRW: Why not commit the port if the address is 109843cc0bc1SRobert Watson * !INADDR_ANY? 109943cc0bc1SRobert Watson */ 110090162a4eSIan Dowse /* Commit the local port if newly assigned. */ 110190162a4eSIan Dowse if (inp->inp_laddr.s_addr == INADDR_ANY && 110290162a4eSIan Dowse inp->inp_lport == 0) { 1103603724d3SBjoern A. Zeeb INP_INFO_WLOCK_ASSERT(&V_udbinfo); 1104c4d585aeSRobert Watson INP_WLOCK_ASSERT(inp); 11053a1757b9SGleb Smirnoff /* 110643cc0bc1SRobert Watson * Remember addr if jailed, to prevent 110743cc0bc1SRobert Watson * rebinding. 11083a1757b9SGleb Smirnoff */ 11090304c731SJamie Gritton if (prison_flag(td->td_ucred, PR_IP4)) 11103a1757b9SGleb Smirnoff inp->inp_laddr = laddr; 111190162a4eSIan Dowse inp->inp_lport = lport; 111290162a4eSIan Dowse if (in_pcbinshash(inp) != 0) { 111390162a4eSIan Dowse inp->inp_lport = 0; 111490162a4eSIan Dowse error = EAGAIN; 1115df8bae1dSRodney W. Grimes goto release; 1116df8bae1dSRodney W. Grimes } 111790162a4eSIan Dowse inp->inp_flags |= INP_ANONPORT; 111890162a4eSIan Dowse } 1119df8bae1dSRodney W. Grimes } else { 112043cc0bc1SRobert Watson faddr = sin->sin_addr; 112143cc0bc1SRobert Watson fport = sin->sin_port; 112243cc0bc1SRobert Watson } 112343cc0bc1SRobert Watson } else { 1124c4d585aeSRobert Watson INP_LOCK_ASSERT(inp); 112590162a4eSIan Dowse faddr = inp->inp_faddr; 112690162a4eSIan Dowse fport = inp->inp_fport; 112790162a4eSIan Dowse if (faddr.s_addr == INADDR_ANY) { 1128df8bae1dSRodney W. Grimes error = ENOTCONN; 1129df8bae1dSRodney W. Grimes goto release; 1130df8bae1dSRodney W. Grimes } 1131df8bae1dSRodney W. Grimes } 1132e6ccd709SRobert Watson 1133df8bae1dSRodney W. Grimes /* 1134e6ccd709SRobert Watson * Calculate data length and get a mbuf for UDP, IP, and possible 1135392e8407SRobert Watson * link-layer headers. Immediate slide the data pointer back forward 1136392e8407SRobert Watson * since we won't use that space at this layer. 1137df8bae1dSRodney W. Grimes */ 1138e6ccd709SRobert Watson M_PREPEND(m, sizeof(struct udpiphdr) + max_linkhdr, M_DONTWAIT); 1139e6ccd709SRobert Watson if (m == NULL) { 1140df8bae1dSRodney W. Grimes error = ENOBUFS; 114149b19bfcSBruce M Simpson goto release; 1142df8bae1dSRodney W. Grimes } 1143e6ccd709SRobert Watson m->m_data += max_linkhdr; 1144e6ccd709SRobert Watson m->m_len -= max_linkhdr; 1145392e8407SRobert Watson m->m_pkthdr.len -= max_linkhdr; 1146df8bae1dSRodney W. Grimes 1147df8bae1dSRodney W. Grimes /* 11483329b236SRobert Watson * Fill in mbuf with extended UDP header and addresses and length put 11493329b236SRobert Watson * into network format. 1150df8bae1dSRodney W. Grimes */ 1151df8bae1dSRodney W. Grimes ui = mtod(m, struct udpiphdr *); 1152db4f9cc7SJonathan Lemon bzero(ui->ui_x1, sizeof(ui->ui_x1)); /* XXX still needed? */ 1153df8bae1dSRodney W. Grimes ui->ui_pr = IPPROTO_UDP; 115490162a4eSIan Dowse ui->ui_src = laddr; 115590162a4eSIan Dowse ui->ui_dst = faddr; 115690162a4eSIan Dowse ui->ui_sport = lport; 115790162a4eSIan Dowse ui->ui_dport = fport; 1158db4f9cc7SJonathan Lemon ui->ui_ulen = htons((u_short)len + sizeof(struct udphdr)); 1159df8bae1dSRodney W. Grimes 1160b2828ad2SAndre Oppermann /* 1161b2828ad2SAndre Oppermann * Set the Don't Fragment bit in the IP header. 1162b2828ad2SAndre Oppermann */ 1163b2828ad2SAndre Oppermann if (inp->inp_flags & INP_DONTFRAG) { 1164b2828ad2SAndre Oppermann struct ip *ip; 11653329b236SRobert Watson 1166b2828ad2SAndre Oppermann ip = (struct ip *)&ui->ui_i; 1167b2828ad2SAndre Oppermann ip->ip_off |= IP_DF; 1168b2828ad2SAndre Oppermann } 1169b2828ad2SAndre Oppermann 1170b5d47ff5SJohn-Mark Gurney ipflags = 0; 1171b5d47ff5SJohn-Mark Gurney if (inp->inp_socket->so_options & SO_DONTROUTE) 1172b5d47ff5SJohn-Mark Gurney ipflags |= IP_ROUTETOIF; 1173b5d47ff5SJohn-Mark Gurney if (inp->inp_socket->so_options & SO_BROADCAST) 1174b5d47ff5SJohn-Mark Gurney ipflags |= IP_ALLOWBROADCAST; 11756fbfd582SAndre Oppermann if (inp->inp_flags & INP_ONESBCAST) 11768afa2304SBruce M Simpson ipflags |= IP_SENDONES; 11778afa2304SBruce M Simpson 11781175d9d5SRobert Watson #ifdef MAC 11791175d9d5SRobert Watson mac_inpcb_create_mbuf(inp, m); 11801175d9d5SRobert Watson #endif 11811175d9d5SRobert Watson 1182df8bae1dSRodney W. Grimes /* 1183db4f9cc7SJonathan Lemon * Set up checksum and output datagram. 1184df8bae1dSRodney W. Grimes */ 1185f5514f08SRobert Watson if (udp_cksum) { 11866fbfd582SAndre Oppermann if (inp->inp_flags & INP_ONESBCAST) 11878a538743SBruce M Simpson faddr.s_addr = INADDR_BROADCAST; 11888a538743SBruce M Simpson ui->ui_sum = in_pseudo(ui->ui_src.s_addr, faddr.s_addr, 1189db4f9cc7SJonathan Lemon htons((u_short)len + sizeof(struct udphdr) + IPPROTO_UDP)); 1190db4f9cc7SJonathan Lemon m->m_pkthdr.csum_flags = CSUM_UDP; 1191db4f9cc7SJonathan Lemon m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum); 11923329b236SRobert Watson } else 1193db4f9cc7SJonathan Lemon ui->ui_sum = 0; 1194df8bae1dSRodney W. Grimes ((struct ip *)ui)->ip_len = sizeof (struct udpiphdr) + len; 1195ca98b82cSDavid Greenman ((struct ip *)ui)->ip_ttl = inp->inp_ip_ttl; /* XXX */ 1196ca98b82cSDavid Greenman ((struct ip *)ui)->ip_tos = inp->inp_ip_tos; /* XXX */ 1197026decb8SRobert Watson UDPSTAT_INC(udps_opackets); 1198cfa1ca9dSYoshinobu Inoue 119943cc0bc1SRobert Watson if (unlock_udbinfo == 2) 1200603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 120143cc0bc1SRobert Watson else if (unlock_udbinfo == 1) 1202603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 120397d8d152SAndre Oppermann error = ip_output(m, inp->inp_options, NULL, ipflags, 12045d846453SSam Leffler inp->inp_moptions, inp); 120543cc0bc1SRobert Watson if (unlock_udbinfo == 2) 12068501a69cSRobert Watson INP_WUNLOCK(inp); 1207948d0fc9SRobert Watson else 1208948d0fc9SRobert Watson INP_RUNLOCK(inp); 1209df8bae1dSRodney W. Grimes return (error); 1210df8bae1dSRodney W. Grimes 1211df8bae1dSRodney W. Grimes release: 121243cc0bc1SRobert Watson if (unlock_udbinfo == 2) { 1213948d0fc9SRobert Watson INP_WUNLOCK(inp); 1214603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 121543cc0bc1SRobert Watson } else if (unlock_udbinfo == 1) { 121643cc0bc1SRobert Watson INP_RUNLOCK(inp); 1217603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 1218948d0fc9SRobert Watson } else 1219948d0fc9SRobert Watson INP_RUNLOCK(inp); 1220df8bae1dSRodney W. Grimes m_freem(m); 1221df8bae1dSRodney W. Grimes return (error); 1222df8bae1dSRodney W. Grimes } 1223df8bae1dSRodney W. Grimes 12247b495c44SVANHULLEBUS Yvan 12257b495c44SVANHULLEBUS Yvan #if defined(IPSEC) && defined(IPSEC_NAT_T) 12267b495c44SVANHULLEBUS Yvan #ifdef INET 12277b495c44SVANHULLEBUS Yvan /* 12287b495c44SVANHULLEBUS Yvan * Potentially decap ESP in UDP frame. Check for an ESP header 12297b495c44SVANHULLEBUS Yvan * and optional marker; if present, strip the UDP header and 12307b495c44SVANHULLEBUS Yvan * push the result through IPSec. 12317b495c44SVANHULLEBUS Yvan * 12327b495c44SVANHULLEBUS Yvan * Returns mbuf to be processed (potentially re-allocated) or 12337b495c44SVANHULLEBUS Yvan * NULL if consumed and/or processed. 12347b495c44SVANHULLEBUS Yvan */ 12357b495c44SVANHULLEBUS Yvan static struct mbuf * 12367b495c44SVANHULLEBUS Yvan udp4_espdecap(struct inpcb *inp, struct mbuf *m, int off) 12377b495c44SVANHULLEBUS Yvan { 12387b495c44SVANHULLEBUS Yvan size_t minlen, payload, skip, iphlen; 12397b495c44SVANHULLEBUS Yvan caddr_t data; 12407b495c44SVANHULLEBUS Yvan struct udpcb *up; 12417b495c44SVANHULLEBUS Yvan struct m_tag *tag; 12427b495c44SVANHULLEBUS Yvan struct udphdr *udphdr; 12437b495c44SVANHULLEBUS Yvan struct ip *ip; 12447b495c44SVANHULLEBUS Yvan 12457b495c44SVANHULLEBUS Yvan INP_RLOCK_ASSERT(inp); 12467b495c44SVANHULLEBUS Yvan 12477b495c44SVANHULLEBUS Yvan /* 12487b495c44SVANHULLEBUS Yvan * Pull up data so the longest case is contiguous: 12497b495c44SVANHULLEBUS Yvan * IP/UDP hdr + non ESP marker + ESP hdr. 12507b495c44SVANHULLEBUS Yvan */ 12517b495c44SVANHULLEBUS Yvan minlen = off + sizeof(uint64_t) + sizeof(struct esp); 12527b495c44SVANHULLEBUS Yvan if (minlen > m->m_pkthdr.len) 12537b495c44SVANHULLEBUS Yvan minlen = m->m_pkthdr.len; 12547b495c44SVANHULLEBUS Yvan if ((m = m_pullup(m, minlen)) == NULL) { 12557b495c44SVANHULLEBUS Yvan V_ipsec4stat.in_inval++; 12567b495c44SVANHULLEBUS Yvan return (NULL); /* Bypass caller processing. */ 12577b495c44SVANHULLEBUS Yvan } 12587b495c44SVANHULLEBUS Yvan data = mtod(m, caddr_t); /* Points to ip header. */ 12597b495c44SVANHULLEBUS Yvan payload = m->m_len - off; /* Size of payload. */ 12607b495c44SVANHULLEBUS Yvan 12617b495c44SVANHULLEBUS Yvan if (payload == 1 && data[off] == '\xff') 12627b495c44SVANHULLEBUS Yvan return (m); /* NB: keepalive packet, no decap. */ 12637b495c44SVANHULLEBUS Yvan 12647b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 12657b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: udpcb NULL", __func__)); 12667b495c44SVANHULLEBUS Yvan KASSERT((up->u_flags & UF_ESPINUDP_ALL) != 0, 12677b495c44SVANHULLEBUS Yvan ("u_flags 0x%x", up->u_flags)); 12687b495c44SVANHULLEBUS Yvan 12697b495c44SVANHULLEBUS Yvan /* 12707b495c44SVANHULLEBUS Yvan * Check that the payload is large enough to hold an 12717b495c44SVANHULLEBUS Yvan * ESP header and compute the amount of data to remove. 12727b495c44SVANHULLEBUS Yvan * 12737b495c44SVANHULLEBUS Yvan * NB: the caller has already done a pullup for us. 12747b495c44SVANHULLEBUS Yvan * XXX can we assume alignment and eliminate bcopys? 12757b495c44SVANHULLEBUS Yvan */ 12767b495c44SVANHULLEBUS Yvan if (up->u_flags & UF_ESPINUDP_NON_IKE) { 12777b495c44SVANHULLEBUS Yvan /* 12787b495c44SVANHULLEBUS Yvan * draft-ietf-ipsec-nat-t-ike-0[01].txt and 12797b495c44SVANHULLEBUS Yvan * draft-ietf-ipsec-udp-encaps-(00/)01.txt, ignoring 12807b495c44SVANHULLEBUS Yvan * possible AH mode non-IKE marker+non-ESP marker 12817b495c44SVANHULLEBUS Yvan * from draft-ietf-ipsec-udp-encaps-00.txt. 12827b495c44SVANHULLEBUS Yvan */ 12837b495c44SVANHULLEBUS Yvan uint64_t marker; 12847b495c44SVANHULLEBUS Yvan 12857b495c44SVANHULLEBUS Yvan if (payload <= sizeof(uint64_t) + sizeof(struct esp)) 12867b495c44SVANHULLEBUS Yvan return (m); /* NB: no decap. */ 12877b495c44SVANHULLEBUS Yvan bcopy(data + off, &marker, sizeof(uint64_t)); 12887b495c44SVANHULLEBUS Yvan if (marker != 0) /* Non-IKE marker. */ 12897b495c44SVANHULLEBUS Yvan return (m); /* NB: no decap. */ 12907b495c44SVANHULLEBUS Yvan skip = sizeof(uint64_t) + sizeof(struct udphdr); 12917b495c44SVANHULLEBUS Yvan } else { 12927b495c44SVANHULLEBUS Yvan uint32_t spi; 12937b495c44SVANHULLEBUS Yvan 12947b495c44SVANHULLEBUS Yvan if (payload <= sizeof(struct esp)) { 12957b495c44SVANHULLEBUS Yvan V_ipsec4stat.in_inval++; 12967b495c44SVANHULLEBUS Yvan m_freem(m); 12977b495c44SVANHULLEBUS Yvan return (NULL); /* Discard. */ 12987b495c44SVANHULLEBUS Yvan } 12997b495c44SVANHULLEBUS Yvan bcopy(data + off, &spi, sizeof(uint32_t)); 13007b495c44SVANHULLEBUS Yvan if (spi == 0) /* Non-ESP marker. */ 13017b495c44SVANHULLEBUS Yvan return (m); /* NB: no decap. */ 13027b495c44SVANHULLEBUS Yvan skip = sizeof(struct udphdr); 13037b495c44SVANHULLEBUS Yvan } 13047b495c44SVANHULLEBUS Yvan 13057b495c44SVANHULLEBUS Yvan /* 13067b495c44SVANHULLEBUS Yvan * Setup a PACKET_TAG_IPSEC_NAT_T_PORT tag to remember 13077b495c44SVANHULLEBUS Yvan * the UDP ports. This is required if we want to select 13087b495c44SVANHULLEBUS Yvan * the right SPD for multiple hosts behind same NAT. 13097b495c44SVANHULLEBUS Yvan * 13107b495c44SVANHULLEBUS Yvan * NB: ports are maintained in network byte order everywhere 13117b495c44SVANHULLEBUS Yvan * in the NAT-T code. 13127b495c44SVANHULLEBUS Yvan */ 13137b495c44SVANHULLEBUS Yvan tag = m_tag_get(PACKET_TAG_IPSEC_NAT_T_PORTS, 13147b495c44SVANHULLEBUS Yvan 2 * sizeof(uint16_t), M_NOWAIT); 13157b495c44SVANHULLEBUS Yvan if (tag == NULL) { 13167b495c44SVANHULLEBUS Yvan V_ipsec4stat.in_nomem++; 13177b495c44SVANHULLEBUS Yvan m_freem(m); 13187b495c44SVANHULLEBUS Yvan return (NULL); /* Discard. */ 13197b495c44SVANHULLEBUS Yvan } 13207b495c44SVANHULLEBUS Yvan iphlen = off - sizeof(struct udphdr); 13217b495c44SVANHULLEBUS Yvan udphdr = (struct udphdr *)(data + iphlen); 13227b495c44SVANHULLEBUS Yvan ((uint16_t *)(tag + 1))[0] = udphdr->uh_sport; 13237b495c44SVANHULLEBUS Yvan ((uint16_t *)(tag + 1))[1] = udphdr->uh_dport; 13247b495c44SVANHULLEBUS Yvan m_tag_prepend(m, tag); 13257b495c44SVANHULLEBUS Yvan 13267b495c44SVANHULLEBUS Yvan /* 13277b495c44SVANHULLEBUS Yvan * Remove the UDP header (and possibly the non ESP marker) 13287b495c44SVANHULLEBUS Yvan * IP header length is iphlen 13297b495c44SVANHULLEBUS Yvan * Before: 13307b495c44SVANHULLEBUS Yvan * <--- off ---> 13317b495c44SVANHULLEBUS Yvan * +----+------+-----+ 13327b495c44SVANHULLEBUS Yvan * | IP | UDP | ESP | 13337b495c44SVANHULLEBUS Yvan * +----+------+-----+ 13347b495c44SVANHULLEBUS Yvan * <-skip-> 13357b495c44SVANHULLEBUS Yvan * After: 13367b495c44SVANHULLEBUS Yvan * +----+-----+ 13377b495c44SVANHULLEBUS Yvan * | IP | ESP | 13387b495c44SVANHULLEBUS Yvan * +----+-----+ 13397b495c44SVANHULLEBUS Yvan * <-skip-> 13407b495c44SVANHULLEBUS Yvan */ 13417b495c44SVANHULLEBUS Yvan ovbcopy(data, data + skip, iphlen); 13427b495c44SVANHULLEBUS Yvan m_adj(m, skip); 13437b495c44SVANHULLEBUS Yvan 13447b495c44SVANHULLEBUS Yvan ip = mtod(m, struct ip *); 13457b495c44SVANHULLEBUS Yvan ip->ip_len -= skip; 13467b495c44SVANHULLEBUS Yvan ip->ip_p = IPPROTO_ESP; 13477b495c44SVANHULLEBUS Yvan 13487b495c44SVANHULLEBUS Yvan /* 13497b495c44SVANHULLEBUS Yvan * We cannot yet update the cksums so clear any 13507b495c44SVANHULLEBUS Yvan * h/w cksum flags as they are no longer valid. 13517b495c44SVANHULLEBUS Yvan */ 13527b495c44SVANHULLEBUS Yvan if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) 13537b495c44SVANHULLEBUS Yvan m->m_pkthdr.csum_flags &= ~(CSUM_DATA_VALID|CSUM_PSEUDO_HDR); 13547b495c44SVANHULLEBUS Yvan 13557b495c44SVANHULLEBUS Yvan (void) ipsec4_common_input(m, iphlen, ip->ip_p); 13567b495c44SVANHULLEBUS Yvan return (NULL); /* NB: consumed, bypass processing. */ 13577b495c44SVANHULLEBUS Yvan } 13587b495c44SVANHULLEBUS Yvan #endif /* INET */ 13597b495c44SVANHULLEBUS Yvan #endif /* defined(IPSEC) && defined(IPSEC_NAT_T) */ 13607b495c44SVANHULLEBUS Yvan 1361ac45e92fSRobert Watson static void 1362d0390e05SGarrett Wollman udp_abort(struct socket *so) 1363df8bae1dSRodney W. Grimes { 1364d0390e05SGarrett Wollman struct inpcb *inp; 1365df8bae1dSRodney W. Grimes 1366d0390e05SGarrett Wollman inp = sotoinpcb(so); 136714ba8addSRobert Watson KASSERT(inp != NULL, ("udp_abort: inp == NULL")); 1368603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 13698501a69cSRobert Watson INP_WLOCK(inp); 1370a152f8a3SRobert Watson if (inp->inp_faddr.s_addr != INADDR_ANY) { 1371a152f8a3SRobert Watson in_pcbdisconnect(inp); 1372a152f8a3SRobert Watson inp->inp_laddr.s_addr = INADDR_ANY; 1373d0390e05SGarrett Wollman soisdisconnected(so); 1374a152f8a3SRobert Watson } 13758501a69cSRobert Watson INP_WUNLOCK(inp); 1376603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1377df8bae1dSRodney W. Grimes } 1378df8bae1dSRodney W. Grimes 1379d0390e05SGarrett Wollman static int 1380b40ce416SJulian Elischer udp_attach(struct socket *so, int proto, struct thread *td) 1381d0390e05SGarrett Wollman { 1382d0390e05SGarrett Wollman struct inpcb *inp; 1383277afaffSRobert Watson int error; 1384d0390e05SGarrett Wollman 1385d0390e05SGarrett Wollman inp = sotoinpcb(so); 138614ba8addSRobert Watson KASSERT(inp == NULL, ("udp_attach: inp != NULL")); 1387cfa1ca9dSYoshinobu Inoue error = soreserve(so, udp_sendspace, udp_recvspace); 1388f24618aaSRobert Watson if (error) 13893329b236SRobert Watson return (error); 1390603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 1391603724d3SBjoern A. Zeeb error = in_pcballoc(so, &V_udbinfo); 139253b57cd1SSam Leffler if (error) { 1393603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 13943329b236SRobert Watson return (error); 139553b57cd1SSam Leffler } 1396cfa1ca9dSYoshinobu Inoue 139768b5629bSRobert Watson inp = sotoinpcb(so); 1398cfa1ca9dSYoshinobu Inoue inp->inp_vflag |= INP_IPV4; 1399603724d3SBjoern A. Zeeb inp->inp_ip_ttl = V_ip_defttl; 14006a9148feSBjoern A. Zeeb 14016a9148feSBjoern A. Zeeb error = udp_newudpcb(inp); 14026a9148feSBjoern A. Zeeb if (error) { 14036a9148feSBjoern A. Zeeb in_pcbdetach(inp); 14046a9148feSBjoern A. Zeeb in_pcbfree(inp); 14056a9148feSBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 14066a9148feSBjoern A. Zeeb return (error); 14076a9148feSBjoern A. Zeeb } 14086a9148feSBjoern A. Zeeb 1409c7c7ea4bSRandall Stewart INP_WUNLOCK(inp); 14106a9148feSBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1411c7c7ea4bSRandall Stewart return (0); 1412c7c7ea4bSRandall Stewart } 1413c7c7ea4bSRandall Stewart 1414c7c7ea4bSRandall Stewart int 1415c7c7ea4bSRandall Stewart udp_set_kernel_tunneling(struct socket *so, udp_tun_func_t f) 1416c7c7ea4bSRandall Stewart { 1417c7c7ea4bSRandall Stewart struct inpcb *inp; 14186a9148feSBjoern A. Zeeb struct udpcb *up; 1419c7c7ea4bSRandall Stewart 142068b5629bSRobert Watson KASSERT(so->so_type == SOCK_DGRAM, 142168b5629bSRobert Watson ("udp_set_kernel_tunneling: !dgram")); 142268b5629bSRobert Watson inp = sotoinpcb(so); 142368b5629bSRobert Watson KASSERT(inp != NULL, ("udp_set_kernel_tunneling: inp == NULL")); 1424c7c7ea4bSRandall Stewart INP_WLOCK(inp); 14256a9148feSBjoern A. Zeeb up = intoudpcb(inp); 14266a9148feSBjoern A. Zeeb if (up->u_tun_func != NULL) { 1427bbb0e3d9SRandall Stewart INP_WUNLOCK(inp); 1428bbb0e3d9SRandall Stewart return (EBUSY); 1429bbb0e3d9SRandall Stewart } 14306a9148feSBjoern A. Zeeb up->u_tun_func = f; 14318501a69cSRobert Watson INP_WUNLOCK(inp); 14323329b236SRobert Watson return (0); 1433df8bae1dSRodney W. Grimes } 1434d0390e05SGarrett Wollman 1435d0390e05SGarrett Wollman static int 1436b40ce416SJulian Elischer udp_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 1437d0390e05SGarrett Wollman { 1438d0390e05SGarrett Wollman struct inpcb *inp; 1439277afaffSRobert Watson int error; 1440d0390e05SGarrett Wollman 1441d0390e05SGarrett Wollman inp = sotoinpcb(so); 144214ba8addSRobert Watson KASSERT(inp != NULL, ("udp_bind: inp == NULL")); 1443603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 14448501a69cSRobert Watson INP_WLOCK(inp); 1445b0330ed9SPawel Jakub Dawidek error = in_pcbbind(inp, nam, td->td_ucred); 14468501a69cSRobert Watson INP_WUNLOCK(inp); 1447603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 14483329b236SRobert Watson return (error); 1449d0390e05SGarrett Wollman } 1450d0390e05SGarrett Wollman 1451a152f8a3SRobert Watson static void 1452a152f8a3SRobert Watson udp_close(struct socket *so) 1453a152f8a3SRobert Watson { 1454a152f8a3SRobert Watson struct inpcb *inp; 1455a152f8a3SRobert Watson 1456a152f8a3SRobert Watson inp = sotoinpcb(so); 1457a152f8a3SRobert Watson KASSERT(inp != NULL, ("udp_close: inp == NULL")); 1458603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 14598501a69cSRobert Watson INP_WLOCK(inp); 1460a152f8a3SRobert Watson if (inp->inp_faddr.s_addr != INADDR_ANY) { 1461a152f8a3SRobert Watson in_pcbdisconnect(inp); 1462a152f8a3SRobert Watson inp->inp_laddr.s_addr = INADDR_ANY; 1463a152f8a3SRobert Watson soisdisconnected(so); 1464a152f8a3SRobert Watson } 14658501a69cSRobert Watson INP_WUNLOCK(inp); 1466603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1467a152f8a3SRobert Watson } 1468a152f8a3SRobert Watson 1469d0390e05SGarrett Wollman static int 1470b40ce416SJulian Elischer udp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 1471d0390e05SGarrett Wollman { 1472d0390e05SGarrett Wollman struct inpcb *inp; 1473277afaffSRobert Watson int error; 147475c13541SPoul-Henning Kamp struct sockaddr_in *sin; 1475d0390e05SGarrett Wollman 1476d0390e05SGarrett Wollman inp = sotoinpcb(so); 147714ba8addSRobert Watson KASSERT(inp != NULL, ("udp_connect: inp == NULL")); 1478603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 14798501a69cSRobert Watson INP_WLOCK(inp); 1480f76fcf6dSJeffrey Hsu if (inp->inp_faddr.s_addr != INADDR_ANY) { 14818501a69cSRobert Watson INP_WUNLOCK(inp); 1482603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 14833329b236SRobert Watson return (EISCONN); 1484f76fcf6dSJeffrey Hsu } 148575c13541SPoul-Henning Kamp sin = (struct sockaddr_in *)nam; 1486b89e82ddSJamie Gritton error = prison_remote_ip4(td->td_ucred, &sin->sin_addr); 1487b89e82ddSJamie Gritton if (error != 0) { 1488413628a7SBjoern A. Zeeb INP_WUNLOCK(inp); 1489385195c0SMarko Zec INP_INFO_WUNLOCK(&V_udbinfo); 1490b89e82ddSJamie Gritton return (error); 1491413628a7SBjoern A. Zeeb } 1492b0330ed9SPawel Jakub Dawidek error = in_pcbconnect(inp, nam, td->td_ucred); 14934cc20ab1SSeigo Tanimura if (error == 0) 1494df8bae1dSRodney W. Grimes soisconnected(so); 14958501a69cSRobert Watson INP_WUNLOCK(inp); 1496603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 14973329b236SRobert Watson return (error); 1498df8bae1dSRodney W. Grimes } 1499d0390e05SGarrett Wollman 1500bc725eafSRobert Watson static void 1501d0390e05SGarrett Wollman udp_detach(struct socket *so) 1502d0390e05SGarrett Wollman { 1503d0390e05SGarrett Wollman struct inpcb *inp; 15046a9148feSBjoern A. Zeeb struct udpcb *up; 1505d0390e05SGarrett Wollman 1506d0390e05SGarrett Wollman inp = sotoinpcb(so); 150714ba8addSRobert Watson KASSERT(inp != NULL, ("udp_detach: inp == NULL")); 1508a152f8a3SRobert Watson KASSERT(inp->inp_faddr.s_addr == INADDR_ANY, 1509a152f8a3SRobert Watson ("udp_detach: not disconnected")); 1510603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 15118501a69cSRobert Watson INP_WLOCK(inp); 15126a9148feSBjoern A. Zeeb up = intoudpcb(inp); 15136a9148feSBjoern A. Zeeb KASSERT(up != NULL, ("%s: up == NULL", __func__)); 15146a9148feSBjoern A. Zeeb inp->inp_ppcb = NULL; 1515d0390e05SGarrett Wollman in_pcbdetach(inp); 151614ba8addSRobert Watson in_pcbfree(inp); 1517603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 15186a9148feSBjoern A. Zeeb udp_discardcb(up); 1519d0390e05SGarrett Wollman } 1520d0390e05SGarrett Wollman 1521d0390e05SGarrett Wollman static int 1522d0390e05SGarrett Wollman udp_disconnect(struct socket *so) 1523d0390e05SGarrett Wollman { 1524d0390e05SGarrett Wollman struct inpcb *inp; 1525d0390e05SGarrett Wollman 1526d0390e05SGarrett Wollman inp = sotoinpcb(so); 152714ba8addSRobert Watson KASSERT(inp != NULL, ("udp_disconnect: inp == NULL")); 1528603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 15298501a69cSRobert Watson INP_WLOCK(inp); 1530f76fcf6dSJeffrey Hsu if (inp->inp_faddr.s_addr == INADDR_ANY) { 15318501a69cSRobert Watson INP_WUNLOCK(inp); 1532603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 15333329b236SRobert Watson return (ENOTCONN); 1534f76fcf6dSJeffrey Hsu } 1535d0390e05SGarrett Wollman 1536df8bae1dSRodney W. Grimes in_pcbdisconnect(inp); 1537df8bae1dSRodney W. Grimes inp->inp_laddr.s_addr = INADDR_ANY; 1538d45e4f99SMaxim Konovalov SOCK_LOCK(so); 1539d45e4f99SMaxim Konovalov so->so_state &= ~SS_ISCONNECTED; /* XXX */ 1540d45e4f99SMaxim Konovalov SOCK_UNLOCK(so); 15418501a69cSRobert Watson INP_WUNLOCK(inp); 1542603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 15433329b236SRobert Watson return (0); 1544df8bae1dSRodney W. Grimes } 1545df8bae1dSRodney W. Grimes 1546d0390e05SGarrett Wollman static int 154757bf258eSGarrett Wollman udp_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *addr, 1548b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 1549d0390e05SGarrett Wollman { 1550d0390e05SGarrett Wollman struct inpcb *inp; 1551d0390e05SGarrett Wollman 1552d0390e05SGarrett Wollman inp = sotoinpcb(so); 155314ba8addSRobert Watson KASSERT(inp != NULL, ("udp_send: inp == NULL")); 15543329b236SRobert Watson return (udp_output(inp, m, addr, control, td)); 1555d0390e05SGarrett Wollman } 1556d0390e05SGarrett Wollman 155776429de4SYoshinobu Inoue int 1558d0390e05SGarrett Wollman udp_shutdown(struct socket *so) 1559d0390e05SGarrett Wollman { 1560d0390e05SGarrett Wollman struct inpcb *inp; 1561d0390e05SGarrett Wollman 1562d0390e05SGarrett Wollman inp = sotoinpcb(so); 156314ba8addSRobert Watson KASSERT(inp != NULL, ("udp_shutdown: inp == NULL")); 15648501a69cSRobert Watson INP_WLOCK(inp); 1565d0390e05SGarrett Wollman socantsendmore(so); 15668501a69cSRobert Watson INP_WUNLOCK(inp); 15673329b236SRobert Watson return (0); 1568d0390e05SGarrett Wollman } 1569d0390e05SGarrett Wollman 1570d0390e05SGarrett Wollman struct pr_usrreqs udp_usrreqs = { 1571756d52a1SPoul-Henning Kamp .pru_abort = udp_abort, 1572756d52a1SPoul-Henning Kamp .pru_attach = udp_attach, 1573756d52a1SPoul-Henning Kamp .pru_bind = udp_bind, 1574756d52a1SPoul-Henning Kamp .pru_connect = udp_connect, 1575756d52a1SPoul-Henning Kamp .pru_control = in_control, 1576756d52a1SPoul-Henning Kamp .pru_detach = udp_detach, 1577756d52a1SPoul-Henning Kamp .pru_disconnect = udp_disconnect, 157854d642bbSRobert Watson .pru_peeraddr = in_getpeeraddr, 1579756d52a1SPoul-Henning Kamp .pru_send = udp_send, 15805df3e839SRobert Watson .pru_soreceive = soreceive_dgram, 158159b8854eSRobert Watson .pru_sosend = sosend_dgram, 1582756d52a1SPoul-Henning Kamp .pru_shutdown = udp_shutdown, 158354d642bbSRobert Watson .pru_sockaddr = in_getsockaddr, 1584a152f8a3SRobert Watson .pru_sosetlabel = in_pcbsosetlabel, 1585a152f8a3SRobert Watson .pru_close = udp_close, 1586d0390e05SGarrett Wollman }; 1587