1c398230bSWarner Losh /*- 26dfab5b1SGarrett Wollman * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995 33329b236SRobert Watson * The Regents of the University of California. 43144b7d3SRobert Watson * Copyright (c) 2008 Robert N. M. Watson 5fa046d87SRobert Watson * Copyright (c) 2010-2011 Juniper Networks, Inc. 63329b236SRobert Watson * All rights reserved. 7df8bae1dSRodney W. Grimes * 8fa046d87SRobert Watson * Portions of this software were developed by Robert N. M. Watson under 9fa046d87SRobert Watson * contract to Juniper Networks, Inc. 10fa046d87SRobert Watson * 11df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 12df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 13df8bae1dSRodney W. Grimes * are met: 14df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 15df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 16df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 17df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 18df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 19df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 20df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 21df8bae1dSRodney W. Grimes * without specific prior written permission. 22df8bae1dSRodney W. Grimes * 23df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 24df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 25df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 26df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 27df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 28df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 29df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 30df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 31df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 32df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 33df8bae1dSRodney W. Grimes * SUCH DAMAGE. 34df8bae1dSRodney W. Grimes * 356dfab5b1SGarrett Wollman * @(#)udp_usrreq.c 8.6 (Berkeley) 5/23/95 36df8bae1dSRodney W. Grimes */ 37df8bae1dSRodney W. Grimes 384b421e2dSMike Silbersack #include <sys/cdefs.h> 394b421e2dSMike Silbersack __FBSDID("$FreeBSD$"); 404b421e2dSMike Silbersack 410b4ae859SGleb Smirnoff #include "opt_ipfw.h" 4279288c11SBjoern A. Zeeb #include "opt_inet.h" 43cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h" 44f5514f08SRobert Watson #include "opt_ipsec.h" 4557f60867SMark Johnston #include "opt_kdtrace.h" 46cfa1ca9dSYoshinobu Inoue 47df8bae1dSRodney W. Grimes #include <sys/param.h> 48960ed29cSSeigo Tanimura #include <sys/domain.h> 494f590175SPaul Saab #include <sys/eventhandler.h> 50960ed29cSSeigo Tanimura #include <sys/jail.h> 51b110a8a2SGarrett Wollman #include <sys/kernel.h> 52960ed29cSSeigo Tanimura #include <sys/lock.h> 53df8bae1dSRodney W. Grimes #include <sys/malloc.h> 54df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 55acd3428bSRobert Watson #include <sys/priv.h> 56490d50b6SBrian Feldman #include <sys/proc.h> 57df8bae1dSRodney W. Grimes #include <sys/protosw.h> 5857f60867SMark Johnston #include <sys/sdt.h> 59960ed29cSSeigo Tanimura #include <sys/signalvar.h> 60df8bae1dSRodney W. Grimes #include <sys/socket.h> 61df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 62960ed29cSSeigo Tanimura #include <sys/sx.h> 63b5e8ce9fSBruce Evans #include <sys/sysctl.h> 64816a3d83SPoul-Henning Kamp #include <sys/syslog.h> 65f5514f08SRobert Watson #include <sys/systm.h> 668781d8e9SBruce Evans 6769c2d429SJeff Roberson #include <vm/uma.h> 68df8bae1dSRodney W. Grimes 69df8bae1dSRodney W. Grimes #include <net/if.h> 70*76039bc8SGleb Smirnoff #include <net/if_var.h> 71df8bae1dSRodney W. Grimes #include <net/route.h> 72df8bae1dSRodney W. Grimes 73df8bae1dSRodney W. Grimes #include <netinet/in.h> 7457f60867SMark Johnston #include <netinet/in_kdtrace.h> 75960ed29cSSeigo Tanimura #include <netinet/in_pcb.h> 76f5514f08SRobert Watson #include <netinet/in_systm.h> 77960ed29cSSeigo Tanimura #include <netinet/in_var.h> 78df8bae1dSRodney W. Grimes #include <netinet/ip.h> 79cfa1ca9dSYoshinobu Inoue #ifdef INET6 80cfa1ca9dSYoshinobu Inoue #include <netinet/ip6.h> 81cfa1ca9dSYoshinobu Inoue #endif 82960ed29cSSeigo Tanimura #include <netinet/ip_icmp.h> 83960ed29cSSeigo Tanimura #include <netinet/icmp_var.h> 84df8bae1dSRodney W. Grimes #include <netinet/ip_var.h> 85ef39adf0SAndre Oppermann #include <netinet/ip_options.h> 86cfa1ca9dSYoshinobu Inoue #ifdef INET6 87cfa1ca9dSYoshinobu Inoue #include <netinet6/ip6_var.h> 88cfa1ca9dSYoshinobu Inoue #endif 89df8bae1dSRodney W. Grimes #include <netinet/udp.h> 90df8bae1dSRodney W. Grimes #include <netinet/udp_var.h> 91df8bae1dSRodney W. Grimes 92b2630c29SGeorge V. Neville-Neil #ifdef IPSEC 93b9234fafSSam Leffler #include <netipsec/ipsec.h> 947b495c44SVANHULLEBUS Yvan #include <netipsec/esp.h> 953329b236SRobert Watson #endif 96b9234fafSSam Leffler 97db4f9cc7SJonathan Lemon #include <machine/in_cksum.h> 98db4f9cc7SJonathan Lemon 99aed55708SRobert Watson #include <security/mac/mac_framework.h> 100aed55708SRobert Watson 101df8bae1dSRodney W. Grimes /* 102df8bae1dSRodney W. Grimes * UDP protocol implementation. 103df8bae1dSRodney W. Grimes * Per RFC 768, August, 1980. 104df8bae1dSRodney W. Grimes */ 10574eb3236SWarner Losh 10674eb3236SWarner Losh /* 1073329b236SRobert Watson * BSD 4.2 defaulted the udp checksum to be off. Turning off udp checksums 1083329b236SRobert Watson * removes the only data integrity mechanism for packets and malformed 109f5514f08SRobert Watson * packets that would otherwise be discarded due to bad checksums, and may 110f5514f08SRobert Watson * cause problems (especially for NFS data blocks). 11174eb3236SWarner Losh */ 11240b676beSBjoern A. Zeeb VNET_DEFINE(int, udp_cksum) = 1; 11340b676beSBjoern A. Zeeb SYSCTL_VNET_INT(_net_inet_udp, UDPCTL_CHECKSUM, checksum, CTLFLAG_RW, 11440b676beSBjoern A. Zeeb &VNET_NAME(udp_cksum), 0, "compute udp checksum"); 115df8bae1dSRodney W. Grimes 116afdb4274SRobert Watson int udp_log_in_vain = 0; 117816a3d83SPoul-Henning Kamp SYSCTL_INT(_net_inet_udp, OID_AUTO, log_in_vain, CTLFLAG_RW, 118afdb4274SRobert Watson &udp_log_in_vain, 0, "Log all incoming UDP packets"); 119816a3d83SPoul-Henning Kamp 12082cea7e6SBjoern A. Zeeb VNET_DEFINE(int, udp_blackhole) = 0; 121eddfbb76SRobert Watson SYSCTL_VNET_INT(_net_inet_udp, OID_AUTO, blackhole, CTLFLAG_RW, 122eddfbb76SRobert Watson &VNET_NAME(udp_blackhole), 0, 1233329b236SRobert Watson "Do not send port unreachables for refused connects"); 12416f7f31fSGeoff Rehmet 12543bbb6aaSRobert Watson u_long udp_sendspace = 9216; /* really max datagram size */ 12643bbb6aaSRobert Watson /* 40 1K datagrams */ 12743bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_MAXDGRAM, maxdgram, CTLFLAG_RW, 12843bbb6aaSRobert Watson &udp_sendspace, 0, "Maximum outgoing UDP datagram size"); 12943bbb6aaSRobert Watson 13043bbb6aaSRobert Watson u_long udp_recvspace = 40 * (1024 + 13143bbb6aaSRobert Watson #ifdef INET6 13243bbb6aaSRobert Watson sizeof(struct sockaddr_in6) 13343bbb6aaSRobert Watson #else 13443bbb6aaSRobert Watson sizeof(struct sockaddr_in) 13543bbb6aaSRobert Watson #endif 13643bbb6aaSRobert Watson ); 13743bbb6aaSRobert Watson 13843bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_RECVSPACE, recvspace, CTLFLAG_RW, 13943bbb6aaSRobert Watson &udp_recvspace, 0, "Maximum space for incoming UDP datagrams"); 14043bbb6aaSRobert Watson 141eddfbb76SRobert Watson VNET_DEFINE(struct inpcbhead, udb); /* from udp_var.h */ 142eddfbb76SRobert Watson VNET_DEFINE(struct inpcbinfo, udbinfo); 1433e288e62SDimitry Andric static VNET_DEFINE(uma_zone_t, udpcb_zone); 1441e77c105SRobert Watson #define V_udpcb_zone VNET(udpcb_zone) 14515bd2b43SDavid Greenman 14615bd2b43SDavid Greenman #ifndef UDBHASHSIZE 147e2ed8f35SAlexander Motin #define UDBHASHSIZE 128 14815bd2b43SDavid Greenman #endif 14915bd2b43SDavid Greenman 1505b7cb97cSAndrey V. Elsukov VNET_PCPUSTAT_DEFINE(struct udpstat, udpstat); /* from udp_var.h */ 1515b7cb97cSAndrey V. Elsukov VNET_PCPUSTAT_SYSINIT(udpstat); 1525b7cb97cSAndrey V. Elsukov SYSCTL_VNET_PCPUSTAT(_net_inet_udp, UDPCTL_STATS, stats, struct udpstat, 1535b7cb97cSAndrey V. Elsukov udpstat, "UDP statistics (struct udpstat, netinet/udp_var.h)"); 154f2ea20e6SGarrett Wollman 1555b7cb97cSAndrey V. Elsukov #ifdef VIMAGE 1565b7cb97cSAndrey V. Elsukov VNET_PCPUSTAT_SYSUNINIT(udpstat); 1575b7cb97cSAndrey V. Elsukov #endif /* VIMAGE */ 15879288c11SBjoern A. Zeeb #ifdef INET 159bc725eafSRobert Watson static void udp_detach(struct socket *so); 1604d77a549SAlfred Perlstein static int udp_output(struct inpcb *, struct mbuf *, struct sockaddr *, 1614d77a549SAlfred Perlstein struct mbuf *, struct thread *); 16279288c11SBjoern A. Zeeb #endif 16379288c11SBjoern A. Zeeb 1647b495c44SVANHULLEBUS Yvan #ifdef IPSEC 1657b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 1667b495c44SVANHULLEBUS Yvan #define UF_ESPINUDP_ALL (UF_ESPINUDP_NON_IKE|UF_ESPINUDP) 1677b495c44SVANHULLEBUS Yvan #ifdef INET 1687b495c44SVANHULLEBUS Yvan static struct mbuf *udp4_espdecap(struct inpcb *, struct mbuf *, int); 1697b495c44SVANHULLEBUS Yvan #endif 1707b495c44SVANHULLEBUS Yvan #endif /* IPSEC_NAT_T */ 1717b495c44SVANHULLEBUS Yvan #endif /* IPSEC */ 172df8bae1dSRodney W. Grimes 1734f590175SPaul Saab static void 1744f590175SPaul Saab udp_zone_change(void *tag) 1754f590175SPaul Saab { 1764f590175SPaul Saab 177603724d3SBjoern A. Zeeb uma_zone_set_max(V_udbinfo.ipi_zone, maxsockets); 1786a9148feSBjoern A. Zeeb uma_zone_set_max(V_udpcb_zone, maxsockets); 1794f590175SPaul Saab } 1804f590175SPaul Saab 181d915b280SStephan Uphoff static int 182d915b280SStephan Uphoff udp_inpcb_init(void *mem, int size, int flags) 183d915b280SStephan Uphoff { 184af1ee11dSRobert Watson struct inpcb *inp; 18508651e1fSJohn Baldwin 186af1ee11dSRobert Watson inp = mem; 187d915b280SStephan Uphoff INP_LOCK_INIT(inp, "inp", "udpinp"); 188d915b280SStephan Uphoff return (0); 189d915b280SStephan Uphoff } 190d915b280SStephan Uphoff 191df8bae1dSRodney W. Grimes void 192af1ee11dSRobert Watson udp_init(void) 193df8bae1dSRodney W. Grimes { 194af1ee11dSRobert Watson 1959bcd427bSRobert Watson in_pcbinfo_init(&V_udbinfo, "udp", &V_udb, UDBHASHSIZE, UDBHASHSIZE, 19652cd27cbSRobert Watson "udp_inpcb", udp_inpcb_init, NULL, UMA_ZONE_NOFREE, 19752cd27cbSRobert Watson IPI_HASHFIELDS_2TUPLE); 1986a9148feSBjoern A. Zeeb V_udpcb_zone = uma_zcreate("udpcb", sizeof(struct udpcb), 1996a9148feSBjoern A. Zeeb NULL, NULL, NULL, NULL, UMA_ALIGN_PTR, UMA_ZONE_NOFREE); 2006a9148feSBjoern A. Zeeb uma_zone_set_max(V_udpcb_zone, maxsockets); 2016acd596eSPawel Jakub Dawidek uma_zone_set_warning(V_udpcb_zone, "kern.ipc.maxsockets limit reached"); 2024f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, udp_zone_change, NULL, 2034f590175SPaul Saab EVENTHANDLER_PRI_ANY); 204df8bae1dSRodney W. Grimes } 205df8bae1dSRodney W. Grimes 206315e3e38SRobert Watson /* 207315e3e38SRobert Watson * Kernel module interface for updating udpstat. The argument is an index 208315e3e38SRobert Watson * into udpstat treated as an array of u_long. While this encodes the 209315e3e38SRobert Watson * general layout of udpstat into the caller, it doesn't encode its location, 210315e3e38SRobert Watson * so that future changes to add, for example, per-CPU stats support won't 211315e3e38SRobert Watson * cause binary compatibility problems for kernel modules. 212315e3e38SRobert Watson */ 213315e3e38SRobert Watson void 214315e3e38SRobert Watson kmod_udpstat_inc(int statnum) 215315e3e38SRobert Watson { 216315e3e38SRobert Watson 2175b7cb97cSAndrey V. Elsukov counter_u64_add(VNET(udpstat)[statnum], 1); 218315e3e38SRobert Watson } 219315e3e38SRobert Watson 2206a9148feSBjoern A. Zeeb int 2216a9148feSBjoern A. Zeeb udp_newudpcb(struct inpcb *inp) 2226a9148feSBjoern A. Zeeb { 2236a9148feSBjoern A. Zeeb struct udpcb *up; 2246a9148feSBjoern A. Zeeb 2256a9148feSBjoern A. Zeeb up = uma_zalloc(V_udpcb_zone, M_NOWAIT | M_ZERO); 2266a9148feSBjoern A. Zeeb if (up == NULL) 2276a9148feSBjoern A. Zeeb return (ENOBUFS); 2286a9148feSBjoern A. Zeeb inp->inp_ppcb = up; 2296a9148feSBjoern A. Zeeb return (0); 2306a9148feSBjoern A. Zeeb } 2316a9148feSBjoern A. Zeeb 2326a9148feSBjoern A. Zeeb void 2336a9148feSBjoern A. Zeeb udp_discardcb(struct udpcb *up) 2346a9148feSBjoern A. Zeeb { 2356a9148feSBjoern A. Zeeb 2366a9148feSBjoern A. Zeeb uma_zfree(V_udpcb_zone, up); 2376a9148feSBjoern A. Zeeb } 2386a9148feSBjoern A. Zeeb 239bc29160dSMarko Zec #ifdef VIMAGE 240bc29160dSMarko Zec void 241bc29160dSMarko Zec udp_destroy(void) 242bc29160dSMarko Zec { 243bc29160dSMarko Zec 2449bcd427bSRobert Watson in_pcbinfo_destroy(&V_udbinfo); 245391dab1cSBjoern A. Zeeb uma_zdestroy(V_udpcb_zone); 246bc29160dSMarko Zec } 247bc29160dSMarko Zec #endif 248bc29160dSMarko Zec 24979288c11SBjoern A. Zeeb #ifdef INET 25043bbb6aaSRobert Watson /* 25143bbb6aaSRobert Watson * Subroutine of udp_input(), which appends the provided mbuf chain to the 25243bbb6aaSRobert Watson * passed pcb/socket. The caller must provide a sockaddr_in via udp_in that 25343bbb6aaSRobert Watson * contains the source address. If the socket ends up being an IPv6 socket, 25443bbb6aaSRobert Watson * udp_append() will convert to a sockaddr_in6 before passing the address 25543bbb6aaSRobert Watson * into the socket code. 25643bbb6aaSRobert Watson */ 25743bbb6aaSRobert Watson static void 25843bbb6aaSRobert Watson udp_append(struct inpcb *inp, struct ip *ip, struct mbuf *n, int off, 25943bbb6aaSRobert Watson struct sockaddr_in *udp_in) 26043bbb6aaSRobert Watson { 26143bbb6aaSRobert Watson struct sockaddr *append_sa; 26243bbb6aaSRobert Watson struct socket *so; 26343bbb6aaSRobert Watson struct mbuf *opts = 0; 26443bbb6aaSRobert Watson #ifdef INET6 26543bbb6aaSRobert Watson struct sockaddr_in6 udp_in6; 26643bbb6aaSRobert Watson #endif 2677b495c44SVANHULLEBUS Yvan struct udpcb *up; 26843bbb6aaSRobert Watson 269fa046d87SRobert Watson INP_LOCK_ASSERT(inp); 27043bbb6aaSRobert Watson 27179bb84fbSEdward Tomasz Napierala /* 27279bb84fbSEdward Tomasz Napierala * Engage the tunneling protocol. 27379bb84fbSEdward Tomasz Napierala */ 27479bb84fbSEdward Tomasz Napierala up = intoudpcb(inp); 27579bb84fbSEdward Tomasz Napierala if (up->u_tun_func != NULL) { 27679bb84fbSEdward Tomasz Napierala (*up->u_tun_func)(n, off, inp); 27779bb84fbSEdward Tomasz Napierala return; 27879bb84fbSEdward Tomasz Napierala } 27979bb84fbSEdward Tomasz Napierala 28079bb84fbSEdward Tomasz Napierala if (n == NULL) 28179bb84fbSEdward Tomasz Napierala return; 28279bb84fbSEdward Tomasz Napierala 28379bb84fbSEdward Tomasz Napierala off += sizeof(struct udphdr); 28479bb84fbSEdward Tomasz Napierala 28543bbb6aaSRobert Watson #ifdef IPSEC 28643bbb6aaSRobert Watson /* Check AH/ESP integrity. */ 28743bbb6aaSRobert Watson if (ipsec4_in_reject(n, inp)) { 28843bbb6aaSRobert Watson m_freem(n); 2896794f460SAndrey V. Elsukov IPSECSTAT_INC(ips_in_polvio); 29043bbb6aaSRobert Watson return; 29143bbb6aaSRobert Watson } 2927b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 2937b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 2947b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: udpcb NULL", __func__)); 2957b495c44SVANHULLEBUS Yvan if (up->u_flags & UF_ESPINUDP_ALL) { /* IPSec UDP encaps. */ 2967b495c44SVANHULLEBUS Yvan n = udp4_espdecap(inp, n, off); 2977b495c44SVANHULLEBUS Yvan if (n == NULL) /* Consumed. */ 2987b495c44SVANHULLEBUS Yvan return; 2997b495c44SVANHULLEBUS Yvan } 3007b495c44SVANHULLEBUS Yvan #endif /* IPSEC_NAT_T */ 30143bbb6aaSRobert Watson #endif /* IPSEC */ 30243bbb6aaSRobert Watson #ifdef MAC 30330d239bcSRobert Watson if (mac_inpcb_check_deliver(inp, n) != 0) { 30443bbb6aaSRobert Watson m_freem(n); 30543bbb6aaSRobert Watson return; 30643bbb6aaSRobert Watson } 30779288c11SBjoern A. Zeeb #endif /* MAC */ 30843bbb6aaSRobert Watson if (inp->inp_flags & INP_CONTROLOPTS || 30943bbb6aaSRobert Watson inp->inp_socket->so_options & (SO_TIMESTAMP | SO_BINTIME)) { 31043bbb6aaSRobert Watson #ifdef INET6 3119a38ba81SBjoern A. Zeeb if (inp->inp_vflag & INP_IPV6) 31248d48eb9SBjoern A. Zeeb (void)ip6_savecontrol_v4(inp, n, &opts, NULL); 3139a38ba81SBjoern A. Zeeb else 31479288c11SBjoern A. Zeeb #endif /* INET6 */ 31543bbb6aaSRobert Watson ip_savecontrol(inp, &opts, ip, n); 31643bbb6aaSRobert Watson } 31743bbb6aaSRobert Watson #ifdef INET6 31843bbb6aaSRobert Watson if (inp->inp_vflag & INP_IPV6) { 31943bbb6aaSRobert Watson bzero(&udp_in6, sizeof(udp_in6)); 32043bbb6aaSRobert Watson udp_in6.sin6_len = sizeof(udp_in6); 32143bbb6aaSRobert Watson udp_in6.sin6_family = AF_INET6; 32243bbb6aaSRobert Watson in6_sin_2_v4mapsin6(udp_in, &udp_in6); 32343bbb6aaSRobert Watson append_sa = (struct sockaddr *)&udp_in6; 32443bbb6aaSRobert Watson } else 32579288c11SBjoern A. Zeeb #endif /* INET6 */ 32643bbb6aaSRobert Watson append_sa = (struct sockaddr *)udp_in; 32743bbb6aaSRobert Watson m_adj(n, off); 32843bbb6aaSRobert Watson 32943bbb6aaSRobert Watson so = inp->inp_socket; 33043bbb6aaSRobert Watson SOCKBUF_LOCK(&so->so_rcv); 33143bbb6aaSRobert Watson if (sbappendaddr_locked(&so->so_rcv, append_sa, n, opts) == 0) { 33243bbb6aaSRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 33343bbb6aaSRobert Watson m_freem(n); 33443bbb6aaSRobert Watson if (opts) 33543bbb6aaSRobert Watson m_freem(opts); 336026decb8SRobert Watson UDPSTAT_INC(udps_fullsock); 33743bbb6aaSRobert Watson } else 33843bbb6aaSRobert Watson sorwakeup_locked(so); 33943bbb6aaSRobert Watson } 34043bbb6aaSRobert Watson 341df8bae1dSRodney W. Grimes void 3423329b236SRobert Watson udp_input(struct mbuf *m, int off) 343df8bae1dSRodney W. Grimes { 344cfa1ca9dSYoshinobu Inoue int iphlen = off; 3453329b236SRobert Watson struct ip *ip; 3463329b236SRobert Watson struct udphdr *uh; 34771498f30SBruce M Simpson struct ifnet *ifp; 3483329b236SRobert Watson struct inpcb *inp; 3498f134647SGleb Smirnoff uint16_t len, ip_len; 350df8bae1dSRodney W. Grimes struct ip save_ip; 351d4b509bdSRobert Watson struct sockaddr_in udp_in; 3520b4ae859SGleb Smirnoff struct m_tag *fwd_tag; 353df8bae1dSRodney W. Grimes 35471498f30SBruce M Simpson ifp = m->m_pkthdr.rcvif; 355026decb8SRobert Watson UDPSTAT_INC(udps_ipackets); 356df8bae1dSRodney W. Grimes 357df8bae1dSRodney W. Grimes /* 3583329b236SRobert Watson * Strip IP options, if any; should skip this, make available to 3593329b236SRobert Watson * user, and use on returned packets, but we don't yet have a way to 3603329b236SRobert Watson * check the checksum with options still present. 361df8bae1dSRodney W. Grimes */ 362df8bae1dSRodney W. Grimes if (iphlen > sizeof (struct ip)) { 363105bd211SGleb Smirnoff ip_stripoptions(m); 364df8bae1dSRodney W. Grimes iphlen = sizeof(struct ip); 365df8bae1dSRodney W. Grimes } 366df8bae1dSRodney W. Grimes 367df8bae1dSRodney W. Grimes /* 368df8bae1dSRodney W. Grimes * Get IP and UDP header together in first mbuf. 369df8bae1dSRodney W. Grimes */ 370df8bae1dSRodney W. Grimes ip = mtod(m, struct ip *); 371df8bae1dSRodney W. Grimes if (m->m_len < iphlen + sizeof(struct udphdr)) { 372df8bae1dSRodney W. Grimes if ((m = m_pullup(m, iphlen + sizeof(struct udphdr))) == 0) { 373026decb8SRobert Watson UDPSTAT_INC(udps_hdrops); 374df8bae1dSRodney W. Grimes return; 375df8bae1dSRodney W. Grimes } 376df8bae1dSRodney W. Grimes ip = mtod(m, struct ip *); 377df8bae1dSRodney W. Grimes } 378df8bae1dSRodney W. Grimes uh = (struct udphdr *)((caddr_t)ip + iphlen); 379df8bae1dSRodney W. Grimes 3803329b236SRobert Watson /* 3813329b236SRobert Watson * Destination port of 0 is illegal, based on RFC768. 3823329b236SRobert Watson */ 383686cdd19SJun-ichiro itojun Hagino if (uh->uh_dport == 0) 384f76fcf6dSJeffrey Hsu goto badunlocked; 385686cdd19SJun-ichiro itojun Hagino 386df8bae1dSRodney W. Grimes /* 3873329b236SRobert Watson * Construct sockaddr format source address. Stuff source address 3883329b236SRobert Watson * and datagram in user buffer. 389b9234fafSSam Leffler */ 390d4b509bdSRobert Watson bzero(&udp_in, sizeof(udp_in)); 391d4b509bdSRobert Watson udp_in.sin_len = sizeof(udp_in); 392d4b509bdSRobert Watson udp_in.sin_family = AF_INET; 393b9234fafSSam Leffler udp_in.sin_port = uh->uh_sport; 394b9234fafSSam Leffler udp_in.sin_addr = ip->ip_src; 395b9234fafSSam Leffler 396b9234fafSSam Leffler /* 397af1ee11dSRobert Watson * Make mbuf data length reflect UDP length. If not enough data to 398af1ee11dSRobert Watson * reflect UDP length, drop. 399df8bae1dSRodney W. Grimes */ 400df8bae1dSRodney W. Grimes len = ntohs((u_short)uh->uh_ulen); 4018ad458a4SGleb Smirnoff ip_len = ntohs(ip->ip_len) - iphlen; 4028f134647SGleb Smirnoff if (ip_len != len) { 4038f134647SGleb Smirnoff if (len > ip_len || len < sizeof(struct udphdr)) { 404026decb8SRobert Watson UDPSTAT_INC(udps_badlen); 405f76fcf6dSJeffrey Hsu goto badunlocked; 406df8bae1dSRodney W. Grimes } 4078f134647SGleb Smirnoff m_adj(m, len - ip_len); 408df8bae1dSRodney W. Grimes } 4093329b236SRobert Watson 410df8bae1dSRodney W. Grimes /* 4113329b236SRobert Watson * Save a copy of the IP header in case we want restore it for 4123329b236SRobert Watson * sending an ICMP error message in response. 413df8bae1dSRodney W. Grimes */ 414603724d3SBjoern A. Zeeb if (!V_udp_blackhole) 415df8bae1dSRodney W. Grimes save_ip = *ip; 416cce418d3SMatt Jacob else 417cce418d3SMatt Jacob memset(&save_ip, 0, sizeof(save_ip)); 418df8bae1dSRodney W. Grimes 419df8bae1dSRodney W. Grimes /* 420df8bae1dSRodney W. Grimes * Checksum extended UDP header and data. 421df8bae1dSRodney W. Grimes */ 4226dfab5b1SGarrett Wollman if (uh->uh_sum) { 42339629c92SDavid Malone u_short uh_sum; 42439629c92SDavid Malone 425db4f9cc7SJonathan Lemon if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) { 426db4f9cc7SJonathan Lemon if (m->m_pkthdr.csum_flags & CSUM_PSEUDO_HDR) 42739629c92SDavid Malone uh_sum = m->m_pkthdr.csum_data; 428db4f9cc7SJonathan Lemon else 42939629c92SDavid Malone uh_sum = in_pseudo(ip->ip_src.s_addr, 430506f4949SRuslan Ermilov ip->ip_dst.s_addr, htonl((u_short)len + 431db4f9cc7SJonathan Lemon m->m_pkthdr.csum_data + IPPROTO_UDP)); 43239629c92SDavid Malone uh_sum ^= 0xffff; 433db4f9cc7SJonathan Lemon } else { 434cb342100SHajimu UMEMOTO char b[9]; 435af1ee11dSRobert Watson 436cb342100SHajimu UMEMOTO bcopy(((struct ipovly *)ip)->ih_x1, b, 9); 4376effc713SDoug Rabson bzero(((struct ipovly *)ip)->ih_x1, 9); 438df8bae1dSRodney W. Grimes ((struct ipovly *)ip)->ih_len = uh->uh_ulen; 43939629c92SDavid Malone uh_sum = in_cksum(m, len + sizeof (struct ip)); 440cb342100SHajimu UMEMOTO bcopy(b, ((struct ipovly *)ip)->ih_x1, 9); 441db4f9cc7SJonathan Lemon } 44239629c92SDavid Malone if (uh_sum) { 443026decb8SRobert Watson UDPSTAT_INC(udps_badsum); 444df8bae1dSRodney W. Grimes m_freem(m); 445df8bae1dSRodney W. Grimes return; 446df8bae1dSRodney W. Grimes } 447fb9aaba0SRuslan Ermilov } else 448026decb8SRobert Watson UDPSTAT_INC(udps_nosum); 449df8bae1dSRodney W. Grimes 450df8bae1dSRodney W. Grimes if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) || 45171498f30SBruce M Simpson in_broadcast(ip->ip_dst, ifp)) { 45282c23ebaSBill Fenner struct inpcb *last; 45371498f30SBruce M Simpson struct ip_moptions *imo; 4543329b236SRobert Watson 455fa046d87SRobert Watson INP_INFO_RLOCK(&V_udbinfo); 456df8bae1dSRodney W. Grimes last = NULL; 457603724d3SBjoern A. Zeeb LIST_FOREACH(inp, &V_udb, inp_list) { 4589c1df695SRobert Watson if (inp->inp_lport != uh->uh_dport) 459f76fcf6dSJeffrey Hsu continue; 460cfa1ca9dSYoshinobu Inoue #ifdef INET6 461369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 4629c1df695SRobert Watson continue; 463cfa1ca9dSYoshinobu Inoue #endif 46471498f30SBruce M Simpson if (inp->inp_laddr.s_addr != INADDR_ANY && 46571498f30SBruce M Simpson inp->inp_laddr.s_addr != ip->ip_dst.s_addr) 4669c1df695SRobert Watson continue; 46771498f30SBruce M Simpson if (inp->inp_faddr.s_addr != INADDR_ANY && 46871498f30SBruce M Simpson inp->inp_faddr.s_addr != ip->ip_src.s_addr) 46971498f30SBruce M Simpson continue; 47071498f30SBruce M Simpson if (inp->inp_fport != 0 && 471df8bae1dSRodney W. Grimes inp->inp_fport != uh->uh_sport) 4729c1df695SRobert Watson continue; 47371498f30SBruce M Simpson 474119d85f6SRobert Watson INP_RLOCK(inp); 475df8bae1dSRodney W. Grimes 47683453a06SBruce M Simpson /* 477fa046d87SRobert Watson * XXXRW: Because we weren't holding either the inpcb 478fa046d87SRobert Watson * or the hash lock when we checked for a match 479fa046d87SRobert Watson * before, we should probably recheck now that the 480fa046d87SRobert Watson * inpcb lock is held. 481fa046d87SRobert Watson */ 482fa046d87SRobert Watson 483fa046d87SRobert Watson /* 48471498f30SBruce M Simpson * Handle socket delivery policy for any-source 48571498f30SBruce M Simpson * and source-specific multicast. [RFC3678] 48683453a06SBruce M Simpson */ 48771498f30SBruce M Simpson imo = inp->inp_moptions; 488a38b1c8cSRandall Stewart if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr))) { 489d10910e6SBruce M Simpson struct sockaddr_in group; 490d10910e6SBruce M Simpson int blocked; 491a38b1c8cSRandall Stewart if (imo == NULL) { 492a38b1c8cSRandall Stewart INP_RUNLOCK(inp); 493a38b1c8cSRandall Stewart continue; 494a38b1c8cSRandall Stewart } 495d10910e6SBruce M Simpson bzero(&group, sizeof(struct sockaddr_in)); 496d10910e6SBruce M Simpson group.sin_len = sizeof(struct sockaddr_in); 497d10910e6SBruce M Simpson group.sin_family = AF_INET; 498d10910e6SBruce M Simpson group.sin_addr = ip->ip_dst; 49971498f30SBruce M Simpson 500d10910e6SBruce M Simpson blocked = imo_multi_filter(imo, ifp, 501d10910e6SBruce M Simpson (struct sockaddr *)&group, 50271498f30SBruce M Simpson (struct sockaddr *)&udp_in); 503d10910e6SBruce M Simpson if (blocked != MCAST_PASS) { 504d10910e6SBruce M Simpson if (blocked == MCAST_NOTGMEMBER) 50586425c62SRobert Watson IPSTAT_INC(ips_notmember); 506d10910e6SBruce M Simpson if (blocked == MCAST_NOTSMEMBER || 507d10910e6SBruce M Simpson blocked == MCAST_MUTED) 508026decb8SRobert Watson UDPSTAT_INC(udps_filtermcast); 509119d85f6SRobert Watson INP_RUNLOCK(inp); 5109c1df695SRobert Watson continue; 5119c1df695SRobert Watson } 51283453a06SBruce M Simpson } 513df8bae1dSRodney W. Grimes if (last != NULL) { 514df8bae1dSRodney W. Grimes struct mbuf *n; 515df8bae1dSRodney W. Grimes 516032dcc76SLuigi Rizzo n = m_copy(m, 0, M_COPYALL); 51779bb84fbSEdward Tomasz Napierala udp_append(last, ip, n, iphlen, &udp_in); 5186a9148feSBjoern A. Zeeb INP_RUNLOCK(last); 519df8bae1dSRodney W. Grimes } 52082c23ebaSBill Fenner last = inp; 521df8bae1dSRodney W. Grimes /* 522df8bae1dSRodney W. Grimes * Don't look for additional matches if this one does 523df8bae1dSRodney W. Grimes * not have either the SO_REUSEPORT or SO_REUSEADDR 5243329b236SRobert Watson * socket options set. This heuristic avoids 5253329b236SRobert Watson * searching through all pcbs in the common case of a 5263329b236SRobert Watson * non-shared port. It assumes that an application 5273329b236SRobert Watson * will never clear these options after setting them. 528df8bae1dSRodney W. Grimes */ 5293329b236SRobert Watson if ((last->inp_socket->so_options & 5303329b236SRobert Watson (SO_REUSEPORT|SO_REUSEADDR)) == 0) 531df8bae1dSRodney W. Grimes break; 532df8bae1dSRodney W. Grimes } 533df8bae1dSRodney W. Grimes 534df8bae1dSRodney W. Grimes if (last == NULL) { 535df8bae1dSRodney W. Grimes /* 5363329b236SRobert Watson * No matching pcb found; discard datagram. (No need 5373329b236SRobert Watson * to send an ICMP Port Unreachable for a broadcast 5383329b236SRobert Watson * or multicast datgram.) 539df8bae1dSRodney W. Grimes */ 540026decb8SRobert Watson UDPSTAT_INC(udps_noportbcast); 541fa046d87SRobert Watson if (inp) 542fa046d87SRobert Watson INP_RUNLOCK(inp); 543fa046d87SRobert Watson INP_INFO_RUNLOCK(&V_udbinfo); 544fa046d87SRobert Watson goto badunlocked; 545df8bae1dSRodney W. Grimes } 54679bb84fbSEdward Tomasz Napierala udp_append(last, ip, m, iphlen, &udp_in); 547c7c7ea4bSRandall Stewart INP_RUNLOCK(last); 548c7c7ea4bSRandall Stewart INP_INFO_RUNLOCK(&V_udbinfo); 549df8bae1dSRodney W. Grimes return; 550df8bae1dSRodney W. Grimes } 5513329b236SRobert Watson 552df8bae1dSRodney W. Grimes /* 5536d6a026bSDavid Greenman * Locate pcb for datagram. 554df8bae1dSRodney W. Grimes */ 555c1de64a4SAndrey V. Elsukov 5568a006adbSBjoern A. Zeeb /* 5578a006adbSBjoern A. Zeeb * Grab info from PACKET_TAG_IPFORWARD tag prepended to the chain. 5588a006adbSBjoern A. Zeeb */ 559ffdbf9daSAndrey V. Elsukov if ((m->m_flags & M_IP_NEXTHOP) && 560c1de64a4SAndrey V. Elsukov (fwd_tag = m_tag_find(m, PACKET_TAG_IPFORWARD, NULL)) != NULL) { 5618a006adbSBjoern A. Zeeb struct sockaddr_in *next_hop; 5628a006adbSBjoern A. Zeeb 5638a006adbSBjoern A. Zeeb next_hop = (struct sockaddr_in *)(fwd_tag + 1); 5648a006adbSBjoern A. Zeeb 5658a006adbSBjoern A. Zeeb /* 5668a006adbSBjoern A. Zeeb * Transparently forwarded. Pretend to be the destination. 5678a006adbSBjoern A. Zeeb * Already got one like this? 5688a006adbSBjoern A. Zeeb */ 569d3c1f003SRobert Watson inp = in_pcblookup_mbuf(&V_udbinfo, ip->ip_src, uh->uh_sport, 5708a006adbSBjoern A. Zeeb ip->ip_dst, uh->uh_dport, INPLOOKUP_RLOCKPCB, ifp, m); 5718a006adbSBjoern A. Zeeb if (!inp) { 5728a006adbSBjoern A. Zeeb /* 5738a006adbSBjoern A. Zeeb * It's new. Try to find the ambushing socket. 5748a006adbSBjoern A. Zeeb * Because we've rewritten the destination address, 5758a006adbSBjoern A. Zeeb * any hardware-generated hash is ignored. 5768a006adbSBjoern A. Zeeb */ 5778a006adbSBjoern A. Zeeb inp = in_pcblookup(&V_udbinfo, ip->ip_src, 5788a006adbSBjoern A. Zeeb uh->uh_sport, next_hop->sin_addr, 5798a006adbSBjoern A. Zeeb next_hop->sin_port ? htons(next_hop->sin_port) : 5808a006adbSBjoern A. Zeeb uh->uh_dport, INPLOOKUP_WILDCARD | 5818a006adbSBjoern A. Zeeb INPLOOKUP_RLOCKPCB, ifp); 5828a006adbSBjoern A. Zeeb } 5838a006adbSBjoern A. Zeeb /* Remove the tag from the packet. We don't need it anymore. */ 5848a006adbSBjoern A. Zeeb m_tag_delete(m, fwd_tag); 585ffdbf9daSAndrey V. Elsukov m->m_flags &= ~M_IP_NEXTHOP; 5868a006adbSBjoern A. Zeeb } else 5878a006adbSBjoern A. Zeeb inp = in_pcblookup_mbuf(&V_udbinfo, ip->ip_src, uh->uh_sport, 5888a006adbSBjoern A. Zeeb ip->ip_dst, uh->uh_dport, INPLOOKUP_WILDCARD | 5898a006adbSBjoern A. Zeeb INPLOOKUP_RLOCKPCB, ifp, m); 59015bd2b43SDavid Greenman if (inp == NULL) { 591afdb4274SRobert Watson if (udp_log_in_vain) { 592df5c0b8aSBill Fenner char buf[4*sizeof "123"]; 59375cfc95fSAndrey A. Chernov 59475cfc95fSAndrey A. Chernov strcpy(buf, inet_ntoa(ip->ip_dst)); 595592071e8SBruce Evans log(LOG_INFO, 596592071e8SBruce Evans "Connection attempt to UDP %s:%d from %s:%d\n", 597592071e8SBruce Evans buf, ntohs(uh->uh_dport), inet_ntoa(ip->ip_src), 598592071e8SBruce Evans ntohs(uh->uh_sport)); 59975cfc95fSAndrey A. Chernov } 600026decb8SRobert Watson UDPSTAT_INC(udps_noport); 601df8bae1dSRodney W. Grimes if (m->m_flags & (M_BCAST | M_MCAST)) { 602026decb8SRobert Watson UDPSTAT_INC(udps_noportbcast); 603fa046d87SRobert Watson goto badunlocked; 604df8bae1dSRodney W. Grimes } 605603724d3SBjoern A. Zeeb if (V_udp_blackhole) 606fa046d87SRobert Watson goto badunlocked; 6071cbd978eSLuigi Rizzo if (badport_bandlim(BANDLIM_ICMP_UNREACH) < 0) 608fa046d87SRobert Watson goto badunlocked; 60904287599SRuslan Ermilov *ip = save_ip; 610582a7760SBruce Evans icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_PORT, 0, 0); 611df8bae1dSRodney W. Grimes return; 612df8bae1dSRodney W. Grimes } 6133329b236SRobert Watson 6143329b236SRobert Watson /* 6153329b236SRobert Watson * Check the minimum TTL for socket. 6163329b236SRobert Watson */ 617fa046d87SRobert Watson INP_RLOCK_ASSERT(inp); 61810cc62b7SRobert Watson if (inp->inp_ip_minttl && inp->inp_ip_minttl > ip->ip_ttl) { 61910cc62b7SRobert Watson INP_RUNLOCK(inp); 620fa046d87SRobert Watson m_freem(m); 621fa046d87SRobert Watson return; 62210cc62b7SRobert Watson } 62357f60867SMark Johnston 6241ad19fb6SMark Johnston UDP_PROBE(receive, NULL, inp, ip, inp, uh); 62579bb84fbSEdward Tomasz Napierala udp_append(inp, ip, m, iphlen, &udp_in); 626119d85f6SRobert Watson INP_RUNLOCK(inp); 627df8bae1dSRodney W. Grimes return; 62861ffc0b1SJeffrey Hsu 629f76fcf6dSJeffrey Hsu badunlocked: 630df8bae1dSRodney W. Grimes m_freem(m); 631cfa1ca9dSYoshinobu Inoue } 63279288c11SBjoern A. Zeeb #endif /* INET */ 633cfa1ca9dSYoshinobu Inoue 634cfa1ca9dSYoshinobu Inoue /* 6353329b236SRobert Watson * Notify a udp user of an asynchronous error; just wake up so that they can 6363329b236SRobert Watson * collect error status. 637df8bae1dSRodney W. Grimes */ 6383ce144eaSJeffrey Hsu struct inpcb * 6393329b236SRobert Watson udp_notify(struct inpcb *inp, int errno) 640df8bae1dSRodney W. Grimes { 6413329b236SRobert Watson 642ac9ae279SRobert Watson /* 643ac9ae279SRobert Watson * While udp_ctlinput() always calls udp_notify() with a read lock 644ac9ae279SRobert Watson * when invoking it directly, in_pcbnotifyall() currently uses write 645ac9ae279SRobert Watson * locks due to sharing code with TCP. For now, accept either a read 646ac9ae279SRobert Watson * or a write lock, but a read lock is sufficient. 647ac9ae279SRobert Watson */ 648ac9ae279SRobert Watson INP_LOCK_ASSERT(inp); 6498501a69cSRobert Watson 650df8bae1dSRodney W. Grimes inp->inp_socket->so_error = errno; 651df8bae1dSRodney W. Grimes sorwakeup(inp->inp_socket); 652df8bae1dSRodney W. Grimes sowwakeup(inp->inp_socket); 6533329b236SRobert Watson return (inp); 654df8bae1dSRodney W. Grimes } 655df8bae1dSRodney W. Grimes 65679288c11SBjoern A. Zeeb #ifdef INET 657df8bae1dSRodney W. Grimes void 6583329b236SRobert Watson udp_ctlinput(int cmd, struct sockaddr *sa, void *vip) 659df8bae1dSRodney W. Grimes { 660c693a045SJonathan Lemon struct ip *ip = vip; 661c693a045SJonathan Lemon struct udphdr *uh; 662c693a045SJonathan Lemon struct in_addr faddr; 663c693a045SJonathan Lemon struct inpcb *inp; 664c693a045SJonathan Lemon 665c693a045SJonathan Lemon faddr = ((struct sockaddr_in *)sa)->sin_addr; 666c693a045SJonathan Lemon if (sa->sa_family != AF_INET || faddr.s_addr == INADDR_ANY) 667c693a045SJonathan Lemon return; 668df8bae1dSRodney W. Grimes 66997d8d152SAndre Oppermann /* 67097d8d152SAndre Oppermann * Redirects don't need to be handled up here. 67197d8d152SAndre Oppermann */ 67297d8d152SAndre Oppermann if (PRC_IS_REDIRECT(cmd)) 67397d8d152SAndre Oppermann return; 6743329b236SRobert Watson 67597d8d152SAndre Oppermann /* 67697d8d152SAndre Oppermann * Hostdead is ugly because it goes linearly through all PCBs. 6773329b236SRobert Watson * 6783329b236SRobert Watson * XXX: We never get this from ICMP, otherwise it makes an excellent 6793329b236SRobert Watson * DoS attack on machines with many connections. 68097d8d152SAndre Oppermann */ 68197d8d152SAndre Oppermann if (cmd == PRC_HOSTDEAD) 682af1ee11dSRobert Watson ip = NULL; 683d1c54148SJesper Skriver else if ((unsigned)cmd >= PRC_NCMDS || inetctlerrmap[cmd] == 0) 684df8bae1dSRodney W. Grimes return; 685af1ee11dSRobert Watson if (ip != NULL) { 686df8bae1dSRodney W. Grimes uh = (struct udphdr *)((caddr_t)ip + (ip->ip_hl << 2)); 687fa046d87SRobert Watson inp = in_pcblookup(&V_udbinfo, faddr, uh->uh_dport, 688fa046d87SRobert Watson ip->ip_src, uh->uh_sport, INPLOOKUP_RLOCKPCB, NULL); 689f76fcf6dSJeffrey Hsu if (inp != NULL) { 690fa046d87SRobert Watson INP_RLOCK_ASSERT(inp); 691f76fcf6dSJeffrey Hsu if (inp->inp_socket != NULL) { 692f5514f08SRobert Watson udp_notify(inp, inetctlerrmap[cmd]); 693f76fcf6dSJeffrey Hsu } 694ac9ae279SRobert Watson INP_RUNLOCK(inp); 695f76fcf6dSJeffrey Hsu } 696df8bae1dSRodney W. Grimes } else 697603724d3SBjoern A. Zeeb in_pcbnotifyall(&V_udbinfo, faddr, inetctlerrmap[cmd], 698f5514f08SRobert Watson udp_notify); 699df8bae1dSRodney W. Grimes } 70079288c11SBjoern A. Zeeb #endif /* INET */ 701df8bae1dSRodney W. Grimes 7020312fbe9SPoul-Henning Kamp static int 70382d9ae4eSPoul-Henning Kamp udp_pcblist(SYSCTL_HANDLER_ARGS) 70498271db4SGarrett Wollman { 705277afaffSRobert Watson int error, i, n; 70698271db4SGarrett Wollman struct inpcb *inp, **inp_list; 70798271db4SGarrett Wollman inp_gen_t gencnt; 70898271db4SGarrett Wollman struct xinpgen xig; 70998271db4SGarrett Wollman 71098271db4SGarrett Wollman /* 711f5514f08SRobert Watson * The process of preparing the PCB list is too time-consuming and 71298271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 71398271db4SGarrett Wollman */ 71498271db4SGarrett Wollman if (req->oldptr == 0) { 715603724d3SBjoern A. Zeeb n = V_udbinfo.ipi_count; 716c007b96aSJohn Baldwin n += imax(n / 8, 10); 717c007b96aSJohn Baldwin req->oldidx = 2 * (sizeof xig) + n * sizeof(struct xinpcb); 7183329b236SRobert Watson return (0); 71998271db4SGarrett Wollman } 72098271db4SGarrett Wollman 72198271db4SGarrett Wollman if (req->newptr != 0) 7223329b236SRobert Watson return (EPERM); 72398271db4SGarrett Wollman 72498271db4SGarrett Wollman /* 72598271db4SGarrett Wollman * OK, now we're committed to doing something. 72698271db4SGarrett Wollman */ 727603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 728603724d3SBjoern A. Zeeb gencnt = V_udbinfo.ipi_gencnt; 729603724d3SBjoern A. Zeeb n = V_udbinfo.ipi_count; 730603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 73198271db4SGarrett Wollman 73247934cefSDon Lewis error = sysctl_wire_old_buffer(req, 2 * (sizeof xig) 7335c38b6dbSDon Lewis + n * sizeof(struct xinpcb)); 73447934cefSDon Lewis if (error != 0) 73547934cefSDon Lewis return (error); 7365c38b6dbSDon Lewis 73798271db4SGarrett Wollman xig.xig_len = sizeof xig; 73898271db4SGarrett Wollman xig.xig_count = n; 73998271db4SGarrett Wollman xig.xig_gen = gencnt; 74098271db4SGarrett Wollman xig.xig_sogen = so_gencnt; 74198271db4SGarrett Wollman error = SYSCTL_OUT(req, &xig, sizeof xig); 74298271db4SGarrett Wollman if (error) 7433329b236SRobert Watson return (error); 74498271db4SGarrett Wollman 745a163d034SWarner Losh inp_list = malloc(n * sizeof *inp_list, M_TEMP, M_WAITOK); 74698271db4SGarrett Wollman if (inp_list == 0) 7473329b236SRobert Watson return (ENOMEM); 74898271db4SGarrett Wollman 749603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 750603724d3SBjoern A. Zeeb for (inp = LIST_FIRST(V_udbinfo.ipi_listhead), i = 0; inp && i < n; 751fc2ffbe6SPoul-Henning Kamp inp = LIST_NEXT(inp, inp_list)) { 752d0e157f6SBjoern A. Zeeb INP_WLOCK(inp); 7532ded288cSJeffrey Hsu if (inp->inp_gencnt <= gencnt && 754d0e157f6SBjoern A. Zeeb cr_canseeinpcb(req->td->td_ucred, inp) == 0) { 755d0e157f6SBjoern A. Zeeb in_pcbref(inp); 75698271db4SGarrett Wollman inp_list[i++] = inp; 757d0e157f6SBjoern A. Zeeb } 758d0e157f6SBjoern A. Zeeb INP_WUNLOCK(inp); 7594787fd37SPaul Saab } 760603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 76198271db4SGarrett Wollman n = i; 76298271db4SGarrett Wollman 76398271db4SGarrett Wollman error = 0; 76498271db4SGarrett Wollman for (i = 0; i < n; i++) { 76598271db4SGarrett Wollman inp = inp_list[i]; 7669622e84fSRobert Watson INP_RLOCK(inp); 76798271db4SGarrett Wollman if (inp->inp_gencnt <= gencnt) { 76898271db4SGarrett Wollman struct xinpcb xi; 769d0e157f6SBjoern A. Zeeb 770fd94099eSColin Percival bzero(&xi, sizeof(xi)); 77198271db4SGarrett Wollman xi.xi_len = sizeof xi; 77298271db4SGarrett Wollman /* XXX should avoid extra copy */ 77398271db4SGarrett Wollman bcopy(inp, &xi.xi_inp, sizeof *inp); 77498271db4SGarrett Wollman if (inp->inp_socket) 77598271db4SGarrett Wollman sotoxsocket(inp->inp_socket, &xi.xi_socket); 7764b40c56cSJeffrey Hsu xi.xi_inp.inp_gencnt = inp->inp_gencnt; 7779622e84fSRobert Watson INP_RUNLOCK(inp); 77898271db4SGarrett Wollman error = SYSCTL_OUT(req, &xi, sizeof xi); 779d915b280SStephan Uphoff } else 7809622e84fSRobert Watson INP_RUNLOCK(inp); 78198271db4SGarrett Wollman } 782d0e157f6SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 783d0e157f6SBjoern A. Zeeb for (i = 0; i < n; i++) { 784d0e157f6SBjoern A. Zeeb inp = inp_list[i]; 785fa046d87SRobert Watson INP_RLOCK(inp); 786fa046d87SRobert Watson if (!in_pcbrele_rlocked(inp)) 787fa046d87SRobert Watson INP_RUNLOCK(inp); 788d0e157f6SBjoern A. Zeeb } 789d0e157f6SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 790d0e157f6SBjoern A. Zeeb 79198271db4SGarrett Wollman if (!error) { 79298271db4SGarrett Wollman /* 7933329b236SRobert Watson * Give the user an updated idea of our state. If the 7943329b236SRobert Watson * generation differs from what we told her before, she knows 7953329b236SRobert Watson * that something happened while we were processing this 7963329b236SRobert Watson * request, and it might be necessary to retry. 79798271db4SGarrett Wollman */ 798603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 799603724d3SBjoern A. Zeeb xig.xig_gen = V_udbinfo.ipi_gencnt; 80098271db4SGarrett Wollman xig.xig_sogen = so_gencnt; 801603724d3SBjoern A. Zeeb xig.xig_count = V_udbinfo.ipi_count; 802603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 80398271db4SGarrett Wollman error = SYSCTL_OUT(req, &xig, sizeof xig); 80498271db4SGarrett Wollman } 80598271db4SGarrett Wollman free(inp_list, M_TEMP); 8063329b236SRobert Watson return (error); 80798271db4SGarrett Wollman } 80898271db4SGarrett Wollman 80979c3d51bSMatthew D Fleming SYSCTL_PROC(_net_inet_udp, UDPCTL_PCBLIST, pcblist, 81079c3d51bSMatthew D Fleming CTLTYPE_OPAQUE | CTLFLAG_RD, NULL, 0, 81198271db4SGarrett Wollman udp_pcblist, "S,xinpcb", "List of active UDP sockets"); 81298271db4SGarrett Wollman 81379288c11SBjoern A. Zeeb #ifdef INET 81498271db4SGarrett Wollman static int 81582d9ae4eSPoul-Henning Kamp udp_getcred(SYSCTL_HANDLER_ARGS) 816490d50b6SBrian Feldman { 817c0511d3bSBrian Feldman struct xucred xuc; 818490d50b6SBrian Feldman struct sockaddr_in addrs[2]; 819490d50b6SBrian Feldman struct inpcb *inp; 820277afaffSRobert Watson int error; 821490d50b6SBrian Feldman 82232f9753cSRobert Watson error = priv_check(req->td, PRIV_NETINET_GETCRED); 823490d50b6SBrian Feldman if (error) 824490d50b6SBrian Feldman return (error); 825490d50b6SBrian Feldman error = SYSCTL_IN(req, addrs, sizeof(addrs)); 826490d50b6SBrian Feldman if (error) 827490d50b6SBrian Feldman return (error); 828fa046d87SRobert Watson inp = in_pcblookup(&V_udbinfo, addrs[1].sin_addr, addrs[1].sin_port, 829fa046d87SRobert Watson addrs[0].sin_addr, addrs[0].sin_port, 830fa046d87SRobert Watson INPLOOKUP_WILDCARD | INPLOOKUP_RLOCKPCB, NULL); 8319622e84fSRobert Watson if (inp != NULL) { 832fa046d87SRobert Watson INP_RLOCK_ASSERT(inp); 8339622e84fSRobert Watson if (inp->inp_socket == NULL) 8349622e84fSRobert Watson error = ENOENT; 8359622e84fSRobert Watson if (error == 0) 836f08ef6c5SBjoern A. Zeeb error = cr_canseeinpcb(req->td->td_ucred, inp); 8379622e84fSRobert Watson if (error == 0) 83886d02c5cSBjoern A. Zeeb cru2x(inp->inp_cred, &xuc); 8399622e84fSRobert Watson INP_RUNLOCK(inp); 840fa046d87SRobert Watson } else 8419622e84fSRobert Watson error = ENOENT; 8420e1eebb8SDon Lewis if (error == 0) 8430e1eebb8SDon Lewis error = SYSCTL_OUT(req, &xuc, sizeof(struct xucred)); 844490d50b6SBrian Feldman return (error); 845490d50b6SBrian Feldman } 846490d50b6SBrian Feldman 8477ce87f12SDavid Malone SYSCTL_PROC(_net_inet_udp, OID_AUTO, getcred, 8487ce87f12SDavid Malone CTLTYPE_OPAQUE|CTLFLAG_RW|CTLFLAG_PRISON, 0, 0, 8497ce87f12SDavid Malone udp_getcred, "S,xucred", "Get the xucred of a UDP connection"); 85079288c11SBjoern A. Zeeb #endif /* INET */ 851490d50b6SBrian Feldman 8527b495c44SVANHULLEBUS Yvan int 8537b495c44SVANHULLEBUS Yvan udp_ctloutput(struct socket *so, struct sockopt *sopt) 8547b495c44SVANHULLEBUS Yvan { 8557b495c44SVANHULLEBUS Yvan int error = 0, optval; 8567b495c44SVANHULLEBUS Yvan struct inpcb *inp; 8577b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8587b495c44SVANHULLEBUS Yvan struct udpcb *up; 8597b495c44SVANHULLEBUS Yvan #endif 8607b495c44SVANHULLEBUS Yvan 8617b495c44SVANHULLEBUS Yvan inp = sotoinpcb(so); 8627b495c44SVANHULLEBUS Yvan KASSERT(inp != NULL, ("%s: inp == NULL", __func__)); 8637b495c44SVANHULLEBUS Yvan INP_WLOCK(inp); 8647b495c44SVANHULLEBUS Yvan if (sopt->sopt_level != IPPROTO_UDP) { 8657b495c44SVANHULLEBUS Yvan #ifdef INET6 8667b495c44SVANHULLEBUS Yvan if (INP_CHECK_SOCKAF(so, AF_INET6)) { 8677b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8687b495c44SVANHULLEBUS Yvan error = ip6_ctloutput(so, sopt); 86979288c11SBjoern A. Zeeb } 8707b495c44SVANHULLEBUS Yvan #endif 87179288c11SBjoern A. Zeeb #if defined(INET) && defined(INET6) 87279288c11SBjoern A. Zeeb else 87379288c11SBjoern A. Zeeb #endif 87479288c11SBjoern A. Zeeb #ifdef INET 87579288c11SBjoern A. Zeeb { 8767b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8777b495c44SVANHULLEBUS Yvan error = ip_ctloutput(so, sopt); 8787b495c44SVANHULLEBUS Yvan } 8797b495c44SVANHULLEBUS Yvan #endif 8807b495c44SVANHULLEBUS Yvan return (error); 8817b495c44SVANHULLEBUS Yvan } 8827b495c44SVANHULLEBUS Yvan 8837b495c44SVANHULLEBUS Yvan switch (sopt->sopt_dir) { 8847b495c44SVANHULLEBUS Yvan case SOPT_SET: 8857b495c44SVANHULLEBUS Yvan switch (sopt->sopt_name) { 8867b495c44SVANHULLEBUS Yvan case UDP_ENCAP: 8877b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 8887b495c44SVANHULLEBUS Yvan error = sooptcopyin(sopt, &optval, sizeof optval, 8897b495c44SVANHULLEBUS Yvan sizeof optval); 8907b495c44SVANHULLEBUS Yvan if (error) 8917b495c44SVANHULLEBUS Yvan break; 8927b495c44SVANHULLEBUS Yvan inp = sotoinpcb(so); 8937b495c44SVANHULLEBUS Yvan KASSERT(inp != NULL, ("%s: inp == NULL", __func__)); 8947b495c44SVANHULLEBUS Yvan INP_WLOCK(inp); 8957b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 8967b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 8977b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: up == NULL", __func__)); 8987b495c44SVANHULLEBUS Yvan #endif 8997b495c44SVANHULLEBUS Yvan switch (optval) { 9007b495c44SVANHULLEBUS Yvan case 0: 9017b495c44SVANHULLEBUS Yvan /* Clear all UDP encap. */ 9027b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 9037b495c44SVANHULLEBUS Yvan up->u_flags &= ~UF_ESPINUDP_ALL; 9047b495c44SVANHULLEBUS Yvan #endif 9057b495c44SVANHULLEBUS Yvan break; 9067b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 9077b495c44SVANHULLEBUS Yvan case UDP_ENCAP_ESPINUDP: 9087b495c44SVANHULLEBUS Yvan case UDP_ENCAP_ESPINUDP_NON_IKE: 9097b495c44SVANHULLEBUS Yvan up->u_flags &= ~UF_ESPINUDP_ALL; 9107b495c44SVANHULLEBUS Yvan if (optval == UDP_ENCAP_ESPINUDP) 9117b495c44SVANHULLEBUS Yvan up->u_flags |= UF_ESPINUDP; 9127b495c44SVANHULLEBUS Yvan else if (optval == UDP_ENCAP_ESPINUDP_NON_IKE) 9137b495c44SVANHULLEBUS Yvan up->u_flags |= UF_ESPINUDP_NON_IKE; 9147b495c44SVANHULLEBUS Yvan break; 9157b495c44SVANHULLEBUS Yvan #endif 9167b495c44SVANHULLEBUS Yvan default: 9177b495c44SVANHULLEBUS Yvan error = EINVAL; 9187b495c44SVANHULLEBUS Yvan break; 9197b495c44SVANHULLEBUS Yvan } 9207b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 9217b495c44SVANHULLEBUS Yvan break; 9227b495c44SVANHULLEBUS Yvan default: 9237b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 9247b495c44SVANHULLEBUS Yvan error = ENOPROTOOPT; 9257b495c44SVANHULLEBUS Yvan break; 9267b495c44SVANHULLEBUS Yvan } 9277b495c44SVANHULLEBUS Yvan break; 9287b495c44SVANHULLEBUS Yvan case SOPT_GET: 9297b495c44SVANHULLEBUS Yvan switch (sopt->sopt_name) { 9307b495c44SVANHULLEBUS Yvan #ifdef IPSEC_NAT_T 9317b495c44SVANHULLEBUS Yvan case UDP_ENCAP: 9327b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 9337b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: up == NULL", __func__)); 9347b495c44SVANHULLEBUS Yvan optval = up->u_flags & UF_ESPINUDP_ALL; 9357b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 9367b495c44SVANHULLEBUS Yvan error = sooptcopyout(sopt, &optval, sizeof optval); 9377b495c44SVANHULLEBUS Yvan break; 9387b495c44SVANHULLEBUS Yvan #endif 9397b495c44SVANHULLEBUS Yvan default: 9407b495c44SVANHULLEBUS Yvan INP_WUNLOCK(inp); 9417b495c44SVANHULLEBUS Yvan error = ENOPROTOOPT; 9427b495c44SVANHULLEBUS Yvan break; 9437b495c44SVANHULLEBUS Yvan } 9447b495c44SVANHULLEBUS Yvan break; 9457b495c44SVANHULLEBUS Yvan } 9467b495c44SVANHULLEBUS Yvan return (error); 9477b495c44SVANHULLEBUS Yvan } 9487b495c44SVANHULLEBUS Yvan 94979288c11SBjoern A. Zeeb #ifdef INET 950fa046d87SRobert Watson #define UH_WLOCKED 2 951fa046d87SRobert Watson #define UH_RLOCKED 1 952fa046d87SRobert Watson #define UH_UNLOCKED 0 953490d50b6SBrian Feldman static int 9543329b236SRobert Watson udp_output(struct inpcb *inp, struct mbuf *m, struct sockaddr *addr, 9553329b236SRobert Watson struct mbuf *control, struct thread *td) 956df8bae1dSRodney W. Grimes { 9573329b236SRobert Watson struct udpiphdr *ui; 9583329b236SRobert Watson int len = m->m_pkthdr.len; 95990162a4eSIan Dowse struct in_addr faddr, laddr; 960c557ae16SIan Dowse struct cmsghdr *cm; 961c557ae16SIan Dowse struct sockaddr_in *sin, src; 96290162a4eSIan Dowse int error = 0; 9638afa2304SBruce M Simpson int ipflags; 96490162a4eSIan Dowse u_short fport, lport; 9655c32ea65SRobert Watson int unlock_udbinfo; 966f584d74bSMichael Tuexen u_char tos; 967df8bae1dSRodney W. Grimes 9685c32ea65SRobert Watson /* 9695c32ea65SRobert Watson * udp_output() may need to temporarily bind or connect the current 970f5514f08SRobert Watson * inpcb. As such, we don't know up front whether we will need the 971f5514f08SRobert Watson * pcbinfo lock or not. Do any work to decide what is needed up 972f5514f08SRobert Watson * front before acquiring any locks. 9735c32ea65SRobert Watson */ 974430d30d8SBill Fenner if (len + sizeof(struct udpiphdr) > IP_MAXPACKET) { 975c557ae16SIan Dowse if (control) 976c557ae16SIan Dowse m_freem(control); 9775c32ea65SRobert Watson m_freem(m); 9783329b236SRobert Watson return (EMSGSIZE); 979430d30d8SBill Fenner } 980430d30d8SBill Fenner 9811b7f0384SBruce M Simpson src.sin_family = 0; 9820cfdff24SBjoern A. Zeeb INP_RLOCK(inp); 983f584d74bSMichael Tuexen tos = inp->inp_ip_tos; 984c557ae16SIan Dowse if (control != NULL) { 985c557ae16SIan Dowse /* 9863329b236SRobert Watson * XXX: Currently, we assume all the optional information is 9873329b236SRobert Watson * stored in a single mbuf. 988c557ae16SIan Dowse */ 989c557ae16SIan Dowse if (control->m_next) { 9900cfdff24SBjoern A. Zeeb INP_RUNLOCK(inp); 991c557ae16SIan Dowse m_freem(control); 9925c32ea65SRobert Watson m_freem(m); 9933329b236SRobert Watson return (EINVAL); 994c557ae16SIan Dowse } 995c557ae16SIan Dowse for (; control->m_len > 0; 996c557ae16SIan Dowse control->m_data += CMSG_ALIGN(cm->cmsg_len), 997c557ae16SIan Dowse control->m_len -= CMSG_ALIGN(cm->cmsg_len)) { 998c557ae16SIan Dowse cm = mtod(control, struct cmsghdr *); 999af1ee11dSRobert Watson if (control->m_len < sizeof(*cm) || cm->cmsg_len == 0 1000af1ee11dSRobert Watson || cm->cmsg_len > control->m_len) { 1001c557ae16SIan Dowse error = EINVAL; 1002c557ae16SIan Dowse break; 1003c557ae16SIan Dowse } 1004c557ae16SIan Dowse if (cm->cmsg_level != IPPROTO_IP) 1005c557ae16SIan Dowse continue; 1006c557ae16SIan Dowse 1007c557ae16SIan Dowse switch (cm->cmsg_type) { 1008c557ae16SIan Dowse case IP_SENDSRCADDR: 1009c557ae16SIan Dowse if (cm->cmsg_len != 1010c557ae16SIan Dowse CMSG_LEN(sizeof(struct in_addr))) { 1011c557ae16SIan Dowse error = EINVAL; 1012c557ae16SIan Dowse break; 1013c557ae16SIan Dowse } 1014c557ae16SIan Dowse bzero(&src, sizeof(src)); 1015c557ae16SIan Dowse src.sin_family = AF_INET; 1016c557ae16SIan Dowse src.sin_len = sizeof(src); 1017c557ae16SIan Dowse src.sin_port = inp->inp_lport; 1018af1ee11dSRobert Watson src.sin_addr = 1019af1ee11dSRobert Watson *(struct in_addr *)CMSG_DATA(cm); 1020c557ae16SIan Dowse break; 1021af1ee11dSRobert Watson 1022f584d74bSMichael Tuexen case IP_TOS: 1023f584d74bSMichael Tuexen if (cm->cmsg_len != CMSG_LEN(sizeof(u_char))) { 1024f584d74bSMichael Tuexen error = EINVAL; 1025f584d74bSMichael Tuexen break; 1026f584d74bSMichael Tuexen } 1027f584d74bSMichael Tuexen tos = *(u_char *)CMSG_DATA(cm); 1028f584d74bSMichael Tuexen break; 1029f584d74bSMichael Tuexen 1030c557ae16SIan Dowse default: 1031c557ae16SIan Dowse error = ENOPROTOOPT; 1032c557ae16SIan Dowse break; 1033c557ae16SIan Dowse } 1034c557ae16SIan Dowse if (error) 1035c557ae16SIan Dowse break; 1036c557ae16SIan Dowse } 1037c557ae16SIan Dowse m_freem(control); 1038c557ae16SIan Dowse } 10395c32ea65SRobert Watson if (error) { 10400cfdff24SBjoern A. Zeeb INP_RUNLOCK(inp); 10415c32ea65SRobert Watson m_freem(m); 10423329b236SRobert Watson return (error); 10435c32ea65SRobert Watson } 10445c32ea65SRobert Watson 104543cc0bc1SRobert Watson /* 104643cc0bc1SRobert Watson * Depending on whether or not the application has bound or connected 1047ca528788SRobert Watson * the socket, we may have to do varying levels of work. The optimal 1048ca528788SRobert Watson * case is for a connected UDP socket, as a global lock isn't 1049ca528788SRobert Watson * required at all. 105043cc0bc1SRobert Watson * 105143cc0bc1SRobert Watson * In order to decide which we need, we require stability of the 105243cc0bc1SRobert Watson * inpcb binding, which we ensure by acquiring a read lock on the 105343cc0bc1SRobert Watson * inpcb. This doesn't strictly follow the lock order, so we play 105443cc0bc1SRobert Watson * the trylock and retry game; note that we may end up with more 105543cc0bc1SRobert Watson * conservative locks than required the second time around, so later 105643cc0bc1SRobert Watson * assertions have to accept that. Further analysis of the number of 105743cc0bc1SRobert Watson * misses under contention is required. 1058fa046d87SRobert Watson * 1059fa046d87SRobert Watson * XXXRW: Check that hash locking update here is correct. 106043cc0bc1SRobert Watson */ 106143cc0bc1SRobert Watson sin = (struct sockaddr_in *)addr; 106243cc0bc1SRobert Watson if (sin != NULL && 106343cc0bc1SRobert Watson (inp->inp_laddr.s_addr == INADDR_ANY && inp->inp_lport == 0)) { 106443cc0bc1SRobert Watson INP_RUNLOCK(inp); 10658501a69cSRobert Watson INP_WLOCK(inp); 1066fa046d87SRobert Watson INP_HASH_WLOCK(&V_udbinfo); 1067fa046d87SRobert Watson unlock_udbinfo = UH_WLOCKED; 106843cc0bc1SRobert Watson } else if ((sin != NULL && ( 106943cc0bc1SRobert Watson (sin->sin_addr.s_addr == INADDR_ANY) || 107043cc0bc1SRobert Watson (sin->sin_addr.s_addr == INADDR_BROADCAST) || 107143cc0bc1SRobert Watson (inp->inp_laddr.s_addr == INADDR_ANY) || 107243cc0bc1SRobert Watson (inp->inp_lport == 0))) || 107343cc0bc1SRobert Watson (src.sin_family == AF_INET)) { 1074fa046d87SRobert Watson INP_HASH_RLOCK(&V_udbinfo); 1075fa046d87SRobert Watson unlock_udbinfo = UH_RLOCKED; 107643cc0bc1SRobert Watson } else 1077fa046d87SRobert Watson unlock_udbinfo = UH_UNLOCKED; 10785c32ea65SRobert Watson 10791b7f0384SBruce M Simpson /* 10801b7f0384SBruce M Simpson * If the IP_SENDSRCADDR control message was specified, override the 10811b7f0384SBruce M Simpson * source address for this datagram. Its use is invalidated if the 10821b7f0384SBruce M Simpson * address thus specified is incomplete or clobbers other inpcbs. 10831b7f0384SBruce M Simpson */ 108490162a4eSIan Dowse laddr = inp->inp_laddr; 108590162a4eSIan Dowse lport = inp->inp_lport; 10861b7f0384SBruce M Simpson if (src.sin_family == AF_INET) { 1087fa046d87SRobert Watson INP_HASH_LOCK_ASSERT(&V_udbinfo); 10881b7f0384SBruce M Simpson if ((lport == 0) || 10891b7f0384SBruce M Simpson (laddr.s_addr == INADDR_ANY && 10901b7f0384SBruce M Simpson src.sin_addr.s_addr == INADDR_ANY)) { 1091c557ae16SIan Dowse error = EINVAL; 1092c557ae16SIan Dowse goto release; 1093c557ae16SIan Dowse } 1094c557ae16SIan Dowse error = in_pcbbind_setup(inp, (struct sockaddr *)&src, 1095b0330ed9SPawel Jakub Dawidek &laddr.s_addr, &lport, td->td_ucred); 1096c557ae16SIan Dowse if (error) 1097c557ae16SIan Dowse goto release; 1098c557ae16SIan Dowse } 1099c557ae16SIan Dowse 11003144b7d3SRobert Watson /* 11013144b7d3SRobert Watson * If a UDP socket has been connected, then a local address/port will 11023144b7d3SRobert Watson * have been selected and bound. 11033144b7d3SRobert Watson * 110443cc0bc1SRobert Watson * If a UDP socket has not been connected to, then an explicit 11053144b7d3SRobert Watson * destination address must be used, in which case a local 11063144b7d3SRobert Watson * address/port may not have been selected and bound. 11073144b7d3SRobert Watson */ 110843cc0bc1SRobert Watson if (sin != NULL) { 1109c4d585aeSRobert Watson INP_LOCK_ASSERT(inp); 1110df8bae1dSRodney W. Grimes if (inp->inp_faddr.s_addr != INADDR_ANY) { 1111df8bae1dSRodney W. Grimes error = EISCONN; 1112df8bae1dSRodney W. Grimes goto release; 1113df8bae1dSRodney W. Grimes } 11143144b7d3SRobert Watson 11153144b7d3SRobert Watson /* 11163144b7d3SRobert Watson * Jail may rewrite the destination address, so let it do 11173144b7d3SRobert Watson * that before we use it. 11183144b7d3SRobert Watson */ 1119b89e82ddSJamie Gritton error = prison_remote_ip4(td->td_ucred, &sin->sin_addr); 1120b89e82ddSJamie Gritton if (error) 1121413628a7SBjoern A. Zeeb goto release; 11223144b7d3SRobert Watson 11233144b7d3SRobert Watson /* 112443cc0bc1SRobert Watson * If a local address or port hasn't yet been selected, or if 112543cc0bc1SRobert Watson * the destination address needs to be rewritten due to using 112643cc0bc1SRobert Watson * a special INADDR_ constant, invoke in_pcbconnect_setup() 112743cc0bc1SRobert Watson * to do the heavy lifting. Once a port is selected, we 112843cc0bc1SRobert Watson * commit the binding back to the socket; we also commit the 112943cc0bc1SRobert Watson * binding of the address if in jail. 113043cc0bc1SRobert Watson * 113143cc0bc1SRobert Watson * If we already have a valid binding and we're not 113243cc0bc1SRobert Watson * requesting a destination address rewrite, use a fast path. 11333144b7d3SRobert Watson */ 113443cc0bc1SRobert Watson if (inp->inp_laddr.s_addr == INADDR_ANY || 113543cc0bc1SRobert Watson inp->inp_lport == 0 || 113643cc0bc1SRobert Watson sin->sin_addr.s_addr == INADDR_ANY || 113743cc0bc1SRobert Watson sin->sin_addr.s_addr == INADDR_BROADCAST) { 1138fa046d87SRobert Watson INP_HASH_LOCK_ASSERT(&V_udbinfo); 113943cc0bc1SRobert Watson error = in_pcbconnect_setup(inp, addr, &laddr.s_addr, 114043cc0bc1SRobert Watson &lport, &faddr.s_addr, &fport, NULL, 114143cc0bc1SRobert Watson td->td_ucred); 114290162a4eSIan Dowse if (error) 114390162a4eSIan Dowse goto release; 114490162a4eSIan Dowse 114543cc0bc1SRobert Watson /* 114643cc0bc1SRobert Watson * XXXRW: Why not commit the port if the address is 114743cc0bc1SRobert Watson * !INADDR_ANY? 114843cc0bc1SRobert Watson */ 114990162a4eSIan Dowse /* Commit the local port if newly assigned. */ 115090162a4eSIan Dowse if (inp->inp_laddr.s_addr == INADDR_ANY && 115190162a4eSIan Dowse inp->inp_lport == 0) { 1152c4d585aeSRobert Watson INP_WLOCK_ASSERT(inp); 1153fa046d87SRobert Watson INP_HASH_WLOCK_ASSERT(&V_udbinfo); 11543a1757b9SGleb Smirnoff /* 115543cc0bc1SRobert Watson * Remember addr if jailed, to prevent 115643cc0bc1SRobert Watson * rebinding. 11573a1757b9SGleb Smirnoff */ 11580304c731SJamie Gritton if (prison_flag(td->td_ucred, PR_IP4)) 11593a1757b9SGleb Smirnoff inp->inp_laddr = laddr; 116090162a4eSIan Dowse inp->inp_lport = lport; 116190162a4eSIan Dowse if (in_pcbinshash(inp) != 0) { 116290162a4eSIan Dowse inp->inp_lport = 0; 116390162a4eSIan Dowse error = EAGAIN; 1164df8bae1dSRodney W. Grimes goto release; 1165df8bae1dSRodney W. Grimes } 116690162a4eSIan Dowse inp->inp_flags |= INP_ANONPORT; 116790162a4eSIan Dowse } 1168df8bae1dSRodney W. Grimes } else { 116943cc0bc1SRobert Watson faddr = sin->sin_addr; 117043cc0bc1SRobert Watson fport = sin->sin_port; 117143cc0bc1SRobert Watson } 117243cc0bc1SRobert Watson } else { 1173c4d585aeSRobert Watson INP_LOCK_ASSERT(inp); 117490162a4eSIan Dowse faddr = inp->inp_faddr; 117590162a4eSIan Dowse fport = inp->inp_fport; 117690162a4eSIan Dowse if (faddr.s_addr == INADDR_ANY) { 1177df8bae1dSRodney W. Grimes error = ENOTCONN; 1178df8bae1dSRodney W. Grimes goto release; 1179df8bae1dSRodney W. Grimes } 1180df8bae1dSRodney W. Grimes } 1181e6ccd709SRobert Watson 1182df8bae1dSRodney W. Grimes /* 1183e6ccd709SRobert Watson * Calculate data length and get a mbuf for UDP, IP, and possible 1184392e8407SRobert Watson * link-layer headers. Immediate slide the data pointer back forward 1185392e8407SRobert Watson * since we won't use that space at this layer. 1186df8bae1dSRodney W. Grimes */ 1187eb1b1807SGleb Smirnoff M_PREPEND(m, sizeof(struct udpiphdr) + max_linkhdr, M_NOWAIT); 1188e6ccd709SRobert Watson if (m == NULL) { 1189df8bae1dSRodney W. Grimes error = ENOBUFS; 119049b19bfcSBruce M Simpson goto release; 1191df8bae1dSRodney W. Grimes } 1192e6ccd709SRobert Watson m->m_data += max_linkhdr; 1193e6ccd709SRobert Watson m->m_len -= max_linkhdr; 1194392e8407SRobert Watson m->m_pkthdr.len -= max_linkhdr; 1195df8bae1dSRodney W. Grimes 1196df8bae1dSRodney W. Grimes /* 11973329b236SRobert Watson * Fill in mbuf with extended UDP header and addresses and length put 11983329b236SRobert Watson * into network format. 1199df8bae1dSRodney W. Grimes */ 1200df8bae1dSRodney W. Grimes ui = mtod(m, struct udpiphdr *); 1201db4f9cc7SJonathan Lemon bzero(ui->ui_x1, sizeof(ui->ui_x1)); /* XXX still needed? */ 120257f60867SMark Johnston ui->ui_v = IPVERSION << 4; 1203df8bae1dSRodney W. Grimes ui->ui_pr = IPPROTO_UDP; 120490162a4eSIan Dowse ui->ui_src = laddr; 120590162a4eSIan Dowse ui->ui_dst = faddr; 120690162a4eSIan Dowse ui->ui_sport = lport; 120790162a4eSIan Dowse ui->ui_dport = fport; 1208db4f9cc7SJonathan Lemon ui->ui_ulen = htons((u_short)len + sizeof(struct udphdr)); 1209df8bae1dSRodney W. Grimes 1210b2828ad2SAndre Oppermann /* 1211b2828ad2SAndre Oppermann * Set the Don't Fragment bit in the IP header. 1212b2828ad2SAndre Oppermann */ 1213b2828ad2SAndre Oppermann if (inp->inp_flags & INP_DONTFRAG) { 1214b2828ad2SAndre Oppermann struct ip *ip; 12153329b236SRobert Watson 1216b2828ad2SAndre Oppermann ip = (struct ip *)&ui->ui_i; 12178f134647SGleb Smirnoff ip->ip_off |= htons(IP_DF); 1218b2828ad2SAndre Oppermann } 1219b2828ad2SAndre Oppermann 1220b5d47ff5SJohn-Mark Gurney ipflags = 0; 1221b5d47ff5SJohn-Mark Gurney if (inp->inp_socket->so_options & SO_DONTROUTE) 1222b5d47ff5SJohn-Mark Gurney ipflags |= IP_ROUTETOIF; 1223b5d47ff5SJohn-Mark Gurney if (inp->inp_socket->so_options & SO_BROADCAST) 1224b5d47ff5SJohn-Mark Gurney ipflags |= IP_ALLOWBROADCAST; 12256fbfd582SAndre Oppermann if (inp->inp_flags & INP_ONESBCAST) 12268afa2304SBruce M Simpson ipflags |= IP_SENDONES; 12278afa2304SBruce M Simpson 12281175d9d5SRobert Watson #ifdef MAC 12291175d9d5SRobert Watson mac_inpcb_create_mbuf(inp, m); 12301175d9d5SRobert Watson #endif 12311175d9d5SRobert Watson 1232df8bae1dSRodney W. Grimes /* 1233db4f9cc7SJonathan Lemon * Set up checksum and output datagram. 1234df8bae1dSRodney W. Grimes */ 123540b676beSBjoern A. Zeeb if (V_udp_cksum) { 12366fbfd582SAndre Oppermann if (inp->inp_flags & INP_ONESBCAST) 12378a538743SBruce M Simpson faddr.s_addr = INADDR_BROADCAST; 12388a538743SBruce M Simpson ui->ui_sum = in_pseudo(ui->ui_src.s_addr, faddr.s_addr, 1239db4f9cc7SJonathan Lemon htons((u_short)len + sizeof(struct udphdr) + IPPROTO_UDP)); 1240db4f9cc7SJonathan Lemon m->m_pkthdr.csum_flags = CSUM_UDP; 1241db4f9cc7SJonathan Lemon m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum); 12423329b236SRobert Watson } else 1243db4f9cc7SJonathan Lemon ui->ui_sum = 0; 12448f134647SGleb Smirnoff ((struct ip *)ui)->ip_len = htons(sizeof(struct udpiphdr) + len); 1245ca98b82cSDavid Greenman ((struct ip *)ui)->ip_ttl = inp->inp_ip_ttl; /* XXX */ 1246f584d74bSMichael Tuexen ((struct ip *)ui)->ip_tos = tos; /* XXX */ 1247026decb8SRobert Watson UDPSTAT_INC(udps_opackets); 1248cfa1ca9dSYoshinobu Inoue 1249fa046d87SRobert Watson if (unlock_udbinfo == UH_WLOCKED) 1250fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 1251fa046d87SRobert Watson else if (unlock_udbinfo == UH_RLOCKED) 1252fa046d87SRobert Watson INP_HASH_RUNLOCK(&V_udbinfo); 125357f60867SMark Johnston UDP_PROBE(send, NULL, inp, &ui->ui_i, inp, &ui->ui_u); 125497d8d152SAndre Oppermann error = ip_output(m, inp->inp_options, NULL, ipflags, 12555d846453SSam Leffler inp->inp_moptions, inp); 1256fa046d87SRobert Watson if (unlock_udbinfo == UH_WLOCKED) 12578501a69cSRobert Watson INP_WUNLOCK(inp); 1258948d0fc9SRobert Watson else 1259948d0fc9SRobert Watson INP_RUNLOCK(inp); 1260df8bae1dSRodney W. Grimes return (error); 1261df8bae1dSRodney W. Grimes 1262df8bae1dSRodney W. Grimes release: 1263fa046d87SRobert Watson if (unlock_udbinfo == UH_WLOCKED) { 1264fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 1265948d0fc9SRobert Watson INP_WUNLOCK(inp); 1266fa046d87SRobert Watson } else if (unlock_udbinfo == UH_RLOCKED) { 1267fa046d87SRobert Watson INP_HASH_RUNLOCK(&V_udbinfo); 126843cc0bc1SRobert Watson INP_RUNLOCK(inp); 1269948d0fc9SRobert Watson } else 1270948d0fc9SRobert Watson INP_RUNLOCK(inp); 1271df8bae1dSRodney W. Grimes m_freem(m); 1272df8bae1dSRodney W. Grimes return (error); 1273df8bae1dSRodney W. Grimes } 1274df8bae1dSRodney W. Grimes 12757b495c44SVANHULLEBUS Yvan 12767b495c44SVANHULLEBUS Yvan #if defined(IPSEC) && defined(IPSEC_NAT_T) 12777b495c44SVANHULLEBUS Yvan /* 12787b495c44SVANHULLEBUS Yvan * Potentially decap ESP in UDP frame. Check for an ESP header 12797b495c44SVANHULLEBUS Yvan * and optional marker; if present, strip the UDP header and 12807b495c44SVANHULLEBUS Yvan * push the result through IPSec. 12817b495c44SVANHULLEBUS Yvan * 12827b495c44SVANHULLEBUS Yvan * Returns mbuf to be processed (potentially re-allocated) or 12837b495c44SVANHULLEBUS Yvan * NULL if consumed and/or processed. 12847b495c44SVANHULLEBUS Yvan */ 12857b495c44SVANHULLEBUS Yvan static struct mbuf * 12867b495c44SVANHULLEBUS Yvan udp4_espdecap(struct inpcb *inp, struct mbuf *m, int off) 12877b495c44SVANHULLEBUS Yvan { 12887b495c44SVANHULLEBUS Yvan size_t minlen, payload, skip, iphlen; 12897b495c44SVANHULLEBUS Yvan caddr_t data; 12907b495c44SVANHULLEBUS Yvan struct udpcb *up; 12917b495c44SVANHULLEBUS Yvan struct m_tag *tag; 12927b495c44SVANHULLEBUS Yvan struct udphdr *udphdr; 12937b495c44SVANHULLEBUS Yvan struct ip *ip; 12947b495c44SVANHULLEBUS Yvan 12957b495c44SVANHULLEBUS Yvan INP_RLOCK_ASSERT(inp); 12967b495c44SVANHULLEBUS Yvan 12977b495c44SVANHULLEBUS Yvan /* 12987b495c44SVANHULLEBUS Yvan * Pull up data so the longest case is contiguous: 12997b495c44SVANHULLEBUS Yvan * IP/UDP hdr + non ESP marker + ESP hdr. 13007b495c44SVANHULLEBUS Yvan */ 13017b495c44SVANHULLEBUS Yvan minlen = off + sizeof(uint64_t) + sizeof(struct esp); 13027b495c44SVANHULLEBUS Yvan if (minlen > m->m_pkthdr.len) 13037b495c44SVANHULLEBUS Yvan minlen = m->m_pkthdr.len; 13047b495c44SVANHULLEBUS Yvan if ((m = m_pullup(m, minlen)) == NULL) { 13056794f460SAndrey V. Elsukov IPSECSTAT_INC(ips_in_inval); 13067b495c44SVANHULLEBUS Yvan return (NULL); /* Bypass caller processing. */ 13077b495c44SVANHULLEBUS Yvan } 13087b495c44SVANHULLEBUS Yvan data = mtod(m, caddr_t); /* Points to ip header. */ 13097b495c44SVANHULLEBUS Yvan payload = m->m_len - off; /* Size of payload. */ 13107b495c44SVANHULLEBUS Yvan 13117b495c44SVANHULLEBUS Yvan if (payload == 1 && data[off] == '\xff') 13127b495c44SVANHULLEBUS Yvan return (m); /* NB: keepalive packet, no decap. */ 13137b495c44SVANHULLEBUS Yvan 13147b495c44SVANHULLEBUS Yvan up = intoudpcb(inp); 13157b495c44SVANHULLEBUS Yvan KASSERT(up != NULL, ("%s: udpcb NULL", __func__)); 13167b495c44SVANHULLEBUS Yvan KASSERT((up->u_flags & UF_ESPINUDP_ALL) != 0, 13177b495c44SVANHULLEBUS Yvan ("u_flags 0x%x", up->u_flags)); 13187b495c44SVANHULLEBUS Yvan 13197b495c44SVANHULLEBUS Yvan /* 13207b495c44SVANHULLEBUS Yvan * Check that the payload is large enough to hold an 13217b495c44SVANHULLEBUS Yvan * ESP header and compute the amount of data to remove. 13227b495c44SVANHULLEBUS Yvan * 13237b495c44SVANHULLEBUS Yvan * NB: the caller has already done a pullup for us. 13247b495c44SVANHULLEBUS Yvan * XXX can we assume alignment and eliminate bcopys? 13257b495c44SVANHULLEBUS Yvan */ 13267b495c44SVANHULLEBUS Yvan if (up->u_flags & UF_ESPINUDP_NON_IKE) { 13277b495c44SVANHULLEBUS Yvan /* 13287b495c44SVANHULLEBUS Yvan * draft-ietf-ipsec-nat-t-ike-0[01].txt and 13297b495c44SVANHULLEBUS Yvan * draft-ietf-ipsec-udp-encaps-(00/)01.txt, ignoring 13307b495c44SVANHULLEBUS Yvan * possible AH mode non-IKE marker+non-ESP marker 13317b495c44SVANHULLEBUS Yvan * from draft-ietf-ipsec-udp-encaps-00.txt. 13327b495c44SVANHULLEBUS Yvan */ 13337b495c44SVANHULLEBUS Yvan uint64_t marker; 13347b495c44SVANHULLEBUS Yvan 13357b495c44SVANHULLEBUS Yvan if (payload <= sizeof(uint64_t) + sizeof(struct esp)) 13367b495c44SVANHULLEBUS Yvan return (m); /* NB: no decap. */ 13377b495c44SVANHULLEBUS Yvan bcopy(data + off, &marker, sizeof(uint64_t)); 13387b495c44SVANHULLEBUS Yvan if (marker != 0) /* Non-IKE marker. */ 13397b495c44SVANHULLEBUS Yvan return (m); /* NB: no decap. */ 13407b495c44SVANHULLEBUS Yvan skip = sizeof(uint64_t) + sizeof(struct udphdr); 13417b495c44SVANHULLEBUS Yvan } else { 13427b495c44SVANHULLEBUS Yvan uint32_t spi; 13437b495c44SVANHULLEBUS Yvan 13447b495c44SVANHULLEBUS Yvan if (payload <= sizeof(struct esp)) { 13456794f460SAndrey V. Elsukov IPSECSTAT_INC(ips_in_inval); 13467b495c44SVANHULLEBUS Yvan m_freem(m); 13477b495c44SVANHULLEBUS Yvan return (NULL); /* Discard. */ 13487b495c44SVANHULLEBUS Yvan } 13497b495c44SVANHULLEBUS Yvan bcopy(data + off, &spi, sizeof(uint32_t)); 13507b495c44SVANHULLEBUS Yvan if (spi == 0) /* Non-ESP marker. */ 13517b495c44SVANHULLEBUS Yvan return (m); /* NB: no decap. */ 13527b495c44SVANHULLEBUS Yvan skip = sizeof(struct udphdr); 13537b495c44SVANHULLEBUS Yvan } 13547b495c44SVANHULLEBUS Yvan 13557b495c44SVANHULLEBUS Yvan /* 13567b495c44SVANHULLEBUS Yvan * Setup a PACKET_TAG_IPSEC_NAT_T_PORT tag to remember 13577b495c44SVANHULLEBUS Yvan * the UDP ports. This is required if we want to select 13587b495c44SVANHULLEBUS Yvan * the right SPD for multiple hosts behind same NAT. 13597b495c44SVANHULLEBUS Yvan * 13607b495c44SVANHULLEBUS Yvan * NB: ports are maintained in network byte order everywhere 13617b495c44SVANHULLEBUS Yvan * in the NAT-T code. 13627b495c44SVANHULLEBUS Yvan */ 13637b495c44SVANHULLEBUS Yvan tag = m_tag_get(PACKET_TAG_IPSEC_NAT_T_PORTS, 13647b495c44SVANHULLEBUS Yvan 2 * sizeof(uint16_t), M_NOWAIT); 13657b495c44SVANHULLEBUS Yvan if (tag == NULL) { 13666794f460SAndrey V. Elsukov IPSECSTAT_INC(ips_in_nomem); 13677b495c44SVANHULLEBUS Yvan m_freem(m); 13687b495c44SVANHULLEBUS Yvan return (NULL); /* Discard. */ 13697b495c44SVANHULLEBUS Yvan } 13707b495c44SVANHULLEBUS Yvan iphlen = off - sizeof(struct udphdr); 13717b495c44SVANHULLEBUS Yvan udphdr = (struct udphdr *)(data + iphlen); 13727b495c44SVANHULLEBUS Yvan ((uint16_t *)(tag + 1))[0] = udphdr->uh_sport; 13737b495c44SVANHULLEBUS Yvan ((uint16_t *)(tag + 1))[1] = udphdr->uh_dport; 13747b495c44SVANHULLEBUS Yvan m_tag_prepend(m, tag); 13757b495c44SVANHULLEBUS Yvan 13767b495c44SVANHULLEBUS Yvan /* 13777b495c44SVANHULLEBUS Yvan * Remove the UDP header (and possibly the non ESP marker) 13787b495c44SVANHULLEBUS Yvan * IP header length is iphlen 13797b495c44SVANHULLEBUS Yvan * Before: 13807b495c44SVANHULLEBUS Yvan * <--- off ---> 13817b495c44SVANHULLEBUS Yvan * +----+------+-----+ 13827b495c44SVANHULLEBUS Yvan * | IP | UDP | ESP | 13837b495c44SVANHULLEBUS Yvan * +----+------+-----+ 13847b495c44SVANHULLEBUS Yvan * <-skip-> 13857b495c44SVANHULLEBUS Yvan * After: 13867b495c44SVANHULLEBUS Yvan * +----+-----+ 13877b495c44SVANHULLEBUS Yvan * | IP | ESP | 13887b495c44SVANHULLEBUS Yvan * +----+-----+ 13897b495c44SVANHULLEBUS Yvan * <-skip-> 13907b495c44SVANHULLEBUS Yvan */ 13917b495c44SVANHULLEBUS Yvan ovbcopy(data, data + skip, iphlen); 13927b495c44SVANHULLEBUS Yvan m_adj(m, skip); 13937b495c44SVANHULLEBUS Yvan 13947b495c44SVANHULLEBUS Yvan ip = mtod(m, struct ip *); 13958f134647SGleb Smirnoff ip->ip_len = htons(ntohs(ip->ip_len) - skip); 13967b495c44SVANHULLEBUS Yvan ip->ip_p = IPPROTO_ESP; 13977b495c44SVANHULLEBUS Yvan 13987b495c44SVANHULLEBUS Yvan /* 13997b495c44SVANHULLEBUS Yvan * We cannot yet update the cksums so clear any 14007b495c44SVANHULLEBUS Yvan * h/w cksum flags as they are no longer valid. 14017b495c44SVANHULLEBUS Yvan */ 14027b495c44SVANHULLEBUS Yvan if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) 14037b495c44SVANHULLEBUS Yvan m->m_pkthdr.csum_flags &= ~(CSUM_DATA_VALID|CSUM_PSEUDO_HDR); 14047b495c44SVANHULLEBUS Yvan 14057b495c44SVANHULLEBUS Yvan (void) ipsec4_common_input(m, iphlen, ip->ip_p); 14067b495c44SVANHULLEBUS Yvan return (NULL); /* NB: consumed, bypass processing. */ 14077b495c44SVANHULLEBUS Yvan } 14087b495c44SVANHULLEBUS Yvan #endif /* defined(IPSEC) && defined(IPSEC_NAT_T) */ 14097b495c44SVANHULLEBUS Yvan 1410ac45e92fSRobert Watson static void 1411d0390e05SGarrett Wollman udp_abort(struct socket *so) 1412df8bae1dSRodney W. Grimes { 1413d0390e05SGarrett Wollman struct inpcb *inp; 1414df8bae1dSRodney W. Grimes 1415d0390e05SGarrett Wollman inp = sotoinpcb(so); 141614ba8addSRobert Watson KASSERT(inp != NULL, ("udp_abort: inp == NULL")); 14178501a69cSRobert Watson INP_WLOCK(inp); 1418a152f8a3SRobert Watson if (inp->inp_faddr.s_addr != INADDR_ANY) { 1419fa046d87SRobert Watson INP_HASH_WLOCK(&V_udbinfo); 1420a152f8a3SRobert Watson in_pcbdisconnect(inp); 1421a152f8a3SRobert Watson inp->inp_laddr.s_addr = INADDR_ANY; 1422fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 1423d0390e05SGarrett Wollman soisdisconnected(so); 1424a152f8a3SRobert Watson } 14258501a69cSRobert Watson INP_WUNLOCK(inp); 1426df8bae1dSRodney W. Grimes } 1427df8bae1dSRodney W. Grimes 1428d0390e05SGarrett Wollman static int 1429b40ce416SJulian Elischer udp_attach(struct socket *so, int proto, struct thread *td) 1430d0390e05SGarrett Wollman { 1431d0390e05SGarrett Wollman struct inpcb *inp; 1432277afaffSRobert Watson int error; 1433d0390e05SGarrett Wollman 1434d0390e05SGarrett Wollman inp = sotoinpcb(so); 143514ba8addSRobert Watson KASSERT(inp == NULL, ("udp_attach: inp != NULL")); 1436cfa1ca9dSYoshinobu Inoue error = soreserve(so, udp_sendspace, udp_recvspace); 1437f24618aaSRobert Watson if (error) 14383329b236SRobert Watson return (error); 1439603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 1440603724d3SBjoern A. Zeeb error = in_pcballoc(so, &V_udbinfo); 144153b57cd1SSam Leffler if (error) { 1442603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 14433329b236SRobert Watson return (error); 144453b57cd1SSam Leffler } 1445cfa1ca9dSYoshinobu Inoue 144668b5629bSRobert Watson inp = sotoinpcb(so); 1447cfa1ca9dSYoshinobu Inoue inp->inp_vflag |= INP_IPV4; 1448603724d3SBjoern A. Zeeb inp->inp_ip_ttl = V_ip_defttl; 14496a9148feSBjoern A. Zeeb 14506a9148feSBjoern A. Zeeb error = udp_newudpcb(inp); 14516a9148feSBjoern A. Zeeb if (error) { 14526a9148feSBjoern A. Zeeb in_pcbdetach(inp); 14536a9148feSBjoern A. Zeeb in_pcbfree(inp); 14546a9148feSBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 14556a9148feSBjoern A. Zeeb return (error); 14566a9148feSBjoern A. Zeeb } 14576a9148feSBjoern A. Zeeb 1458c7c7ea4bSRandall Stewart INP_WUNLOCK(inp); 14596a9148feSBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1460c7c7ea4bSRandall Stewart return (0); 1461c7c7ea4bSRandall Stewart } 146279288c11SBjoern A. Zeeb #endif /* INET */ 1463c7c7ea4bSRandall Stewart 1464c7c7ea4bSRandall Stewart int 1465c7c7ea4bSRandall Stewart udp_set_kernel_tunneling(struct socket *so, udp_tun_func_t f) 1466c7c7ea4bSRandall Stewart { 1467c7c7ea4bSRandall Stewart struct inpcb *inp; 14686a9148feSBjoern A. Zeeb struct udpcb *up; 1469c7c7ea4bSRandall Stewart 147068b5629bSRobert Watson KASSERT(so->so_type == SOCK_DGRAM, 147168b5629bSRobert Watson ("udp_set_kernel_tunneling: !dgram")); 147268b5629bSRobert Watson inp = sotoinpcb(so); 147368b5629bSRobert Watson KASSERT(inp != NULL, ("udp_set_kernel_tunneling: inp == NULL")); 1474c7c7ea4bSRandall Stewart INP_WLOCK(inp); 14756a9148feSBjoern A. Zeeb up = intoudpcb(inp); 14766a9148feSBjoern A. Zeeb if (up->u_tun_func != NULL) { 1477bbb0e3d9SRandall Stewart INP_WUNLOCK(inp); 1478bbb0e3d9SRandall Stewart return (EBUSY); 1479bbb0e3d9SRandall Stewart } 14806a9148feSBjoern A. Zeeb up->u_tun_func = f; 14818501a69cSRobert Watson INP_WUNLOCK(inp); 14823329b236SRobert Watson return (0); 1483df8bae1dSRodney W. Grimes } 1484d0390e05SGarrett Wollman 148579288c11SBjoern A. Zeeb #ifdef INET 1486d0390e05SGarrett Wollman static int 1487b40ce416SJulian Elischer udp_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 1488d0390e05SGarrett Wollman { 1489d0390e05SGarrett Wollman struct inpcb *inp; 1490277afaffSRobert Watson int error; 1491d0390e05SGarrett Wollman 1492d0390e05SGarrett Wollman inp = sotoinpcb(so); 149314ba8addSRobert Watson KASSERT(inp != NULL, ("udp_bind: inp == NULL")); 14948501a69cSRobert Watson INP_WLOCK(inp); 1495fa046d87SRobert Watson INP_HASH_WLOCK(&V_udbinfo); 1496b0330ed9SPawel Jakub Dawidek error = in_pcbbind(inp, nam, td->td_ucred); 1497fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 14988501a69cSRobert Watson INP_WUNLOCK(inp); 14993329b236SRobert Watson return (error); 1500d0390e05SGarrett Wollman } 1501d0390e05SGarrett Wollman 1502a152f8a3SRobert Watson static void 1503a152f8a3SRobert Watson udp_close(struct socket *so) 1504a152f8a3SRobert Watson { 1505a152f8a3SRobert Watson struct inpcb *inp; 1506a152f8a3SRobert Watson 1507a152f8a3SRobert Watson inp = sotoinpcb(so); 1508a152f8a3SRobert Watson KASSERT(inp != NULL, ("udp_close: inp == NULL")); 15098501a69cSRobert Watson INP_WLOCK(inp); 1510a152f8a3SRobert Watson if (inp->inp_faddr.s_addr != INADDR_ANY) { 1511fa046d87SRobert Watson INP_HASH_WLOCK(&V_udbinfo); 1512a152f8a3SRobert Watson in_pcbdisconnect(inp); 1513a152f8a3SRobert Watson inp->inp_laddr.s_addr = INADDR_ANY; 1514fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 1515a152f8a3SRobert Watson soisdisconnected(so); 1516a152f8a3SRobert Watson } 15178501a69cSRobert Watson INP_WUNLOCK(inp); 1518a152f8a3SRobert Watson } 1519a152f8a3SRobert Watson 1520d0390e05SGarrett Wollman static int 1521b40ce416SJulian Elischer udp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 1522d0390e05SGarrett Wollman { 1523d0390e05SGarrett Wollman struct inpcb *inp; 1524277afaffSRobert Watson int error; 152575c13541SPoul-Henning Kamp struct sockaddr_in *sin; 1526d0390e05SGarrett Wollman 1527d0390e05SGarrett Wollman inp = sotoinpcb(so); 152814ba8addSRobert Watson KASSERT(inp != NULL, ("udp_connect: inp == NULL")); 15298501a69cSRobert Watson INP_WLOCK(inp); 1530f76fcf6dSJeffrey Hsu if (inp->inp_faddr.s_addr != INADDR_ANY) { 15318501a69cSRobert Watson INP_WUNLOCK(inp); 15323329b236SRobert Watson return (EISCONN); 1533f76fcf6dSJeffrey Hsu } 153475c13541SPoul-Henning Kamp sin = (struct sockaddr_in *)nam; 1535b89e82ddSJamie Gritton error = prison_remote_ip4(td->td_ucred, &sin->sin_addr); 1536b89e82ddSJamie Gritton if (error != 0) { 1537413628a7SBjoern A. Zeeb INP_WUNLOCK(inp); 1538b89e82ddSJamie Gritton return (error); 1539413628a7SBjoern A. Zeeb } 1540fa046d87SRobert Watson INP_HASH_WLOCK(&V_udbinfo); 1541b0330ed9SPawel Jakub Dawidek error = in_pcbconnect(inp, nam, td->td_ucred); 1542fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 15434cc20ab1SSeigo Tanimura if (error == 0) 1544df8bae1dSRodney W. Grimes soisconnected(so); 15458501a69cSRobert Watson INP_WUNLOCK(inp); 15463329b236SRobert Watson return (error); 1547df8bae1dSRodney W. Grimes } 1548d0390e05SGarrett Wollman 1549bc725eafSRobert Watson static void 1550d0390e05SGarrett Wollman udp_detach(struct socket *so) 1551d0390e05SGarrett Wollman { 1552d0390e05SGarrett Wollman struct inpcb *inp; 15536a9148feSBjoern A. Zeeb struct udpcb *up; 1554d0390e05SGarrett Wollman 1555d0390e05SGarrett Wollman inp = sotoinpcb(so); 155614ba8addSRobert Watson KASSERT(inp != NULL, ("udp_detach: inp == NULL")); 1557a152f8a3SRobert Watson KASSERT(inp->inp_faddr.s_addr == INADDR_ANY, 1558a152f8a3SRobert Watson ("udp_detach: not disconnected")); 1559603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 15608501a69cSRobert Watson INP_WLOCK(inp); 15616a9148feSBjoern A. Zeeb up = intoudpcb(inp); 15626a9148feSBjoern A. Zeeb KASSERT(up != NULL, ("%s: up == NULL", __func__)); 15636a9148feSBjoern A. Zeeb inp->inp_ppcb = NULL; 1564d0390e05SGarrett Wollman in_pcbdetach(inp); 156514ba8addSRobert Watson in_pcbfree(inp); 1566603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 15676a9148feSBjoern A. Zeeb udp_discardcb(up); 1568d0390e05SGarrett Wollman } 1569d0390e05SGarrett Wollman 1570d0390e05SGarrett Wollman static int 1571d0390e05SGarrett Wollman udp_disconnect(struct socket *so) 1572d0390e05SGarrett Wollman { 1573d0390e05SGarrett Wollman struct inpcb *inp; 1574d0390e05SGarrett Wollman 1575d0390e05SGarrett Wollman inp = sotoinpcb(so); 157614ba8addSRobert Watson KASSERT(inp != NULL, ("udp_disconnect: inp == NULL")); 15778501a69cSRobert Watson INP_WLOCK(inp); 1578f76fcf6dSJeffrey Hsu if (inp->inp_faddr.s_addr == INADDR_ANY) { 15798501a69cSRobert Watson INP_WUNLOCK(inp); 15803329b236SRobert Watson return (ENOTCONN); 1581f76fcf6dSJeffrey Hsu } 1582fa046d87SRobert Watson INP_HASH_WLOCK(&V_udbinfo); 1583df8bae1dSRodney W. Grimes in_pcbdisconnect(inp); 1584df8bae1dSRodney W. Grimes inp->inp_laddr.s_addr = INADDR_ANY; 1585fa046d87SRobert Watson INP_HASH_WUNLOCK(&V_udbinfo); 1586d45e4f99SMaxim Konovalov SOCK_LOCK(so); 1587d45e4f99SMaxim Konovalov so->so_state &= ~SS_ISCONNECTED; /* XXX */ 1588d45e4f99SMaxim Konovalov SOCK_UNLOCK(so); 15898501a69cSRobert Watson INP_WUNLOCK(inp); 15903329b236SRobert Watson return (0); 1591df8bae1dSRodney W. Grimes } 1592df8bae1dSRodney W. Grimes 1593d0390e05SGarrett Wollman static int 159457bf258eSGarrett Wollman udp_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *addr, 1595b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 1596d0390e05SGarrett Wollman { 1597d0390e05SGarrett Wollman struct inpcb *inp; 1598d0390e05SGarrett Wollman 1599d0390e05SGarrett Wollman inp = sotoinpcb(so); 160014ba8addSRobert Watson KASSERT(inp != NULL, ("udp_send: inp == NULL")); 16013329b236SRobert Watson return (udp_output(inp, m, addr, control, td)); 1602d0390e05SGarrett Wollman } 160379288c11SBjoern A. Zeeb #endif /* INET */ 1604d0390e05SGarrett Wollman 160576429de4SYoshinobu Inoue int 1606d0390e05SGarrett Wollman udp_shutdown(struct socket *so) 1607d0390e05SGarrett Wollman { 1608d0390e05SGarrett Wollman struct inpcb *inp; 1609d0390e05SGarrett Wollman 1610d0390e05SGarrett Wollman inp = sotoinpcb(so); 161114ba8addSRobert Watson KASSERT(inp != NULL, ("udp_shutdown: inp == NULL")); 16128501a69cSRobert Watson INP_WLOCK(inp); 1613d0390e05SGarrett Wollman socantsendmore(so); 16148501a69cSRobert Watson INP_WUNLOCK(inp); 16153329b236SRobert Watson return (0); 1616d0390e05SGarrett Wollman } 1617d0390e05SGarrett Wollman 161879288c11SBjoern A. Zeeb #ifdef INET 1619d0390e05SGarrett Wollman struct pr_usrreqs udp_usrreqs = { 1620756d52a1SPoul-Henning Kamp .pru_abort = udp_abort, 1621756d52a1SPoul-Henning Kamp .pru_attach = udp_attach, 1622756d52a1SPoul-Henning Kamp .pru_bind = udp_bind, 1623756d52a1SPoul-Henning Kamp .pru_connect = udp_connect, 1624756d52a1SPoul-Henning Kamp .pru_control = in_control, 1625756d52a1SPoul-Henning Kamp .pru_detach = udp_detach, 1626756d52a1SPoul-Henning Kamp .pru_disconnect = udp_disconnect, 162754d642bbSRobert Watson .pru_peeraddr = in_getpeeraddr, 1628756d52a1SPoul-Henning Kamp .pru_send = udp_send, 16295df3e839SRobert Watson .pru_soreceive = soreceive_dgram, 163059b8854eSRobert Watson .pru_sosend = sosend_dgram, 1631756d52a1SPoul-Henning Kamp .pru_shutdown = udp_shutdown, 163254d642bbSRobert Watson .pru_sockaddr = in_getsockaddr, 1633a152f8a3SRobert Watson .pru_sosetlabel = in_pcbsosetlabel, 1634a152f8a3SRobert Watson .pru_close = udp_close, 1635d0390e05SGarrett Wollman }; 163679288c11SBjoern A. Zeeb #endif /* INET */ 1637