1c398230bSWarner Losh /*- 26dfab5b1SGarrett Wollman * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995 33329b236SRobert Watson * The Regents of the University of California. 43144b7d3SRobert Watson * Copyright (c) 2008 Robert N. M. Watson 53329b236SRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 316dfab5b1SGarrett Wollman * @(#)udp_usrreq.c 8.6 (Berkeley) 5/23/95 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 344b421e2dSMike Silbersack #include <sys/cdefs.h> 354b421e2dSMike Silbersack __FBSDID("$FreeBSD$"); 364b421e2dSMike Silbersack 370b4ae859SGleb Smirnoff #include "opt_ipfw.h" 38cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h" 39f5514f08SRobert Watson #include "opt_ipsec.h" 40bdb3fa18SRobert Watson #include "opt_mac.h" 41cfa1ca9dSYoshinobu Inoue 42df8bae1dSRodney W. Grimes #include <sys/param.h> 43960ed29cSSeigo Tanimura #include <sys/domain.h> 444f590175SPaul Saab #include <sys/eventhandler.h> 45960ed29cSSeigo Tanimura #include <sys/jail.h> 46b110a8a2SGarrett Wollman #include <sys/kernel.h> 47960ed29cSSeigo Tanimura #include <sys/lock.h> 48df8bae1dSRodney W. Grimes #include <sys/malloc.h> 49df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 50acd3428bSRobert Watson #include <sys/priv.h> 51490d50b6SBrian Feldman #include <sys/proc.h> 52df8bae1dSRodney W. Grimes #include <sys/protosw.h> 53960ed29cSSeigo Tanimura #include <sys/signalvar.h> 54df8bae1dSRodney W. Grimes #include <sys/socket.h> 55df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 56960ed29cSSeigo Tanimura #include <sys/sx.h> 57b5e8ce9fSBruce Evans #include <sys/sysctl.h> 58816a3d83SPoul-Henning Kamp #include <sys/syslog.h> 59f5514f08SRobert Watson #include <sys/systm.h> 60603724d3SBjoern A. Zeeb #include <sys/vimage.h> 618781d8e9SBruce Evans 6269c2d429SJeff Roberson #include <vm/uma.h> 63df8bae1dSRodney W. Grimes 64df8bae1dSRodney W. Grimes #include <net/if.h> 65df8bae1dSRodney W. Grimes #include <net/route.h> 66df8bae1dSRodney W. Grimes 67df8bae1dSRodney W. Grimes #include <netinet/in.h> 68960ed29cSSeigo Tanimura #include <netinet/in_pcb.h> 69f5514f08SRobert Watson #include <netinet/in_systm.h> 70960ed29cSSeigo Tanimura #include <netinet/in_var.h> 71df8bae1dSRodney W. Grimes #include <netinet/ip.h> 72cfa1ca9dSYoshinobu Inoue #ifdef INET6 73cfa1ca9dSYoshinobu Inoue #include <netinet/ip6.h> 74cfa1ca9dSYoshinobu Inoue #endif 75960ed29cSSeigo Tanimura #include <netinet/ip_icmp.h> 76960ed29cSSeigo Tanimura #include <netinet/icmp_var.h> 77df8bae1dSRodney W. Grimes #include <netinet/ip_var.h> 78ef39adf0SAndre Oppermann #include <netinet/ip_options.h> 79cfa1ca9dSYoshinobu Inoue #ifdef INET6 80cfa1ca9dSYoshinobu Inoue #include <netinet6/ip6_var.h> 81cfa1ca9dSYoshinobu Inoue #endif 82df8bae1dSRodney W. Grimes #include <netinet/udp.h> 83df8bae1dSRodney W. Grimes #include <netinet/udp_var.h> 84df8bae1dSRodney W. Grimes 85b2630c29SGeorge V. Neville-Neil #ifdef IPSEC 86b9234fafSSam Leffler #include <netipsec/ipsec.h> 873329b236SRobert Watson #endif 88b9234fafSSam Leffler 89db4f9cc7SJonathan Lemon #include <machine/in_cksum.h> 90db4f9cc7SJonathan Lemon 91aed55708SRobert Watson #include <security/mac/mac_framework.h> 92aed55708SRobert Watson 93df8bae1dSRodney W. Grimes /* 94df8bae1dSRodney W. Grimes * UDP protocol implementation. 95df8bae1dSRodney W. Grimes * Per RFC 768, August, 1980. 96df8bae1dSRodney W. Grimes */ 9774eb3236SWarner Losh 9844e33a07SMarko Zec #ifdef VIMAGE_GLOBALS 9944e33a07SMarko Zec int udp_blackhole; 10044e33a07SMarko Zec #endif 10144e33a07SMarko Zec 10274eb3236SWarner Losh /* 1033329b236SRobert Watson * BSD 4.2 defaulted the udp checksum to be off. Turning off udp checksums 1043329b236SRobert Watson * removes the only data integrity mechanism for packets and malformed 105f5514f08SRobert Watson * packets that would otherwise be discarded due to bad checksums, and may 106f5514f08SRobert Watson * cause problems (especially for NFS data blocks). 10774eb3236SWarner Losh */ 108f5514f08SRobert Watson static int udp_cksum = 1; 109f5514f08SRobert Watson SYSCTL_INT(_net_inet_udp, UDPCTL_CHECKSUM, checksum, CTLFLAG_RW, &udp_cksum, 11041698ebfSTom Rhodes 0, "compute udp checksum"); 111df8bae1dSRodney W. Grimes 112afdb4274SRobert Watson int udp_log_in_vain = 0; 113816a3d83SPoul-Henning Kamp SYSCTL_INT(_net_inet_udp, OID_AUTO, log_in_vain, CTLFLAG_RW, 114afdb4274SRobert Watson &udp_log_in_vain, 0, "Log all incoming UDP packets"); 115816a3d83SPoul-Henning Kamp 11697021c24SMarko Zec SYSCTL_V_INT(V_NET, vnet_inet, _net_inet_udp, OID_AUTO, blackhole, 11797021c24SMarko Zec CTLFLAG_RW, udp_blackhole, 0, 1183329b236SRobert Watson "Do not send port unreachables for refused connects"); 11916f7f31fSGeoff Rehmet 12043bbb6aaSRobert Watson u_long udp_sendspace = 9216; /* really max datagram size */ 12143bbb6aaSRobert Watson /* 40 1K datagrams */ 12243bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_MAXDGRAM, maxdgram, CTLFLAG_RW, 12343bbb6aaSRobert Watson &udp_sendspace, 0, "Maximum outgoing UDP datagram size"); 12443bbb6aaSRobert Watson 12543bbb6aaSRobert Watson u_long udp_recvspace = 40 * (1024 + 12643bbb6aaSRobert Watson #ifdef INET6 12743bbb6aaSRobert Watson sizeof(struct sockaddr_in6) 12843bbb6aaSRobert Watson #else 12943bbb6aaSRobert Watson sizeof(struct sockaddr_in) 13043bbb6aaSRobert Watson #endif 13143bbb6aaSRobert Watson ); 13243bbb6aaSRobert Watson 13343bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_RECVSPACE, recvspace, CTLFLAG_RW, 13443bbb6aaSRobert Watson &udp_recvspace, 0, "Maximum space for incoming UDP datagrams"); 13543bbb6aaSRobert Watson 13644e33a07SMarko Zec #ifdef VIMAGE_GLOBALS 13776429de4SYoshinobu Inoue struct inpcbhead udb; /* from udp_var.h */ 1387a2aab80SBrian Feldman struct inpcbinfo udbinfo; 13944e33a07SMarko Zec struct udpstat udpstat; /* from udp_var.h */ 14044e33a07SMarko Zec #endif 14115bd2b43SDavid Greenman 14215bd2b43SDavid Greenman #ifndef UDBHASHSIZE 143e2ed8f35SAlexander Motin #define UDBHASHSIZE 128 14415bd2b43SDavid Greenman #endif 14515bd2b43SDavid Greenman 1468b615593SMarko Zec SYSCTL_V_STRUCT(V_NET, vnet_inet, _net_inet_udp, UDPCTL_STATS, stats, 1478b615593SMarko Zec CTLFLAG_RW, udpstat, udpstat, 1488b615593SMarko Zec "UDP statistics (struct udpstat, netinet/udp_var.h)"); 149f2ea20e6SGarrett Wollman 150bc725eafSRobert Watson static void udp_detach(struct socket *so); 1514d77a549SAlfred Perlstein static int udp_output(struct inpcb *, struct mbuf *, struct sockaddr *, 1524d77a549SAlfred Perlstein struct mbuf *, struct thread *); 153df8bae1dSRodney W. Grimes 1544f590175SPaul Saab static void 1554f590175SPaul Saab udp_zone_change(void *tag) 1564f590175SPaul Saab { 1574f590175SPaul Saab 158603724d3SBjoern A. Zeeb uma_zone_set_max(V_udbinfo.ipi_zone, maxsockets); 1594f590175SPaul Saab } 1604f590175SPaul Saab 161d915b280SStephan Uphoff static int 162d915b280SStephan Uphoff udp_inpcb_init(void *mem, int size, int flags) 163d915b280SStephan Uphoff { 164af1ee11dSRobert Watson struct inpcb *inp; 16508651e1fSJohn Baldwin 166af1ee11dSRobert Watson inp = mem; 167d915b280SStephan Uphoff INP_LOCK_INIT(inp, "inp", "udpinp"); 168d915b280SStephan Uphoff return (0); 169d915b280SStephan Uphoff } 170d915b280SStephan Uphoff 171df8bae1dSRodney W. Grimes void 172af1ee11dSRobert Watson udp_init(void) 173df8bae1dSRodney W. Grimes { 1748b615593SMarko Zec INIT_VNET_INET(curvnet); 175af1ee11dSRobert Watson 17644e33a07SMarko Zec V_udp_blackhole = 0; 17744e33a07SMarko Zec 178603724d3SBjoern A. Zeeb INP_INFO_LOCK_INIT(&V_udbinfo, "udp"); 179603724d3SBjoern A. Zeeb LIST_INIT(&V_udb); 1802c0d658fSJulian Elischer V_udbinfo.ipi_listhead = &V_udb; 181603724d3SBjoern A. Zeeb V_udbinfo.ipi_hashbase = hashinit(UDBHASHSIZE, M_PCB, 182603724d3SBjoern A. Zeeb &V_udbinfo.ipi_hashmask); 183603724d3SBjoern A. Zeeb V_udbinfo.ipi_porthashbase = hashinit(UDBHASHSIZE, M_PCB, 184603724d3SBjoern A. Zeeb &V_udbinfo.ipi_porthashmask); 185603724d3SBjoern A. Zeeb V_udbinfo.ipi_zone = uma_zcreate("udpcb", sizeof(struct inpcb), NULL, 186d915b280SStephan Uphoff NULL, udp_inpcb_init, NULL, UMA_ALIGN_PTR, UMA_ZONE_NOFREE); 187603724d3SBjoern A. Zeeb uma_zone_set_max(V_udbinfo.ipi_zone, maxsockets); 1884f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, udp_zone_change, NULL, 1894f590175SPaul Saab EVENTHANDLER_PRI_ANY); 190df8bae1dSRodney W. Grimes } 191df8bae1dSRodney W. Grimes 19243bbb6aaSRobert Watson /* 19343bbb6aaSRobert Watson * Subroutine of udp_input(), which appends the provided mbuf chain to the 19443bbb6aaSRobert Watson * passed pcb/socket. The caller must provide a sockaddr_in via udp_in that 19543bbb6aaSRobert Watson * contains the source address. If the socket ends up being an IPv6 socket, 19643bbb6aaSRobert Watson * udp_append() will convert to a sockaddr_in6 before passing the address 19743bbb6aaSRobert Watson * into the socket code. 19843bbb6aaSRobert Watson */ 19943bbb6aaSRobert Watson static void 20043bbb6aaSRobert Watson udp_append(struct inpcb *inp, struct ip *ip, struct mbuf *n, int off, 20143bbb6aaSRobert Watson struct sockaddr_in *udp_in) 20243bbb6aaSRobert Watson { 20343bbb6aaSRobert Watson struct sockaddr *append_sa; 20443bbb6aaSRobert Watson struct socket *so; 20543bbb6aaSRobert Watson struct mbuf *opts = 0; 20643bbb6aaSRobert Watson #ifdef INET6 20743bbb6aaSRobert Watson struct sockaddr_in6 udp_in6; 20843bbb6aaSRobert Watson #endif 20943bbb6aaSRobert Watson 210119d85f6SRobert Watson INP_RLOCK_ASSERT(inp); 21143bbb6aaSRobert Watson 21243bbb6aaSRobert Watson #ifdef IPSEC 21343bbb6aaSRobert Watson /* Check AH/ESP integrity. */ 21443bbb6aaSRobert Watson if (ipsec4_in_reject(n, inp)) { 2158b615593SMarko Zec INIT_VNET_IPSEC(curvnet); 21643bbb6aaSRobert Watson m_freem(n); 217603724d3SBjoern A. Zeeb V_ipsec4stat.in_polvio++; 21843bbb6aaSRobert Watson return; 21943bbb6aaSRobert Watson } 22043bbb6aaSRobert Watson #endif /* IPSEC */ 22143bbb6aaSRobert Watson #ifdef MAC 22230d239bcSRobert Watson if (mac_inpcb_check_deliver(inp, n) != 0) { 22343bbb6aaSRobert Watson m_freem(n); 22443bbb6aaSRobert Watson return; 22543bbb6aaSRobert Watson } 22643bbb6aaSRobert Watson #endif 22743bbb6aaSRobert Watson if (inp->inp_flags & INP_CONTROLOPTS || 22843bbb6aaSRobert Watson inp->inp_socket->so_options & (SO_TIMESTAMP | SO_BINTIME)) { 22943bbb6aaSRobert Watson #ifdef INET6 2309a38ba81SBjoern A. Zeeb if (inp->inp_vflag & INP_IPV6) 23148d48eb9SBjoern A. Zeeb (void)ip6_savecontrol_v4(inp, n, &opts, NULL); 2329a38ba81SBjoern A. Zeeb else 23343bbb6aaSRobert Watson #endif 23443bbb6aaSRobert Watson ip_savecontrol(inp, &opts, ip, n); 23543bbb6aaSRobert Watson } 23643bbb6aaSRobert Watson #ifdef INET6 23743bbb6aaSRobert Watson if (inp->inp_vflag & INP_IPV6) { 23843bbb6aaSRobert Watson bzero(&udp_in6, sizeof(udp_in6)); 23943bbb6aaSRobert Watson udp_in6.sin6_len = sizeof(udp_in6); 24043bbb6aaSRobert Watson udp_in6.sin6_family = AF_INET6; 24143bbb6aaSRobert Watson in6_sin_2_v4mapsin6(udp_in, &udp_in6); 24243bbb6aaSRobert Watson append_sa = (struct sockaddr *)&udp_in6; 24343bbb6aaSRobert Watson } else 24443bbb6aaSRobert Watson #endif 24543bbb6aaSRobert Watson append_sa = (struct sockaddr *)udp_in; 24643bbb6aaSRobert Watson m_adj(n, off); 24743bbb6aaSRobert Watson 24843bbb6aaSRobert Watson so = inp->inp_socket; 24943bbb6aaSRobert Watson SOCKBUF_LOCK(&so->so_rcv); 25043bbb6aaSRobert Watson if (sbappendaddr_locked(&so->so_rcv, append_sa, n, opts) == 0) { 2518b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 25243bbb6aaSRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 25343bbb6aaSRobert Watson m_freem(n); 25443bbb6aaSRobert Watson if (opts) 25543bbb6aaSRobert Watson m_freem(opts); 256603724d3SBjoern A. Zeeb V_udpstat.udps_fullsock++; 25743bbb6aaSRobert Watson } else 25843bbb6aaSRobert Watson sorwakeup_locked(so); 25943bbb6aaSRobert Watson } 26043bbb6aaSRobert Watson 261df8bae1dSRodney W. Grimes void 2623329b236SRobert Watson udp_input(struct mbuf *m, int off) 263df8bae1dSRodney W. Grimes { 2648b615593SMarko Zec INIT_VNET_INET(curvnet); 265cfa1ca9dSYoshinobu Inoue int iphlen = off; 2663329b236SRobert Watson struct ip *ip; 2673329b236SRobert Watson struct udphdr *uh; 26871498f30SBruce M Simpson struct ifnet *ifp; 2693329b236SRobert Watson struct inpcb *inp; 270df8bae1dSRodney W. Grimes int len; 271df8bae1dSRodney W. Grimes struct ip save_ip; 272d4b509bdSRobert Watson struct sockaddr_in udp_in; 2730b4ae859SGleb Smirnoff #ifdef IPFIREWALL_FORWARD 2740b4ae859SGleb Smirnoff struct m_tag *fwd_tag; 2750b4ae859SGleb Smirnoff #endif 276df8bae1dSRodney W. Grimes 27771498f30SBruce M Simpson ifp = m->m_pkthdr.rcvif; 278603724d3SBjoern A. Zeeb V_udpstat.udps_ipackets++; 279df8bae1dSRodney W. Grimes 280df8bae1dSRodney W. Grimes /* 2813329b236SRobert Watson * Strip IP options, if any; should skip this, make available to 2823329b236SRobert Watson * user, and use on returned packets, but we don't yet have a way to 2833329b236SRobert Watson * check the checksum with options still present. 284df8bae1dSRodney W. Grimes */ 285df8bae1dSRodney W. Grimes if (iphlen > sizeof (struct ip)) { 286df8bae1dSRodney W. Grimes ip_stripoptions(m, (struct mbuf *)0); 287df8bae1dSRodney W. Grimes iphlen = sizeof(struct ip); 288df8bae1dSRodney W. Grimes } 289df8bae1dSRodney W. Grimes 290df8bae1dSRodney W. Grimes /* 291df8bae1dSRodney W. Grimes * Get IP and UDP header together in first mbuf. 292df8bae1dSRodney W. Grimes */ 293df8bae1dSRodney W. Grimes ip = mtod(m, struct ip *); 294df8bae1dSRodney W. Grimes if (m->m_len < iphlen + sizeof(struct udphdr)) { 295df8bae1dSRodney W. Grimes if ((m = m_pullup(m, iphlen + sizeof(struct udphdr))) == 0) { 296603724d3SBjoern A. Zeeb V_udpstat.udps_hdrops++; 297df8bae1dSRodney W. Grimes return; 298df8bae1dSRodney W. Grimes } 299df8bae1dSRodney W. Grimes ip = mtod(m, struct ip *); 300df8bae1dSRodney W. Grimes } 301df8bae1dSRodney W. Grimes uh = (struct udphdr *)((caddr_t)ip + iphlen); 302df8bae1dSRodney W. Grimes 3033329b236SRobert Watson /* 3043329b236SRobert Watson * Destination port of 0 is illegal, based on RFC768. 3053329b236SRobert Watson */ 306686cdd19SJun-ichiro itojun Hagino if (uh->uh_dport == 0) 307f76fcf6dSJeffrey Hsu goto badunlocked; 308686cdd19SJun-ichiro itojun Hagino 309df8bae1dSRodney W. Grimes /* 3103329b236SRobert Watson * Construct sockaddr format source address. Stuff source address 3113329b236SRobert Watson * and datagram in user buffer. 312b9234fafSSam Leffler */ 313d4b509bdSRobert Watson bzero(&udp_in, sizeof(udp_in)); 314d4b509bdSRobert Watson udp_in.sin_len = sizeof(udp_in); 315d4b509bdSRobert Watson udp_in.sin_family = AF_INET; 316b9234fafSSam Leffler udp_in.sin_port = uh->uh_sport; 317b9234fafSSam Leffler udp_in.sin_addr = ip->ip_src; 318b9234fafSSam Leffler 319b9234fafSSam Leffler /* 320af1ee11dSRobert Watson * Make mbuf data length reflect UDP length. If not enough data to 321af1ee11dSRobert Watson * reflect UDP length, drop. 322df8bae1dSRodney W. Grimes */ 323df8bae1dSRodney W. Grimes len = ntohs((u_short)uh->uh_ulen); 324df8bae1dSRodney W. Grimes if (ip->ip_len != len) { 3257eb7a449SAndras Olah if (len > ip->ip_len || len < sizeof(struct udphdr)) { 326603724d3SBjoern A. Zeeb V_udpstat.udps_badlen++; 327f76fcf6dSJeffrey Hsu goto badunlocked; 328df8bae1dSRodney W. Grimes } 329df8bae1dSRodney W. Grimes m_adj(m, len - ip->ip_len); 330df8bae1dSRodney W. Grimes /* ip->ip_len = len; */ 331df8bae1dSRodney W. Grimes } 3323329b236SRobert Watson 333df8bae1dSRodney W. Grimes /* 3343329b236SRobert Watson * Save a copy of the IP header in case we want restore it for 3353329b236SRobert Watson * sending an ICMP error message in response. 336df8bae1dSRodney W. Grimes */ 337603724d3SBjoern A. Zeeb if (!V_udp_blackhole) 338df8bae1dSRodney W. Grimes save_ip = *ip; 339cce418d3SMatt Jacob else 340cce418d3SMatt Jacob memset(&save_ip, 0, sizeof(save_ip)); 341df8bae1dSRodney W. Grimes 342df8bae1dSRodney W. Grimes /* 343df8bae1dSRodney W. Grimes * Checksum extended UDP header and data. 344df8bae1dSRodney W. Grimes */ 3456dfab5b1SGarrett Wollman if (uh->uh_sum) { 34639629c92SDavid Malone u_short uh_sum; 34739629c92SDavid Malone 348db4f9cc7SJonathan Lemon if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) { 349db4f9cc7SJonathan Lemon if (m->m_pkthdr.csum_flags & CSUM_PSEUDO_HDR) 35039629c92SDavid Malone uh_sum = m->m_pkthdr.csum_data; 351db4f9cc7SJonathan Lemon else 35239629c92SDavid Malone uh_sum = in_pseudo(ip->ip_src.s_addr, 353506f4949SRuslan Ermilov ip->ip_dst.s_addr, htonl((u_short)len + 354db4f9cc7SJonathan Lemon m->m_pkthdr.csum_data + IPPROTO_UDP)); 35539629c92SDavid Malone uh_sum ^= 0xffff; 356db4f9cc7SJonathan Lemon } else { 357cb342100SHajimu UMEMOTO char b[9]; 358af1ee11dSRobert Watson 359cb342100SHajimu UMEMOTO bcopy(((struct ipovly *)ip)->ih_x1, b, 9); 3606effc713SDoug Rabson bzero(((struct ipovly *)ip)->ih_x1, 9); 361df8bae1dSRodney W. Grimes ((struct ipovly *)ip)->ih_len = uh->uh_ulen; 36239629c92SDavid Malone uh_sum = in_cksum(m, len + sizeof (struct ip)); 363cb342100SHajimu UMEMOTO bcopy(b, ((struct ipovly *)ip)->ih_x1, 9); 364db4f9cc7SJonathan Lemon } 36539629c92SDavid Malone if (uh_sum) { 366603724d3SBjoern A. Zeeb V_udpstat.udps_badsum++; 367df8bae1dSRodney W. Grimes m_freem(m); 368df8bae1dSRodney W. Grimes return; 369df8bae1dSRodney W. Grimes } 370fb9aaba0SRuslan Ermilov } else 371603724d3SBjoern A. Zeeb V_udpstat.udps_nosum++; 372df8bae1dSRodney W. Grimes 3730b4ae859SGleb Smirnoff #ifdef IPFIREWALL_FORWARD 3743329b236SRobert Watson /* 3753329b236SRobert Watson * Grab info from PACKET_TAG_IPFORWARD tag prepended to the chain. 3763329b236SRobert Watson */ 3770b4ae859SGleb Smirnoff fwd_tag = m_tag_find(m, PACKET_TAG_IPFORWARD, NULL); 3780b4ae859SGleb Smirnoff if (fwd_tag != NULL) { 3790b4ae859SGleb Smirnoff struct sockaddr_in *next_hop; 3800b4ae859SGleb Smirnoff 3813329b236SRobert Watson /* 3823329b236SRobert Watson * Do the hack. 3833329b236SRobert Watson */ 3840b4ae859SGleb Smirnoff next_hop = (struct sockaddr_in *)(fwd_tag + 1); 3850b4ae859SGleb Smirnoff ip->ip_dst = next_hop->sin_addr; 3860b4ae859SGleb Smirnoff uh->uh_dport = ntohs(next_hop->sin_port); 3873329b236SRobert Watson 3883329b236SRobert Watson /* 3893329b236SRobert Watson * Remove the tag from the packet. We don't need it anymore. 3903329b236SRobert Watson */ 3910b4ae859SGleb Smirnoff m_tag_delete(m, fwd_tag); 3920b4ae859SGleb Smirnoff } 3930b4ae859SGleb Smirnoff #endif 3940b4ae859SGleb Smirnoff 395603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 396df8bae1dSRodney W. Grimes if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) || 39771498f30SBruce M Simpson in_broadcast(ip->ip_dst, ifp)) { 39882c23ebaSBill Fenner struct inpcb *last; 39971498f30SBruce M Simpson struct ip_moptions *imo; 4003329b236SRobert Watson 401df8bae1dSRodney W. Grimes last = NULL; 402603724d3SBjoern A. Zeeb LIST_FOREACH(inp, &V_udb, inp_list) { 4039c1df695SRobert Watson if (inp->inp_lport != uh->uh_dport) 404f76fcf6dSJeffrey Hsu continue; 405cfa1ca9dSYoshinobu Inoue #ifdef INET6 406369dc8ceSEivind Eklund if ((inp->inp_vflag & INP_IPV4) == 0) 4079c1df695SRobert Watson continue; 408cfa1ca9dSYoshinobu Inoue #endif 40971498f30SBruce M Simpson if (inp->inp_laddr.s_addr != INADDR_ANY && 41071498f30SBruce M Simpson inp->inp_laddr.s_addr != ip->ip_dst.s_addr) 4119c1df695SRobert Watson continue; 41271498f30SBruce M Simpson if (inp->inp_faddr.s_addr != INADDR_ANY && 41371498f30SBruce M Simpson inp->inp_faddr.s_addr != ip->ip_src.s_addr) 41471498f30SBruce M Simpson continue; 41571498f30SBruce M Simpson /* 41671498f30SBruce M Simpson * XXX: Do not check source port of incoming datagram 41771498f30SBruce M Simpson * unless inp_connect() has been called to bind the 41871498f30SBruce M Simpson * fport part of the 4-tuple; the source could be 41971498f30SBruce M Simpson * trying to talk to us with an ephemeral port. 42071498f30SBruce M Simpson */ 42171498f30SBruce M Simpson if (inp->inp_fport != 0 && 422df8bae1dSRodney W. Grimes inp->inp_fport != uh->uh_sport) 4239c1df695SRobert Watson continue; 42471498f30SBruce M Simpson 425119d85f6SRobert Watson INP_RLOCK(inp); 426df8bae1dSRodney W. Grimes 42783453a06SBruce M Simpson /* 42871498f30SBruce M Simpson * Handle socket delivery policy for any-source 42971498f30SBruce M Simpson * and source-specific multicast. [RFC3678] 43083453a06SBruce M Simpson */ 43171498f30SBruce M Simpson imo = inp->inp_moptions; 43271498f30SBruce M Simpson if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) && 43371498f30SBruce M Simpson imo != NULL) { 43471498f30SBruce M Simpson struct sockaddr_in sin; 43571498f30SBruce M Simpson struct in_msource *ims; 43671498f30SBruce M Simpson int blocked, mode; 43771498f30SBruce M Simpson size_t idx; 43883453a06SBruce M Simpson 43971498f30SBruce M Simpson bzero(&sin, sizeof(struct sockaddr_in)); 44071498f30SBruce M Simpson sin.sin_len = sizeof(struct sockaddr_in); 44171498f30SBruce M Simpson sin.sin_family = AF_INET; 44271498f30SBruce M Simpson sin.sin_addr = ip->ip_dst; 44371498f30SBruce M Simpson 44471498f30SBruce M Simpson blocked = 0; 44571498f30SBruce M Simpson idx = imo_match_group(imo, ifp, 44671498f30SBruce M Simpson (struct sockaddr *)&sin); 44771498f30SBruce M Simpson if (idx == -1) { 44871498f30SBruce M Simpson /* 44971498f30SBruce M Simpson * No group membership for this socket. 45071498f30SBruce M Simpson * Do not bump udps_noportbcast, as 45171498f30SBruce M Simpson * this will happen further down. 45271498f30SBruce M Simpson */ 45371498f30SBruce M Simpson blocked++; 45471498f30SBruce M Simpson } else { 45571498f30SBruce M Simpson /* 45671498f30SBruce M Simpson * Check for a multicast source filter 45771498f30SBruce M Simpson * entry on this socket for this group. 45871498f30SBruce M Simpson * MCAST_EXCLUDE is the default 45971498f30SBruce M Simpson * behaviour. It means default accept; 46071498f30SBruce M Simpson * entries, if present, denote sources 46171498f30SBruce M Simpson * to be excluded from delivery. 46271498f30SBruce M Simpson */ 46371498f30SBruce M Simpson ims = imo_match_source(imo, idx, 46471498f30SBruce M Simpson (struct sockaddr *)&udp_in); 46571498f30SBruce M Simpson mode = imo->imo_mfilters[idx].imf_fmode; 46671498f30SBruce M Simpson if ((ims != NULL && 46771498f30SBruce M Simpson mode == MCAST_EXCLUDE) || 46871498f30SBruce M Simpson (ims == NULL && 46971498f30SBruce M Simpson mode == MCAST_INCLUDE)) { 47071498f30SBruce M Simpson #ifdef DIAGNOSTIC 47171498f30SBruce M Simpson if (bootverbose) { 47271498f30SBruce M Simpson printf("%s: blocked by" 47371498f30SBruce M Simpson " source filter\n", 47471498f30SBruce M Simpson __func__); 47571498f30SBruce M Simpson } 47671498f30SBruce M Simpson #endif 477603724d3SBjoern A. Zeeb V_udpstat.udps_filtermcast++; 47871498f30SBruce M Simpson blocked++; 47983453a06SBruce M Simpson } 48083453a06SBruce M Simpson } 48171498f30SBruce M Simpson if (blocked != 0) { 482119d85f6SRobert Watson INP_RUNLOCK(inp); 4839c1df695SRobert Watson continue; 4849c1df695SRobert Watson } 48583453a06SBruce M Simpson } 486df8bae1dSRodney W. Grimes if (last != NULL) { 487df8bae1dSRodney W. Grimes struct mbuf *n; 488df8bae1dSRodney W. Grimes 489032dcc76SLuigi Rizzo n = m_copy(m, 0, M_COPYALL); 490365433d9SRobert Watson if (n != NULL) 4913329b236SRobert Watson udp_append(last, ip, n, iphlen + 4923329b236SRobert Watson sizeof(struct udphdr), &udp_in); 493119d85f6SRobert Watson INP_RUNLOCK(last); 494df8bae1dSRodney W. Grimes } 49582c23ebaSBill Fenner last = inp; 496df8bae1dSRodney W. Grimes /* 497df8bae1dSRodney W. Grimes * Don't look for additional matches if this one does 498df8bae1dSRodney W. Grimes * not have either the SO_REUSEPORT or SO_REUSEADDR 4993329b236SRobert Watson * socket options set. This heuristic avoids 5003329b236SRobert Watson * searching through all pcbs in the common case of a 5013329b236SRobert Watson * non-shared port. It assumes that an application 5023329b236SRobert Watson * will never clear these options after setting them. 503df8bae1dSRodney W. Grimes */ 5043329b236SRobert Watson if ((last->inp_socket->so_options & 5053329b236SRobert Watson (SO_REUSEPORT|SO_REUSEADDR)) == 0) 506df8bae1dSRodney W. Grimes break; 507df8bae1dSRodney W. Grimes } 508df8bae1dSRodney W. Grimes 509df8bae1dSRodney W. Grimes if (last == NULL) { 510df8bae1dSRodney W. Grimes /* 5113329b236SRobert Watson * No matching pcb found; discard datagram. (No need 5123329b236SRobert Watson * to send an ICMP Port Unreachable for a broadcast 5133329b236SRobert Watson * or multicast datgram.) 514df8bae1dSRodney W. Grimes */ 515603724d3SBjoern A. Zeeb V_udpstat.udps_noportbcast++; 51661ffc0b1SJeffrey Hsu goto badheadlocked; 517df8bae1dSRodney W. Grimes } 518d4b509bdSRobert Watson udp_append(last, ip, m, iphlen + sizeof(struct udphdr), 519d4b509bdSRobert Watson &udp_in); 520119d85f6SRobert Watson INP_RUNLOCK(last); 521603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 522df8bae1dSRodney W. Grimes return; 523df8bae1dSRodney W. Grimes } 5243329b236SRobert Watson 525df8bae1dSRodney W. Grimes /* 5266d6a026bSDavid Greenman * Locate pcb for datagram. 527df8bae1dSRodney W. Grimes */ 528603724d3SBjoern A. Zeeb inp = in_pcblookup_hash(&V_udbinfo, ip->ip_src, uh->uh_sport, 52971498f30SBruce M Simpson ip->ip_dst, uh->uh_dport, 1, ifp); 53015bd2b43SDavid Greenman if (inp == NULL) { 531afdb4274SRobert Watson if (udp_log_in_vain) { 532df5c0b8aSBill Fenner char buf[4*sizeof "123"]; 53375cfc95fSAndrey A. Chernov 53475cfc95fSAndrey A. Chernov strcpy(buf, inet_ntoa(ip->ip_dst)); 535592071e8SBruce Evans log(LOG_INFO, 536592071e8SBruce Evans "Connection attempt to UDP %s:%d from %s:%d\n", 537592071e8SBruce Evans buf, ntohs(uh->uh_dport), inet_ntoa(ip->ip_src), 538592071e8SBruce Evans ntohs(uh->uh_sport)); 53975cfc95fSAndrey A. Chernov } 540603724d3SBjoern A. Zeeb V_udpstat.udps_noport++; 541df8bae1dSRodney W. Grimes if (m->m_flags & (M_BCAST | M_MCAST)) { 542603724d3SBjoern A. Zeeb V_udpstat.udps_noportbcast++; 54361ffc0b1SJeffrey Hsu goto badheadlocked; 544df8bae1dSRodney W. Grimes } 545603724d3SBjoern A. Zeeb if (V_udp_blackhole) 54661ffc0b1SJeffrey Hsu goto badheadlocked; 5471cbd978eSLuigi Rizzo if (badport_bandlim(BANDLIM_ICMP_UNREACH) < 0) 5481cbd978eSLuigi Rizzo goto badheadlocked; 54904287599SRuslan Ermilov *ip = save_ip; 55004287599SRuslan Ermilov ip->ip_len += iphlen; 551582a7760SBruce Evans icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_PORT, 0, 0); 552603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 553df8bae1dSRodney W. Grimes return; 554df8bae1dSRodney W. Grimes } 5553329b236SRobert Watson 5563329b236SRobert Watson /* 5573329b236SRobert Watson * Check the minimum TTL for socket. 5583329b236SRobert Watson */ 559119d85f6SRobert Watson INP_RLOCK(inp); 560603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 56110cc62b7SRobert Watson if (inp->inp_ip_minttl && inp->inp_ip_minttl > ip->ip_ttl) { 56210cc62b7SRobert Watson INP_RUNLOCK(inp); 56310cc62b7SRobert Watson goto badunlocked; 56410cc62b7SRobert Watson } 565d4b509bdSRobert Watson udp_append(inp, ip, m, iphlen + sizeof(struct udphdr), &udp_in); 566119d85f6SRobert Watson INP_RUNLOCK(inp); 567df8bae1dSRodney W. Grimes return; 56861ffc0b1SJeffrey Hsu 56961ffc0b1SJeffrey Hsu badheadlocked: 570f76fcf6dSJeffrey Hsu if (inp) 571119d85f6SRobert Watson INP_RUNLOCK(inp); 572603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 573f76fcf6dSJeffrey Hsu badunlocked: 574df8bae1dSRodney W. Grimes m_freem(m); 575cfa1ca9dSYoshinobu Inoue } 576cfa1ca9dSYoshinobu Inoue 577cfa1ca9dSYoshinobu Inoue /* 5783329b236SRobert Watson * Notify a udp user of an asynchronous error; just wake up so that they can 5793329b236SRobert Watson * collect error status. 580df8bae1dSRodney W. Grimes */ 5813ce144eaSJeffrey Hsu struct inpcb * 5823329b236SRobert Watson udp_notify(struct inpcb *inp, int errno) 583df8bae1dSRodney W. Grimes { 5843329b236SRobert Watson 585ac9ae279SRobert Watson /* 586ac9ae279SRobert Watson * While udp_ctlinput() always calls udp_notify() with a read lock 587ac9ae279SRobert Watson * when invoking it directly, in_pcbnotifyall() currently uses write 588ac9ae279SRobert Watson * locks due to sharing code with TCP. For now, accept either a read 589ac9ae279SRobert Watson * or a write lock, but a read lock is sufficient. 590ac9ae279SRobert Watson */ 591ac9ae279SRobert Watson INP_LOCK_ASSERT(inp); 5928501a69cSRobert Watson 593df8bae1dSRodney W. Grimes inp->inp_socket->so_error = errno; 594df8bae1dSRodney W. Grimes sorwakeup(inp->inp_socket); 595df8bae1dSRodney W. Grimes sowwakeup(inp->inp_socket); 5963329b236SRobert Watson return (inp); 597df8bae1dSRodney W. Grimes } 598df8bae1dSRodney W. Grimes 599df8bae1dSRodney W. Grimes void 6003329b236SRobert Watson udp_ctlinput(int cmd, struct sockaddr *sa, void *vip) 601df8bae1dSRodney W. Grimes { 6028b615593SMarko Zec INIT_VNET_INET(curvnet); 603c693a045SJonathan Lemon struct ip *ip = vip; 604c693a045SJonathan Lemon struct udphdr *uh; 605c693a045SJonathan Lemon struct in_addr faddr; 606c693a045SJonathan Lemon struct inpcb *inp; 607c693a045SJonathan Lemon 608c693a045SJonathan Lemon faddr = ((struct sockaddr_in *)sa)->sin_addr; 609c693a045SJonathan Lemon if (sa->sa_family != AF_INET || faddr.s_addr == INADDR_ANY) 610c693a045SJonathan Lemon return; 611df8bae1dSRodney W. Grimes 61297d8d152SAndre Oppermann /* 61397d8d152SAndre Oppermann * Redirects don't need to be handled up here. 61497d8d152SAndre Oppermann */ 61597d8d152SAndre Oppermann if (PRC_IS_REDIRECT(cmd)) 61697d8d152SAndre Oppermann return; 6173329b236SRobert Watson 61897d8d152SAndre Oppermann /* 61997d8d152SAndre Oppermann * Hostdead is ugly because it goes linearly through all PCBs. 6203329b236SRobert Watson * 6213329b236SRobert Watson * XXX: We never get this from ICMP, otherwise it makes an excellent 6223329b236SRobert Watson * DoS attack on machines with many connections. 62397d8d152SAndre Oppermann */ 62497d8d152SAndre Oppermann if (cmd == PRC_HOSTDEAD) 625af1ee11dSRobert Watson ip = NULL; 626d1c54148SJesper Skriver else if ((unsigned)cmd >= PRC_NCMDS || inetctlerrmap[cmd] == 0) 627df8bae1dSRodney W. Grimes return; 628af1ee11dSRobert Watson if (ip != NULL) { 629df8bae1dSRodney W. Grimes uh = (struct udphdr *)((caddr_t)ip + (ip->ip_hl << 2)); 630603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 631603724d3SBjoern A. Zeeb inp = in_pcblookup_hash(&V_udbinfo, faddr, uh->uh_dport, 632c693a045SJonathan Lemon ip->ip_src, uh->uh_sport, 0, NULL); 633f76fcf6dSJeffrey Hsu if (inp != NULL) { 634ac9ae279SRobert Watson INP_RLOCK(inp); 635f76fcf6dSJeffrey Hsu if (inp->inp_socket != NULL) { 636f5514f08SRobert Watson udp_notify(inp, inetctlerrmap[cmd]); 637f76fcf6dSJeffrey Hsu } 638ac9ae279SRobert Watson INP_RUNLOCK(inp); 639f76fcf6dSJeffrey Hsu } 640603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 641df8bae1dSRodney W. Grimes } else 642603724d3SBjoern A. Zeeb in_pcbnotifyall(&V_udbinfo, faddr, inetctlerrmap[cmd], 643f5514f08SRobert Watson udp_notify); 644df8bae1dSRodney W. Grimes } 645df8bae1dSRodney W. Grimes 6460312fbe9SPoul-Henning Kamp static int 64782d9ae4eSPoul-Henning Kamp udp_pcblist(SYSCTL_HANDLER_ARGS) 64898271db4SGarrett Wollman { 6498b615593SMarko Zec INIT_VNET_INET(curvnet); 650277afaffSRobert Watson int error, i, n; 65198271db4SGarrett Wollman struct inpcb *inp, **inp_list; 65298271db4SGarrett Wollman inp_gen_t gencnt; 65398271db4SGarrett Wollman struct xinpgen xig; 65498271db4SGarrett Wollman 65598271db4SGarrett Wollman /* 656f5514f08SRobert Watson * The process of preparing the PCB list is too time-consuming and 65798271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 65898271db4SGarrett Wollman */ 65998271db4SGarrett Wollman if (req->oldptr == 0) { 660603724d3SBjoern A. Zeeb n = V_udbinfo.ipi_count; 66198271db4SGarrett Wollman req->oldidx = 2 * (sizeof xig) 66298271db4SGarrett Wollman + (n + n/8) * sizeof(struct xinpcb); 6633329b236SRobert Watson return (0); 66498271db4SGarrett Wollman } 66598271db4SGarrett Wollman 66698271db4SGarrett Wollman if (req->newptr != 0) 6673329b236SRobert Watson return (EPERM); 66898271db4SGarrett Wollman 66998271db4SGarrett Wollman /* 67098271db4SGarrett Wollman * OK, now we're committed to doing something. 67198271db4SGarrett Wollman */ 672603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 673603724d3SBjoern A. Zeeb gencnt = V_udbinfo.ipi_gencnt; 674603724d3SBjoern A. Zeeb n = V_udbinfo.ipi_count; 675603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 67698271db4SGarrett Wollman 67747934cefSDon Lewis error = sysctl_wire_old_buffer(req, 2 * (sizeof xig) 6785c38b6dbSDon Lewis + n * sizeof(struct xinpcb)); 67947934cefSDon Lewis if (error != 0) 68047934cefSDon Lewis return (error); 6815c38b6dbSDon Lewis 68298271db4SGarrett Wollman xig.xig_len = sizeof xig; 68398271db4SGarrett Wollman xig.xig_count = n; 68498271db4SGarrett Wollman xig.xig_gen = gencnt; 68598271db4SGarrett Wollman xig.xig_sogen = so_gencnt; 68698271db4SGarrett Wollman error = SYSCTL_OUT(req, &xig, sizeof xig); 68798271db4SGarrett Wollman if (error) 6883329b236SRobert Watson return (error); 68998271db4SGarrett Wollman 690a163d034SWarner Losh inp_list = malloc(n * sizeof *inp_list, M_TEMP, M_WAITOK); 69198271db4SGarrett Wollman if (inp_list == 0) 6923329b236SRobert Watson return (ENOMEM); 69398271db4SGarrett Wollman 694603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 695603724d3SBjoern A. Zeeb for (inp = LIST_FIRST(V_udbinfo.ipi_listhead), i = 0; inp && i < n; 696fc2ffbe6SPoul-Henning Kamp inp = LIST_NEXT(inp, inp_list)) { 6979622e84fSRobert Watson INP_RLOCK(inp); 6982ded288cSJeffrey Hsu if (inp->inp_gencnt <= gencnt && 699f08ef6c5SBjoern A. Zeeb cr_canseeinpcb(req->td->td_ucred, inp) == 0) 70098271db4SGarrett Wollman inp_list[i++] = inp; 7019622e84fSRobert Watson INP_RUNLOCK(inp); 7024787fd37SPaul Saab } 703603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 70498271db4SGarrett Wollman n = i; 70598271db4SGarrett Wollman 70698271db4SGarrett Wollman error = 0; 70798271db4SGarrett Wollman for (i = 0; i < n; i++) { 70898271db4SGarrett Wollman inp = inp_list[i]; 7099622e84fSRobert Watson INP_RLOCK(inp); 71098271db4SGarrett Wollman if (inp->inp_gencnt <= gencnt) { 71198271db4SGarrett Wollman struct xinpcb xi; 712fd94099eSColin Percival bzero(&xi, sizeof(xi)); 71398271db4SGarrett Wollman xi.xi_len = sizeof xi; 71498271db4SGarrett Wollman /* XXX should avoid extra copy */ 71598271db4SGarrett Wollman bcopy(inp, &xi.xi_inp, sizeof *inp); 71698271db4SGarrett Wollman if (inp->inp_socket) 71798271db4SGarrett Wollman sotoxsocket(inp->inp_socket, &xi.xi_socket); 7184b40c56cSJeffrey Hsu xi.xi_inp.inp_gencnt = inp->inp_gencnt; 7199622e84fSRobert Watson INP_RUNLOCK(inp); 72098271db4SGarrett Wollman error = SYSCTL_OUT(req, &xi, sizeof xi); 721d915b280SStephan Uphoff } else 7229622e84fSRobert Watson INP_RUNLOCK(inp); 72398271db4SGarrett Wollman } 72498271db4SGarrett Wollman if (!error) { 72598271db4SGarrett Wollman /* 7263329b236SRobert Watson * Give the user an updated idea of our state. If the 7273329b236SRobert Watson * generation differs from what we told her before, she knows 7283329b236SRobert Watson * that something happened while we were processing this 7293329b236SRobert Watson * request, and it might be necessary to retry. 73098271db4SGarrett Wollman */ 731603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 732603724d3SBjoern A. Zeeb xig.xig_gen = V_udbinfo.ipi_gencnt; 73398271db4SGarrett Wollman xig.xig_sogen = so_gencnt; 734603724d3SBjoern A. Zeeb xig.xig_count = V_udbinfo.ipi_count; 735603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 73698271db4SGarrett Wollman error = SYSCTL_OUT(req, &xig, sizeof xig); 73798271db4SGarrett Wollman } 73898271db4SGarrett Wollman free(inp_list, M_TEMP); 7393329b236SRobert Watson return (error); 74098271db4SGarrett Wollman } 74198271db4SGarrett Wollman 74298271db4SGarrett Wollman SYSCTL_PROC(_net_inet_udp, UDPCTL_PCBLIST, pcblist, CTLFLAG_RD, 0, 0, 74398271db4SGarrett Wollman udp_pcblist, "S,xinpcb", "List of active UDP sockets"); 74498271db4SGarrett Wollman 74598271db4SGarrett Wollman static int 74682d9ae4eSPoul-Henning Kamp udp_getcred(SYSCTL_HANDLER_ARGS) 747490d50b6SBrian Feldman { 7488b615593SMarko Zec INIT_VNET_INET(curvnet); 749c0511d3bSBrian Feldman struct xucred xuc; 750490d50b6SBrian Feldman struct sockaddr_in addrs[2]; 751490d50b6SBrian Feldman struct inpcb *inp; 752277afaffSRobert Watson int error; 753490d50b6SBrian Feldman 75432f9753cSRobert Watson error = priv_check(req->td, PRIV_NETINET_GETCRED); 755490d50b6SBrian Feldman if (error) 756490d50b6SBrian Feldman return (error); 757490d50b6SBrian Feldman error = SYSCTL_IN(req, addrs, sizeof(addrs)); 758490d50b6SBrian Feldman if (error) 759490d50b6SBrian Feldman return (error); 760603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 761603724d3SBjoern A. Zeeb inp = in_pcblookup_hash(&V_udbinfo, addrs[1].sin_addr, addrs[1].sin_port, 762cfa1ca9dSYoshinobu Inoue addrs[0].sin_addr, addrs[0].sin_port, 1, NULL); 7639622e84fSRobert Watson if (inp != NULL) { 7649622e84fSRobert Watson INP_RLOCK(inp); 765603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 7669622e84fSRobert Watson if (inp->inp_socket == NULL) 7679622e84fSRobert Watson error = ENOENT; 7689622e84fSRobert Watson if (error == 0) 769f08ef6c5SBjoern A. Zeeb error = cr_canseeinpcb(req->td->td_ucred, inp); 7709622e84fSRobert Watson if (error == 0) 77186d02c5cSBjoern A. Zeeb cru2x(inp->inp_cred, &xuc); 7729622e84fSRobert Watson INP_RUNLOCK(inp); 7739622e84fSRobert Watson } else { 774603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 7759622e84fSRobert Watson error = ENOENT; 7769622e84fSRobert Watson } 7770e1eebb8SDon Lewis if (error == 0) 7780e1eebb8SDon Lewis error = SYSCTL_OUT(req, &xuc, sizeof(struct xucred)); 779490d50b6SBrian Feldman return (error); 780490d50b6SBrian Feldman } 781490d50b6SBrian Feldman 7827ce87f12SDavid Malone SYSCTL_PROC(_net_inet_udp, OID_AUTO, getcred, 7837ce87f12SDavid Malone CTLTYPE_OPAQUE|CTLFLAG_RW|CTLFLAG_PRISON, 0, 0, 7847ce87f12SDavid Malone udp_getcred, "S,xucred", "Get the xucred of a UDP connection"); 785490d50b6SBrian Feldman 786490d50b6SBrian Feldman static int 7873329b236SRobert Watson udp_output(struct inpcb *inp, struct mbuf *m, struct sockaddr *addr, 7883329b236SRobert Watson struct mbuf *control, struct thread *td) 789df8bae1dSRodney W. Grimes { 7908b615593SMarko Zec INIT_VNET_INET(inp->inp_vnet); 7913329b236SRobert Watson struct udpiphdr *ui; 7923329b236SRobert Watson int len = m->m_pkthdr.len; 79390162a4eSIan Dowse struct in_addr faddr, laddr; 794c557ae16SIan Dowse struct cmsghdr *cm; 795c557ae16SIan Dowse struct sockaddr_in *sin, src; 79690162a4eSIan Dowse int error = 0; 7978afa2304SBruce M Simpson int ipflags; 79890162a4eSIan Dowse u_short fport, lport; 7995c32ea65SRobert Watson int unlock_udbinfo; 800df8bae1dSRodney W. Grimes 8015c32ea65SRobert Watson /* 8025c32ea65SRobert Watson * udp_output() may need to temporarily bind or connect the current 803f5514f08SRobert Watson * inpcb. As such, we don't know up front whether we will need the 804f5514f08SRobert Watson * pcbinfo lock or not. Do any work to decide what is needed up 805f5514f08SRobert Watson * front before acquiring any locks. 8065c32ea65SRobert Watson */ 807430d30d8SBill Fenner if (len + sizeof(struct udpiphdr) > IP_MAXPACKET) { 808c557ae16SIan Dowse if (control) 809c557ae16SIan Dowse m_freem(control); 8105c32ea65SRobert Watson m_freem(m); 8113329b236SRobert Watson return (EMSGSIZE); 812430d30d8SBill Fenner } 813430d30d8SBill Fenner 8141b7f0384SBruce M Simpson src.sin_family = 0; 815c557ae16SIan Dowse if (control != NULL) { 816c557ae16SIan Dowse /* 8173329b236SRobert Watson * XXX: Currently, we assume all the optional information is 8183329b236SRobert Watson * stored in a single mbuf. 819c557ae16SIan Dowse */ 820c557ae16SIan Dowse if (control->m_next) { 821c557ae16SIan Dowse m_freem(control); 8225c32ea65SRobert Watson m_freem(m); 8233329b236SRobert Watson return (EINVAL); 824c557ae16SIan Dowse } 825c557ae16SIan Dowse for (; control->m_len > 0; 826c557ae16SIan Dowse control->m_data += CMSG_ALIGN(cm->cmsg_len), 827c557ae16SIan Dowse control->m_len -= CMSG_ALIGN(cm->cmsg_len)) { 828c557ae16SIan Dowse cm = mtod(control, struct cmsghdr *); 829af1ee11dSRobert Watson if (control->m_len < sizeof(*cm) || cm->cmsg_len == 0 830af1ee11dSRobert Watson || cm->cmsg_len > control->m_len) { 831c557ae16SIan Dowse error = EINVAL; 832c557ae16SIan Dowse break; 833c557ae16SIan Dowse } 834c557ae16SIan Dowse if (cm->cmsg_level != IPPROTO_IP) 835c557ae16SIan Dowse continue; 836c557ae16SIan Dowse 837c557ae16SIan Dowse switch (cm->cmsg_type) { 838c557ae16SIan Dowse case IP_SENDSRCADDR: 839c557ae16SIan Dowse if (cm->cmsg_len != 840c557ae16SIan Dowse CMSG_LEN(sizeof(struct in_addr))) { 841c557ae16SIan Dowse error = EINVAL; 842c557ae16SIan Dowse break; 843c557ae16SIan Dowse } 844c557ae16SIan Dowse bzero(&src, sizeof(src)); 845c557ae16SIan Dowse src.sin_family = AF_INET; 846c557ae16SIan Dowse src.sin_len = sizeof(src); 847c557ae16SIan Dowse src.sin_port = inp->inp_lport; 848af1ee11dSRobert Watson src.sin_addr = 849af1ee11dSRobert Watson *(struct in_addr *)CMSG_DATA(cm); 850c557ae16SIan Dowse break; 851af1ee11dSRobert Watson 852c557ae16SIan Dowse default: 853c557ae16SIan Dowse error = ENOPROTOOPT; 854c557ae16SIan Dowse break; 855c557ae16SIan Dowse } 856c557ae16SIan Dowse if (error) 857c557ae16SIan Dowse break; 858c557ae16SIan Dowse } 859c557ae16SIan Dowse m_freem(control); 860c557ae16SIan Dowse } 8615c32ea65SRobert Watson if (error) { 8625c32ea65SRobert Watson m_freem(m); 8633329b236SRobert Watson return (error); 8645c32ea65SRobert Watson } 8655c32ea65SRobert Watson 86643cc0bc1SRobert Watson /* 86743cc0bc1SRobert Watson * Depending on whether or not the application has bound or connected 868ca528788SRobert Watson * the socket, we may have to do varying levels of work. The optimal 869ca528788SRobert Watson * case is for a connected UDP socket, as a global lock isn't 870ca528788SRobert Watson * required at all. 87143cc0bc1SRobert Watson * 87243cc0bc1SRobert Watson * In order to decide which we need, we require stability of the 87343cc0bc1SRobert Watson * inpcb binding, which we ensure by acquiring a read lock on the 87443cc0bc1SRobert Watson * inpcb. This doesn't strictly follow the lock order, so we play 87543cc0bc1SRobert Watson * the trylock and retry game; note that we may end up with more 87643cc0bc1SRobert Watson * conservative locks than required the second time around, so later 87743cc0bc1SRobert Watson * assertions have to accept that. Further analysis of the number of 87843cc0bc1SRobert Watson * misses under contention is required. 87943cc0bc1SRobert Watson */ 88043cc0bc1SRobert Watson sin = (struct sockaddr_in *)addr; 88143cc0bc1SRobert Watson INP_RLOCK(inp); 88243cc0bc1SRobert Watson if (sin != NULL && 88343cc0bc1SRobert Watson (inp->inp_laddr.s_addr == INADDR_ANY && inp->inp_lport == 0)) { 88443cc0bc1SRobert Watson INP_RUNLOCK(inp); 885603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 8868501a69cSRobert Watson INP_WLOCK(inp); 88743cc0bc1SRobert Watson unlock_udbinfo = 2; 88843cc0bc1SRobert Watson } else if ((sin != NULL && ( 88943cc0bc1SRobert Watson (sin->sin_addr.s_addr == INADDR_ANY) || 89043cc0bc1SRobert Watson (sin->sin_addr.s_addr == INADDR_BROADCAST) || 89143cc0bc1SRobert Watson (inp->inp_laddr.s_addr == INADDR_ANY) || 89243cc0bc1SRobert Watson (inp->inp_lport == 0))) || 89343cc0bc1SRobert Watson (src.sin_family == AF_INET)) { 894603724d3SBjoern A. Zeeb if (!INP_INFO_TRY_RLOCK(&V_udbinfo)) { 89543cc0bc1SRobert Watson INP_RUNLOCK(inp); 896603724d3SBjoern A. Zeeb INP_INFO_RLOCK(&V_udbinfo); 897948d0fc9SRobert Watson INP_RLOCK(inp); 898948d0fc9SRobert Watson } 89943cc0bc1SRobert Watson unlock_udbinfo = 1; 90043cc0bc1SRobert Watson } else 90143cc0bc1SRobert Watson unlock_udbinfo = 0; 9025c32ea65SRobert Watson 9031b7f0384SBruce M Simpson /* 9041b7f0384SBruce M Simpson * If the IP_SENDSRCADDR control message was specified, override the 9051b7f0384SBruce M Simpson * source address for this datagram. Its use is invalidated if the 9061b7f0384SBruce M Simpson * address thus specified is incomplete or clobbers other inpcbs. 9071b7f0384SBruce M Simpson */ 90890162a4eSIan Dowse laddr = inp->inp_laddr; 90990162a4eSIan Dowse lport = inp->inp_lport; 9101b7f0384SBruce M Simpson if (src.sin_family == AF_INET) { 911603724d3SBjoern A. Zeeb INP_INFO_LOCK_ASSERT(&V_udbinfo); 9121b7f0384SBruce M Simpson if ((lport == 0) || 9131b7f0384SBruce M Simpson (laddr.s_addr == INADDR_ANY && 9141b7f0384SBruce M Simpson src.sin_addr.s_addr == INADDR_ANY)) { 915c557ae16SIan Dowse error = EINVAL; 916c557ae16SIan Dowse goto release; 917c557ae16SIan Dowse } 918c557ae16SIan Dowse error = in_pcbbind_setup(inp, (struct sockaddr *)&src, 919b0330ed9SPawel Jakub Dawidek &laddr.s_addr, &lport, td->td_ucred); 920c557ae16SIan Dowse if (error) 921c557ae16SIan Dowse goto release; 922c557ae16SIan Dowse } 923c557ae16SIan Dowse 9243144b7d3SRobert Watson /* 9253144b7d3SRobert Watson * If a UDP socket has been connected, then a local address/port will 9263144b7d3SRobert Watson * have been selected and bound. 9273144b7d3SRobert Watson * 92843cc0bc1SRobert Watson * If a UDP socket has not been connected to, then an explicit 9293144b7d3SRobert Watson * destination address must be used, in which case a local 9303144b7d3SRobert Watson * address/port may not have been selected and bound. 9313144b7d3SRobert Watson */ 93243cc0bc1SRobert Watson if (sin != NULL) { 933c4d585aeSRobert Watson INP_LOCK_ASSERT(inp); 934df8bae1dSRodney W. Grimes if (inp->inp_faddr.s_addr != INADDR_ANY) { 935df8bae1dSRodney W. Grimes error = EISCONN; 936df8bae1dSRodney W. Grimes goto release; 937df8bae1dSRodney W. Grimes } 9383144b7d3SRobert Watson 9393144b7d3SRobert Watson /* 9403144b7d3SRobert Watson * Jail may rewrite the destination address, so let it do 9413144b7d3SRobert Watson * that before we use it. 9423144b7d3SRobert Watson */ 943413628a7SBjoern A. Zeeb if (prison_remote_ip4(td->td_ucred, &sin->sin_addr) != 0) { 944413628a7SBjoern A. Zeeb error = EINVAL; 945413628a7SBjoern A. Zeeb goto release; 946413628a7SBjoern A. Zeeb } 9473144b7d3SRobert Watson 9483144b7d3SRobert Watson /* 94943cc0bc1SRobert Watson * If a local address or port hasn't yet been selected, or if 95043cc0bc1SRobert Watson * the destination address needs to be rewritten due to using 95143cc0bc1SRobert Watson * a special INADDR_ constant, invoke in_pcbconnect_setup() 95243cc0bc1SRobert Watson * to do the heavy lifting. Once a port is selected, we 95343cc0bc1SRobert Watson * commit the binding back to the socket; we also commit the 95443cc0bc1SRobert Watson * binding of the address if in jail. 95543cc0bc1SRobert Watson * 95643cc0bc1SRobert Watson * If we already have a valid binding and we're not 95743cc0bc1SRobert Watson * requesting a destination address rewrite, use a fast path. 9583144b7d3SRobert Watson */ 95943cc0bc1SRobert Watson if (inp->inp_laddr.s_addr == INADDR_ANY || 96043cc0bc1SRobert Watson inp->inp_lport == 0 || 96143cc0bc1SRobert Watson sin->sin_addr.s_addr == INADDR_ANY || 96243cc0bc1SRobert Watson sin->sin_addr.s_addr == INADDR_BROADCAST) { 963603724d3SBjoern A. Zeeb INP_INFO_LOCK_ASSERT(&V_udbinfo); 96443cc0bc1SRobert Watson error = in_pcbconnect_setup(inp, addr, &laddr.s_addr, 96543cc0bc1SRobert Watson &lport, &faddr.s_addr, &fport, NULL, 96643cc0bc1SRobert Watson td->td_ucred); 96790162a4eSIan Dowse if (error) 96890162a4eSIan Dowse goto release; 96990162a4eSIan Dowse 97043cc0bc1SRobert Watson /* 97143cc0bc1SRobert Watson * XXXRW: Why not commit the port if the address is 97243cc0bc1SRobert Watson * !INADDR_ANY? 97343cc0bc1SRobert Watson */ 97490162a4eSIan Dowse /* Commit the local port if newly assigned. */ 97590162a4eSIan Dowse if (inp->inp_laddr.s_addr == INADDR_ANY && 97690162a4eSIan Dowse inp->inp_lport == 0) { 977603724d3SBjoern A. Zeeb INP_INFO_WLOCK_ASSERT(&V_udbinfo); 978c4d585aeSRobert Watson INP_WLOCK_ASSERT(inp); 9793a1757b9SGleb Smirnoff /* 98043cc0bc1SRobert Watson * Remember addr if jailed, to prevent 98143cc0bc1SRobert Watson * rebinding. 9823a1757b9SGleb Smirnoff */ 9833a1757b9SGleb Smirnoff if (jailed(td->td_ucred)) 9843a1757b9SGleb Smirnoff inp->inp_laddr = laddr; 98590162a4eSIan Dowse inp->inp_lport = lport; 98690162a4eSIan Dowse if (in_pcbinshash(inp) != 0) { 98790162a4eSIan Dowse inp->inp_lport = 0; 98890162a4eSIan Dowse error = EAGAIN; 989df8bae1dSRodney W. Grimes goto release; 990df8bae1dSRodney W. Grimes } 99190162a4eSIan Dowse inp->inp_flags |= INP_ANONPORT; 99290162a4eSIan Dowse } 993df8bae1dSRodney W. Grimes } else { 99443cc0bc1SRobert Watson faddr = sin->sin_addr; 99543cc0bc1SRobert Watson fport = sin->sin_port; 99643cc0bc1SRobert Watson } 99743cc0bc1SRobert Watson } else { 998c4d585aeSRobert Watson INP_LOCK_ASSERT(inp); 99990162a4eSIan Dowse faddr = inp->inp_faddr; 100090162a4eSIan Dowse fport = inp->inp_fport; 100190162a4eSIan Dowse if (faddr.s_addr == INADDR_ANY) { 1002df8bae1dSRodney W. Grimes error = ENOTCONN; 1003df8bae1dSRodney W. Grimes goto release; 1004df8bae1dSRodney W. Grimes } 1005df8bae1dSRodney W. Grimes } 1006e6ccd709SRobert Watson 1007df8bae1dSRodney W. Grimes /* 1008e6ccd709SRobert Watson * Calculate data length and get a mbuf for UDP, IP, and possible 1009392e8407SRobert Watson * link-layer headers. Immediate slide the data pointer back forward 1010392e8407SRobert Watson * since we won't use that space at this layer. 1011df8bae1dSRodney W. Grimes */ 1012e6ccd709SRobert Watson M_PREPEND(m, sizeof(struct udpiphdr) + max_linkhdr, M_DONTWAIT); 1013e6ccd709SRobert Watson if (m == NULL) { 1014df8bae1dSRodney W. Grimes error = ENOBUFS; 101549b19bfcSBruce M Simpson goto release; 1016df8bae1dSRodney W. Grimes } 1017e6ccd709SRobert Watson m->m_data += max_linkhdr; 1018e6ccd709SRobert Watson m->m_len -= max_linkhdr; 1019392e8407SRobert Watson m->m_pkthdr.len -= max_linkhdr; 1020df8bae1dSRodney W. Grimes 1021df8bae1dSRodney W. Grimes /* 10223329b236SRobert Watson * Fill in mbuf with extended UDP header and addresses and length put 10233329b236SRobert Watson * into network format. 1024df8bae1dSRodney W. Grimes */ 1025df8bae1dSRodney W. Grimes ui = mtod(m, struct udpiphdr *); 1026db4f9cc7SJonathan Lemon bzero(ui->ui_x1, sizeof(ui->ui_x1)); /* XXX still needed? */ 1027df8bae1dSRodney W. Grimes ui->ui_pr = IPPROTO_UDP; 102890162a4eSIan Dowse ui->ui_src = laddr; 102990162a4eSIan Dowse ui->ui_dst = faddr; 103090162a4eSIan Dowse ui->ui_sport = lport; 103190162a4eSIan Dowse ui->ui_dport = fport; 1032db4f9cc7SJonathan Lemon ui->ui_ulen = htons((u_short)len + sizeof(struct udphdr)); 1033df8bae1dSRodney W. Grimes 1034b2828ad2SAndre Oppermann /* 1035b2828ad2SAndre Oppermann * Set the Don't Fragment bit in the IP header. 1036b2828ad2SAndre Oppermann */ 1037b2828ad2SAndre Oppermann if (inp->inp_flags & INP_DONTFRAG) { 1038b2828ad2SAndre Oppermann struct ip *ip; 10393329b236SRobert Watson 1040b2828ad2SAndre Oppermann ip = (struct ip *)&ui->ui_i; 1041b2828ad2SAndre Oppermann ip->ip_off |= IP_DF; 1042b2828ad2SAndre Oppermann } 1043b2828ad2SAndre Oppermann 1044b5d47ff5SJohn-Mark Gurney ipflags = 0; 1045b5d47ff5SJohn-Mark Gurney if (inp->inp_socket->so_options & SO_DONTROUTE) 1046b5d47ff5SJohn-Mark Gurney ipflags |= IP_ROUTETOIF; 1047b5d47ff5SJohn-Mark Gurney if (inp->inp_socket->so_options & SO_BROADCAST) 1048b5d47ff5SJohn-Mark Gurney ipflags |= IP_ALLOWBROADCAST; 10496fbfd582SAndre Oppermann if (inp->inp_flags & INP_ONESBCAST) 10508afa2304SBruce M Simpson ipflags |= IP_SENDONES; 10518afa2304SBruce M Simpson 10521175d9d5SRobert Watson #ifdef MAC 10531175d9d5SRobert Watson mac_inpcb_create_mbuf(inp, m); 10541175d9d5SRobert Watson #endif 10551175d9d5SRobert Watson 1056df8bae1dSRodney W. Grimes /* 1057db4f9cc7SJonathan Lemon * Set up checksum and output datagram. 1058df8bae1dSRodney W. Grimes */ 1059f5514f08SRobert Watson if (udp_cksum) { 10606fbfd582SAndre Oppermann if (inp->inp_flags & INP_ONESBCAST) 10618a538743SBruce M Simpson faddr.s_addr = INADDR_BROADCAST; 10628a538743SBruce M Simpson ui->ui_sum = in_pseudo(ui->ui_src.s_addr, faddr.s_addr, 1063db4f9cc7SJonathan Lemon htons((u_short)len + sizeof(struct udphdr) + IPPROTO_UDP)); 1064db4f9cc7SJonathan Lemon m->m_pkthdr.csum_flags = CSUM_UDP; 1065db4f9cc7SJonathan Lemon m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum); 10663329b236SRobert Watson } else 1067db4f9cc7SJonathan Lemon ui->ui_sum = 0; 1068df8bae1dSRodney W. Grimes ((struct ip *)ui)->ip_len = sizeof (struct udpiphdr) + len; 1069ca98b82cSDavid Greenman ((struct ip *)ui)->ip_ttl = inp->inp_ip_ttl; /* XXX */ 1070ca98b82cSDavid Greenman ((struct ip *)ui)->ip_tos = inp->inp_ip_tos; /* XXX */ 1071603724d3SBjoern A. Zeeb V_udpstat.udps_opackets++; 1072cfa1ca9dSYoshinobu Inoue 107343cc0bc1SRobert Watson if (unlock_udbinfo == 2) 1074603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 107543cc0bc1SRobert Watson else if (unlock_udbinfo == 1) 1076603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 107797d8d152SAndre Oppermann error = ip_output(m, inp->inp_options, NULL, ipflags, 10785d846453SSam Leffler inp->inp_moptions, inp); 107943cc0bc1SRobert Watson if (unlock_udbinfo == 2) 10808501a69cSRobert Watson INP_WUNLOCK(inp); 1081948d0fc9SRobert Watson else 1082948d0fc9SRobert Watson INP_RUNLOCK(inp); 1083df8bae1dSRodney W. Grimes return (error); 1084df8bae1dSRodney W. Grimes 1085df8bae1dSRodney W. Grimes release: 108643cc0bc1SRobert Watson if (unlock_udbinfo == 2) { 1087948d0fc9SRobert Watson INP_WUNLOCK(inp); 1088603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 108943cc0bc1SRobert Watson } else if (unlock_udbinfo == 1) { 109043cc0bc1SRobert Watson INP_RUNLOCK(inp); 1091603724d3SBjoern A. Zeeb INP_INFO_RUNLOCK(&V_udbinfo); 1092948d0fc9SRobert Watson } else 1093948d0fc9SRobert Watson INP_RUNLOCK(inp); 1094df8bae1dSRodney W. Grimes m_freem(m); 1095df8bae1dSRodney W. Grimes return (error); 1096df8bae1dSRodney W. Grimes } 1097df8bae1dSRodney W. Grimes 1098ac45e92fSRobert Watson static void 1099d0390e05SGarrett Wollman udp_abort(struct socket *so) 1100df8bae1dSRodney W. Grimes { 11018b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1102d0390e05SGarrett Wollman struct inpcb *inp; 1103df8bae1dSRodney W. Grimes 1104d0390e05SGarrett Wollman inp = sotoinpcb(so); 110514ba8addSRobert Watson KASSERT(inp != NULL, ("udp_abort: inp == NULL")); 1106603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 11078501a69cSRobert Watson INP_WLOCK(inp); 1108a152f8a3SRobert Watson if (inp->inp_faddr.s_addr != INADDR_ANY) { 1109a152f8a3SRobert Watson in_pcbdisconnect(inp); 1110a152f8a3SRobert Watson inp->inp_laddr.s_addr = INADDR_ANY; 1111d0390e05SGarrett Wollman soisdisconnected(so); 1112a152f8a3SRobert Watson } 11138501a69cSRobert Watson INP_WUNLOCK(inp); 1114603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1115df8bae1dSRodney W. Grimes } 1116df8bae1dSRodney W. Grimes 1117d0390e05SGarrett Wollman static int 1118b40ce416SJulian Elischer udp_attach(struct socket *so, int proto, struct thread *td) 1119d0390e05SGarrett Wollman { 11208b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1121d0390e05SGarrett Wollman struct inpcb *inp; 1122277afaffSRobert Watson int error; 1123d0390e05SGarrett Wollman 1124d0390e05SGarrett Wollman inp = sotoinpcb(so); 112514ba8addSRobert Watson KASSERT(inp == NULL, ("udp_attach: inp != NULL")); 1126cfa1ca9dSYoshinobu Inoue error = soreserve(so, udp_sendspace, udp_recvspace); 1127f24618aaSRobert Watson if (error) 11283329b236SRobert Watson return (error); 1129603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 1130603724d3SBjoern A. Zeeb error = in_pcballoc(so, &V_udbinfo); 113153b57cd1SSam Leffler if (error) { 1132603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 11333329b236SRobert Watson return (error); 113453b57cd1SSam Leffler } 1135cfa1ca9dSYoshinobu Inoue 1136cfa1ca9dSYoshinobu Inoue inp = (struct inpcb *)so->so_pcb; 1137603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1138cfa1ca9dSYoshinobu Inoue inp->inp_vflag |= INP_IPV4; 1139603724d3SBjoern A. Zeeb inp->inp_ip_ttl = V_ip_defttl; 11408501a69cSRobert Watson INP_WUNLOCK(inp); 11413329b236SRobert Watson return (0); 1142df8bae1dSRodney W. Grimes } 1143d0390e05SGarrett Wollman 1144d0390e05SGarrett Wollman static int 1145b40ce416SJulian Elischer udp_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 1146d0390e05SGarrett Wollman { 11478b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1148d0390e05SGarrett Wollman struct inpcb *inp; 1149277afaffSRobert Watson int error; 1150d0390e05SGarrett Wollman 1151d0390e05SGarrett Wollman inp = sotoinpcb(so); 115214ba8addSRobert Watson KASSERT(inp != NULL, ("udp_bind: inp == NULL")); 1153603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 11548501a69cSRobert Watson INP_WLOCK(inp); 1155b0330ed9SPawel Jakub Dawidek error = in_pcbbind(inp, nam, td->td_ucred); 11568501a69cSRobert Watson INP_WUNLOCK(inp); 1157603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 11583329b236SRobert Watson return (error); 1159d0390e05SGarrett Wollman } 1160d0390e05SGarrett Wollman 1161a152f8a3SRobert Watson static void 1162a152f8a3SRobert Watson udp_close(struct socket *so) 1163a152f8a3SRobert Watson { 11648b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1165a152f8a3SRobert Watson struct inpcb *inp; 1166a152f8a3SRobert Watson 1167a152f8a3SRobert Watson inp = sotoinpcb(so); 1168a152f8a3SRobert Watson KASSERT(inp != NULL, ("udp_close: inp == NULL")); 1169603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 11708501a69cSRobert Watson INP_WLOCK(inp); 1171a152f8a3SRobert Watson if (inp->inp_faddr.s_addr != INADDR_ANY) { 1172a152f8a3SRobert Watson in_pcbdisconnect(inp); 1173a152f8a3SRobert Watson inp->inp_laddr.s_addr = INADDR_ANY; 1174a152f8a3SRobert Watson soisdisconnected(so); 1175a152f8a3SRobert Watson } 11768501a69cSRobert Watson INP_WUNLOCK(inp); 1177603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1178a152f8a3SRobert Watson } 1179a152f8a3SRobert Watson 1180d0390e05SGarrett Wollman static int 1181b40ce416SJulian Elischer udp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 1182d0390e05SGarrett Wollman { 11838b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1184d0390e05SGarrett Wollman struct inpcb *inp; 1185277afaffSRobert Watson int error; 118675c13541SPoul-Henning Kamp struct sockaddr_in *sin; 1187d0390e05SGarrett Wollman 1188d0390e05SGarrett Wollman inp = sotoinpcb(so); 118914ba8addSRobert Watson KASSERT(inp != NULL, ("udp_connect: inp == NULL")); 1190603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 11918501a69cSRobert Watson INP_WLOCK(inp); 1192f76fcf6dSJeffrey Hsu if (inp->inp_faddr.s_addr != INADDR_ANY) { 11938501a69cSRobert Watson INP_WUNLOCK(inp); 1194603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 11953329b236SRobert Watson return (EISCONN); 1196f76fcf6dSJeffrey Hsu } 119775c13541SPoul-Henning Kamp sin = (struct sockaddr_in *)nam; 1198413628a7SBjoern A. Zeeb if (prison_remote_ip4(td->td_ucred, &sin->sin_addr) != 0) { 1199413628a7SBjoern A. Zeeb INP_WUNLOCK(inp); 1200413628a7SBjoern A. Zeeb INP_INFO_WUNLOCK(&udbinfo); 1201413628a7SBjoern A. Zeeb return (EAFNOSUPPORT); 1202413628a7SBjoern A. Zeeb } 1203b0330ed9SPawel Jakub Dawidek error = in_pcbconnect(inp, nam, td->td_ucred); 12044cc20ab1SSeigo Tanimura if (error == 0) 1205df8bae1dSRodney W. Grimes soisconnected(so); 12068501a69cSRobert Watson INP_WUNLOCK(inp); 1207603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 12083329b236SRobert Watson return (error); 1209df8bae1dSRodney W. Grimes } 1210d0390e05SGarrett Wollman 1211bc725eafSRobert Watson static void 1212d0390e05SGarrett Wollman udp_detach(struct socket *so) 1213d0390e05SGarrett Wollman { 12148b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1215d0390e05SGarrett Wollman struct inpcb *inp; 1216d0390e05SGarrett Wollman 1217d0390e05SGarrett Wollman inp = sotoinpcb(so); 121814ba8addSRobert Watson KASSERT(inp != NULL, ("udp_detach: inp == NULL")); 1219a152f8a3SRobert Watson KASSERT(inp->inp_faddr.s_addr == INADDR_ANY, 1220a152f8a3SRobert Watson ("udp_detach: not disconnected")); 1221603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 12228501a69cSRobert Watson INP_WLOCK(inp); 1223d0390e05SGarrett Wollman in_pcbdetach(inp); 122414ba8addSRobert Watson in_pcbfree(inp); 1225603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 1226d0390e05SGarrett Wollman } 1227d0390e05SGarrett Wollman 1228d0390e05SGarrett Wollman static int 1229d0390e05SGarrett Wollman udp_disconnect(struct socket *so) 1230d0390e05SGarrett Wollman { 12318b615593SMarko Zec INIT_VNET_INET(so->so_vnet); 1232d0390e05SGarrett Wollman struct inpcb *inp; 1233d0390e05SGarrett Wollman 1234d0390e05SGarrett Wollman inp = sotoinpcb(so); 123514ba8addSRobert Watson KASSERT(inp != NULL, ("udp_disconnect: inp == NULL")); 1236603724d3SBjoern A. Zeeb INP_INFO_WLOCK(&V_udbinfo); 12378501a69cSRobert Watson INP_WLOCK(inp); 1238f76fcf6dSJeffrey Hsu if (inp->inp_faddr.s_addr == INADDR_ANY) { 12398501a69cSRobert Watson INP_WUNLOCK(inp); 1240603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 12413329b236SRobert Watson return (ENOTCONN); 1242f76fcf6dSJeffrey Hsu } 1243d0390e05SGarrett Wollman 1244df8bae1dSRodney W. Grimes in_pcbdisconnect(inp); 1245df8bae1dSRodney W. Grimes inp->inp_laddr.s_addr = INADDR_ANY; 1246d45e4f99SMaxim Konovalov SOCK_LOCK(so); 1247d45e4f99SMaxim Konovalov so->so_state &= ~SS_ISCONNECTED; /* XXX */ 1248d45e4f99SMaxim Konovalov SOCK_UNLOCK(so); 12498501a69cSRobert Watson INP_WUNLOCK(inp); 1250603724d3SBjoern A. Zeeb INP_INFO_WUNLOCK(&V_udbinfo); 12513329b236SRobert Watson return (0); 1252df8bae1dSRodney W. Grimes } 1253df8bae1dSRodney W. Grimes 1254d0390e05SGarrett Wollman static int 125557bf258eSGarrett Wollman udp_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *addr, 1256b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 1257d0390e05SGarrett Wollman { 1258d0390e05SGarrett Wollman struct inpcb *inp; 1259d0390e05SGarrett Wollman 1260d0390e05SGarrett Wollman inp = sotoinpcb(so); 126114ba8addSRobert Watson KASSERT(inp != NULL, ("udp_send: inp == NULL")); 12623329b236SRobert Watson return (udp_output(inp, m, addr, control, td)); 1263d0390e05SGarrett Wollman } 1264d0390e05SGarrett Wollman 126576429de4SYoshinobu Inoue int 1266d0390e05SGarrett Wollman udp_shutdown(struct socket *so) 1267d0390e05SGarrett Wollman { 1268d0390e05SGarrett Wollman struct inpcb *inp; 1269d0390e05SGarrett Wollman 1270d0390e05SGarrett Wollman inp = sotoinpcb(so); 127114ba8addSRobert Watson KASSERT(inp != NULL, ("udp_shutdown: inp == NULL")); 12728501a69cSRobert Watson INP_WLOCK(inp); 1273d0390e05SGarrett Wollman socantsendmore(so); 12748501a69cSRobert Watson INP_WUNLOCK(inp); 12753329b236SRobert Watson return (0); 1276d0390e05SGarrett Wollman } 1277d0390e05SGarrett Wollman 1278d0390e05SGarrett Wollman struct pr_usrreqs udp_usrreqs = { 1279756d52a1SPoul-Henning Kamp .pru_abort = udp_abort, 1280756d52a1SPoul-Henning Kamp .pru_attach = udp_attach, 1281756d52a1SPoul-Henning Kamp .pru_bind = udp_bind, 1282756d52a1SPoul-Henning Kamp .pru_connect = udp_connect, 1283756d52a1SPoul-Henning Kamp .pru_control = in_control, 1284756d52a1SPoul-Henning Kamp .pru_detach = udp_detach, 1285756d52a1SPoul-Henning Kamp .pru_disconnect = udp_disconnect, 128654d642bbSRobert Watson .pru_peeraddr = in_getpeeraddr, 1287756d52a1SPoul-Henning Kamp .pru_send = udp_send, 12885df3e839SRobert Watson .pru_soreceive = soreceive_dgram, 128959b8854eSRobert Watson .pru_sosend = sosend_dgram, 1290756d52a1SPoul-Henning Kamp .pru_shutdown = udp_shutdown, 129154d642bbSRobert Watson .pru_sockaddr = in_getsockaddr, 1292a152f8a3SRobert Watson .pru_sosetlabel = in_pcbsosetlabel, 1293a152f8a3SRobert Watson .pru_close = udp_close, 1294d0390e05SGarrett Wollman }; 1295