xref: /freebsd/sys/netinet/udp_usrreq.c (revision 413628a7e3d23a897cd959638d325395e4c9691b)
1c398230bSWarner Losh /*-
26dfab5b1SGarrett Wollman  * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995
33329b236SRobert Watson  *	The Regents of the University of California.
43144b7d3SRobert Watson  * Copyright (c) 2008 Robert N. M. Watson
53329b236SRobert Watson  * All rights reserved.
6df8bae1dSRodney W. Grimes  *
7df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
8df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
9df8bae1dSRodney W. Grimes  * are met:
10df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
12df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
13df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
14df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
15df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
16df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
17df8bae1dSRodney W. Grimes  *    without specific prior written permission.
18df8bae1dSRodney W. Grimes  *
19df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
30df8bae1dSRodney W. Grimes  *
316dfab5b1SGarrett Wollman  *	@(#)udp_usrreq.c	8.6 (Berkeley) 5/23/95
32df8bae1dSRodney W. Grimes  */
33df8bae1dSRodney W. Grimes 
344b421e2dSMike Silbersack #include <sys/cdefs.h>
354b421e2dSMike Silbersack __FBSDID("$FreeBSD$");
364b421e2dSMike Silbersack 
370b4ae859SGleb Smirnoff #include "opt_ipfw.h"
38cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h"
39f5514f08SRobert Watson #include "opt_ipsec.h"
40bdb3fa18SRobert Watson #include "opt_mac.h"
41cfa1ca9dSYoshinobu Inoue 
42df8bae1dSRodney W. Grimes #include <sys/param.h>
43960ed29cSSeigo Tanimura #include <sys/domain.h>
444f590175SPaul Saab #include <sys/eventhandler.h>
45960ed29cSSeigo Tanimura #include <sys/jail.h>
46b110a8a2SGarrett Wollman #include <sys/kernel.h>
47960ed29cSSeigo Tanimura #include <sys/lock.h>
48df8bae1dSRodney W. Grimes #include <sys/malloc.h>
49df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
50acd3428bSRobert Watson #include <sys/priv.h>
51490d50b6SBrian Feldman #include <sys/proc.h>
52df8bae1dSRodney W. Grimes #include <sys/protosw.h>
53960ed29cSSeigo Tanimura #include <sys/signalvar.h>
54df8bae1dSRodney W. Grimes #include <sys/socket.h>
55df8bae1dSRodney W. Grimes #include <sys/socketvar.h>
56960ed29cSSeigo Tanimura #include <sys/sx.h>
57b5e8ce9fSBruce Evans #include <sys/sysctl.h>
58816a3d83SPoul-Henning Kamp #include <sys/syslog.h>
59f5514f08SRobert Watson #include <sys/systm.h>
60603724d3SBjoern A. Zeeb #include <sys/vimage.h>
618781d8e9SBruce Evans 
6269c2d429SJeff Roberson #include <vm/uma.h>
63df8bae1dSRodney W. Grimes 
64df8bae1dSRodney W. Grimes #include <net/if.h>
65df8bae1dSRodney W. Grimes #include <net/route.h>
66df8bae1dSRodney W. Grimes 
67df8bae1dSRodney W. Grimes #include <netinet/in.h>
68960ed29cSSeigo Tanimura #include <netinet/in_pcb.h>
69f5514f08SRobert Watson #include <netinet/in_systm.h>
70960ed29cSSeigo Tanimura #include <netinet/in_var.h>
71df8bae1dSRodney W. Grimes #include <netinet/ip.h>
72cfa1ca9dSYoshinobu Inoue #ifdef INET6
73cfa1ca9dSYoshinobu Inoue #include <netinet/ip6.h>
74cfa1ca9dSYoshinobu Inoue #endif
75960ed29cSSeigo Tanimura #include <netinet/ip_icmp.h>
76960ed29cSSeigo Tanimura #include <netinet/icmp_var.h>
77df8bae1dSRodney W. Grimes #include <netinet/ip_var.h>
78ef39adf0SAndre Oppermann #include <netinet/ip_options.h>
79cfa1ca9dSYoshinobu Inoue #ifdef INET6
80cfa1ca9dSYoshinobu Inoue #include <netinet6/ip6_var.h>
81cfa1ca9dSYoshinobu Inoue #endif
82df8bae1dSRodney W. Grimes #include <netinet/udp.h>
83df8bae1dSRodney W. Grimes #include <netinet/udp_var.h>
84df8bae1dSRodney W. Grimes 
85b2630c29SGeorge V. Neville-Neil #ifdef IPSEC
86b9234fafSSam Leffler #include <netipsec/ipsec.h>
873329b236SRobert Watson #endif
88b9234fafSSam Leffler 
89db4f9cc7SJonathan Lemon #include <machine/in_cksum.h>
90db4f9cc7SJonathan Lemon 
91aed55708SRobert Watson #include <security/mac/mac_framework.h>
92aed55708SRobert Watson 
93df8bae1dSRodney W. Grimes /*
94df8bae1dSRodney W. Grimes  * UDP protocol implementation.
95df8bae1dSRodney W. Grimes  * Per RFC 768, August, 1980.
96df8bae1dSRodney W. Grimes  */
9774eb3236SWarner Losh 
9844e33a07SMarko Zec #ifdef VIMAGE_GLOBALS
9944e33a07SMarko Zec int	udp_blackhole;
10044e33a07SMarko Zec #endif
10144e33a07SMarko Zec 
10274eb3236SWarner Losh /*
1033329b236SRobert Watson  * BSD 4.2 defaulted the udp checksum to be off.  Turning off udp checksums
1043329b236SRobert Watson  * removes the only data integrity mechanism for packets and malformed
105f5514f08SRobert Watson  * packets that would otherwise be discarded due to bad checksums, and may
106f5514f08SRobert Watson  * cause problems (especially for NFS data blocks).
10774eb3236SWarner Losh  */
108f5514f08SRobert Watson static int	udp_cksum = 1;
109f5514f08SRobert Watson SYSCTL_INT(_net_inet_udp, UDPCTL_CHECKSUM, checksum, CTLFLAG_RW, &udp_cksum,
11041698ebfSTom Rhodes     0, "compute udp checksum");
111df8bae1dSRodney W. Grimes 
112afdb4274SRobert Watson int	udp_log_in_vain = 0;
113816a3d83SPoul-Henning Kamp SYSCTL_INT(_net_inet_udp, OID_AUTO, log_in_vain, CTLFLAG_RW,
114afdb4274SRobert Watson     &udp_log_in_vain, 0, "Log all incoming UDP packets");
115816a3d83SPoul-Henning Kamp 
11697021c24SMarko Zec SYSCTL_V_INT(V_NET, vnet_inet, _net_inet_udp, OID_AUTO, blackhole,
11797021c24SMarko Zec     CTLFLAG_RW, udp_blackhole, 0,
1183329b236SRobert Watson     "Do not send port unreachables for refused connects");
11916f7f31fSGeoff Rehmet 
12043bbb6aaSRobert Watson u_long	udp_sendspace = 9216;		/* really max datagram size */
12143bbb6aaSRobert Watson 					/* 40 1K datagrams */
12243bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_MAXDGRAM, maxdgram, CTLFLAG_RW,
12343bbb6aaSRobert Watson     &udp_sendspace, 0, "Maximum outgoing UDP datagram size");
12443bbb6aaSRobert Watson 
12543bbb6aaSRobert Watson u_long	udp_recvspace = 40 * (1024 +
12643bbb6aaSRobert Watson #ifdef INET6
12743bbb6aaSRobert Watson 				      sizeof(struct sockaddr_in6)
12843bbb6aaSRobert Watson #else
12943bbb6aaSRobert Watson 				      sizeof(struct sockaddr_in)
13043bbb6aaSRobert Watson #endif
13143bbb6aaSRobert Watson 				      );
13243bbb6aaSRobert Watson 
13343bbb6aaSRobert Watson SYSCTL_ULONG(_net_inet_udp, UDPCTL_RECVSPACE, recvspace, CTLFLAG_RW,
13443bbb6aaSRobert Watson     &udp_recvspace, 0, "Maximum space for incoming UDP datagrams");
13543bbb6aaSRobert Watson 
13644e33a07SMarko Zec #ifdef VIMAGE_GLOBALS
13776429de4SYoshinobu Inoue struct inpcbhead	udb;		/* from udp_var.h */
1387a2aab80SBrian Feldman struct inpcbinfo	udbinfo;
13944e33a07SMarko Zec struct udpstat		udpstat;	/* from udp_var.h */
14044e33a07SMarko Zec #endif
14115bd2b43SDavid Greenman 
14215bd2b43SDavid Greenman #ifndef UDBHASHSIZE
143e2ed8f35SAlexander Motin #define	UDBHASHSIZE	128
14415bd2b43SDavid Greenman #endif
14515bd2b43SDavid Greenman 
1468b615593SMarko Zec SYSCTL_V_STRUCT(V_NET, vnet_inet, _net_inet_udp, UDPCTL_STATS, stats,
1478b615593SMarko Zec     CTLFLAG_RW, udpstat, udpstat,
1488b615593SMarko Zec     "UDP statistics (struct udpstat, netinet/udp_var.h)");
149f2ea20e6SGarrett Wollman 
150bc725eafSRobert Watson static void	udp_detach(struct socket *so);
1514d77a549SAlfred Perlstein static int	udp_output(struct inpcb *, struct mbuf *, struct sockaddr *,
1524d77a549SAlfred Perlstein 		    struct mbuf *, struct thread *);
153df8bae1dSRodney W. Grimes 
1544f590175SPaul Saab static void
1554f590175SPaul Saab udp_zone_change(void *tag)
1564f590175SPaul Saab {
1574f590175SPaul Saab 
158603724d3SBjoern A. Zeeb 	uma_zone_set_max(V_udbinfo.ipi_zone, maxsockets);
1594f590175SPaul Saab }
1604f590175SPaul Saab 
161d915b280SStephan Uphoff static int
162d915b280SStephan Uphoff udp_inpcb_init(void *mem, int size, int flags)
163d915b280SStephan Uphoff {
164af1ee11dSRobert Watson 	struct inpcb *inp;
16508651e1fSJohn Baldwin 
166af1ee11dSRobert Watson 	inp = mem;
167d915b280SStephan Uphoff 	INP_LOCK_INIT(inp, "inp", "udpinp");
168d915b280SStephan Uphoff 	return (0);
169d915b280SStephan Uphoff }
170d915b280SStephan Uphoff 
171df8bae1dSRodney W. Grimes void
172af1ee11dSRobert Watson udp_init(void)
173df8bae1dSRodney W. Grimes {
1748b615593SMarko Zec 	INIT_VNET_INET(curvnet);
175af1ee11dSRobert Watson 
17644e33a07SMarko Zec 	V_udp_blackhole = 0;
17744e33a07SMarko Zec 
178603724d3SBjoern A. Zeeb 	INP_INFO_LOCK_INIT(&V_udbinfo, "udp");
179603724d3SBjoern A. Zeeb 	LIST_INIT(&V_udb);
1802c0d658fSJulian Elischer 	V_udbinfo.ipi_listhead = &V_udb;
181603724d3SBjoern A. Zeeb 	V_udbinfo.ipi_hashbase = hashinit(UDBHASHSIZE, M_PCB,
182603724d3SBjoern A. Zeeb 	    &V_udbinfo.ipi_hashmask);
183603724d3SBjoern A. Zeeb 	V_udbinfo.ipi_porthashbase = hashinit(UDBHASHSIZE, M_PCB,
184603724d3SBjoern A. Zeeb 	    &V_udbinfo.ipi_porthashmask);
185603724d3SBjoern A. Zeeb 	V_udbinfo.ipi_zone = uma_zcreate("udpcb", sizeof(struct inpcb), NULL,
186d915b280SStephan Uphoff 	    NULL, udp_inpcb_init, NULL, UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
187603724d3SBjoern A. Zeeb 	uma_zone_set_max(V_udbinfo.ipi_zone, maxsockets);
1884f590175SPaul Saab 	EVENTHANDLER_REGISTER(maxsockets_change, udp_zone_change, NULL,
1894f590175SPaul Saab 	    EVENTHANDLER_PRI_ANY);
190df8bae1dSRodney W. Grimes }
191df8bae1dSRodney W. Grimes 
19243bbb6aaSRobert Watson /*
19343bbb6aaSRobert Watson  * Subroutine of udp_input(), which appends the provided mbuf chain to the
19443bbb6aaSRobert Watson  * passed pcb/socket.  The caller must provide a sockaddr_in via udp_in that
19543bbb6aaSRobert Watson  * contains the source address.  If the socket ends up being an IPv6 socket,
19643bbb6aaSRobert Watson  * udp_append() will convert to a sockaddr_in6 before passing the address
19743bbb6aaSRobert Watson  * into the socket code.
19843bbb6aaSRobert Watson  */
19943bbb6aaSRobert Watson static void
20043bbb6aaSRobert Watson udp_append(struct inpcb *inp, struct ip *ip, struct mbuf *n, int off,
20143bbb6aaSRobert Watson     struct sockaddr_in *udp_in)
20243bbb6aaSRobert Watson {
20343bbb6aaSRobert Watson 	struct sockaddr *append_sa;
20443bbb6aaSRobert Watson 	struct socket *so;
20543bbb6aaSRobert Watson 	struct mbuf *opts = 0;
20643bbb6aaSRobert Watson #ifdef INET6
20743bbb6aaSRobert Watson 	struct sockaddr_in6 udp_in6;
20843bbb6aaSRobert Watson #endif
20943bbb6aaSRobert Watson 
210119d85f6SRobert Watson 	INP_RLOCK_ASSERT(inp);
21143bbb6aaSRobert Watson 
21243bbb6aaSRobert Watson #ifdef IPSEC
21343bbb6aaSRobert Watson 	/* Check AH/ESP integrity. */
21443bbb6aaSRobert Watson 	if (ipsec4_in_reject(n, inp)) {
2158b615593SMarko Zec 		INIT_VNET_IPSEC(curvnet);
21643bbb6aaSRobert Watson 		m_freem(n);
217603724d3SBjoern A. Zeeb 		V_ipsec4stat.in_polvio++;
21843bbb6aaSRobert Watson 		return;
21943bbb6aaSRobert Watson 	}
22043bbb6aaSRobert Watson #endif /* IPSEC */
22143bbb6aaSRobert Watson #ifdef MAC
22230d239bcSRobert Watson 	if (mac_inpcb_check_deliver(inp, n) != 0) {
22343bbb6aaSRobert Watson 		m_freem(n);
22443bbb6aaSRobert Watson 		return;
22543bbb6aaSRobert Watson 	}
22643bbb6aaSRobert Watson #endif
22743bbb6aaSRobert Watson 	if (inp->inp_flags & INP_CONTROLOPTS ||
22843bbb6aaSRobert Watson 	    inp->inp_socket->so_options & (SO_TIMESTAMP | SO_BINTIME)) {
22943bbb6aaSRobert Watson #ifdef INET6
2309a38ba81SBjoern A. Zeeb 		if (inp->inp_vflag & INP_IPV6)
23148d48eb9SBjoern A. Zeeb 			(void)ip6_savecontrol_v4(inp, n, &opts, NULL);
2329a38ba81SBjoern A. Zeeb 		else
23343bbb6aaSRobert Watson #endif
23443bbb6aaSRobert Watson 			ip_savecontrol(inp, &opts, ip, n);
23543bbb6aaSRobert Watson 	}
23643bbb6aaSRobert Watson #ifdef INET6
23743bbb6aaSRobert Watson 	if (inp->inp_vflag & INP_IPV6) {
23843bbb6aaSRobert Watson 		bzero(&udp_in6, sizeof(udp_in6));
23943bbb6aaSRobert Watson 		udp_in6.sin6_len = sizeof(udp_in6);
24043bbb6aaSRobert Watson 		udp_in6.sin6_family = AF_INET6;
24143bbb6aaSRobert Watson 		in6_sin_2_v4mapsin6(udp_in, &udp_in6);
24243bbb6aaSRobert Watson 		append_sa = (struct sockaddr *)&udp_in6;
24343bbb6aaSRobert Watson 	} else
24443bbb6aaSRobert Watson #endif
24543bbb6aaSRobert Watson 		append_sa = (struct sockaddr *)udp_in;
24643bbb6aaSRobert Watson 	m_adj(n, off);
24743bbb6aaSRobert Watson 
24843bbb6aaSRobert Watson 	so = inp->inp_socket;
24943bbb6aaSRobert Watson 	SOCKBUF_LOCK(&so->so_rcv);
25043bbb6aaSRobert Watson 	if (sbappendaddr_locked(&so->so_rcv, append_sa, n, opts) == 0) {
2518b615593SMarko Zec 		INIT_VNET_INET(so->so_vnet);
25243bbb6aaSRobert Watson 		SOCKBUF_UNLOCK(&so->so_rcv);
25343bbb6aaSRobert Watson 		m_freem(n);
25443bbb6aaSRobert Watson 		if (opts)
25543bbb6aaSRobert Watson 			m_freem(opts);
256603724d3SBjoern A. Zeeb 		V_udpstat.udps_fullsock++;
25743bbb6aaSRobert Watson 	} else
25843bbb6aaSRobert Watson 		sorwakeup_locked(so);
25943bbb6aaSRobert Watson }
26043bbb6aaSRobert Watson 
261df8bae1dSRodney W. Grimes void
2623329b236SRobert Watson udp_input(struct mbuf *m, int off)
263df8bae1dSRodney W. Grimes {
2648b615593SMarko Zec 	INIT_VNET_INET(curvnet);
265cfa1ca9dSYoshinobu Inoue 	int iphlen = off;
2663329b236SRobert Watson 	struct ip *ip;
2673329b236SRobert Watson 	struct udphdr *uh;
26871498f30SBruce M Simpson 	struct ifnet *ifp;
2693329b236SRobert Watson 	struct inpcb *inp;
270df8bae1dSRodney W. Grimes 	int len;
271df8bae1dSRodney W. Grimes 	struct ip save_ip;
272d4b509bdSRobert Watson 	struct sockaddr_in udp_in;
2730b4ae859SGleb Smirnoff #ifdef IPFIREWALL_FORWARD
2740b4ae859SGleb Smirnoff 	struct m_tag *fwd_tag;
2750b4ae859SGleb Smirnoff #endif
276df8bae1dSRodney W. Grimes 
27771498f30SBruce M Simpson 	ifp = m->m_pkthdr.rcvif;
278603724d3SBjoern A. Zeeb 	V_udpstat.udps_ipackets++;
279df8bae1dSRodney W. Grimes 
280df8bae1dSRodney W. Grimes 	/*
2813329b236SRobert Watson 	 * Strip IP options, if any; should skip this, make available to
2823329b236SRobert Watson 	 * user, and use on returned packets, but we don't yet have a way to
2833329b236SRobert Watson 	 * check the checksum with options still present.
284df8bae1dSRodney W. Grimes 	 */
285df8bae1dSRodney W. Grimes 	if (iphlen > sizeof (struct ip)) {
286df8bae1dSRodney W. Grimes 		ip_stripoptions(m, (struct mbuf *)0);
287df8bae1dSRodney W. Grimes 		iphlen = sizeof(struct ip);
288df8bae1dSRodney W. Grimes 	}
289df8bae1dSRodney W. Grimes 
290df8bae1dSRodney W. Grimes 	/*
291df8bae1dSRodney W. Grimes 	 * Get IP and UDP header together in first mbuf.
292df8bae1dSRodney W. Grimes 	 */
293df8bae1dSRodney W. Grimes 	ip = mtod(m, struct ip *);
294df8bae1dSRodney W. Grimes 	if (m->m_len < iphlen + sizeof(struct udphdr)) {
295df8bae1dSRodney W. Grimes 		if ((m = m_pullup(m, iphlen + sizeof(struct udphdr))) == 0) {
296603724d3SBjoern A. Zeeb 			V_udpstat.udps_hdrops++;
297df8bae1dSRodney W. Grimes 			return;
298df8bae1dSRodney W. Grimes 		}
299df8bae1dSRodney W. Grimes 		ip = mtod(m, struct ip *);
300df8bae1dSRodney W. Grimes 	}
301df8bae1dSRodney W. Grimes 	uh = (struct udphdr *)((caddr_t)ip + iphlen);
302df8bae1dSRodney W. Grimes 
3033329b236SRobert Watson 	/*
3043329b236SRobert Watson 	 * Destination port of 0 is illegal, based on RFC768.
3053329b236SRobert Watson 	 */
306686cdd19SJun-ichiro itojun Hagino 	if (uh->uh_dport == 0)
307f76fcf6dSJeffrey Hsu 		goto badunlocked;
308686cdd19SJun-ichiro itojun Hagino 
309df8bae1dSRodney W. Grimes 	/*
3103329b236SRobert Watson 	 * Construct sockaddr format source address.  Stuff source address
3113329b236SRobert Watson 	 * and datagram in user buffer.
312b9234fafSSam Leffler 	 */
313d4b509bdSRobert Watson 	bzero(&udp_in, sizeof(udp_in));
314d4b509bdSRobert Watson 	udp_in.sin_len = sizeof(udp_in);
315d4b509bdSRobert Watson 	udp_in.sin_family = AF_INET;
316b9234fafSSam Leffler 	udp_in.sin_port = uh->uh_sport;
317b9234fafSSam Leffler 	udp_in.sin_addr = ip->ip_src;
318b9234fafSSam Leffler 
319b9234fafSSam Leffler 	/*
320af1ee11dSRobert Watson 	 * Make mbuf data length reflect UDP length.  If not enough data to
321af1ee11dSRobert Watson 	 * reflect UDP length, drop.
322df8bae1dSRodney W. Grimes 	 */
323df8bae1dSRodney W. Grimes 	len = ntohs((u_short)uh->uh_ulen);
324df8bae1dSRodney W. Grimes 	if (ip->ip_len != len) {
3257eb7a449SAndras Olah 		if (len > ip->ip_len || len < sizeof(struct udphdr)) {
326603724d3SBjoern A. Zeeb 			V_udpstat.udps_badlen++;
327f76fcf6dSJeffrey Hsu 			goto badunlocked;
328df8bae1dSRodney W. Grimes 		}
329df8bae1dSRodney W. Grimes 		m_adj(m, len - ip->ip_len);
330df8bae1dSRodney W. Grimes 		/* ip->ip_len = len; */
331df8bae1dSRodney W. Grimes 	}
3323329b236SRobert Watson 
333df8bae1dSRodney W. Grimes 	/*
3343329b236SRobert Watson 	 * Save a copy of the IP header in case we want restore it for
3353329b236SRobert Watson 	 * sending an ICMP error message in response.
336df8bae1dSRodney W. Grimes 	 */
337603724d3SBjoern A. Zeeb 	if (!V_udp_blackhole)
338df8bae1dSRodney W. Grimes 		save_ip = *ip;
339cce418d3SMatt Jacob 	else
340cce418d3SMatt Jacob 		memset(&save_ip, 0, sizeof(save_ip));
341df8bae1dSRodney W. Grimes 
342df8bae1dSRodney W. Grimes 	/*
343df8bae1dSRodney W. Grimes 	 * Checksum extended UDP header and data.
344df8bae1dSRodney W. Grimes 	 */
3456dfab5b1SGarrett Wollman 	if (uh->uh_sum) {
34639629c92SDavid Malone 		u_short uh_sum;
34739629c92SDavid Malone 
348db4f9cc7SJonathan Lemon 		if (m->m_pkthdr.csum_flags & CSUM_DATA_VALID) {
349db4f9cc7SJonathan Lemon 			if (m->m_pkthdr.csum_flags & CSUM_PSEUDO_HDR)
35039629c92SDavid Malone 				uh_sum = m->m_pkthdr.csum_data;
351db4f9cc7SJonathan Lemon 			else
35239629c92SDavid Malone 				uh_sum = in_pseudo(ip->ip_src.s_addr,
353506f4949SRuslan Ermilov 				    ip->ip_dst.s_addr, htonl((u_short)len +
354db4f9cc7SJonathan Lemon 				    m->m_pkthdr.csum_data + IPPROTO_UDP));
35539629c92SDavid Malone 			uh_sum ^= 0xffff;
356db4f9cc7SJonathan Lemon 		} else {
357cb342100SHajimu UMEMOTO 			char b[9];
358af1ee11dSRobert Watson 
359cb342100SHajimu UMEMOTO 			bcopy(((struct ipovly *)ip)->ih_x1, b, 9);
3606effc713SDoug Rabson 			bzero(((struct ipovly *)ip)->ih_x1, 9);
361df8bae1dSRodney W. Grimes 			((struct ipovly *)ip)->ih_len = uh->uh_ulen;
36239629c92SDavid Malone 			uh_sum = in_cksum(m, len + sizeof (struct ip));
363cb342100SHajimu UMEMOTO 			bcopy(b, ((struct ipovly *)ip)->ih_x1, 9);
364db4f9cc7SJonathan Lemon 		}
36539629c92SDavid Malone 		if (uh_sum) {
366603724d3SBjoern A. Zeeb 			V_udpstat.udps_badsum++;
367df8bae1dSRodney W. Grimes 			m_freem(m);
368df8bae1dSRodney W. Grimes 			return;
369df8bae1dSRodney W. Grimes 		}
370fb9aaba0SRuslan Ermilov 	} else
371603724d3SBjoern A. Zeeb 		V_udpstat.udps_nosum++;
372df8bae1dSRodney W. Grimes 
3730b4ae859SGleb Smirnoff #ifdef IPFIREWALL_FORWARD
3743329b236SRobert Watson 	/*
3753329b236SRobert Watson 	 * Grab info from PACKET_TAG_IPFORWARD tag prepended to the chain.
3763329b236SRobert Watson 	 */
3770b4ae859SGleb Smirnoff 	fwd_tag = m_tag_find(m, PACKET_TAG_IPFORWARD, NULL);
3780b4ae859SGleb Smirnoff 	if (fwd_tag != NULL) {
3790b4ae859SGleb Smirnoff 		struct sockaddr_in *next_hop;
3800b4ae859SGleb Smirnoff 
3813329b236SRobert Watson 		/*
3823329b236SRobert Watson 		 * Do the hack.
3833329b236SRobert Watson 		 */
3840b4ae859SGleb Smirnoff 		next_hop = (struct sockaddr_in *)(fwd_tag + 1);
3850b4ae859SGleb Smirnoff 		ip->ip_dst = next_hop->sin_addr;
3860b4ae859SGleb Smirnoff 		uh->uh_dport = ntohs(next_hop->sin_port);
3873329b236SRobert Watson 
3883329b236SRobert Watson 		/*
3893329b236SRobert Watson 		 * Remove the tag from the packet.  We don't need it anymore.
3903329b236SRobert Watson 		 */
3910b4ae859SGleb Smirnoff 		m_tag_delete(m, fwd_tag);
3920b4ae859SGleb Smirnoff 	}
3930b4ae859SGleb Smirnoff #endif
3940b4ae859SGleb Smirnoff 
395603724d3SBjoern A. Zeeb 	INP_INFO_RLOCK(&V_udbinfo);
396df8bae1dSRodney W. Grimes 	if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) ||
39771498f30SBruce M Simpson 	    in_broadcast(ip->ip_dst, ifp)) {
39882c23ebaSBill Fenner 		struct inpcb *last;
39971498f30SBruce M Simpson 		struct ip_moptions *imo;
4003329b236SRobert Watson 
401df8bae1dSRodney W. Grimes 		last = NULL;
402603724d3SBjoern A. Zeeb 		LIST_FOREACH(inp, &V_udb, inp_list) {
4039c1df695SRobert Watson 			if (inp->inp_lport != uh->uh_dport)
404f76fcf6dSJeffrey Hsu 				continue;
405cfa1ca9dSYoshinobu Inoue #ifdef INET6
406369dc8ceSEivind Eklund 			if ((inp->inp_vflag & INP_IPV4) == 0)
4079c1df695SRobert Watson 				continue;
408cfa1ca9dSYoshinobu Inoue #endif
40971498f30SBruce M Simpson 			if (inp->inp_laddr.s_addr != INADDR_ANY &&
41071498f30SBruce M Simpson 			    inp->inp_laddr.s_addr != ip->ip_dst.s_addr)
4119c1df695SRobert Watson 				continue;
41271498f30SBruce M Simpson 			if (inp->inp_faddr.s_addr != INADDR_ANY &&
41371498f30SBruce M Simpson 			    inp->inp_faddr.s_addr != ip->ip_src.s_addr)
41471498f30SBruce M Simpson 				continue;
41571498f30SBruce M Simpson 			/*
41671498f30SBruce M Simpson 			 * XXX: Do not check source port of incoming datagram
41771498f30SBruce M Simpson 			 * unless inp_connect() has been called to bind the
41871498f30SBruce M Simpson 			 * fport part of the 4-tuple; the source could be
41971498f30SBruce M Simpson 			 * trying to talk to us with an ephemeral port.
42071498f30SBruce M Simpson 			 */
42171498f30SBruce M Simpson 			if (inp->inp_fport != 0 &&
422df8bae1dSRodney W. Grimes 			    inp->inp_fport != uh->uh_sport)
4239c1df695SRobert Watson 				continue;
42471498f30SBruce M Simpson 
425119d85f6SRobert Watson 			INP_RLOCK(inp);
426df8bae1dSRodney W. Grimes 
42783453a06SBruce M Simpson 			/*
42871498f30SBruce M Simpson 			 * Handle socket delivery policy for any-source
42971498f30SBruce M Simpson 			 * and source-specific multicast. [RFC3678]
43083453a06SBruce M Simpson 			 */
43171498f30SBruce M Simpson 			imo = inp->inp_moptions;
43271498f30SBruce M Simpson 			if (IN_MULTICAST(ntohl(ip->ip_dst.s_addr)) &&
43371498f30SBruce M Simpson 			    imo != NULL) {
43471498f30SBruce M Simpson 				struct sockaddr_in	 sin;
43571498f30SBruce M Simpson 				struct in_msource	*ims;
43671498f30SBruce M Simpson 				int			 blocked, mode;
43771498f30SBruce M Simpson 				size_t			 idx;
43883453a06SBruce M Simpson 
43971498f30SBruce M Simpson 				bzero(&sin, sizeof(struct sockaddr_in));
44071498f30SBruce M Simpson 				sin.sin_len = sizeof(struct sockaddr_in);
44171498f30SBruce M Simpson 				sin.sin_family = AF_INET;
44271498f30SBruce M Simpson 				sin.sin_addr = ip->ip_dst;
44371498f30SBruce M Simpson 
44471498f30SBruce M Simpson 				blocked = 0;
44571498f30SBruce M Simpson 				idx = imo_match_group(imo, ifp,
44671498f30SBruce M Simpson 				    (struct sockaddr *)&sin);
44771498f30SBruce M Simpson 				if (idx == -1) {
44871498f30SBruce M Simpson 					/*
44971498f30SBruce M Simpson 					 * No group membership for this socket.
45071498f30SBruce M Simpson 					 * Do not bump udps_noportbcast, as
45171498f30SBruce M Simpson 					 * this will happen further down.
45271498f30SBruce M Simpson 					 */
45371498f30SBruce M Simpson 					blocked++;
45471498f30SBruce M Simpson 				} else {
45571498f30SBruce M Simpson 					/*
45671498f30SBruce M Simpson 					 * Check for a multicast source filter
45771498f30SBruce M Simpson 					 * entry on this socket for this group.
45871498f30SBruce M Simpson 					 * MCAST_EXCLUDE is the default
45971498f30SBruce M Simpson 					 * behaviour.  It means default accept;
46071498f30SBruce M Simpson 					 * entries, if present, denote sources
46171498f30SBruce M Simpson 					 * to be excluded from delivery.
46271498f30SBruce M Simpson 					 */
46371498f30SBruce M Simpson 					ims = imo_match_source(imo, idx,
46471498f30SBruce M Simpson 					    (struct sockaddr *)&udp_in);
46571498f30SBruce M Simpson 					mode = imo->imo_mfilters[idx].imf_fmode;
46671498f30SBruce M Simpson 					if ((ims != NULL &&
46771498f30SBruce M Simpson 					     mode == MCAST_EXCLUDE) ||
46871498f30SBruce M Simpson 					    (ims == NULL &&
46971498f30SBruce M Simpson 					     mode == MCAST_INCLUDE)) {
47071498f30SBruce M Simpson #ifdef DIAGNOSTIC
47171498f30SBruce M Simpson 						if (bootverbose) {
47271498f30SBruce M Simpson 							printf("%s: blocked by"
47371498f30SBruce M Simpson 							    " source filter\n",
47471498f30SBruce M Simpson 							    __func__);
47571498f30SBruce M Simpson 						}
47671498f30SBruce M Simpson #endif
477603724d3SBjoern A. Zeeb 						V_udpstat.udps_filtermcast++;
47871498f30SBruce M Simpson 						blocked++;
47983453a06SBruce M Simpson 					}
48083453a06SBruce M Simpson 				}
48171498f30SBruce M Simpson 				if (blocked != 0) {
482119d85f6SRobert Watson 					INP_RUNLOCK(inp);
4839c1df695SRobert Watson 					continue;
4849c1df695SRobert Watson 				}
48583453a06SBruce M Simpson 			}
486df8bae1dSRodney W. Grimes 			if (last != NULL) {
487df8bae1dSRodney W. Grimes 				struct mbuf *n;
488df8bae1dSRodney W. Grimes 
489032dcc76SLuigi Rizzo 				n = m_copy(m, 0, M_COPYALL);
490365433d9SRobert Watson 				if (n != NULL)
4913329b236SRobert Watson 					udp_append(last, ip, n, iphlen +
4923329b236SRobert Watson 					    sizeof(struct udphdr), &udp_in);
493119d85f6SRobert Watson 				INP_RUNLOCK(last);
494df8bae1dSRodney W. Grimes 			}
49582c23ebaSBill Fenner 			last = inp;
496df8bae1dSRodney W. Grimes 			/*
497df8bae1dSRodney W. Grimes 			 * Don't look for additional matches if this one does
498df8bae1dSRodney W. Grimes 			 * not have either the SO_REUSEPORT or SO_REUSEADDR
4993329b236SRobert Watson 			 * socket options set.  This heuristic avoids
5003329b236SRobert Watson 			 * searching through all pcbs in the common case of a
5013329b236SRobert Watson 			 * non-shared port.  It assumes that an application
5023329b236SRobert Watson 			 * will never clear these options after setting them.
503df8bae1dSRodney W. Grimes 			 */
5043329b236SRobert Watson 			if ((last->inp_socket->so_options &
5053329b236SRobert Watson 			    (SO_REUSEPORT|SO_REUSEADDR)) == 0)
506df8bae1dSRodney W. Grimes 				break;
507df8bae1dSRodney W. Grimes 		}
508df8bae1dSRodney W. Grimes 
509df8bae1dSRodney W. Grimes 		if (last == NULL) {
510df8bae1dSRodney W. Grimes 			/*
5113329b236SRobert Watson 			 * No matching pcb found; discard datagram.  (No need
5123329b236SRobert Watson 			 * to send an ICMP Port Unreachable for a broadcast
5133329b236SRobert Watson 			 * or multicast datgram.)
514df8bae1dSRodney W. Grimes 			 */
515603724d3SBjoern A. Zeeb 			V_udpstat.udps_noportbcast++;
51661ffc0b1SJeffrey Hsu 			goto badheadlocked;
517df8bae1dSRodney W. Grimes 		}
518d4b509bdSRobert Watson 		udp_append(last, ip, m, iphlen + sizeof(struct udphdr),
519d4b509bdSRobert Watson 		    &udp_in);
520119d85f6SRobert Watson 		INP_RUNLOCK(last);
521603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
522df8bae1dSRodney W. Grimes 		return;
523df8bae1dSRodney W. Grimes 	}
5243329b236SRobert Watson 
525df8bae1dSRodney W. Grimes 	/*
5266d6a026bSDavid Greenman 	 * Locate pcb for datagram.
527df8bae1dSRodney W. Grimes 	 */
528603724d3SBjoern A. Zeeb 	inp = in_pcblookup_hash(&V_udbinfo, ip->ip_src, uh->uh_sport,
52971498f30SBruce M Simpson 	    ip->ip_dst, uh->uh_dport, 1, ifp);
53015bd2b43SDavid Greenman 	if (inp == NULL) {
531afdb4274SRobert Watson 		if (udp_log_in_vain) {
532df5c0b8aSBill Fenner 			char buf[4*sizeof "123"];
53375cfc95fSAndrey A. Chernov 
53475cfc95fSAndrey A. Chernov 			strcpy(buf, inet_ntoa(ip->ip_dst));
535592071e8SBruce Evans 			log(LOG_INFO,
536592071e8SBruce Evans 			    "Connection attempt to UDP %s:%d from %s:%d\n",
537592071e8SBruce Evans 			    buf, ntohs(uh->uh_dport), inet_ntoa(ip->ip_src),
538592071e8SBruce Evans 			    ntohs(uh->uh_sport));
53975cfc95fSAndrey A. Chernov 		}
540603724d3SBjoern A. Zeeb 		V_udpstat.udps_noport++;
541df8bae1dSRodney W. Grimes 		if (m->m_flags & (M_BCAST | M_MCAST)) {
542603724d3SBjoern A. Zeeb 			V_udpstat.udps_noportbcast++;
54361ffc0b1SJeffrey Hsu 			goto badheadlocked;
544df8bae1dSRodney W. Grimes 		}
545603724d3SBjoern A. Zeeb 		if (V_udp_blackhole)
54661ffc0b1SJeffrey Hsu 			goto badheadlocked;
5471cbd978eSLuigi Rizzo 		if (badport_bandlim(BANDLIM_ICMP_UNREACH) < 0)
5481cbd978eSLuigi Rizzo 			goto badheadlocked;
54904287599SRuslan Ermilov 		*ip = save_ip;
55004287599SRuslan Ermilov 		ip->ip_len += iphlen;
551582a7760SBruce Evans 		icmp_error(m, ICMP_UNREACH, ICMP_UNREACH_PORT, 0, 0);
552603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
553df8bae1dSRodney W. Grimes 		return;
554df8bae1dSRodney W. Grimes 	}
5553329b236SRobert Watson 
5563329b236SRobert Watson 	/*
5573329b236SRobert Watson 	 * Check the minimum TTL for socket.
5583329b236SRobert Watson 	 */
559119d85f6SRobert Watson 	INP_RLOCK(inp);
560603724d3SBjoern A. Zeeb 	INP_INFO_RUNLOCK(&V_udbinfo);
56110cc62b7SRobert Watson 	if (inp->inp_ip_minttl && inp->inp_ip_minttl > ip->ip_ttl) {
56210cc62b7SRobert Watson 		INP_RUNLOCK(inp);
56310cc62b7SRobert Watson 		goto badunlocked;
56410cc62b7SRobert Watson 	}
565d4b509bdSRobert Watson 	udp_append(inp, ip, m, iphlen + sizeof(struct udphdr), &udp_in);
566119d85f6SRobert Watson 	INP_RUNLOCK(inp);
567df8bae1dSRodney W. Grimes 	return;
56861ffc0b1SJeffrey Hsu 
56961ffc0b1SJeffrey Hsu badheadlocked:
570f76fcf6dSJeffrey Hsu 	if (inp)
571119d85f6SRobert Watson 		INP_RUNLOCK(inp);
572603724d3SBjoern A. Zeeb 	INP_INFO_RUNLOCK(&V_udbinfo);
573f76fcf6dSJeffrey Hsu badunlocked:
574df8bae1dSRodney W. Grimes 	m_freem(m);
575cfa1ca9dSYoshinobu Inoue }
576cfa1ca9dSYoshinobu Inoue 
577cfa1ca9dSYoshinobu Inoue /*
5783329b236SRobert Watson  * Notify a udp user of an asynchronous error; just wake up so that they can
5793329b236SRobert Watson  * collect error status.
580df8bae1dSRodney W. Grimes  */
5813ce144eaSJeffrey Hsu struct inpcb *
5823329b236SRobert Watson udp_notify(struct inpcb *inp, int errno)
583df8bae1dSRodney W. Grimes {
5843329b236SRobert Watson 
585ac9ae279SRobert Watson 	/*
586ac9ae279SRobert Watson 	 * While udp_ctlinput() always calls udp_notify() with a read lock
587ac9ae279SRobert Watson 	 * when invoking it directly, in_pcbnotifyall() currently uses write
588ac9ae279SRobert Watson 	 * locks due to sharing code with TCP.  For now, accept either a read
589ac9ae279SRobert Watson 	 * or a write lock, but a read lock is sufficient.
590ac9ae279SRobert Watson 	 */
591ac9ae279SRobert Watson 	INP_LOCK_ASSERT(inp);
5928501a69cSRobert Watson 
593df8bae1dSRodney W. Grimes 	inp->inp_socket->so_error = errno;
594df8bae1dSRodney W. Grimes 	sorwakeup(inp->inp_socket);
595df8bae1dSRodney W. Grimes 	sowwakeup(inp->inp_socket);
5963329b236SRobert Watson 	return (inp);
597df8bae1dSRodney W. Grimes }
598df8bae1dSRodney W. Grimes 
599df8bae1dSRodney W. Grimes void
6003329b236SRobert Watson udp_ctlinput(int cmd, struct sockaddr *sa, void *vip)
601df8bae1dSRodney W. Grimes {
6028b615593SMarko Zec 	INIT_VNET_INET(curvnet);
603c693a045SJonathan Lemon 	struct ip *ip = vip;
604c693a045SJonathan Lemon 	struct udphdr *uh;
605c693a045SJonathan Lemon 	struct in_addr faddr;
606c693a045SJonathan Lemon 	struct inpcb *inp;
607c693a045SJonathan Lemon 
608c693a045SJonathan Lemon 	faddr = ((struct sockaddr_in *)sa)->sin_addr;
609c693a045SJonathan Lemon 	if (sa->sa_family != AF_INET || faddr.s_addr == INADDR_ANY)
610c693a045SJonathan Lemon 		return;
611df8bae1dSRodney W. Grimes 
61297d8d152SAndre Oppermann 	/*
61397d8d152SAndre Oppermann 	 * Redirects don't need to be handled up here.
61497d8d152SAndre Oppermann 	 */
61597d8d152SAndre Oppermann 	if (PRC_IS_REDIRECT(cmd))
61697d8d152SAndre Oppermann 		return;
6173329b236SRobert Watson 
61897d8d152SAndre Oppermann 	/*
61997d8d152SAndre Oppermann 	 * Hostdead is ugly because it goes linearly through all PCBs.
6203329b236SRobert Watson 	 *
6213329b236SRobert Watson 	 * XXX: We never get this from ICMP, otherwise it makes an excellent
6223329b236SRobert Watson 	 * DoS attack on machines with many connections.
62397d8d152SAndre Oppermann 	 */
62497d8d152SAndre Oppermann 	if (cmd == PRC_HOSTDEAD)
625af1ee11dSRobert Watson 		ip = NULL;
626d1c54148SJesper Skriver 	else if ((unsigned)cmd >= PRC_NCMDS || inetctlerrmap[cmd] == 0)
627df8bae1dSRodney W. Grimes 		return;
628af1ee11dSRobert Watson 	if (ip != NULL) {
629df8bae1dSRodney W. Grimes 		uh = (struct udphdr *)((caddr_t)ip + (ip->ip_hl << 2));
630603724d3SBjoern A. Zeeb 		INP_INFO_RLOCK(&V_udbinfo);
631603724d3SBjoern A. Zeeb 		inp = in_pcblookup_hash(&V_udbinfo, faddr, uh->uh_dport,
632c693a045SJonathan Lemon 		    ip->ip_src, uh->uh_sport, 0, NULL);
633f76fcf6dSJeffrey Hsu 		if (inp != NULL) {
634ac9ae279SRobert Watson 			INP_RLOCK(inp);
635f76fcf6dSJeffrey Hsu 			if (inp->inp_socket != NULL) {
636f5514f08SRobert Watson 				udp_notify(inp, inetctlerrmap[cmd]);
637f76fcf6dSJeffrey Hsu 			}
638ac9ae279SRobert Watson 			INP_RUNLOCK(inp);
639f76fcf6dSJeffrey Hsu 		}
640603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
641df8bae1dSRodney W. Grimes 	} else
642603724d3SBjoern A. Zeeb 		in_pcbnotifyall(&V_udbinfo, faddr, inetctlerrmap[cmd],
643f5514f08SRobert Watson 		    udp_notify);
644df8bae1dSRodney W. Grimes }
645df8bae1dSRodney W. Grimes 
6460312fbe9SPoul-Henning Kamp static int
64782d9ae4eSPoul-Henning Kamp udp_pcblist(SYSCTL_HANDLER_ARGS)
64898271db4SGarrett Wollman {
6498b615593SMarko Zec 	INIT_VNET_INET(curvnet);
650277afaffSRobert Watson 	int error, i, n;
65198271db4SGarrett Wollman 	struct inpcb *inp, **inp_list;
65298271db4SGarrett Wollman 	inp_gen_t gencnt;
65398271db4SGarrett Wollman 	struct xinpgen xig;
65498271db4SGarrett Wollman 
65598271db4SGarrett Wollman 	/*
656f5514f08SRobert Watson 	 * The process of preparing the PCB list is too time-consuming and
65798271db4SGarrett Wollman 	 * resource-intensive to repeat twice on every request.
65898271db4SGarrett Wollman 	 */
65998271db4SGarrett Wollman 	if (req->oldptr == 0) {
660603724d3SBjoern A. Zeeb 		n = V_udbinfo.ipi_count;
66198271db4SGarrett Wollman 		req->oldidx = 2 * (sizeof xig)
66298271db4SGarrett Wollman 			+ (n + n/8) * sizeof(struct xinpcb);
6633329b236SRobert Watson 		return (0);
66498271db4SGarrett Wollman 	}
66598271db4SGarrett Wollman 
66698271db4SGarrett Wollman 	if (req->newptr != 0)
6673329b236SRobert Watson 		return (EPERM);
66898271db4SGarrett Wollman 
66998271db4SGarrett Wollman 	/*
67098271db4SGarrett Wollman 	 * OK, now we're committed to doing something.
67198271db4SGarrett Wollman 	 */
672603724d3SBjoern A. Zeeb 	INP_INFO_RLOCK(&V_udbinfo);
673603724d3SBjoern A. Zeeb 	gencnt = V_udbinfo.ipi_gencnt;
674603724d3SBjoern A. Zeeb 	n = V_udbinfo.ipi_count;
675603724d3SBjoern A. Zeeb 	INP_INFO_RUNLOCK(&V_udbinfo);
67698271db4SGarrett Wollman 
67747934cefSDon Lewis 	error = sysctl_wire_old_buffer(req, 2 * (sizeof xig)
6785c38b6dbSDon Lewis 		+ n * sizeof(struct xinpcb));
67947934cefSDon Lewis 	if (error != 0)
68047934cefSDon Lewis 		return (error);
6815c38b6dbSDon Lewis 
68298271db4SGarrett Wollman 	xig.xig_len = sizeof xig;
68398271db4SGarrett Wollman 	xig.xig_count = n;
68498271db4SGarrett Wollman 	xig.xig_gen = gencnt;
68598271db4SGarrett Wollman 	xig.xig_sogen = so_gencnt;
68698271db4SGarrett Wollman 	error = SYSCTL_OUT(req, &xig, sizeof xig);
68798271db4SGarrett Wollman 	if (error)
6883329b236SRobert Watson 		return (error);
68998271db4SGarrett Wollman 
690a163d034SWarner Losh 	inp_list = malloc(n * sizeof *inp_list, M_TEMP, M_WAITOK);
69198271db4SGarrett Wollman 	if (inp_list == 0)
6923329b236SRobert Watson 		return (ENOMEM);
69398271db4SGarrett Wollman 
694603724d3SBjoern A. Zeeb 	INP_INFO_RLOCK(&V_udbinfo);
695603724d3SBjoern A. Zeeb 	for (inp = LIST_FIRST(V_udbinfo.ipi_listhead), i = 0; inp && i < n;
696fc2ffbe6SPoul-Henning Kamp 	     inp = LIST_NEXT(inp, inp_list)) {
6979622e84fSRobert Watson 		INP_RLOCK(inp);
6982ded288cSJeffrey Hsu 		if (inp->inp_gencnt <= gencnt &&
699f08ef6c5SBjoern A. Zeeb 		    cr_canseeinpcb(req->td->td_ucred, inp) == 0)
70098271db4SGarrett Wollman 			inp_list[i++] = inp;
7019622e84fSRobert Watson 		INP_RUNLOCK(inp);
7024787fd37SPaul Saab 	}
703603724d3SBjoern A. Zeeb 	INP_INFO_RUNLOCK(&V_udbinfo);
70498271db4SGarrett Wollman 	n = i;
70598271db4SGarrett Wollman 
70698271db4SGarrett Wollman 	error = 0;
70798271db4SGarrett Wollman 	for (i = 0; i < n; i++) {
70898271db4SGarrett Wollman 		inp = inp_list[i];
7099622e84fSRobert Watson 		INP_RLOCK(inp);
71098271db4SGarrett Wollman 		if (inp->inp_gencnt <= gencnt) {
71198271db4SGarrett Wollman 			struct xinpcb xi;
712fd94099eSColin Percival 			bzero(&xi, sizeof(xi));
71398271db4SGarrett Wollman 			xi.xi_len = sizeof xi;
71498271db4SGarrett Wollman 			/* XXX should avoid extra copy */
71598271db4SGarrett Wollman 			bcopy(inp, &xi.xi_inp, sizeof *inp);
71698271db4SGarrett Wollman 			if (inp->inp_socket)
71798271db4SGarrett Wollman 				sotoxsocket(inp->inp_socket, &xi.xi_socket);
7184b40c56cSJeffrey Hsu 			xi.xi_inp.inp_gencnt = inp->inp_gencnt;
7199622e84fSRobert Watson 			INP_RUNLOCK(inp);
72098271db4SGarrett Wollman 			error = SYSCTL_OUT(req, &xi, sizeof xi);
721d915b280SStephan Uphoff 		} else
7229622e84fSRobert Watson 			INP_RUNLOCK(inp);
72398271db4SGarrett Wollman 	}
72498271db4SGarrett Wollman 	if (!error) {
72598271db4SGarrett Wollman 		/*
7263329b236SRobert Watson 		 * Give the user an updated idea of our state.  If the
7273329b236SRobert Watson 		 * generation differs from what we told her before, she knows
7283329b236SRobert Watson 		 * that something happened while we were processing this
7293329b236SRobert Watson 		 * request, and it might be necessary to retry.
73098271db4SGarrett Wollman 		 */
731603724d3SBjoern A. Zeeb 		INP_INFO_RLOCK(&V_udbinfo);
732603724d3SBjoern A. Zeeb 		xig.xig_gen = V_udbinfo.ipi_gencnt;
73398271db4SGarrett Wollman 		xig.xig_sogen = so_gencnt;
734603724d3SBjoern A. Zeeb 		xig.xig_count = V_udbinfo.ipi_count;
735603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
73698271db4SGarrett Wollman 		error = SYSCTL_OUT(req, &xig, sizeof xig);
73798271db4SGarrett Wollman 	}
73898271db4SGarrett Wollman 	free(inp_list, M_TEMP);
7393329b236SRobert Watson 	return (error);
74098271db4SGarrett Wollman }
74198271db4SGarrett Wollman 
74298271db4SGarrett Wollman SYSCTL_PROC(_net_inet_udp, UDPCTL_PCBLIST, pcblist, CTLFLAG_RD, 0, 0,
74398271db4SGarrett Wollman     udp_pcblist, "S,xinpcb", "List of active UDP sockets");
74498271db4SGarrett Wollman 
74598271db4SGarrett Wollman static int
74682d9ae4eSPoul-Henning Kamp udp_getcred(SYSCTL_HANDLER_ARGS)
747490d50b6SBrian Feldman {
7488b615593SMarko Zec 	INIT_VNET_INET(curvnet);
749c0511d3bSBrian Feldman 	struct xucred xuc;
750490d50b6SBrian Feldman 	struct sockaddr_in addrs[2];
751490d50b6SBrian Feldman 	struct inpcb *inp;
752277afaffSRobert Watson 	int error;
753490d50b6SBrian Feldman 
75432f9753cSRobert Watson 	error = priv_check(req->td, PRIV_NETINET_GETCRED);
755490d50b6SBrian Feldman 	if (error)
756490d50b6SBrian Feldman 		return (error);
757490d50b6SBrian Feldman 	error = SYSCTL_IN(req, addrs, sizeof(addrs));
758490d50b6SBrian Feldman 	if (error)
759490d50b6SBrian Feldman 		return (error);
760603724d3SBjoern A. Zeeb 	INP_INFO_RLOCK(&V_udbinfo);
761603724d3SBjoern A. Zeeb 	inp = in_pcblookup_hash(&V_udbinfo, addrs[1].sin_addr, addrs[1].sin_port,
762cfa1ca9dSYoshinobu Inoue 				addrs[0].sin_addr, addrs[0].sin_port, 1, NULL);
7639622e84fSRobert Watson 	if (inp != NULL) {
7649622e84fSRobert Watson 		INP_RLOCK(inp);
765603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
7669622e84fSRobert Watson 		if (inp->inp_socket == NULL)
7679622e84fSRobert Watson 			error = ENOENT;
7689622e84fSRobert Watson 		if (error == 0)
769f08ef6c5SBjoern A. Zeeb 			error = cr_canseeinpcb(req->td->td_ucred, inp);
7709622e84fSRobert Watson 		if (error == 0)
77186d02c5cSBjoern A. Zeeb 			cru2x(inp->inp_cred, &xuc);
7729622e84fSRobert Watson 		INP_RUNLOCK(inp);
7739622e84fSRobert Watson 	} else {
774603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
7759622e84fSRobert Watson 		error = ENOENT;
7769622e84fSRobert Watson 	}
7770e1eebb8SDon Lewis 	if (error == 0)
7780e1eebb8SDon Lewis 		error = SYSCTL_OUT(req, &xuc, sizeof(struct xucred));
779490d50b6SBrian Feldman 	return (error);
780490d50b6SBrian Feldman }
781490d50b6SBrian Feldman 
7827ce87f12SDavid Malone SYSCTL_PROC(_net_inet_udp, OID_AUTO, getcred,
7837ce87f12SDavid Malone     CTLTYPE_OPAQUE|CTLFLAG_RW|CTLFLAG_PRISON, 0, 0,
7847ce87f12SDavid Malone     udp_getcred, "S,xucred", "Get the xucred of a UDP connection");
785490d50b6SBrian Feldman 
786490d50b6SBrian Feldman static int
7873329b236SRobert Watson udp_output(struct inpcb *inp, struct mbuf *m, struct sockaddr *addr,
7883329b236SRobert Watson     struct mbuf *control, struct thread *td)
789df8bae1dSRodney W. Grimes {
7908b615593SMarko Zec 	INIT_VNET_INET(inp->inp_vnet);
7913329b236SRobert Watson 	struct udpiphdr *ui;
7923329b236SRobert Watson 	int len = m->m_pkthdr.len;
79390162a4eSIan Dowse 	struct in_addr faddr, laddr;
794c557ae16SIan Dowse 	struct cmsghdr *cm;
795c557ae16SIan Dowse 	struct sockaddr_in *sin, src;
79690162a4eSIan Dowse 	int error = 0;
7978afa2304SBruce M Simpson 	int ipflags;
79890162a4eSIan Dowse 	u_short fport, lport;
7995c32ea65SRobert Watson 	int unlock_udbinfo;
800df8bae1dSRodney W. Grimes 
8015c32ea65SRobert Watson 	/*
8025c32ea65SRobert Watson 	 * udp_output() may need to temporarily bind or connect the current
803f5514f08SRobert Watson 	 * inpcb.  As such, we don't know up front whether we will need the
804f5514f08SRobert Watson 	 * pcbinfo lock or not.  Do any work to decide what is needed up
805f5514f08SRobert Watson 	 * front before acquiring any locks.
8065c32ea65SRobert Watson 	 */
807430d30d8SBill Fenner 	if (len + sizeof(struct udpiphdr) > IP_MAXPACKET) {
808c557ae16SIan Dowse 		if (control)
809c557ae16SIan Dowse 			m_freem(control);
8105c32ea65SRobert Watson 		m_freem(m);
8113329b236SRobert Watson 		return (EMSGSIZE);
812430d30d8SBill Fenner 	}
813430d30d8SBill Fenner 
8141b7f0384SBruce M Simpson 	src.sin_family = 0;
815c557ae16SIan Dowse 	if (control != NULL) {
816c557ae16SIan Dowse 		/*
8173329b236SRobert Watson 		 * XXX: Currently, we assume all the optional information is
8183329b236SRobert Watson 		 * stored in a single mbuf.
819c557ae16SIan Dowse 		 */
820c557ae16SIan Dowse 		if (control->m_next) {
821c557ae16SIan Dowse 			m_freem(control);
8225c32ea65SRobert Watson 			m_freem(m);
8233329b236SRobert Watson 			return (EINVAL);
824c557ae16SIan Dowse 		}
825c557ae16SIan Dowse 		for (; control->m_len > 0;
826c557ae16SIan Dowse 		    control->m_data += CMSG_ALIGN(cm->cmsg_len),
827c557ae16SIan Dowse 		    control->m_len -= CMSG_ALIGN(cm->cmsg_len)) {
828c557ae16SIan Dowse 			cm = mtod(control, struct cmsghdr *);
829af1ee11dSRobert Watson 			if (control->m_len < sizeof(*cm) || cm->cmsg_len == 0
830af1ee11dSRobert Watson 			    || cm->cmsg_len > control->m_len) {
831c557ae16SIan Dowse 				error = EINVAL;
832c557ae16SIan Dowse 				break;
833c557ae16SIan Dowse 			}
834c557ae16SIan Dowse 			if (cm->cmsg_level != IPPROTO_IP)
835c557ae16SIan Dowse 				continue;
836c557ae16SIan Dowse 
837c557ae16SIan Dowse 			switch (cm->cmsg_type) {
838c557ae16SIan Dowse 			case IP_SENDSRCADDR:
839c557ae16SIan Dowse 				if (cm->cmsg_len !=
840c557ae16SIan Dowse 				    CMSG_LEN(sizeof(struct in_addr))) {
841c557ae16SIan Dowse 					error = EINVAL;
842c557ae16SIan Dowse 					break;
843c557ae16SIan Dowse 				}
844c557ae16SIan Dowse 				bzero(&src, sizeof(src));
845c557ae16SIan Dowse 				src.sin_family = AF_INET;
846c557ae16SIan Dowse 				src.sin_len = sizeof(src);
847c557ae16SIan Dowse 				src.sin_port = inp->inp_lport;
848af1ee11dSRobert Watson 				src.sin_addr =
849af1ee11dSRobert Watson 				    *(struct in_addr *)CMSG_DATA(cm);
850c557ae16SIan Dowse 				break;
851af1ee11dSRobert Watson 
852c557ae16SIan Dowse 			default:
853c557ae16SIan Dowse 				error = ENOPROTOOPT;
854c557ae16SIan Dowse 				break;
855c557ae16SIan Dowse 			}
856c557ae16SIan Dowse 			if (error)
857c557ae16SIan Dowse 				break;
858c557ae16SIan Dowse 		}
859c557ae16SIan Dowse 		m_freem(control);
860c557ae16SIan Dowse 	}
8615c32ea65SRobert Watson 	if (error) {
8625c32ea65SRobert Watson 		m_freem(m);
8633329b236SRobert Watson 		return (error);
8645c32ea65SRobert Watson 	}
8655c32ea65SRobert Watson 
86643cc0bc1SRobert Watson 	/*
86743cc0bc1SRobert Watson 	 * Depending on whether or not the application has bound or connected
868ca528788SRobert Watson 	 * the socket, we may have to do varying levels of work.  The optimal
869ca528788SRobert Watson 	 * case is for a connected UDP socket, as a global lock isn't
870ca528788SRobert Watson 	 * required at all.
87143cc0bc1SRobert Watson 	 *
87243cc0bc1SRobert Watson 	 * In order to decide which we need, we require stability of the
87343cc0bc1SRobert Watson 	 * inpcb binding, which we ensure by acquiring a read lock on the
87443cc0bc1SRobert Watson 	 * inpcb.  This doesn't strictly follow the lock order, so we play
87543cc0bc1SRobert Watson 	 * the trylock and retry game; note that we may end up with more
87643cc0bc1SRobert Watson 	 * conservative locks than required the second time around, so later
87743cc0bc1SRobert Watson 	 * assertions have to accept that.  Further analysis of the number of
87843cc0bc1SRobert Watson 	 * misses under contention is required.
87943cc0bc1SRobert Watson 	 */
88043cc0bc1SRobert Watson 	sin = (struct sockaddr_in *)addr;
88143cc0bc1SRobert Watson 	INP_RLOCK(inp);
88243cc0bc1SRobert Watson 	if (sin != NULL &&
88343cc0bc1SRobert Watson 	    (inp->inp_laddr.s_addr == INADDR_ANY && inp->inp_lport == 0)) {
88443cc0bc1SRobert Watson 		INP_RUNLOCK(inp);
885603724d3SBjoern A. Zeeb 		INP_INFO_WLOCK(&V_udbinfo);
8868501a69cSRobert Watson 		INP_WLOCK(inp);
88743cc0bc1SRobert Watson 		unlock_udbinfo = 2;
88843cc0bc1SRobert Watson 	} else if ((sin != NULL && (
88943cc0bc1SRobert Watson 	    (sin->sin_addr.s_addr == INADDR_ANY) ||
89043cc0bc1SRobert Watson 	    (sin->sin_addr.s_addr == INADDR_BROADCAST) ||
89143cc0bc1SRobert Watson 	    (inp->inp_laddr.s_addr == INADDR_ANY) ||
89243cc0bc1SRobert Watson 	    (inp->inp_lport == 0))) ||
89343cc0bc1SRobert Watson 	    (src.sin_family == AF_INET)) {
894603724d3SBjoern A. Zeeb 		if (!INP_INFO_TRY_RLOCK(&V_udbinfo)) {
89543cc0bc1SRobert Watson 			INP_RUNLOCK(inp);
896603724d3SBjoern A. Zeeb 			INP_INFO_RLOCK(&V_udbinfo);
897948d0fc9SRobert Watson 			INP_RLOCK(inp);
898948d0fc9SRobert Watson 		}
89943cc0bc1SRobert Watson 		unlock_udbinfo = 1;
90043cc0bc1SRobert Watson 	} else
90143cc0bc1SRobert Watson 		unlock_udbinfo = 0;
9025c32ea65SRobert Watson 
9031b7f0384SBruce M Simpson 	/*
9041b7f0384SBruce M Simpson 	 * If the IP_SENDSRCADDR control message was specified, override the
9051b7f0384SBruce M Simpson 	 * source address for this datagram.  Its use is invalidated if the
9061b7f0384SBruce M Simpson 	 * address thus specified is incomplete or clobbers other inpcbs.
9071b7f0384SBruce M Simpson 	 */
90890162a4eSIan Dowse 	laddr = inp->inp_laddr;
90990162a4eSIan Dowse 	lport = inp->inp_lport;
9101b7f0384SBruce M Simpson 	if (src.sin_family == AF_INET) {
911603724d3SBjoern A. Zeeb 		INP_INFO_LOCK_ASSERT(&V_udbinfo);
9121b7f0384SBruce M Simpson 		if ((lport == 0) ||
9131b7f0384SBruce M Simpson 		    (laddr.s_addr == INADDR_ANY &&
9141b7f0384SBruce M Simpson 		     src.sin_addr.s_addr == INADDR_ANY)) {
915c557ae16SIan Dowse 			error = EINVAL;
916c557ae16SIan Dowse 			goto release;
917c557ae16SIan Dowse 		}
918c557ae16SIan Dowse 		error = in_pcbbind_setup(inp, (struct sockaddr *)&src,
919b0330ed9SPawel Jakub Dawidek 		    &laddr.s_addr, &lport, td->td_ucred);
920c557ae16SIan Dowse 		if (error)
921c557ae16SIan Dowse 			goto release;
922c557ae16SIan Dowse 	}
923c557ae16SIan Dowse 
9243144b7d3SRobert Watson 	/*
9253144b7d3SRobert Watson 	 * If a UDP socket has been connected, then a local address/port will
9263144b7d3SRobert Watson 	 * have been selected and bound.
9273144b7d3SRobert Watson 	 *
92843cc0bc1SRobert Watson 	 * If a UDP socket has not been connected to, then an explicit
9293144b7d3SRobert Watson 	 * destination address must be used, in which case a local
9303144b7d3SRobert Watson 	 * address/port may not have been selected and bound.
9313144b7d3SRobert Watson 	 */
93243cc0bc1SRobert Watson 	if (sin != NULL) {
933c4d585aeSRobert Watson 		INP_LOCK_ASSERT(inp);
934df8bae1dSRodney W. Grimes 		if (inp->inp_faddr.s_addr != INADDR_ANY) {
935df8bae1dSRodney W. Grimes 			error = EISCONN;
936df8bae1dSRodney W. Grimes 			goto release;
937df8bae1dSRodney W. Grimes 		}
9383144b7d3SRobert Watson 
9393144b7d3SRobert Watson 		/*
9403144b7d3SRobert Watson 		 * Jail may rewrite the destination address, so let it do
9413144b7d3SRobert Watson 		 * that before we use it.
9423144b7d3SRobert Watson 		 */
943413628a7SBjoern A. Zeeb 		if (prison_remote_ip4(td->td_ucred, &sin->sin_addr) != 0) {
944413628a7SBjoern A. Zeeb 			error = EINVAL;
945413628a7SBjoern A. Zeeb 			goto release;
946413628a7SBjoern A. Zeeb 		}
9473144b7d3SRobert Watson 
9483144b7d3SRobert Watson 		/*
94943cc0bc1SRobert Watson 		 * If a local address or port hasn't yet been selected, or if
95043cc0bc1SRobert Watson 		 * the destination address needs to be rewritten due to using
95143cc0bc1SRobert Watson 		 * a special INADDR_ constant, invoke in_pcbconnect_setup()
95243cc0bc1SRobert Watson 		 * to do the heavy lifting.  Once a port is selected, we
95343cc0bc1SRobert Watson 		 * commit the binding back to the socket; we also commit the
95443cc0bc1SRobert Watson 		 * binding of the address if in jail.
95543cc0bc1SRobert Watson 		 *
95643cc0bc1SRobert Watson 		 * If we already have a valid binding and we're not
95743cc0bc1SRobert Watson 		 * requesting a destination address rewrite, use a fast path.
9583144b7d3SRobert Watson 		 */
95943cc0bc1SRobert Watson 		if (inp->inp_laddr.s_addr == INADDR_ANY ||
96043cc0bc1SRobert Watson 		    inp->inp_lport == 0 ||
96143cc0bc1SRobert Watson 		    sin->sin_addr.s_addr == INADDR_ANY ||
96243cc0bc1SRobert Watson 		    sin->sin_addr.s_addr == INADDR_BROADCAST) {
963603724d3SBjoern A. Zeeb 			INP_INFO_LOCK_ASSERT(&V_udbinfo);
96443cc0bc1SRobert Watson 			error = in_pcbconnect_setup(inp, addr, &laddr.s_addr,
96543cc0bc1SRobert Watson 			    &lport, &faddr.s_addr, &fport, NULL,
96643cc0bc1SRobert Watson 			    td->td_ucred);
96790162a4eSIan Dowse 			if (error)
96890162a4eSIan Dowse 				goto release;
96990162a4eSIan Dowse 
97043cc0bc1SRobert Watson 			/*
97143cc0bc1SRobert Watson 			 * XXXRW: Why not commit the port if the address is
97243cc0bc1SRobert Watson 			 * !INADDR_ANY?
97343cc0bc1SRobert Watson 			 */
97490162a4eSIan Dowse 			/* Commit the local port if newly assigned. */
97590162a4eSIan Dowse 			if (inp->inp_laddr.s_addr == INADDR_ANY &&
97690162a4eSIan Dowse 			    inp->inp_lport == 0) {
977603724d3SBjoern A. Zeeb 				INP_INFO_WLOCK_ASSERT(&V_udbinfo);
978c4d585aeSRobert Watson 				INP_WLOCK_ASSERT(inp);
9793a1757b9SGleb Smirnoff 				/*
98043cc0bc1SRobert Watson 				 * Remember addr if jailed, to prevent
98143cc0bc1SRobert Watson 				 * rebinding.
9823a1757b9SGleb Smirnoff 				 */
9833a1757b9SGleb Smirnoff 				if (jailed(td->td_ucred))
9843a1757b9SGleb Smirnoff 					inp->inp_laddr = laddr;
98590162a4eSIan Dowse 				inp->inp_lport = lport;
98690162a4eSIan Dowse 				if (in_pcbinshash(inp) != 0) {
98790162a4eSIan Dowse 					inp->inp_lport = 0;
98890162a4eSIan Dowse 					error = EAGAIN;
989df8bae1dSRodney W. Grimes 					goto release;
990df8bae1dSRodney W. Grimes 				}
99190162a4eSIan Dowse 				inp->inp_flags |= INP_ANONPORT;
99290162a4eSIan Dowse 			}
993df8bae1dSRodney W. Grimes 		} else {
99443cc0bc1SRobert Watson 			faddr = sin->sin_addr;
99543cc0bc1SRobert Watson 			fport = sin->sin_port;
99643cc0bc1SRobert Watson 		}
99743cc0bc1SRobert Watson 	} else {
998c4d585aeSRobert Watson 		INP_LOCK_ASSERT(inp);
99990162a4eSIan Dowse 		faddr = inp->inp_faddr;
100090162a4eSIan Dowse 		fport = inp->inp_fport;
100190162a4eSIan Dowse 		if (faddr.s_addr == INADDR_ANY) {
1002df8bae1dSRodney W. Grimes 			error = ENOTCONN;
1003df8bae1dSRodney W. Grimes 			goto release;
1004df8bae1dSRodney W. Grimes 		}
1005df8bae1dSRodney W. Grimes 	}
1006e6ccd709SRobert Watson 
1007df8bae1dSRodney W. Grimes 	/*
1008e6ccd709SRobert Watson 	 * Calculate data length and get a mbuf for UDP, IP, and possible
1009392e8407SRobert Watson 	 * link-layer headers.  Immediate slide the data pointer back forward
1010392e8407SRobert Watson 	 * since we won't use that space at this layer.
1011df8bae1dSRodney W. Grimes 	 */
1012e6ccd709SRobert Watson 	M_PREPEND(m, sizeof(struct udpiphdr) + max_linkhdr, M_DONTWAIT);
1013e6ccd709SRobert Watson 	if (m == NULL) {
1014df8bae1dSRodney W. Grimes 		error = ENOBUFS;
101549b19bfcSBruce M Simpson 		goto release;
1016df8bae1dSRodney W. Grimes 	}
1017e6ccd709SRobert Watson 	m->m_data += max_linkhdr;
1018e6ccd709SRobert Watson 	m->m_len -= max_linkhdr;
1019392e8407SRobert Watson 	m->m_pkthdr.len -= max_linkhdr;
1020df8bae1dSRodney W. Grimes 
1021df8bae1dSRodney W. Grimes 	/*
10223329b236SRobert Watson 	 * Fill in mbuf with extended UDP header and addresses and length put
10233329b236SRobert Watson 	 * into network format.
1024df8bae1dSRodney W. Grimes 	 */
1025df8bae1dSRodney W. Grimes 	ui = mtod(m, struct udpiphdr *);
1026db4f9cc7SJonathan Lemon 	bzero(ui->ui_x1, sizeof(ui->ui_x1));	/* XXX still needed? */
1027df8bae1dSRodney W. Grimes 	ui->ui_pr = IPPROTO_UDP;
102890162a4eSIan Dowse 	ui->ui_src = laddr;
102990162a4eSIan Dowse 	ui->ui_dst = faddr;
103090162a4eSIan Dowse 	ui->ui_sport = lport;
103190162a4eSIan Dowse 	ui->ui_dport = fport;
1032db4f9cc7SJonathan Lemon 	ui->ui_ulen = htons((u_short)len + sizeof(struct udphdr));
1033df8bae1dSRodney W. Grimes 
1034b2828ad2SAndre Oppermann 	/*
1035b2828ad2SAndre Oppermann 	 * Set the Don't Fragment bit in the IP header.
1036b2828ad2SAndre Oppermann 	 */
1037b2828ad2SAndre Oppermann 	if (inp->inp_flags & INP_DONTFRAG) {
1038b2828ad2SAndre Oppermann 		struct ip *ip;
10393329b236SRobert Watson 
1040b2828ad2SAndre Oppermann 		ip = (struct ip *)&ui->ui_i;
1041b2828ad2SAndre Oppermann 		ip->ip_off |= IP_DF;
1042b2828ad2SAndre Oppermann 	}
1043b2828ad2SAndre Oppermann 
1044b5d47ff5SJohn-Mark Gurney 	ipflags = 0;
1045b5d47ff5SJohn-Mark Gurney 	if (inp->inp_socket->so_options & SO_DONTROUTE)
1046b5d47ff5SJohn-Mark Gurney 		ipflags |= IP_ROUTETOIF;
1047b5d47ff5SJohn-Mark Gurney 	if (inp->inp_socket->so_options & SO_BROADCAST)
1048b5d47ff5SJohn-Mark Gurney 		ipflags |= IP_ALLOWBROADCAST;
10496fbfd582SAndre Oppermann 	if (inp->inp_flags & INP_ONESBCAST)
10508afa2304SBruce M Simpson 		ipflags |= IP_SENDONES;
10518afa2304SBruce M Simpson 
10521175d9d5SRobert Watson #ifdef MAC
10531175d9d5SRobert Watson 	mac_inpcb_create_mbuf(inp, m);
10541175d9d5SRobert Watson #endif
10551175d9d5SRobert Watson 
1056df8bae1dSRodney W. Grimes 	/*
1057db4f9cc7SJonathan Lemon 	 * Set up checksum and output datagram.
1058df8bae1dSRodney W. Grimes 	 */
1059f5514f08SRobert Watson 	if (udp_cksum) {
10606fbfd582SAndre Oppermann 		if (inp->inp_flags & INP_ONESBCAST)
10618a538743SBruce M Simpson 			faddr.s_addr = INADDR_BROADCAST;
10628a538743SBruce M Simpson 		ui->ui_sum = in_pseudo(ui->ui_src.s_addr, faddr.s_addr,
1063db4f9cc7SJonathan Lemon 		    htons((u_short)len + sizeof(struct udphdr) + IPPROTO_UDP));
1064db4f9cc7SJonathan Lemon 		m->m_pkthdr.csum_flags = CSUM_UDP;
1065db4f9cc7SJonathan Lemon 		m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum);
10663329b236SRobert Watson 	} else
1067db4f9cc7SJonathan Lemon 		ui->ui_sum = 0;
1068df8bae1dSRodney W. Grimes 	((struct ip *)ui)->ip_len = sizeof (struct udpiphdr) + len;
1069ca98b82cSDavid Greenman 	((struct ip *)ui)->ip_ttl = inp->inp_ip_ttl;	/* XXX */
1070ca98b82cSDavid Greenman 	((struct ip *)ui)->ip_tos = inp->inp_ip_tos;	/* XXX */
1071603724d3SBjoern A. Zeeb 	V_udpstat.udps_opackets++;
1072cfa1ca9dSYoshinobu Inoue 
107343cc0bc1SRobert Watson 	if (unlock_udbinfo == 2)
1074603724d3SBjoern A. Zeeb 		INP_INFO_WUNLOCK(&V_udbinfo);
107543cc0bc1SRobert Watson 	else if (unlock_udbinfo == 1)
1076603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
107797d8d152SAndre Oppermann 	error = ip_output(m, inp->inp_options, NULL, ipflags,
10785d846453SSam Leffler 	    inp->inp_moptions, inp);
107943cc0bc1SRobert Watson 	if (unlock_udbinfo == 2)
10808501a69cSRobert Watson 		INP_WUNLOCK(inp);
1081948d0fc9SRobert Watson 	else
1082948d0fc9SRobert Watson 		INP_RUNLOCK(inp);
1083df8bae1dSRodney W. Grimes 	return (error);
1084df8bae1dSRodney W. Grimes 
1085df8bae1dSRodney W. Grimes release:
108643cc0bc1SRobert Watson 	if (unlock_udbinfo == 2) {
1087948d0fc9SRobert Watson 		INP_WUNLOCK(inp);
1088603724d3SBjoern A. Zeeb 		INP_INFO_WUNLOCK(&V_udbinfo);
108943cc0bc1SRobert Watson 	} else if (unlock_udbinfo == 1) {
109043cc0bc1SRobert Watson 		INP_RUNLOCK(inp);
1091603724d3SBjoern A. Zeeb 		INP_INFO_RUNLOCK(&V_udbinfo);
1092948d0fc9SRobert Watson 	} else
1093948d0fc9SRobert Watson 		INP_RUNLOCK(inp);
1094df8bae1dSRodney W. Grimes 	m_freem(m);
1095df8bae1dSRodney W. Grimes 	return (error);
1096df8bae1dSRodney W. Grimes }
1097df8bae1dSRodney W. Grimes 
1098ac45e92fSRobert Watson static void
1099d0390e05SGarrett Wollman udp_abort(struct socket *so)
1100df8bae1dSRodney W. Grimes {
11018b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1102d0390e05SGarrett Wollman 	struct inpcb *inp;
1103df8bae1dSRodney W. Grimes 
1104d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
110514ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_abort: inp == NULL"));
1106603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
11078501a69cSRobert Watson 	INP_WLOCK(inp);
1108a152f8a3SRobert Watson 	if (inp->inp_faddr.s_addr != INADDR_ANY) {
1109a152f8a3SRobert Watson 		in_pcbdisconnect(inp);
1110a152f8a3SRobert Watson 		inp->inp_laddr.s_addr = INADDR_ANY;
1111d0390e05SGarrett Wollman 		soisdisconnected(so);
1112a152f8a3SRobert Watson 	}
11138501a69cSRobert Watson 	INP_WUNLOCK(inp);
1114603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
1115df8bae1dSRodney W. Grimes }
1116df8bae1dSRodney W. Grimes 
1117d0390e05SGarrett Wollman static int
1118b40ce416SJulian Elischer udp_attach(struct socket *so, int proto, struct thread *td)
1119d0390e05SGarrett Wollman {
11208b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1121d0390e05SGarrett Wollman 	struct inpcb *inp;
1122277afaffSRobert Watson 	int error;
1123d0390e05SGarrett Wollman 
1124d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
112514ba8addSRobert Watson 	KASSERT(inp == NULL, ("udp_attach: inp != NULL"));
1126cfa1ca9dSYoshinobu Inoue 	error = soreserve(so, udp_sendspace, udp_recvspace);
1127f24618aaSRobert Watson 	if (error)
11283329b236SRobert Watson 		return (error);
1129603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
1130603724d3SBjoern A. Zeeb 	error = in_pcballoc(so, &V_udbinfo);
113153b57cd1SSam Leffler 	if (error) {
1132603724d3SBjoern A. Zeeb 		INP_INFO_WUNLOCK(&V_udbinfo);
11333329b236SRobert Watson 		return (error);
113453b57cd1SSam Leffler 	}
1135cfa1ca9dSYoshinobu Inoue 
1136cfa1ca9dSYoshinobu Inoue 	inp = (struct inpcb *)so->so_pcb;
1137603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
1138cfa1ca9dSYoshinobu Inoue 	inp->inp_vflag |= INP_IPV4;
1139603724d3SBjoern A. Zeeb 	inp->inp_ip_ttl = V_ip_defttl;
11408501a69cSRobert Watson 	INP_WUNLOCK(inp);
11413329b236SRobert Watson 	return (0);
1142df8bae1dSRodney W. Grimes }
1143d0390e05SGarrett Wollman 
1144d0390e05SGarrett Wollman static int
1145b40ce416SJulian Elischer udp_bind(struct socket *so, struct sockaddr *nam, struct thread *td)
1146d0390e05SGarrett Wollman {
11478b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1148d0390e05SGarrett Wollman 	struct inpcb *inp;
1149277afaffSRobert Watson 	int error;
1150d0390e05SGarrett Wollman 
1151d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
115214ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_bind: inp == NULL"));
1153603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
11548501a69cSRobert Watson 	INP_WLOCK(inp);
1155b0330ed9SPawel Jakub Dawidek 	error = in_pcbbind(inp, nam, td->td_ucred);
11568501a69cSRobert Watson 	INP_WUNLOCK(inp);
1157603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
11583329b236SRobert Watson 	return (error);
1159d0390e05SGarrett Wollman }
1160d0390e05SGarrett Wollman 
1161a152f8a3SRobert Watson static void
1162a152f8a3SRobert Watson udp_close(struct socket *so)
1163a152f8a3SRobert Watson {
11648b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1165a152f8a3SRobert Watson 	struct inpcb *inp;
1166a152f8a3SRobert Watson 
1167a152f8a3SRobert Watson 	inp = sotoinpcb(so);
1168a152f8a3SRobert Watson 	KASSERT(inp != NULL, ("udp_close: inp == NULL"));
1169603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
11708501a69cSRobert Watson 	INP_WLOCK(inp);
1171a152f8a3SRobert Watson 	if (inp->inp_faddr.s_addr != INADDR_ANY) {
1172a152f8a3SRobert Watson 		in_pcbdisconnect(inp);
1173a152f8a3SRobert Watson 		inp->inp_laddr.s_addr = INADDR_ANY;
1174a152f8a3SRobert Watson 		soisdisconnected(so);
1175a152f8a3SRobert Watson 	}
11768501a69cSRobert Watson 	INP_WUNLOCK(inp);
1177603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
1178a152f8a3SRobert Watson }
1179a152f8a3SRobert Watson 
1180d0390e05SGarrett Wollman static int
1181b40ce416SJulian Elischer udp_connect(struct socket *so, struct sockaddr *nam, struct thread *td)
1182d0390e05SGarrett Wollman {
11838b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1184d0390e05SGarrett Wollman 	struct inpcb *inp;
1185277afaffSRobert Watson 	int error;
118675c13541SPoul-Henning Kamp 	struct sockaddr_in *sin;
1187d0390e05SGarrett Wollman 
1188d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
118914ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_connect: inp == NULL"));
1190603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
11918501a69cSRobert Watson 	INP_WLOCK(inp);
1192f76fcf6dSJeffrey Hsu 	if (inp->inp_faddr.s_addr != INADDR_ANY) {
11938501a69cSRobert Watson 		INP_WUNLOCK(inp);
1194603724d3SBjoern A. Zeeb 		INP_INFO_WUNLOCK(&V_udbinfo);
11953329b236SRobert Watson 		return (EISCONN);
1196f76fcf6dSJeffrey Hsu 	}
119775c13541SPoul-Henning Kamp 	sin = (struct sockaddr_in *)nam;
1198413628a7SBjoern A. Zeeb 	if (prison_remote_ip4(td->td_ucred, &sin->sin_addr) != 0) {
1199413628a7SBjoern A. Zeeb 		INP_WUNLOCK(inp);
1200413628a7SBjoern A. Zeeb 		INP_INFO_WUNLOCK(&udbinfo);
1201413628a7SBjoern A. Zeeb 		return (EAFNOSUPPORT);
1202413628a7SBjoern A. Zeeb 	}
1203b0330ed9SPawel Jakub Dawidek 	error = in_pcbconnect(inp, nam, td->td_ucred);
12044cc20ab1SSeigo Tanimura 	if (error == 0)
1205df8bae1dSRodney W. Grimes 		soisconnected(so);
12068501a69cSRobert Watson 	INP_WUNLOCK(inp);
1207603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
12083329b236SRobert Watson 	return (error);
1209df8bae1dSRodney W. Grimes }
1210d0390e05SGarrett Wollman 
1211bc725eafSRobert Watson static void
1212d0390e05SGarrett Wollman udp_detach(struct socket *so)
1213d0390e05SGarrett Wollman {
12148b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1215d0390e05SGarrett Wollman 	struct inpcb *inp;
1216d0390e05SGarrett Wollman 
1217d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
121814ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_detach: inp == NULL"));
1219a152f8a3SRobert Watson 	KASSERT(inp->inp_faddr.s_addr == INADDR_ANY,
1220a152f8a3SRobert Watson 	    ("udp_detach: not disconnected"));
1221603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
12228501a69cSRobert Watson 	INP_WLOCK(inp);
1223d0390e05SGarrett Wollman 	in_pcbdetach(inp);
122414ba8addSRobert Watson 	in_pcbfree(inp);
1225603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
1226d0390e05SGarrett Wollman }
1227d0390e05SGarrett Wollman 
1228d0390e05SGarrett Wollman static int
1229d0390e05SGarrett Wollman udp_disconnect(struct socket *so)
1230d0390e05SGarrett Wollman {
12318b615593SMarko Zec 	INIT_VNET_INET(so->so_vnet);
1232d0390e05SGarrett Wollman 	struct inpcb *inp;
1233d0390e05SGarrett Wollman 
1234d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
123514ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_disconnect: inp == NULL"));
1236603724d3SBjoern A. Zeeb 	INP_INFO_WLOCK(&V_udbinfo);
12378501a69cSRobert Watson 	INP_WLOCK(inp);
1238f76fcf6dSJeffrey Hsu 	if (inp->inp_faddr.s_addr == INADDR_ANY) {
12398501a69cSRobert Watson 		INP_WUNLOCK(inp);
1240603724d3SBjoern A. Zeeb 		INP_INFO_WUNLOCK(&V_udbinfo);
12413329b236SRobert Watson 		return (ENOTCONN);
1242f76fcf6dSJeffrey Hsu 	}
1243d0390e05SGarrett Wollman 
1244df8bae1dSRodney W. Grimes 	in_pcbdisconnect(inp);
1245df8bae1dSRodney W. Grimes 	inp->inp_laddr.s_addr = INADDR_ANY;
1246d45e4f99SMaxim Konovalov 	SOCK_LOCK(so);
1247d45e4f99SMaxim Konovalov 	so->so_state &= ~SS_ISCONNECTED;		/* XXX */
1248d45e4f99SMaxim Konovalov 	SOCK_UNLOCK(so);
12498501a69cSRobert Watson 	INP_WUNLOCK(inp);
1250603724d3SBjoern A. Zeeb 	INP_INFO_WUNLOCK(&V_udbinfo);
12513329b236SRobert Watson 	return (0);
1252df8bae1dSRodney W. Grimes }
1253df8bae1dSRodney W. Grimes 
1254d0390e05SGarrett Wollman static int
125557bf258eSGarrett Wollman udp_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *addr,
1256b40ce416SJulian Elischer     struct mbuf *control, struct thread *td)
1257d0390e05SGarrett Wollman {
1258d0390e05SGarrett Wollman 	struct inpcb *inp;
1259d0390e05SGarrett Wollman 
1260d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
126114ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_send: inp == NULL"));
12623329b236SRobert Watson 	return (udp_output(inp, m, addr, control, td));
1263d0390e05SGarrett Wollman }
1264d0390e05SGarrett Wollman 
126576429de4SYoshinobu Inoue int
1266d0390e05SGarrett Wollman udp_shutdown(struct socket *so)
1267d0390e05SGarrett Wollman {
1268d0390e05SGarrett Wollman 	struct inpcb *inp;
1269d0390e05SGarrett Wollman 
1270d0390e05SGarrett Wollman 	inp = sotoinpcb(so);
127114ba8addSRobert Watson 	KASSERT(inp != NULL, ("udp_shutdown: inp == NULL"));
12728501a69cSRobert Watson 	INP_WLOCK(inp);
1273d0390e05SGarrett Wollman 	socantsendmore(so);
12748501a69cSRobert Watson 	INP_WUNLOCK(inp);
12753329b236SRobert Watson 	return (0);
1276d0390e05SGarrett Wollman }
1277d0390e05SGarrett Wollman 
1278d0390e05SGarrett Wollman struct pr_usrreqs udp_usrreqs = {
1279756d52a1SPoul-Henning Kamp 	.pru_abort =		udp_abort,
1280756d52a1SPoul-Henning Kamp 	.pru_attach =		udp_attach,
1281756d52a1SPoul-Henning Kamp 	.pru_bind =		udp_bind,
1282756d52a1SPoul-Henning Kamp 	.pru_connect =		udp_connect,
1283756d52a1SPoul-Henning Kamp 	.pru_control =		in_control,
1284756d52a1SPoul-Henning Kamp 	.pru_detach =		udp_detach,
1285756d52a1SPoul-Henning Kamp 	.pru_disconnect =	udp_disconnect,
128654d642bbSRobert Watson 	.pru_peeraddr =		in_getpeeraddr,
1287756d52a1SPoul-Henning Kamp 	.pru_send =		udp_send,
12885df3e839SRobert Watson 	.pru_soreceive =	soreceive_dgram,
128959b8854eSRobert Watson 	.pru_sosend =		sosend_dgram,
1290756d52a1SPoul-Henning Kamp 	.pru_shutdown =		udp_shutdown,
129154d642bbSRobert Watson 	.pru_sockaddr =		in_getsockaddr,
1292a152f8a3SRobert Watson 	.pru_sosetlabel =	in_pcbsosetlabel,
1293a152f8a3SRobert Watson 	.pru_close =		udp_close,
1294d0390e05SGarrett Wollman };
1295