19454b2d8SWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1982, 1986, 1989, 1991, 1993 3e1ac28e2SRobert Watson * The Regents of the University of California. 446a1d9bfSRobert Watson * Copyright (c) 2004-2007 Robert N. M. Watson 5e1ac28e2SRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 31748e0b0aSGarrett Wollman * From: @(#)uipc_usrreq.c 8.3 (Berkeley) 1/4/94 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 34f23929fbSRobert Watson /* 35f23929fbSRobert Watson * UNIX Domain (Local) Sockets 36f23929fbSRobert Watson * 37f23929fbSRobert Watson * This is an implementation of UNIX (local) domain sockets. Each socket has 38f23929fbSRobert Watson * an associated struct unpcb (UNIX protocol control block). Stream sockets 39f23929fbSRobert Watson * may be connected to 0 or 1 other socket. Datagram sockets may be 40f23929fbSRobert Watson * connected to 0, 1, or many other sockets. Sockets may be created and 41f23929fbSRobert Watson * connected in pairs (socketpair(2)), or bound/connected to using the file 42f23929fbSRobert Watson * system name space. For most purposes, only the receive socket buffer is 43f23929fbSRobert Watson * used, as sending on one socket delivers directly to the receive socket 445b950deaSRobert Watson * buffer of a second socket. 455b950deaSRobert Watson * 465b950deaSRobert Watson * The implementation is substantially complicated by the fact that 475b950deaSRobert Watson * "ancillary data", such as file descriptors or credentials, may be passed 485b950deaSRobert Watson * across UNIX domain sockets. The potential for passing UNIX domain sockets 495b950deaSRobert Watson * over other UNIX domain sockets requires the implementation of a simple 505b950deaSRobert Watson * garbage collector to find and tear down cycles of disconnected sockets. 51aea52f1bSRobert Watson * 52aea52f1bSRobert Watson * TODO: 53aea52f1bSRobert Watson * SEQPACKET, RDM 54aea52f1bSRobert Watson * rethink name space problems 55aea52f1bSRobert Watson * need a proper out-of-band 56aea52f1bSRobert Watson * lock pushdown 57f23929fbSRobert Watson */ 58f23929fbSRobert Watson 59677b542eSDavid E. O'Brien #include <sys/cdefs.h> 60677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 61677b542eSDavid E. O'Brien 62335654d7SRobert Watson #include "opt_mac.h" 63335654d7SRobert Watson 64df8bae1dSRodney W. Grimes #include <sys/param.h> 65fb919e4dSMark Murray #include <sys/domain.h> 66960ed29cSSeigo Tanimura #include <sys/fcntl.h> 67d826c479SBruce Evans #include <sys/malloc.h> /* XXX must be before <sys/file.h> */ 684f590175SPaul Saab #include <sys/eventhandler.h> 69639acc13SGarrett Wollman #include <sys/file.h> 70960ed29cSSeigo Tanimura #include <sys/filedesc.h> 71960ed29cSSeigo Tanimura #include <sys/jail.h> 72960ed29cSSeigo Tanimura #include <sys/kernel.h> 73960ed29cSSeigo Tanimura #include <sys/lock.h> 74639acc13SGarrett Wollman #include <sys/mbuf.h> 75033eb86eSJeff Roberson #include <sys/mount.h> 76960ed29cSSeigo Tanimura #include <sys/mutex.h> 77639acc13SGarrett Wollman #include <sys/namei.h> 78639acc13SGarrett Wollman #include <sys/proc.h> 79df8bae1dSRodney W. Grimes #include <sys/protosw.h> 80960ed29cSSeigo Tanimura #include <sys/resourcevar.h> 81df8bae1dSRodney W. Grimes #include <sys/socket.h> 82df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 83960ed29cSSeigo Tanimura #include <sys/signalvar.h> 84df8bae1dSRodney W. Grimes #include <sys/stat.h> 85960ed29cSSeigo Tanimura #include <sys/sx.h> 86639acc13SGarrett Wollman #include <sys/sysctl.h> 87960ed29cSSeigo Tanimura #include <sys/systm.h> 88a0ec558aSRobert Watson #include <sys/taskqueue.h> 89639acc13SGarrett Wollman #include <sys/un.h> 9098271db4SGarrett Wollman #include <sys/unpcb.h> 91639acc13SGarrett Wollman #include <sys/vnode.h> 92df8bae1dSRodney W. Grimes 93aed55708SRobert Watson #include <security/mac/mac_framework.h> 94aed55708SRobert Watson 959e9d298aSJeff Roberson #include <vm/uma.h> 9698271db4SGarrett Wollman 979e9d298aSJeff Roberson static uma_zone_t unp_zone; 9898271db4SGarrett Wollman static unp_gen_t unp_gencnt; 99aea52f1bSRobert Watson static u_int unp_count; /* Count of local sockets. */ 100aea52f1bSRobert Watson static ino_t unp_ino; /* Prototype for fake inode numbers. */ 101aea52f1bSRobert Watson static int unp_rights; /* File descriptors in flight. */ 102aea52f1bSRobert Watson static struct unp_head unp_shead; /* List of local stream sockets. */ 103aea52f1bSRobert Watson static struct unp_head unp_dhead; /* List of local datagram sockets. */ 10498271db4SGarrett Wollman 105aea52f1bSRobert Watson static const struct sockaddr sun_noname = { sizeof(sun_noname), AF_LOCAL }; 10698271db4SGarrett Wollman 107df8bae1dSRodney W. Grimes /* 108aea52f1bSRobert Watson * Garbage collection of cyclic file descriptor/socket references occurs 109aea52f1bSRobert Watson * asynchronously in a taskqueue context in order to avoid recursion and 110aea52f1bSRobert Watson * reentrance in the UNIX domain socket, file descriptor, and socket layer 111aea52f1bSRobert Watson * code. See unp_gc() for a full description. 112df8bae1dSRodney W. Grimes */ 113aea52f1bSRobert Watson static struct task unp_gc_task; 114f708ef1bSPoul-Henning Kamp 115ce5f32deSRobert Watson /* 1167e711c3aSRobert Watson * Both send and receive buffers are allocated PIPSIZ bytes of buffering for 1177e711c3aSRobert Watson * stream sockets, although the total for sender and receiver is actually 1187e711c3aSRobert Watson * only PIPSIZ. 1197e711c3aSRobert Watson * 1207e711c3aSRobert Watson * Datagram sockets really use the sendspace as the maximum datagram size, 1217e711c3aSRobert Watson * and don't really want to reserve the sendspace. Their recvspace should be 1227e711c3aSRobert Watson * large enough for at least one max-size datagram plus address. 1237e711c3aSRobert Watson */ 1247e711c3aSRobert Watson #ifndef PIPSIZ 1257e711c3aSRobert Watson #define PIPSIZ 8192 1267e711c3aSRobert Watson #endif 1277e711c3aSRobert Watson static u_long unpst_sendspace = PIPSIZ; 1287e711c3aSRobert Watson static u_long unpst_recvspace = PIPSIZ; 1297e711c3aSRobert Watson static u_long unpdg_sendspace = 2*1024; /* really max datagram size */ 1307e711c3aSRobert Watson static u_long unpdg_recvspace = 4*1024; 1317e711c3aSRobert Watson 132e4445a03SRobert Watson SYSCTL_NODE(_net, PF_LOCAL, local, CTLFLAG_RW, 0, "Local domain"); 133e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_STREAM, stream, CTLFLAG_RW, 0, "SOCK_STREAM"); 134e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_DGRAM, dgram, CTLFLAG_RW, 0, "SOCK_DGRAM"); 135e4445a03SRobert Watson 1367e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, sendspace, CTLFLAG_RW, 1377e711c3aSRobert Watson &unpst_sendspace, 0, ""); 1387e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, recvspace, CTLFLAG_RW, 1397e711c3aSRobert Watson &unpst_recvspace, 0, ""); 1407e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, maxdgram, CTLFLAG_RW, 1417e711c3aSRobert Watson &unpdg_sendspace, 0, ""); 1427e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, recvspace, CTLFLAG_RW, 1437e711c3aSRobert Watson &unpdg_recvspace, 0, ""); 1447e711c3aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, inflight, CTLFLAG_RD, &unp_rights, 0, ""); 1457e711c3aSRobert Watson 1467e711c3aSRobert Watson /* 147ce5f32deSRobert Watson * Currently, UNIX domain sockets are protected by a single subsystem lock, 148ce5f32deSRobert Watson * which covers global data structures and variables, the contents of each 149ce5f32deSRobert Watson * per-socket unpcb structure, and the so_pcb field in sockets attached to 150ce5f32deSRobert Watson * the UNIX domain. This provides for a moderate degree of paralellism, as 151ce5f32deSRobert Watson * receive operations on UNIX domain sockets do not need to acquire the 152ce5f32deSRobert Watson * subsystem lock. Finer grained locking to permit send() without acquiring 153ce5f32deSRobert Watson * a global lock would be a logical next step. 154ce5f32deSRobert Watson * 155ce5f32deSRobert Watson * The UNIX domain socket lock preceds all socket layer locks, including the 156ce5f32deSRobert Watson * socket lock and socket buffer lock, permitting UNIX domain socket code to 157ce5f32deSRobert Watson * call into socket support routines without releasing its locks. 158ce5f32deSRobert Watson * 159ce5f32deSRobert Watson * Some caution is required in areas where the UNIX domain socket code enters 160ce5f32deSRobert Watson * VFS in order to create or find rendezvous points. This results in 161ce5f32deSRobert Watson * dropping of the UNIX domain socket subsystem lock, acquisition of the 162ce5f32deSRobert Watson * Giant lock, and potential sleeping. This increases the chances of races, 163ce5f32deSRobert Watson * and exposes weaknesses in the socket->protocol API by offering poor 164ce5f32deSRobert Watson * failure modes. 165ce5f32deSRobert Watson */ 1660d9ce3a1SRobert Watson static struct mtx unp_mtx; 1670d9ce3a1SRobert Watson #define UNP_LOCK_INIT() \ 16846a1d9bfSRobert Watson mtx_init(&unp_mtx, "unp", NULL, MTX_DEF | MTX_RECURSE) 1690d9ce3a1SRobert Watson #define UNP_LOCK() mtx_lock(&unp_mtx) 1700d9ce3a1SRobert Watson #define UNP_UNLOCK() mtx_unlock(&unp_mtx) 1710d9ce3a1SRobert Watson #define UNP_LOCK_ASSERT() mtx_assert(&unp_mtx, MA_OWNED) 1724c5bc1caSRobert Watson #define UNP_UNLOCK_ASSERT() mtx_assert(&unp_mtx, MA_NOTOWNED) 1730d9ce3a1SRobert Watson 174aea52f1bSRobert Watson static int unp_connect(struct socket *, struct sockaddr *, 175aea52f1bSRobert Watson struct thread *); 1766a2989fdSMatthew N. Dodd static int unp_connect2(struct socket *so, struct socket *so2, int); 1774d77a549SAlfred Perlstein static void unp_disconnect(struct unpcb *); 1784d77a549SAlfred Perlstein static void unp_shutdown(struct unpcb *); 1794d77a549SAlfred Perlstein static void unp_drop(struct unpcb *, int); 180a0ec558aSRobert Watson static void unp_gc(__unused void *, int); 1814d77a549SAlfred Perlstein static void unp_scan(struct mbuf *, void (*)(struct file *)); 1824d77a549SAlfred Perlstein static void unp_mark(struct file *); 1834d77a549SAlfred Perlstein static void unp_discard(struct file *); 1844d77a549SAlfred Perlstein static void unp_freerights(struct file **, int); 1854d77a549SAlfred Perlstein static int unp_internalize(struct mbuf **, struct thread *); 186d374e81eSRobert Watson static int unp_listen(struct socket *, struct unpcb *, int, 187d374e81eSRobert Watson struct thread *); 1885b950deaSRobert Watson static struct mbuf *unp_addsockcred(struct thread *, struct mbuf *); 189f708ef1bSPoul-Henning Kamp 190e4445a03SRobert Watson /* 191e4445a03SRobert Watson * Definitions of protocols supported in the LOCAL domain. 192e4445a03SRobert Watson */ 193e4445a03SRobert Watson static struct domain localdomain; 194e4445a03SRobert Watson static struct protosw localsw[] = { 195e4445a03SRobert Watson { 196e4445a03SRobert Watson .pr_type = SOCK_STREAM, 197e4445a03SRobert Watson .pr_domain = &localdomain, 198e4445a03SRobert Watson .pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_RIGHTS, 199e4445a03SRobert Watson .pr_ctloutput = &uipc_ctloutput, 200e4445a03SRobert Watson .pr_usrreqs = &uipc_usrreqs 201e4445a03SRobert Watson }, 202e4445a03SRobert Watson { 203e4445a03SRobert Watson .pr_type = SOCK_DGRAM, 204e4445a03SRobert Watson .pr_domain = &localdomain, 205e4445a03SRobert Watson .pr_flags = PR_ATOMIC|PR_ADDR|PR_RIGHTS, 206e4445a03SRobert Watson .pr_usrreqs = &uipc_usrreqs 207e4445a03SRobert Watson }, 208e4445a03SRobert Watson }; 209e4445a03SRobert Watson 210e4445a03SRobert Watson static struct domain localdomain = { 211e4445a03SRobert Watson .dom_family = AF_LOCAL, 212e4445a03SRobert Watson .dom_name = "local", 213e4445a03SRobert Watson .dom_init = unp_init, 214e4445a03SRobert Watson .dom_externalize = unp_externalize, 215e4445a03SRobert Watson .dom_dispose = unp_dispose, 216e4445a03SRobert Watson .dom_protosw = localsw, 217e4445a03SRobert Watson .dom_protoswNPROTOSW = &localsw[sizeof(localsw)/sizeof(localsw[0])] 218e4445a03SRobert Watson }; 219e4445a03SRobert Watson DOMAIN_SET(local); 220e4445a03SRobert Watson 221ac45e92fSRobert Watson static void 222a29f300eSGarrett Wollman uipc_abort(struct socket *so) 223df8bae1dSRodney W. Grimes { 22440f2ac28SRobert Watson struct unpcb *unp; 225df8bae1dSRodney W. Grimes 22640f2ac28SRobert Watson unp = sotounpcb(so); 2274d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_abort: unp == NULL")); 2284d4b555eSRobert Watson UNP_LOCK(); 229a29f300eSGarrett Wollman unp_drop(unp, ECONNABORTED); 230a152f8a3SRobert Watson UNP_UNLOCK(); 231df8bae1dSRodney W. Grimes } 232df8bae1dSRodney W. Grimes 233a29f300eSGarrett Wollman static int 23457bf258eSGarrett Wollman uipc_accept(struct socket *so, struct sockaddr **nam) 235a29f300eSGarrett Wollman { 23640f2ac28SRobert Watson struct unpcb *unp; 2370d9ce3a1SRobert Watson const struct sockaddr *sa; 238df8bae1dSRodney W. Grimes 239df8bae1dSRodney W. Grimes /* 2401c381b19SRobert Watson * Pass back name of connected socket, if it was bound and we are 2411c381b19SRobert Watson * still connected (our peer may have closed already!). 242df8bae1dSRodney W. Grimes */ 2434d4b555eSRobert Watson unp = sotounpcb(so); 2444d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_accept: unp == NULL")); 2450d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 2460d9ce3a1SRobert Watson UNP_LOCK(); 2470d9ce3a1SRobert Watson if (unp->unp_conn != NULL && unp->unp_conn->unp_addr != NULL) 2480d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_conn->unp_addr; 2490d9ce3a1SRobert Watson else 2500d9ce3a1SRobert Watson sa = &sun_noname; 2510d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 2520d9ce3a1SRobert Watson UNP_UNLOCK(); 253e5aeaa0cSDag-Erling Smørgrav return (0); 254a29f300eSGarrett Wollman } 255df8bae1dSRodney W. Grimes 256a29f300eSGarrett Wollman static int 257b40ce416SJulian Elischer uipc_attach(struct socket *so, int proto, struct thread *td) 258a29f300eSGarrett Wollman { 2596d32873cSRobert Watson struct unpcb *unp; 2606d32873cSRobert Watson int error; 261df8bae1dSRodney W. Grimes 2626d32873cSRobert Watson KASSERT(so->so_pcb == NULL, ("uipc_attach: so_pcb != NULL")); 2636d32873cSRobert Watson if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) { 2646d32873cSRobert Watson switch (so->so_type) { 2656d32873cSRobert Watson case SOCK_STREAM: 2666d32873cSRobert Watson error = soreserve(so, unpst_sendspace, unpst_recvspace); 2676d32873cSRobert Watson break; 2686d32873cSRobert Watson 2696d32873cSRobert Watson case SOCK_DGRAM: 2706d32873cSRobert Watson error = soreserve(so, unpdg_sendspace, unpdg_recvspace); 2716d32873cSRobert Watson break; 2726d32873cSRobert Watson 2736d32873cSRobert Watson default: 2746d32873cSRobert Watson panic("unp_attach"); 2756d32873cSRobert Watson } 2766d32873cSRobert Watson if (error) 2776d32873cSRobert Watson return (error); 2786d32873cSRobert Watson } 27946a1d9bfSRobert Watson unp = uma_zalloc(unp_zone, M_NOWAIT | M_ZERO); 2806d32873cSRobert Watson if (unp == NULL) 2816d32873cSRobert Watson return (ENOBUFS); 2826d32873cSRobert Watson LIST_INIT(&unp->unp_refs); 2836d32873cSRobert Watson unp->unp_socket = so; 2846d32873cSRobert Watson so->so_pcb = unp; 2856d32873cSRobert Watson 2869ae328fcSJohn Baldwin unp->unp_refcount = 1; 2876d32873cSRobert Watson UNP_LOCK(); 2886d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 2896d32873cSRobert Watson unp_count++; 290b7e2f3ecSRobert Watson LIST_INSERT_HEAD(so->so_type == SOCK_DGRAM ? &unp_dhead : &unp_shead, 291b7e2f3ecSRobert Watson unp, unp_link); 2926d32873cSRobert Watson UNP_UNLOCK(); 2936d32873cSRobert Watson 2946d32873cSRobert Watson return (0); 295a29f300eSGarrett Wollman } 296a29f300eSGarrett Wollman 297a29f300eSGarrett Wollman static int 298b40ce416SJulian Elischer uipc_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 299a29f300eSGarrett Wollman { 300dd47f5caSRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 301dd47f5caSRobert Watson struct vattr vattr; 302dd47f5caSRobert Watson int error, namelen; 303dd47f5caSRobert Watson struct nameidata nd; 30440f2ac28SRobert Watson struct unpcb *unp; 305dd47f5caSRobert Watson struct vnode *vp; 306dd47f5caSRobert Watson struct mount *mp; 307dd47f5caSRobert Watson char *buf; 308a29f300eSGarrett Wollman 30940f2ac28SRobert Watson unp = sotounpcb(so); 3104d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_bind: unp == NULL")); 3114f1f0ef5SRobert Watson 3124f1f0ef5SRobert Watson namelen = soun->sun_len - offsetof(struct sockaddr_un, sun_path); 3134f1f0ef5SRobert Watson if (namelen <= 0) 3144f1f0ef5SRobert Watson return (EINVAL); 315dd47f5caSRobert Watson 316dd47f5caSRobert Watson /* 3174f1f0ef5SRobert Watson * We don't allow simultaneous bind() calls on a single UNIX domain 3184f1f0ef5SRobert Watson * socket, so flag in-progress operations, and return an error if an 3194f1f0ef5SRobert Watson * operation is already in progress. 3204f1f0ef5SRobert Watson * 3214f1f0ef5SRobert Watson * Historically, we have not allowed a socket to be rebound, so this 3224f1f0ef5SRobert Watson * also returns an error. Not allowing re-binding certainly 3234f1f0ef5SRobert Watson * simplifies the implementation and avoids a great many possible 3244f1f0ef5SRobert Watson * failure modes. 325dd47f5caSRobert Watson */ 3264f1f0ef5SRobert Watson UNP_LOCK(); 327dd47f5caSRobert Watson if (unp->unp_vnode != NULL) { 32840f2ac28SRobert Watson UNP_UNLOCK(); 329dd47f5caSRobert Watson return (EINVAL); 330dd47f5caSRobert Watson } 3314f1f0ef5SRobert Watson if (unp->unp_flags & UNP_BINDING) { 332dd47f5caSRobert Watson UNP_UNLOCK(); 3334f1f0ef5SRobert Watson return (EALREADY); 334dd47f5caSRobert Watson } 3354f1f0ef5SRobert Watson unp->unp_flags |= UNP_BINDING; 336dd47f5caSRobert Watson UNP_UNLOCK(); 337dd47f5caSRobert Watson 338dd47f5caSRobert Watson buf = malloc(namelen + 1, M_TEMP, M_WAITOK); 339dd47f5caSRobert Watson strlcpy(buf, soun->sun_path, namelen + 1); 340dd47f5caSRobert Watson 341dd47f5caSRobert Watson mtx_lock(&Giant); 342dd47f5caSRobert Watson restart: 343dd47f5caSRobert Watson mtx_assert(&Giant, MA_OWNED); 344dd47f5caSRobert Watson NDINIT(&nd, CREATE, NOFOLLOW | LOCKPARENT | SAVENAME, UIO_SYSSPACE, 345dd47f5caSRobert Watson buf, td); 346dd47f5caSRobert Watson /* SHOULD BE ABLE TO ADOPT EXISTING AND wakeup() ALA FIFO's */ 347dd47f5caSRobert Watson error = namei(&nd); 348dd47f5caSRobert Watson if (error) 3494f1f0ef5SRobert Watson goto error; 350dd47f5caSRobert Watson vp = nd.ni_vp; 351dd47f5caSRobert Watson if (vp != NULL || vn_start_write(nd.ni_dvp, &mp, V_NOWAIT) != 0) { 352dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 353dd47f5caSRobert Watson if (nd.ni_dvp == vp) 354dd47f5caSRobert Watson vrele(nd.ni_dvp); 355dd47f5caSRobert Watson else 356dd47f5caSRobert Watson vput(nd.ni_dvp); 357dd47f5caSRobert Watson if (vp != NULL) { 358dd47f5caSRobert Watson vrele(vp); 359dd47f5caSRobert Watson error = EADDRINUSE; 3604f1f0ef5SRobert Watson goto error; 361dd47f5caSRobert Watson } 362dd47f5caSRobert Watson error = vn_start_write(NULL, &mp, V_XSLEEP | PCATCH); 363dd47f5caSRobert Watson if (error) 3644f1f0ef5SRobert Watson goto error; 365dd47f5caSRobert Watson goto restart; 366dd47f5caSRobert Watson } 367dd47f5caSRobert Watson VATTR_NULL(&vattr); 368dd47f5caSRobert Watson vattr.va_type = VSOCK; 369dd47f5caSRobert Watson vattr.va_mode = (ACCESSPERMS & ~td->td_proc->p_fd->fd_cmask); 370dd47f5caSRobert Watson #ifdef MAC 371dd47f5caSRobert Watson error = mac_check_vnode_create(td->td_ucred, nd.ni_dvp, &nd.ni_cnd, 372dd47f5caSRobert Watson &vattr); 373dd47f5caSRobert Watson #endif 374dd47f5caSRobert Watson if (error == 0) { 375dd47f5caSRobert Watson VOP_LEASE(nd.ni_dvp, td, td->td_ucred, LEASE_WRITE); 376dd47f5caSRobert Watson error = VOP_CREATE(nd.ni_dvp, &nd.ni_vp, &nd.ni_cnd, &vattr); 377dd47f5caSRobert Watson } 378dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 379dd47f5caSRobert Watson vput(nd.ni_dvp); 380dd47f5caSRobert Watson if (error) { 381dd47f5caSRobert Watson vn_finished_write(mp); 3824f1f0ef5SRobert Watson goto error; 383dd47f5caSRobert Watson } 384dd47f5caSRobert Watson vp = nd.ni_vp; 3854f1f0ef5SRobert Watson ASSERT_VOP_LOCKED(vp, "uipc_bind"); 386dd47f5caSRobert Watson soun = (struct sockaddr_un *)sodupsockaddr(nam, M_WAITOK); 387dd47f5caSRobert Watson UNP_LOCK(); 388dd47f5caSRobert Watson vp->v_socket = unp->unp_socket; 389dd47f5caSRobert Watson unp->unp_vnode = vp; 390dd47f5caSRobert Watson unp->unp_addr = soun; 3914f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 392dd47f5caSRobert Watson UNP_UNLOCK(); 393dd47f5caSRobert Watson VOP_UNLOCK(vp, 0, td); 394dd47f5caSRobert Watson vn_finished_write(mp); 3954f1f0ef5SRobert Watson mtx_unlock(&Giant); 3964f1f0ef5SRobert Watson free(buf, M_TEMP); 3974f1f0ef5SRobert Watson return (0); 3984f1f0ef5SRobert Watson error: 3994f1f0ef5SRobert Watson UNP_LOCK(); 4004f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 4014f1f0ef5SRobert Watson UNP_UNLOCK(); 402dd47f5caSRobert Watson mtx_unlock(&Giant); 403dd47f5caSRobert Watson free(buf, M_TEMP); 40440f2ac28SRobert Watson return (error); 405a29f300eSGarrett Wollman } 406a29f300eSGarrett Wollman 407a29f300eSGarrett Wollman static int 408b40ce416SJulian Elischer uipc_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 409a29f300eSGarrett Wollman { 4100d9ce3a1SRobert Watson int error; 411a29f300eSGarrett Wollman 412fd179ee9SRobert Watson KASSERT(td == curthread, ("uipc_connect: td != curthread")); 4134d4b555eSRobert Watson UNP_LOCK(); 414fd179ee9SRobert Watson error = unp_connect(so, nam, td); 4150d9ce3a1SRobert Watson UNP_UNLOCK(); 4160d9ce3a1SRobert Watson return (error); 417a29f300eSGarrett Wollman } 418a29f300eSGarrett Wollman 419a152f8a3SRobert Watson /* 420a152f8a3SRobert Watson * XXXRW: Should also unbind? 421a152f8a3SRobert Watson */ 422a152f8a3SRobert Watson static void 423a152f8a3SRobert Watson uipc_close(struct socket *so) 424a152f8a3SRobert Watson { 425a152f8a3SRobert Watson struct unpcb *unp; 426a152f8a3SRobert Watson 427a152f8a3SRobert Watson unp = sotounpcb(so); 428a152f8a3SRobert Watson KASSERT(unp != NULL, ("uipc_close: unp == NULL")); 429a152f8a3SRobert Watson UNP_LOCK(); 430a152f8a3SRobert Watson unp_disconnect(unp); 431a152f8a3SRobert Watson UNP_UNLOCK(); 432a152f8a3SRobert Watson } 433a152f8a3SRobert Watson 434db48c0d2SRobert Watson int 435a29f300eSGarrett Wollman uipc_connect2(struct socket *so1, struct socket *so2) 436a29f300eSGarrett Wollman { 43740f2ac28SRobert Watson struct unpcb *unp; 4380d9ce3a1SRobert Watson int error; 439a29f300eSGarrett Wollman 44040f2ac28SRobert Watson unp = sotounpcb(so1); 4414d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_connect2: unp == NULL")); 4424d4b555eSRobert Watson UNP_LOCK(); 4436a2989fdSMatthew N. Dodd error = unp_connect2(so1, so2, PRU_CONNECT2); 4440d9ce3a1SRobert Watson UNP_UNLOCK(); 4450d9ce3a1SRobert Watson return (error); 446a29f300eSGarrett Wollman } 447a29f300eSGarrett Wollman 448a29f300eSGarrett Wollman /* control is EOPNOTSUPP */ 449a29f300eSGarrett Wollman 450bc725eafSRobert Watson static void 451a29f300eSGarrett Wollman uipc_detach(struct socket *so) 452a29f300eSGarrett Wollman { 4539ae328fcSJohn Baldwin struct sockaddr_un *saved_unp_addr; 45440f2ac28SRobert Watson struct unpcb *unp; 4556d32873cSRobert Watson struct vnode *vp; 4569ae328fcSJohn Baldwin int freeunp, local_unp_rights; 457a29f300eSGarrett Wollman 45840f2ac28SRobert Watson unp = sotounpcb(so); 4594d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_detach: unp == NULL")); 4604d4b555eSRobert Watson UNP_LOCK(); 4616d32873cSRobert Watson LIST_REMOVE(unp, unp_link); 4626d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 4636d32873cSRobert Watson --unp_count; 4646d32873cSRobert Watson if ((vp = unp->unp_vnode) != NULL) { 4656d32873cSRobert Watson unp->unp_vnode->v_socket = NULL; 4666d32873cSRobert Watson unp->unp_vnode = NULL; 4676d32873cSRobert Watson } 4686d32873cSRobert Watson if (unp->unp_conn != NULL) 4696d32873cSRobert Watson unp_disconnect(unp); 4706d32873cSRobert Watson while (!LIST_EMPTY(&unp->unp_refs)) { 4716d32873cSRobert Watson struct unpcb *ref = LIST_FIRST(&unp->unp_refs); 4726d32873cSRobert Watson unp_drop(ref, ECONNRESET); 4736d32873cSRobert Watson } 4746d32873cSRobert Watson unp->unp_socket->so_pcb = NULL; 4756d32873cSRobert Watson local_unp_rights = unp_rights; 4769ae328fcSJohn Baldwin saved_unp_addr = unp->unp_addr; 4779ae328fcSJohn Baldwin unp->unp_addr = NULL; 4789ae328fcSJohn Baldwin unp->unp_refcount--; 4799ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 4806d32873cSRobert Watson UNP_UNLOCK(); 4819ae328fcSJohn Baldwin if (saved_unp_addr != NULL) 4829ae328fcSJohn Baldwin FREE(saved_unp_addr, M_SONAME); 4839ae328fcSJohn Baldwin if (freeunp) 4846d32873cSRobert Watson uma_zfree(unp_zone, unp); 4856d32873cSRobert Watson if (vp) { 4866d32873cSRobert Watson int vfslocked; 4876d32873cSRobert Watson 4886d32873cSRobert Watson vfslocked = VFS_LOCK_GIANT(vp->v_mount); 4896d32873cSRobert Watson vrele(vp); 4906d32873cSRobert Watson VFS_UNLOCK_GIANT(vfslocked); 4916d32873cSRobert Watson } 4926d32873cSRobert Watson if (local_unp_rights) 4936d32873cSRobert Watson taskqueue_enqueue(taskqueue_thread, &unp_gc_task); 494a29f300eSGarrett Wollman } 495a29f300eSGarrett Wollman 496a29f300eSGarrett Wollman static int 497a29f300eSGarrett Wollman uipc_disconnect(struct socket *so) 498a29f300eSGarrett Wollman { 49940f2ac28SRobert Watson struct unpcb *unp; 500a29f300eSGarrett Wollman 50140f2ac28SRobert Watson unp = sotounpcb(so); 5024d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_disconnect: unp == NULL")); 5034d4b555eSRobert Watson UNP_LOCK(); 504a29f300eSGarrett Wollman unp_disconnect(unp); 5050d9ce3a1SRobert Watson UNP_UNLOCK(); 506e5aeaa0cSDag-Erling Smørgrav return (0); 507a29f300eSGarrett Wollman } 508a29f300eSGarrett Wollman 509a29f300eSGarrett Wollman static int 510d374e81eSRobert Watson uipc_listen(struct socket *so, int backlog, struct thread *td) 511a29f300eSGarrett Wollman { 51240f2ac28SRobert Watson struct unpcb *unp; 5130d9ce3a1SRobert Watson int error; 514a29f300eSGarrett Wollman 51540f2ac28SRobert Watson unp = sotounpcb(so); 5164d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_listen: unp == NULL")); 5174d4b555eSRobert Watson UNP_LOCK(); 5184d4b555eSRobert Watson if (unp->unp_vnode == NULL) { 51940f2ac28SRobert Watson UNP_UNLOCK(); 52040f2ac28SRobert Watson return (EINVAL); 52140f2ac28SRobert Watson } 522d374e81eSRobert Watson error = unp_listen(so, unp, backlog, td); 5230d9ce3a1SRobert Watson UNP_UNLOCK(); 5240d9ce3a1SRobert Watson return (error); 525a29f300eSGarrett Wollman } 526a29f300eSGarrett Wollman 527a29f300eSGarrett Wollman static int 52857bf258eSGarrett Wollman uipc_peeraddr(struct socket *so, struct sockaddr **nam) 529a29f300eSGarrett Wollman { 53040f2ac28SRobert Watson struct unpcb *unp; 5310d9ce3a1SRobert Watson const struct sockaddr *sa; 532a29f300eSGarrett Wollman 5334d4b555eSRobert Watson unp = sotounpcb(so); 5344d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_peeraddr: unp == NULL")); 5350d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 5360d9ce3a1SRobert Watson UNP_LOCK(); 537fc3fcacfSRobert Watson if (unp->unp_conn != NULL && unp->unp_conn->unp_addr!= NULL) 5380d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_conn->unp_addr; 539bdc5f6a3SHajimu UMEMOTO else { 540bdc5f6a3SHajimu UMEMOTO /* 541bdc5f6a3SHajimu UMEMOTO * XXX: It seems that this test always fails even when 542bdc5f6a3SHajimu UMEMOTO * connection is established. So, this else clause is 543bdc5f6a3SHajimu UMEMOTO * added as workaround to return PF_LOCAL sockaddr. 544bdc5f6a3SHajimu UMEMOTO */ 5450d9ce3a1SRobert Watson sa = &sun_noname; 546bdc5f6a3SHajimu UMEMOTO } 5470d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 5480d9ce3a1SRobert Watson UNP_UNLOCK(); 549e5aeaa0cSDag-Erling Smørgrav return (0); 550a29f300eSGarrett Wollman } 551a29f300eSGarrett Wollman 552a29f300eSGarrett Wollman static int 553a29f300eSGarrett Wollman uipc_rcvd(struct socket *so, int flags) 554a29f300eSGarrett Wollman { 55540f2ac28SRobert Watson struct unpcb *unp; 556a29f300eSGarrett Wollman struct socket *so2; 557337cc6b6SRobert Watson u_int mbcnt, sbcc; 5586aef685fSBrian Feldman u_long newhiwat; 559a29f300eSGarrett Wollman 56040f2ac28SRobert Watson unp = sotounpcb(so); 5614d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_rcvd: unp == NULL")); 562df8bae1dSRodney W. Grimes switch (so->so_type) { 563df8bae1dSRodney W. Grimes case SOCK_DGRAM: 564a29f300eSGarrett Wollman panic("uipc_rcvd DGRAM?"); 565df8bae1dSRodney W. Grimes /*NOTREACHED*/ 566df8bae1dSRodney W. Grimes 567df8bae1dSRodney W. Grimes case SOCK_STREAM: 568df8bae1dSRodney W. Grimes /* 5691c381b19SRobert Watson * Adjust backpressure on sender and wakeup any waiting to 5701c381b19SRobert Watson * write. 571df8bae1dSRodney W. Grimes */ 572337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 573337cc6b6SRobert Watson mbcnt = so->so_rcv.sb_mbcnt; 574337cc6b6SRobert Watson sbcc = so->so_rcv.sb_cc; 575337cc6b6SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 576337cc6b6SRobert Watson UNP_LOCK(); 577337cc6b6SRobert Watson if (unp->unp_conn == NULL) { 578337cc6b6SRobert Watson UNP_UNLOCK(); 579337cc6b6SRobert Watson break; 580337cc6b6SRobert Watson } 581337cc6b6SRobert Watson so2 = unp->unp_conn->unp_socket; 582337cc6b6SRobert Watson SOCKBUF_LOCK(&so2->so_snd); 583337cc6b6SRobert Watson so2->so_snd.sb_mbmax += unp->unp_mbcnt - mbcnt; 584337cc6b6SRobert Watson newhiwat = so2->so_snd.sb_hiwat + unp->unp_cc - sbcc; 585f535380cSDon Lewis (void)chgsbsize(so2->so_cred->cr_uidinfo, &so2->so_snd.sb_hiwat, 5866aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 5871e4d7da7SRobert Watson sowwakeup_locked(so2); 588337cc6b6SRobert Watson unp->unp_mbcnt = mbcnt; 589337cc6b6SRobert Watson unp->unp_cc = sbcc; 590337cc6b6SRobert Watson UNP_UNLOCK(); 591df8bae1dSRodney W. Grimes break; 592df8bae1dSRodney W. Grimes 593df8bae1dSRodney W. Grimes default: 594a29f300eSGarrett Wollman panic("uipc_rcvd unknown socktype"); 595df8bae1dSRodney W. Grimes } 596e5aeaa0cSDag-Erling Smørgrav return (0); 597a29f300eSGarrett Wollman } 598df8bae1dSRodney W. Grimes 599a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */ 600a29f300eSGarrett Wollman 601a29f300eSGarrett Wollman static int 60257bf258eSGarrett Wollman uipc_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam, 603b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 604a29f300eSGarrett Wollman { 605f3f49bbbSRobert Watson struct unpcb *unp, *unp2; 606a29f300eSGarrett Wollman struct socket *so2; 607337cc6b6SRobert Watson u_int mbcnt, sbcc; 6086aef685fSBrian Feldman u_long newhiwat; 609f3f49bbbSRobert Watson int error = 0; 610a29f300eSGarrett Wollman 61140f2ac28SRobert Watson unp = sotounpcb(so); 6124d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_send: unp == NULL")); 613a29f300eSGarrett Wollman if (flags & PRUS_OOB) { 614a29f300eSGarrett Wollman error = EOPNOTSUPP; 615a29f300eSGarrett Wollman goto release; 616a29f300eSGarrett Wollman } 617a29f300eSGarrett Wollman 618fc3fcacfSRobert Watson if (control != NULL && (error = unp_internalize(&control, td))) 619a29f300eSGarrett Wollman goto release; 620df8bae1dSRodney W. Grimes 6210d9ce3a1SRobert Watson UNP_LOCK(); 622a29f300eSGarrett Wollman switch (so->so_type) { 623a29f300eSGarrett Wollman case SOCK_DGRAM: 624a29f300eSGarrett Wollman { 625e7dd9a10SRobert Watson const struct sockaddr *from; 626df8bae1dSRodney W. Grimes 627fc3fcacfSRobert Watson if (nam != NULL) { 628fc3fcacfSRobert Watson if (unp->unp_conn != NULL) { 629df8bae1dSRodney W. Grimes error = EISCONN; 630df8bae1dSRodney W. Grimes break; 631df8bae1dSRodney W. Grimes } 632b40ce416SJulian Elischer error = unp_connect(so, nam, td); 633df8bae1dSRodney W. Grimes if (error) 634df8bae1dSRodney W. Grimes break; 635df8bae1dSRodney W. Grimes } 636b5ff0914SRobert Watson /* 637b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 638b5ff0914SRobert Watson * with a target address, it's possible that the socket will 639b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 640b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 641b5ff0914SRobert Watson * correct error that the socket is not connected. 642b5ff0914SRobert Watson */ 643f3f49bbbSRobert Watson unp2 = unp->unp_conn; 644b5ff0914SRobert Watson if (unp2 == NULL) { 645b5ff0914SRobert Watson error = ENOTCONN; 646b5ff0914SRobert Watson break; 647b5ff0914SRobert Watson } 648f3f49bbbSRobert Watson so2 = unp2->unp_socket; 649fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 65057bf258eSGarrett Wollman from = (struct sockaddr *)unp->unp_addr; 651df8bae1dSRodney W. Grimes else 652df8bae1dSRodney W. Grimes from = &sun_noname; 653f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) 6546a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 655a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 656a34b7046SRobert Watson if (sbappendaddr_locked(&so2->so_rcv, from, m, control)) { 6571e4d7da7SRobert Watson sorwakeup_locked(so2); 658fc3fcacfSRobert Watson m = NULL; 659fc3fcacfSRobert Watson control = NULL; 660e5aeaa0cSDag-Erling Smørgrav } else { 661a34b7046SRobert Watson SOCKBUF_UNLOCK(&so2->so_rcv); 662df8bae1dSRodney W. Grimes error = ENOBUFS; 663e5aeaa0cSDag-Erling Smørgrav } 664fc3fcacfSRobert Watson if (nam != NULL) 665df8bae1dSRodney W. Grimes unp_disconnect(unp); 666df8bae1dSRodney W. Grimes break; 667df8bae1dSRodney W. Grimes } 668df8bae1dSRodney W. Grimes 669df8bae1dSRodney W. Grimes case SOCK_STREAM: 6706b8fda4dSGarrett Wollman /* 6711c381b19SRobert Watson * Connect if not connected yet. 6721c381b19SRobert Watson * 6731c381b19SRobert Watson * Note: A better implementation would complain if not equal 6741c381b19SRobert Watson * to the peer's address. 6756b8fda4dSGarrett Wollman */ 676402cc72dSDavid Greenman if ((so->so_state & SS_ISCONNECTED) == 0) { 677fc3fcacfSRobert Watson if (nam != NULL) { 678b40ce416SJulian Elischer error = unp_connect(so, nam, td); 679402cc72dSDavid Greenman if (error) 6806b8fda4dSGarrett Wollman break; /* XXX */ 681402cc72dSDavid Greenman } else { 682402cc72dSDavid Greenman error = ENOTCONN; 683402cc72dSDavid Greenman break; 684402cc72dSDavid Greenman } 685402cc72dSDavid Greenman } 686402cc72dSDavid Greenman 687337cc6b6SRobert Watson /* Lockless read. */ 688c0b99ffaSRobert Watson if (so->so_snd.sb_state & SBS_CANTSENDMORE) { 689df8bae1dSRodney W. Grimes error = EPIPE; 690df8bae1dSRodney W. Grimes break; 691df8bae1dSRodney W. Grimes } 692b5ff0914SRobert Watson /* 693b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 694b5ff0914SRobert Watson * with a target address, it's possible that the socket will 695b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 696b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 697b5ff0914SRobert Watson * correct error that the socket is not connected. 698b5ff0914SRobert Watson */ 699f3f49bbbSRobert Watson unp2 = unp->unp_conn; 700b5ff0914SRobert Watson if (unp2 == NULL) { 701b5ff0914SRobert Watson error = ENOTCONN; 702b5ff0914SRobert Watson break; 703b5ff0914SRobert Watson } 704f3f49bbbSRobert Watson so2 = unp2->unp_socket; 705a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 706f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) { 7076a2989fdSMatthew N. Dodd /* 7086a2989fdSMatthew N. Dodd * Credentials are passed only once on 7096a2989fdSMatthew N. Dodd * SOCK_STREAM. 7106a2989fdSMatthew N. Dodd */ 711f3f49bbbSRobert Watson unp2->unp_flags &= ~UNP_WANTCRED; 7126a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 7136a2989fdSMatthew N. Dodd } 714df8bae1dSRodney W. Grimes /* 7151c381b19SRobert Watson * Send to paired receive port, and then reduce send buffer 7161c381b19SRobert Watson * hiwater marks to maintain backpressure. Wake up readers. 717df8bae1dSRodney W. Grimes */ 718fc3fcacfSRobert Watson if (control != NULL) { 719a34b7046SRobert Watson if (sbappendcontrol_locked(&so2->so_rcv, m, control)) 720fc3fcacfSRobert Watson control = NULL; 721e5aeaa0cSDag-Erling Smørgrav } else { 722a34b7046SRobert Watson sbappend_locked(&so2->so_rcv, m); 723e5aeaa0cSDag-Erling Smørgrav } 724f3f49bbbSRobert Watson mbcnt = so2->so_rcv.sb_mbcnt - unp2->unp_mbcnt; 725f3f49bbbSRobert Watson unp2->unp_mbcnt = so2->so_rcv.sb_mbcnt; 726337cc6b6SRobert Watson sbcc = so2->so_rcv.sb_cc; 727337cc6b6SRobert Watson sorwakeup_locked(so2); 728337cc6b6SRobert Watson 729337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_snd); 730f3f49bbbSRobert Watson newhiwat = so->so_snd.sb_hiwat - (sbcc - unp2->unp_cc); 731f535380cSDon Lewis (void)chgsbsize(so->so_cred->cr_uidinfo, &so->so_snd.sb_hiwat, 7326aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 733337cc6b6SRobert Watson so->so_snd.sb_mbmax -= mbcnt; 7347abe2ac2SAlan Cox SOCKBUF_UNLOCK(&so->so_snd); 735337cc6b6SRobert Watson 736f3f49bbbSRobert Watson unp2->unp_cc = sbcc; 737fc3fcacfSRobert Watson m = NULL; 738df8bae1dSRodney W. Grimes break; 739df8bae1dSRodney W. Grimes 740df8bae1dSRodney W. Grimes default: 741a29f300eSGarrett Wollman panic("uipc_send unknown socktype"); 742df8bae1dSRodney W. Grimes } 743a29f300eSGarrett Wollman 7446b8fda4dSGarrett Wollman /* 7456b8fda4dSGarrett Wollman * SEND_EOF is equivalent to a SEND followed by 7466b8fda4dSGarrett Wollman * a SHUTDOWN. 7476b8fda4dSGarrett Wollman */ 748a29f300eSGarrett Wollman if (flags & PRUS_EOF) { 7496b8fda4dSGarrett Wollman socantsendmore(so); 7506b8fda4dSGarrett Wollman unp_shutdown(unp); 7516b8fda4dSGarrett Wollman } 7520d9ce3a1SRobert Watson UNP_UNLOCK(); 753df8bae1dSRodney W. Grimes 754fc3fcacfSRobert Watson if (control != NULL && error != 0) 755bd508d39SDon Lewis unp_dispose(control); 756bd508d39SDon Lewis 757a29f300eSGarrett Wollman release: 758fc3fcacfSRobert Watson if (control != NULL) 759a29f300eSGarrett Wollman m_freem(control); 760fc3fcacfSRobert Watson if (m != NULL) 761a29f300eSGarrett Wollman m_freem(m); 762e5aeaa0cSDag-Erling Smørgrav return (error); 763a29f300eSGarrett Wollman } 764df8bae1dSRodney W. Grimes 765a29f300eSGarrett Wollman static int 766a29f300eSGarrett Wollman uipc_sense(struct socket *so, struct stat *sb) 767a29f300eSGarrett Wollman { 76840f2ac28SRobert Watson struct unpcb *unp; 769a29f300eSGarrett Wollman struct socket *so2; 770a29f300eSGarrett Wollman 77140f2ac28SRobert Watson unp = sotounpcb(so); 7724d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sense: unp == NULL")); 7734d4b555eSRobert Watson UNP_LOCK(); 774a29f300eSGarrett Wollman sb->st_blksize = so->so_snd.sb_hiwat; 775fc3fcacfSRobert Watson if (so->so_type == SOCK_STREAM && unp->unp_conn != NULL) { 776df8bae1dSRodney W. Grimes so2 = unp->unp_conn->unp_socket; 777a29f300eSGarrett Wollman sb->st_blksize += so2->so_rcv.sb_cc; 778df8bae1dSRodney W. Grimes } 779f3732fd1SPoul-Henning Kamp sb->st_dev = NODEV; 780df8bae1dSRodney W. Grimes if (unp->unp_ino == 0) 7816f782c46SJeffrey Hsu unp->unp_ino = (++unp_ino == 0) ? ++unp_ino : unp_ino; 782a29f300eSGarrett Wollman sb->st_ino = unp->unp_ino; 7830d9ce3a1SRobert Watson UNP_UNLOCK(); 784df8bae1dSRodney W. Grimes return (0); 785a29f300eSGarrett Wollman } 786df8bae1dSRodney W. Grimes 787a29f300eSGarrett Wollman static int 788a29f300eSGarrett Wollman uipc_shutdown(struct socket *so) 789a29f300eSGarrett Wollman { 79040f2ac28SRobert Watson struct unpcb *unp; 791df8bae1dSRodney W. Grimes 79240f2ac28SRobert Watson unp = sotounpcb(so); 7934d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_shutdown: unp == NULL")); 7944d4b555eSRobert Watson UNP_LOCK(); 795a29f300eSGarrett Wollman socantsendmore(so); 796a29f300eSGarrett Wollman unp_shutdown(unp); 7970d9ce3a1SRobert Watson UNP_UNLOCK(); 798e5aeaa0cSDag-Erling Smørgrav return (0); 799a29f300eSGarrett Wollman } 800df8bae1dSRodney W. Grimes 801a29f300eSGarrett Wollman static int 80257bf258eSGarrett Wollman uipc_sockaddr(struct socket *so, struct sockaddr **nam) 803a29f300eSGarrett Wollman { 80440f2ac28SRobert Watson struct unpcb *unp; 8050d9ce3a1SRobert Watson const struct sockaddr *sa; 806a29f300eSGarrett Wollman 8074d4b555eSRobert Watson unp = sotounpcb(so); 8084d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sockaddr: unp == NULL")); 8090d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 8100d9ce3a1SRobert Watson UNP_LOCK(); 811fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 8120d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_addr; 81383f3198bSThomas Moestl else 8140d9ce3a1SRobert Watson sa = &sun_noname; 8150d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 8160d9ce3a1SRobert Watson UNP_UNLOCK(); 817e5aeaa0cSDag-Erling Smørgrav return (0); 818df8bae1dSRodney W. Grimes } 819a29f300eSGarrett Wollman 820a29f300eSGarrett Wollman struct pr_usrreqs uipc_usrreqs = { 821756d52a1SPoul-Henning Kamp .pru_abort = uipc_abort, 822756d52a1SPoul-Henning Kamp .pru_accept = uipc_accept, 823756d52a1SPoul-Henning Kamp .pru_attach = uipc_attach, 824756d52a1SPoul-Henning Kamp .pru_bind = uipc_bind, 825756d52a1SPoul-Henning Kamp .pru_connect = uipc_connect, 826756d52a1SPoul-Henning Kamp .pru_connect2 = uipc_connect2, 827756d52a1SPoul-Henning Kamp .pru_detach = uipc_detach, 828756d52a1SPoul-Henning Kamp .pru_disconnect = uipc_disconnect, 829756d52a1SPoul-Henning Kamp .pru_listen = uipc_listen, 830756d52a1SPoul-Henning Kamp .pru_peeraddr = uipc_peeraddr, 831756d52a1SPoul-Henning Kamp .pru_rcvd = uipc_rcvd, 832756d52a1SPoul-Henning Kamp .pru_send = uipc_send, 833756d52a1SPoul-Henning Kamp .pru_sense = uipc_sense, 834756d52a1SPoul-Henning Kamp .pru_shutdown = uipc_shutdown, 835756d52a1SPoul-Henning Kamp .pru_sockaddr = uipc_sockaddr, 836a152f8a3SRobert Watson .pru_close = uipc_close, 837a29f300eSGarrett Wollman }; 838df8bae1dSRodney W. Grimes 8390c1bb4fbSDima Dorfman int 840892af6b9SRobert Watson uipc_ctloutput(struct socket *so, struct sockopt *sopt) 8410c1bb4fbSDima Dorfman { 84240f2ac28SRobert Watson struct unpcb *unp; 8430d9ce3a1SRobert Watson struct xucred xu; 8446a2989fdSMatthew N. Dodd int error, optval; 8456a2989fdSMatthew N. Dodd 84696a041b5SMatthew N. Dodd if (sopt->sopt_level != 0) 84796a041b5SMatthew N. Dodd return (EINVAL); 84896a041b5SMatthew N. Dodd 8496a2989fdSMatthew N. Dodd unp = sotounpcb(so); 8504d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_ctloutput: unp == NULL")); 8516a2989fdSMatthew N. Dodd error = 0; 8520c1bb4fbSDima Dorfman switch (sopt->sopt_dir) { 8530c1bb4fbSDima Dorfman case SOPT_GET: 8540c1bb4fbSDima Dorfman switch (sopt->sopt_name) { 8550c1bb4fbSDima Dorfman case LOCAL_PEERCRED: 8561f837c47SRobert Watson UNP_LOCK(); 8570c1bb4fbSDima Dorfman if (unp->unp_flags & UNP_HAVEPC) 8580d9ce3a1SRobert Watson xu = unp->unp_peercred; 8590c1bb4fbSDima Dorfman else { 8600c1bb4fbSDima Dorfman if (so->so_type == SOCK_STREAM) 8610c1bb4fbSDima Dorfman error = ENOTCONN; 8620c1bb4fbSDima Dorfman else 8630c1bb4fbSDima Dorfman error = EINVAL; 8640c1bb4fbSDima Dorfman } 8651f837c47SRobert Watson UNP_UNLOCK(); 8660d9ce3a1SRobert Watson if (error == 0) 8670d9ce3a1SRobert Watson error = sooptcopyout(sopt, &xu, sizeof(xu)); 8680c1bb4fbSDima Dorfman break; 8696a2989fdSMatthew N. Dodd case LOCAL_CREDS: 8701f837c47SRobert Watson /* Unocked read. */ 8716a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_WANTCRED ? 1 : 0; 8726a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 8736a2989fdSMatthew N. Dodd break; 8746a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 8751f837c47SRobert Watson /* Unocked read. */ 8766a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_CONNWAIT ? 1 : 0; 8776a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 8786a2989fdSMatthew N. Dodd break; 8790c1bb4fbSDima Dorfman default: 8800c1bb4fbSDima Dorfman error = EOPNOTSUPP; 8810c1bb4fbSDima Dorfman break; 8820c1bb4fbSDima Dorfman } 8830c1bb4fbSDima Dorfman break; 8840c1bb4fbSDima Dorfman case SOPT_SET: 8856a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 8866a2989fdSMatthew N. Dodd case LOCAL_CREDS: 8876a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 8886a2989fdSMatthew N. Dodd error = sooptcopyin(sopt, &optval, sizeof(optval), 8896a2989fdSMatthew N. Dodd sizeof(optval)); 8906a2989fdSMatthew N. Dodd if (error) 8916a2989fdSMatthew N. Dodd break; 8926a2989fdSMatthew N. Dodd 8936a2989fdSMatthew N. Dodd #define OPTSET(bit) \ 8946a2989fdSMatthew N. Dodd if (optval) \ 8956a2989fdSMatthew N. Dodd unp->unp_flags |= bit; \ 8966a2989fdSMatthew N. Dodd else \ 8976a2989fdSMatthew N. Dodd unp->unp_flags &= ~bit; 8986a2989fdSMatthew N. Dodd 8991f837c47SRobert Watson UNP_LOCK(); 9006a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 9016a2989fdSMatthew N. Dodd case LOCAL_CREDS: 9026a2989fdSMatthew N. Dodd OPTSET(UNP_WANTCRED); 9036a2989fdSMatthew N. Dodd break; 9046a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 9056a2989fdSMatthew N. Dodd OPTSET(UNP_CONNWAIT); 9066a2989fdSMatthew N. Dodd break; 9076a2989fdSMatthew N. Dodd default: 9086a2989fdSMatthew N. Dodd break; 9096a2989fdSMatthew N. Dodd } 9101f837c47SRobert Watson UNP_UNLOCK(); 9116a2989fdSMatthew N. Dodd break; 9126a2989fdSMatthew N. Dodd #undef OPTSET 9136a2989fdSMatthew N. Dodd default: 9146a2989fdSMatthew N. Dodd error = ENOPROTOOPT; 9156a2989fdSMatthew N. Dodd break; 9166a2989fdSMatthew N. Dodd } 917abb886faSMatthew N. Dodd break; 9180c1bb4fbSDima Dorfman default: 9190c1bb4fbSDima Dorfman error = EOPNOTSUPP; 9200c1bb4fbSDima Dorfman break; 9210c1bb4fbSDima Dorfman } 9220c1bb4fbSDima Dorfman return (error); 9230c1bb4fbSDima Dorfman } 9240c1bb4fbSDima Dorfman 925f708ef1bSPoul-Henning Kamp static int 926892af6b9SRobert Watson unp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 927df8bae1dSRodney W. Grimes { 928892af6b9SRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 929892af6b9SRobert Watson struct vnode *vp; 930892af6b9SRobert Watson struct socket *so2, *so3; 931b295bdcdSRobert Watson struct unpcb *unp, *unp2, *unp3; 93257bf258eSGarrett Wollman int error, len; 933df8bae1dSRodney W. Grimes struct nameidata nd; 93457bf258eSGarrett Wollman char buf[SOCK_MAXADDRLEN]; 9350d9ce3a1SRobert Watson struct sockaddr *sa; 9360d9ce3a1SRobert Watson 9370d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 938df8bae1dSRodney W. Grimes 9394d4b555eSRobert Watson unp = sotounpcb(so); 9404d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 94157bf258eSGarrett Wollman len = nam->sa_len - offsetof(struct sockaddr_un, sun_path); 94257bf258eSGarrett Wollman if (len <= 0) 943e5aeaa0cSDag-Erling Smørgrav return (EINVAL); 94455c85568SRobert Drehmel strlcpy(buf, soun->sun_path, len + 1); 9454f1f0ef5SRobert Watson if (unp->unp_flags & UNP_CONNECTING) { 9464f1f0ef5SRobert Watson UNP_UNLOCK(); 9474f1f0ef5SRobert Watson return (EALREADY); 9484f1f0ef5SRobert Watson } 94905102f04SRobert Watson unp->unp_flags |= UNP_CONNECTING; 9500d9ce3a1SRobert Watson UNP_UNLOCK(); 9510d9ce3a1SRobert Watson sa = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 9520d9ce3a1SRobert Watson mtx_lock(&Giant); 953b40ce416SJulian Elischer NDINIT(&nd, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, buf, td); 954797f2d22SPoul-Henning Kamp error = namei(&nd); 955797f2d22SPoul-Henning Kamp if (error) 9560d9ce3a1SRobert Watson vp = NULL; 9570d9ce3a1SRobert Watson else 958df8bae1dSRodney W. Grimes vp = nd.ni_vp; 9590d9ce3a1SRobert Watson ASSERT_VOP_LOCKED(vp, "unp_connect"); 960762e6b85SEivind Eklund NDFREE(&nd, NDF_ONLY_PNBUF); 9610d9ce3a1SRobert Watson if (error) 9620d9ce3a1SRobert Watson goto bad; 9630d9ce3a1SRobert Watson 964df8bae1dSRodney W. Grimes if (vp->v_type != VSOCK) { 965df8bae1dSRodney W. Grimes error = ENOTSOCK; 966df8bae1dSRodney W. Grimes goto bad; 967df8bae1dSRodney W. Grimes } 9686fac927cSRobert Watson #ifdef MAC 9696fac927cSRobert Watson error = mac_check_vnode_open(td->td_ucred, vp, VWRITE | VREAD); 9706fac927cSRobert Watson if (error) 9716fac927cSRobert Watson goto bad; 9726fac927cSRobert Watson #endif 973a854ed98SJohn Baldwin error = VOP_ACCESS(vp, VWRITE, td->td_ucred, td); 974797f2d22SPoul-Henning Kamp if (error) 975df8bae1dSRodney W. Grimes goto bad; 9762260c03dSRobert Watson mtx_unlock(&Giant); 9772260c03dSRobert Watson UNP_LOCK(); 978b295bdcdSRobert Watson unp = sotounpcb(so); 9794d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 980df8bae1dSRodney W. Grimes so2 = vp->v_socket; 981fc3fcacfSRobert Watson if (so2 == NULL) { 982df8bae1dSRodney W. Grimes error = ECONNREFUSED; 9832260c03dSRobert Watson goto bad2; 984df8bae1dSRodney W. Grimes } 985df8bae1dSRodney W. Grimes if (so->so_type != so2->so_type) { 986df8bae1dSRodney W. Grimes error = EPROTOTYPE; 9872260c03dSRobert Watson goto bad2; 988df8bae1dSRodney W. Grimes } 989df8bae1dSRodney W. Grimes if (so->so_proto->pr_flags & PR_CONNREQUIRED) { 99046a1d9bfSRobert Watson if (so2->so_options & SO_ACCEPTCONN) 9910d9ce3a1SRobert Watson so3 = sonewconn(so2, 0); 99246a1d9bfSRobert Watson else 9930d9ce3a1SRobert Watson so3 = NULL; 9940d9ce3a1SRobert Watson if (so3 == NULL) { 995df8bae1dSRodney W. Grimes error = ECONNREFUSED; 9960d9ce3a1SRobert Watson goto bad2; 997df8bae1dSRodney W. Grimes } 9980c1bb4fbSDima Dorfman unp = sotounpcb(so); 999df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 1000df8bae1dSRodney W. Grimes unp3 = sotounpcb(so3); 10010d9ce3a1SRobert Watson if (unp2->unp_addr != NULL) { 10020d9ce3a1SRobert Watson bcopy(unp2->unp_addr, sa, unp2->unp_addr->sun_len); 10030d9ce3a1SRobert Watson unp3->unp_addr = (struct sockaddr_un *) sa; 10040d9ce3a1SRobert Watson sa = NULL; 10050d9ce3a1SRobert Watson } 10060c1bb4fbSDima Dorfman /* 10070c1bb4fbSDima Dorfman * unp_peercred management: 10080c1bb4fbSDima Dorfman * 10091c381b19SRobert Watson * The connecter's (client's) credentials are copied from its 10101c381b19SRobert Watson * process structure at the time of connect() (which is now). 10110c1bb4fbSDima Dorfman */ 1012a854ed98SJohn Baldwin cru2x(td->td_ucred, &unp3->unp_peercred); 10130c1bb4fbSDima Dorfman unp3->unp_flags |= UNP_HAVEPC; 10140c1bb4fbSDima Dorfman /* 10151c381b19SRobert Watson * The receiver's (server's) credentials are copied from the 10161c381b19SRobert Watson * unp_peercred member of socket on which the former called 10171c381b19SRobert Watson * listen(); unp_listen() cached that process's credentials 10181c381b19SRobert Watson * at that time so we can use them now. 10190c1bb4fbSDima Dorfman */ 10200c1bb4fbSDima Dorfman KASSERT(unp2->unp_flags & UNP_HAVEPCCACHED, 10210c1bb4fbSDima Dorfman ("unp_connect: listener without cached peercred")); 10220c1bb4fbSDima Dorfman memcpy(&unp->unp_peercred, &unp2->unp_peercred, 10230c1bb4fbSDima Dorfman sizeof(unp->unp_peercred)); 10240c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPC; 1025481f8fe8SMaxim Konovalov if (unp2->unp_flags & UNP_WANTCRED) 1026481f8fe8SMaxim Konovalov unp3->unp_flags |= UNP_WANTCRED; 1027335654d7SRobert Watson #ifdef MAC 1028310e7cebSRobert Watson SOCK_LOCK(so); 1029335654d7SRobert Watson mac_set_socket_peer_from_socket(so, so3); 1030335654d7SRobert Watson mac_set_socket_peer_from_socket(so3, so); 1031310e7cebSRobert Watson SOCK_UNLOCK(so); 1032335654d7SRobert Watson #endif 10330c1bb4fbSDima Dorfman 1034df8bae1dSRodney W. Grimes so2 = so3; 1035df8bae1dSRodney W. Grimes } 10366a2989fdSMatthew N. Dodd error = unp_connect2(so, so2, PRU_CONNECT); 10370d9ce3a1SRobert Watson bad2: 10380d9ce3a1SRobert Watson UNP_UNLOCK(); 10390d9ce3a1SRobert Watson mtx_lock(&Giant); 1040df8bae1dSRodney W. Grimes bad: 10410d9ce3a1SRobert Watson mtx_assert(&Giant, MA_OWNED); 10420d9ce3a1SRobert Watson if (vp != NULL) 1043df8bae1dSRodney W. Grimes vput(vp); 10440d9ce3a1SRobert Watson mtx_unlock(&Giant); 10450d9ce3a1SRobert Watson free(sa, M_SONAME); 10460d9ce3a1SRobert Watson UNP_LOCK(); 10474f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_CONNECTING; 1048df8bae1dSRodney W. Grimes return (error); 1049df8bae1dSRodney W. Grimes } 1050df8bae1dSRodney W. Grimes 1051db48c0d2SRobert Watson static int 10526a2989fdSMatthew N. Dodd unp_connect2(struct socket *so, struct socket *so2, int req) 1053df8bae1dSRodney W. Grimes { 1054892af6b9SRobert Watson struct unpcb *unp = sotounpcb(so); 1055892af6b9SRobert Watson struct unpcb *unp2; 1056df8bae1dSRodney W. Grimes 10570d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 10580d9ce3a1SRobert Watson 1059df8bae1dSRodney W. Grimes if (so2->so_type != so->so_type) 1060df8bae1dSRodney W. Grimes return (EPROTOTYPE); 1061df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 10624d4b555eSRobert Watson KASSERT(unp2 != NULL, ("unp_connect2: unp2 == NULL")); 1063df8bae1dSRodney W. Grimes unp->unp_conn = unp2; 1064df8bae1dSRodney W. Grimes switch (so->so_type) { 1065df8bae1dSRodney W. Grimes case SOCK_DGRAM: 106698271db4SGarrett Wollman LIST_INSERT_HEAD(&unp2->unp_refs, unp, unp_reflink); 1067df8bae1dSRodney W. Grimes soisconnected(so); 1068df8bae1dSRodney W. Grimes break; 1069df8bae1dSRodney W. Grimes 1070df8bae1dSRodney W. Grimes case SOCK_STREAM: 1071df8bae1dSRodney W. Grimes unp2->unp_conn = unp; 10726a2989fdSMatthew N. Dodd if (req == PRU_CONNECT && 10736a2989fdSMatthew N. Dodd ((unp->unp_flags | unp2->unp_flags) & UNP_CONNWAIT)) 10746a2989fdSMatthew N. Dodd soisconnecting(so); 10756a2989fdSMatthew N. Dodd else 1076df8bae1dSRodney W. Grimes soisconnected(so); 1077df8bae1dSRodney W. Grimes soisconnected(so2); 1078df8bae1dSRodney W. Grimes break; 1079df8bae1dSRodney W. Grimes 1080df8bae1dSRodney W. Grimes default: 1081df8bae1dSRodney W. Grimes panic("unp_connect2"); 1082df8bae1dSRodney W. Grimes } 1083df8bae1dSRodney W. Grimes return (0); 1084df8bae1dSRodney W. Grimes } 1085df8bae1dSRodney W. Grimes 1086f708ef1bSPoul-Henning Kamp static void 1087892af6b9SRobert Watson unp_disconnect(struct unpcb *unp) 1088df8bae1dSRodney W. Grimes { 1089892af6b9SRobert Watson struct unpcb *unp2 = unp->unp_conn; 10901b2e3b4bSRobert Watson struct socket *so; 1091df8bae1dSRodney W. Grimes 10920d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 10930d9ce3a1SRobert Watson 1094fc3fcacfSRobert Watson if (unp2 == NULL) 1095df8bae1dSRodney W. Grimes return; 1096fc3fcacfSRobert Watson unp->unp_conn = NULL; 1097df8bae1dSRodney W. Grimes switch (unp->unp_socket->so_type) { 1098df8bae1dSRodney W. Grimes case SOCK_DGRAM: 109998271db4SGarrett Wollman LIST_REMOVE(unp, unp_reflink); 11001b2e3b4bSRobert Watson so = unp->unp_socket; 11011b2e3b4bSRobert Watson SOCK_LOCK(so); 11021b2e3b4bSRobert Watson so->so_state &= ~SS_ISCONNECTED; 11031b2e3b4bSRobert Watson SOCK_UNLOCK(so); 1104df8bae1dSRodney W. Grimes break; 1105df8bae1dSRodney W. Grimes 1106df8bae1dSRodney W. Grimes case SOCK_STREAM: 1107df8bae1dSRodney W. Grimes soisdisconnected(unp->unp_socket); 1108fc3fcacfSRobert Watson unp2->unp_conn = NULL; 1109df8bae1dSRodney W. Grimes soisdisconnected(unp2->unp_socket); 1110df8bae1dSRodney W. Grimes break; 1111df8bae1dSRodney W. Grimes } 1112df8bae1dSRodney W. Grimes } 1113df8bae1dSRodney W. Grimes 11140d9ce3a1SRobert Watson /* 11151c381b19SRobert Watson * unp_pcblist() assumes that UNIX domain socket memory is never reclaimed by 11161c381b19SRobert Watson * the zone (UMA_ZONE_NOFREE), and as such potentially stale pointers are 11171c381b19SRobert Watson * safe to reference. It first scans the list of struct unpcb's to generate 11181c381b19SRobert Watson * a pointer list, then it rescans its list one entry at a time to 11190d9ce3a1SRobert Watson * externalize and copyout. It checks the generation number to see if a 11200d9ce3a1SRobert Watson * struct unpcb has been reused, and will skip it if so. 11210d9ce3a1SRobert Watson */ 112298271db4SGarrett Wollman static int 112382d9ae4eSPoul-Henning Kamp unp_pcblist(SYSCTL_HANDLER_ARGS) 112498271db4SGarrett Wollman { 1125f5ef029eSPoul-Henning Kamp int error, i, n; 11269ae328fcSJohn Baldwin int freeunp; 112798271db4SGarrett Wollman struct unpcb *unp, **unp_list; 112898271db4SGarrett Wollman unp_gen_t gencnt; 11298f364875SJulian Elischer struct xunpgen *xug; 113098271db4SGarrett Wollman struct unp_head *head; 11318f364875SJulian Elischer struct xunpcb *xu; 113298271db4SGarrett Wollman 1133a23d65bfSBruce Evans head = ((intptr_t)arg1 == SOCK_DGRAM ? &unp_dhead : &unp_shead); 113498271db4SGarrett Wollman 113598271db4SGarrett Wollman /* 113698271db4SGarrett Wollman * The process of preparing the PCB list is too time-consuming and 113798271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 113898271db4SGarrett Wollman */ 1139fc3fcacfSRobert Watson if (req->oldptr == NULL) { 114098271db4SGarrett Wollman n = unp_count; 11418f364875SJulian Elischer req->oldidx = 2 * (sizeof *xug) 114298271db4SGarrett Wollman + (n + n/8) * sizeof(struct xunpcb); 1143e5aeaa0cSDag-Erling Smørgrav return (0); 114498271db4SGarrett Wollman } 114598271db4SGarrett Wollman 1146fc3fcacfSRobert Watson if (req->newptr != NULL) 1147e5aeaa0cSDag-Erling Smørgrav return (EPERM); 114898271db4SGarrett Wollman 114998271db4SGarrett Wollman /* 115098271db4SGarrett Wollman * OK, now we're committed to doing something. 115198271db4SGarrett Wollman */ 1152a163d034SWarner Losh xug = malloc(sizeof(*xug), M_TEMP, M_WAITOK); 11530d9ce3a1SRobert Watson UNP_LOCK(); 115498271db4SGarrett Wollman gencnt = unp_gencnt; 115598271db4SGarrett Wollman n = unp_count; 11560d9ce3a1SRobert Watson UNP_UNLOCK(); 115798271db4SGarrett Wollman 11588f364875SJulian Elischer xug->xug_len = sizeof *xug; 11598f364875SJulian Elischer xug->xug_count = n; 11608f364875SJulian Elischer xug->xug_gen = gencnt; 11618f364875SJulian Elischer xug->xug_sogen = so_gencnt; 11628f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 11638f364875SJulian Elischer if (error) { 11648f364875SJulian Elischer free(xug, M_TEMP); 1165e5aeaa0cSDag-Erling Smørgrav return (error); 11668f364875SJulian Elischer } 116798271db4SGarrett Wollman 1168a163d034SWarner Losh unp_list = malloc(n * sizeof *unp_list, M_TEMP, M_WAITOK); 116998271db4SGarrett Wollman 11700d9ce3a1SRobert Watson UNP_LOCK(); 11712e3c8fcbSPoul-Henning Kamp for (unp = LIST_FIRST(head), i = 0; unp && i < n; 11722e3c8fcbSPoul-Henning Kamp unp = LIST_NEXT(unp, unp_link)) { 11738a7d8cc6SRobert Watson if (unp->unp_gencnt <= gencnt) { 1174a854ed98SJohn Baldwin if (cr_cansee(req->td->td_ucred, 11758a7d8cc6SRobert Watson unp->unp_socket->so_cred)) 11764787fd37SPaul Saab continue; 117798271db4SGarrett Wollman unp_list[i++] = unp; 11789ae328fcSJohn Baldwin unp->unp_refcount++; 117998271db4SGarrett Wollman } 11804787fd37SPaul Saab } 11810d9ce3a1SRobert Watson UNP_UNLOCK(); 11821c381b19SRobert Watson n = i; /* In case we lost some during malloc. */ 118398271db4SGarrett Wollman 118498271db4SGarrett Wollman error = 0; 1185fe2eee82SColin Percival xu = malloc(sizeof(*xu), M_TEMP, M_WAITOK | M_ZERO); 118698271db4SGarrett Wollman for (i = 0; i < n; i++) { 118798271db4SGarrett Wollman unp = unp_list[i]; 11889ae328fcSJohn Baldwin UNP_LOCK(); 11899ae328fcSJohn Baldwin unp->unp_refcount--; 11909ae328fcSJohn Baldwin if (unp->unp_refcount != 0 && unp->unp_gencnt <= gencnt) { 11918f364875SJulian Elischer xu->xu_len = sizeof *xu; 11928f364875SJulian Elischer xu->xu_unpp = unp; 119398271db4SGarrett Wollman /* 119498271db4SGarrett Wollman * XXX - need more locking here to protect against 119598271db4SGarrett Wollman * connect/disconnect races for SMP. 119698271db4SGarrett Wollman */ 1197fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 11988f364875SJulian Elischer bcopy(unp->unp_addr, &xu->xu_addr, 119998271db4SGarrett Wollman unp->unp_addr->sun_len); 1200fc3fcacfSRobert Watson if (unp->unp_conn != NULL && 1201fc3fcacfSRobert Watson unp->unp_conn->unp_addr != NULL) 120298271db4SGarrett Wollman bcopy(unp->unp_conn->unp_addr, 12038f364875SJulian Elischer &xu->xu_caddr, 120498271db4SGarrett Wollman unp->unp_conn->unp_addr->sun_len); 12058f364875SJulian Elischer bcopy(unp, &xu->xu_unp, sizeof *unp); 12068f364875SJulian Elischer sotoxsocket(unp->unp_socket, &xu->xu_socket); 12079ae328fcSJohn Baldwin UNP_UNLOCK(); 12088f364875SJulian Elischer error = SYSCTL_OUT(req, xu, sizeof *xu); 12099ae328fcSJohn Baldwin } else { 12109ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 12119ae328fcSJohn Baldwin UNP_UNLOCK(); 12129ae328fcSJohn Baldwin if (freeunp) 12139ae328fcSJohn Baldwin uma_zfree(unp_zone, unp); 121498271db4SGarrett Wollman } 121598271db4SGarrett Wollman } 12168f364875SJulian Elischer free(xu, M_TEMP); 121798271db4SGarrett Wollman if (!error) { 121898271db4SGarrett Wollman /* 12191c381b19SRobert Watson * Give the user an updated idea of our state. If the 12201c381b19SRobert Watson * generation differs from what we told her before, she knows 12211c381b19SRobert Watson * that something happened while we were processing this 12221c381b19SRobert Watson * request, and it might be necessary to retry. 122398271db4SGarrett Wollman */ 12248f364875SJulian Elischer xug->xug_gen = unp_gencnt; 12258f364875SJulian Elischer xug->xug_sogen = so_gencnt; 12268f364875SJulian Elischer xug->xug_count = unp_count; 12278f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 122898271db4SGarrett Wollman } 122998271db4SGarrett Wollman free(unp_list, M_TEMP); 12308f364875SJulian Elischer free(xug, M_TEMP); 1231e5aeaa0cSDag-Erling Smørgrav return (error); 123298271db4SGarrett Wollman } 123398271db4SGarrett Wollman 123498271db4SGarrett Wollman SYSCTL_PROC(_net_local_dgram, OID_AUTO, pcblist, CTLFLAG_RD, 123598271db4SGarrett Wollman (caddr_t)(long)SOCK_DGRAM, 0, unp_pcblist, "S,xunpcb", 123698271db4SGarrett Wollman "List of active local datagram sockets"); 123798271db4SGarrett Wollman SYSCTL_PROC(_net_local_stream, OID_AUTO, pcblist, CTLFLAG_RD, 123898271db4SGarrett Wollman (caddr_t)(long)SOCK_STREAM, 0, unp_pcblist, "S,xunpcb", 123998271db4SGarrett Wollman "List of active local stream sockets"); 124098271db4SGarrett Wollman 1241f708ef1bSPoul-Henning Kamp static void 1242892af6b9SRobert Watson unp_shutdown(struct unpcb *unp) 1243df8bae1dSRodney W. Grimes { 1244df8bae1dSRodney W. Grimes struct socket *so; 1245df8bae1dSRodney W. Grimes 12460d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 12470d9ce3a1SRobert Watson 1248df8bae1dSRodney W. Grimes if (unp->unp_socket->so_type == SOCK_STREAM && unp->unp_conn && 1249df8bae1dSRodney W. Grimes (so = unp->unp_conn->unp_socket)) 1250df8bae1dSRodney W. Grimes socantrcvmore(so); 1251df8bae1dSRodney W. Grimes } 1252df8bae1dSRodney W. Grimes 1253f708ef1bSPoul-Henning Kamp static void 1254892af6b9SRobert Watson unp_drop(struct unpcb *unp, int errno) 1255df8bae1dSRodney W. Grimes { 1256df8bae1dSRodney W. Grimes struct socket *so = unp->unp_socket; 1257df8bae1dSRodney W. Grimes 12580d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 12590d9ce3a1SRobert Watson 1260df8bae1dSRodney W. Grimes so->so_error = errno; 1261df8bae1dSRodney W. Grimes unp_disconnect(unp); 1262df8bae1dSRodney W. Grimes } 1263df8bae1dSRodney W. Grimes 12642bc21ed9SDavid Malone static void 1265892af6b9SRobert Watson unp_freerights(struct file **rp, int fdcount) 1266df8bae1dSRodney W. Grimes { 12672bc21ed9SDavid Malone int i; 12682bc21ed9SDavid Malone struct file *fp; 1269df8bae1dSRodney W. Grimes 12702bc21ed9SDavid Malone for (i = 0; i < fdcount; i++) { 1271df8bae1dSRodney W. Grimes fp = *rp; 12728692c025SYoshinobu Inoue /* 12731c381b19SRobert Watson * Zero the pointer before calling unp_discard since it may 12741c381b19SRobert Watson * end up in unp_gc().. 1275d7dca903SRobert Watson * 1276d7dca903SRobert Watson * XXXRW: This is less true than it used to be. 12778692c025SYoshinobu Inoue */ 1278df8bae1dSRodney W. Grimes *rp++ = 0; 12798692c025SYoshinobu Inoue unp_discard(fp); 1280df8bae1dSRodney W. Grimes } 12812bc21ed9SDavid Malone } 12822bc21ed9SDavid Malone 12832bc21ed9SDavid Malone int 1284892af6b9SRobert Watson unp_externalize(struct mbuf *control, struct mbuf **controlp) 12852bc21ed9SDavid Malone { 12862bc21ed9SDavid Malone struct thread *td = curthread; /* XXX */ 12872bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 12882bc21ed9SDavid Malone int i; 12892bc21ed9SDavid Malone int *fdp; 12902bc21ed9SDavid Malone struct file **rp; 12912bc21ed9SDavid Malone struct file *fp; 12922bc21ed9SDavid Malone void *data; 12932bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 12942bc21ed9SDavid Malone int error, newfds; 12952bc21ed9SDavid Malone int f; 12962bc21ed9SDavid Malone u_int newlen; 12972bc21ed9SDavid Malone 12984c5bc1caSRobert Watson UNP_UNLOCK_ASSERT(); 12994c5bc1caSRobert Watson 13002bc21ed9SDavid Malone error = 0; 13012bc21ed9SDavid Malone if (controlp != NULL) /* controlp == NULL => free control messages */ 13022bc21ed9SDavid Malone *controlp = NULL; 13032bc21ed9SDavid Malone 13042bc21ed9SDavid Malone while (cm != NULL) { 13052bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) { 13062bc21ed9SDavid Malone error = EINVAL; 13072bc21ed9SDavid Malone break; 13082bc21ed9SDavid Malone } 13092bc21ed9SDavid Malone 13102bc21ed9SDavid Malone data = CMSG_DATA(cm); 13112bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 13122bc21ed9SDavid Malone 13132bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET 13142bc21ed9SDavid Malone && cm->cmsg_type == SCM_RIGHTS) { 13152bc21ed9SDavid Malone newfds = datalen / sizeof(struct file *); 13162bc21ed9SDavid Malone rp = data; 13172bc21ed9SDavid Malone 1318e2f9a08bSOlivier Houchard /* If we're not outputting the descriptors free them. */ 13192bc21ed9SDavid Malone if (error || controlp == NULL) { 13202bc21ed9SDavid Malone unp_freerights(rp, newfds); 13212bc21ed9SDavid Malone goto next; 13222bc21ed9SDavid Malone } 1323426da3bcSAlfred Perlstein FILEDESC_LOCK(td->td_proc->p_fd); 13242bc21ed9SDavid Malone /* if the new FD's will not fit free them. */ 13252bc21ed9SDavid Malone if (!fdavail(td, newfds)) { 1326426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13272bc21ed9SDavid Malone error = EMSGSIZE; 13282bc21ed9SDavid Malone unp_freerights(rp, newfds); 13292bc21ed9SDavid Malone goto next; 1330df8bae1dSRodney W. Grimes } 1331ed5b7817SJulian Elischer /* 13321c381b19SRobert Watson * Now change each pointer to an fd in the global 13331c381b19SRobert Watson * table to an integer that is the index to the local 13341c381b19SRobert Watson * fd table entry that we set up to point to the 13351c381b19SRobert Watson * global one we are transferring. 1336ed5b7817SJulian Elischer */ 13372bc21ed9SDavid Malone newlen = newfds * sizeof(int); 13382bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 13392bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 13402bc21ed9SDavid Malone if (*controlp == NULL) { 1341426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13422bc21ed9SDavid Malone error = E2BIG; 13432bc21ed9SDavid Malone unp_freerights(rp, newfds); 13442bc21ed9SDavid Malone goto next; 13452bc21ed9SDavid Malone } 13462bc21ed9SDavid Malone 13472bc21ed9SDavid Malone fdp = (int *) 13482bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 1349df8bae1dSRodney W. Grimes for (i = 0; i < newfds; i++) { 1350a6d4491cSDag-Erling Smørgrav if (fdalloc(td, 0, &f)) 13512bc21ed9SDavid Malone panic("unp_externalize fdalloc failed"); 13528692c025SYoshinobu Inoue fp = *rp++; 1353b40ce416SJulian Elischer td->td_proc->p_fd->fd_ofiles[f] = fp; 1354426da3bcSAlfred Perlstein FILE_LOCK(fp); 1355df8bae1dSRodney W. Grimes fp->f_msgcount--; 1356426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1357df8bae1dSRodney W. Grimes unp_rights--; 13588692c025SYoshinobu Inoue *fdp++ = f; 1359df8bae1dSRodney W. Grimes } 1360426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13611c381b19SRobert Watson } else { 13621c381b19SRobert Watson /* We can just copy anything else across. */ 13632bc21ed9SDavid Malone if (error || controlp == NULL) 13642bc21ed9SDavid Malone goto next; 13652bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, datalen, 13662bc21ed9SDavid Malone cm->cmsg_type, cm->cmsg_level); 13672bc21ed9SDavid Malone if (*controlp == NULL) { 13682bc21ed9SDavid Malone error = ENOBUFS; 13692bc21ed9SDavid Malone goto next; 13702bc21ed9SDavid Malone } 13712bc21ed9SDavid Malone bcopy(data, 13722bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)), 13732bc21ed9SDavid Malone datalen); 13742bc21ed9SDavid Malone } 13752bc21ed9SDavid Malone 13762bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 13772bc21ed9SDavid Malone 13782bc21ed9SDavid Malone next: 13792bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 13802bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 13812bc21ed9SDavid Malone cm = (struct cmsghdr *) 13822bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 13838692c025SYoshinobu Inoue } else { 13842bc21ed9SDavid Malone clen = 0; 13852bc21ed9SDavid Malone cm = NULL; 13868692c025SYoshinobu Inoue } 13878692c025SYoshinobu Inoue } 13888692c025SYoshinobu Inoue 13892bc21ed9SDavid Malone m_freem(control); 13902bc21ed9SDavid Malone 13912bc21ed9SDavid Malone return (error); 1392df8bae1dSRodney W. Grimes } 1393df8bae1dSRodney W. Grimes 13944f590175SPaul Saab static void 13954f590175SPaul Saab unp_zone_change(void *tag) 13964f590175SPaul Saab { 13974f590175SPaul Saab 13984f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 13994f590175SPaul Saab } 14004f590175SPaul Saab 140198271db4SGarrett Wollman void 140298271db4SGarrett Wollman unp_init(void) 140398271db4SGarrett Wollman { 14041c381b19SRobert Watson 14059e9d298aSJeff Roberson unp_zone = uma_zcreate("unpcb", sizeof(struct unpcb), NULL, NULL, 14069ae328fcSJohn Baldwin NULL, NULL, UMA_ALIGN_PTR, 0); 1407fc3fcacfSRobert Watson if (unp_zone == NULL) 140898271db4SGarrett Wollman panic("unp_init"); 14094f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 14104f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, unp_zone_change, 14114f590175SPaul Saab NULL, EVENTHANDLER_PRI_ANY); 141298271db4SGarrett Wollman LIST_INIT(&unp_dhead); 141398271db4SGarrett Wollman LIST_INIT(&unp_shead); 1414a0ec558aSRobert Watson TASK_INIT(&unp_gc_task, 0, unp_gc, NULL); 14150d9ce3a1SRobert Watson UNP_LOCK_INIT(); 141698271db4SGarrett Wollman } 141798271db4SGarrett Wollman 1418f708ef1bSPoul-Henning Kamp static int 1419892af6b9SRobert Watson unp_internalize(struct mbuf **controlp, struct thread *td) 1420df8bae1dSRodney W. Grimes { 14212bc21ed9SDavid Malone struct mbuf *control = *controlp; 1422b40ce416SJulian Elischer struct proc *p = td->td_proc; 14238692c025SYoshinobu Inoue struct filedesc *fdescp = p->p_fd; 14242bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 14252bc21ed9SDavid Malone struct cmsgcred *cmcred; 14262bc21ed9SDavid Malone struct file **rp; 14272bc21ed9SDavid Malone struct file *fp; 14282bc21ed9SDavid Malone struct timeval *tv; 14292bc21ed9SDavid Malone int i, fd, *fdp; 14302bc21ed9SDavid Malone void *data; 14312bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 14322bc21ed9SDavid Malone int error, oldfds; 14338692c025SYoshinobu Inoue u_int newlen; 1434df8bae1dSRodney W. Grimes 14354c5bc1caSRobert Watson UNP_UNLOCK_ASSERT(); 14364c5bc1caSRobert Watson 14372bc21ed9SDavid Malone error = 0; 14382bc21ed9SDavid Malone *controlp = NULL; 14390b788fa1SBill Paul 14402bc21ed9SDavid Malone while (cm != NULL) { 14412bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_level != SOL_SOCKET 14422bc21ed9SDavid Malone || cm->cmsg_len > clen) { 14432bc21ed9SDavid Malone error = EINVAL; 14442bc21ed9SDavid Malone goto out; 14452bc21ed9SDavid Malone } 14462bc21ed9SDavid Malone 14472bc21ed9SDavid Malone data = CMSG_DATA(cm); 14482bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 14492bc21ed9SDavid Malone 14502bc21ed9SDavid Malone switch (cm->cmsg_type) { 14510b788fa1SBill Paul /* 14520b788fa1SBill Paul * Fill in credential information. 14530b788fa1SBill Paul */ 14542bc21ed9SDavid Malone case SCM_CREDS: 14552bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*cmcred), 14562bc21ed9SDavid Malone SCM_CREDS, SOL_SOCKET); 14572bc21ed9SDavid Malone if (*controlp == NULL) { 14582bc21ed9SDavid Malone error = ENOBUFS; 14592bc21ed9SDavid Malone goto out; 14602bc21ed9SDavid Malone } 14612bc21ed9SDavid Malone 14622bc21ed9SDavid Malone cmcred = (struct cmsgcred *) 14632bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 14640b788fa1SBill Paul cmcred->cmcred_pid = p->p_pid; 1465a854ed98SJohn Baldwin cmcred->cmcred_uid = td->td_ucred->cr_ruid; 1466a854ed98SJohn Baldwin cmcred->cmcred_gid = td->td_ucred->cr_rgid; 1467a854ed98SJohn Baldwin cmcred->cmcred_euid = td->td_ucred->cr_uid; 1468a854ed98SJohn Baldwin cmcred->cmcred_ngroups = MIN(td->td_ucred->cr_ngroups, 14690b788fa1SBill Paul CMGROUP_MAX); 14700b788fa1SBill Paul for (i = 0; i < cmcred->cmcred_ngroups; i++) 14712bc21ed9SDavid Malone cmcred->cmcred_groups[i] = 1472a854ed98SJohn Baldwin td->td_ucred->cr_groups[i]; 14732bc21ed9SDavid Malone break; 14740b788fa1SBill Paul 14752bc21ed9SDavid Malone case SCM_RIGHTS: 14762bc21ed9SDavid Malone oldfds = datalen / sizeof (int); 1477ed5b7817SJulian Elischer /* 14781c381b19SRobert Watson * Check that all the FDs passed in refer to legal 14791c381b19SRobert Watson * files. If not, reject the entire operation. 1480ed5b7817SJulian Elischer */ 14812bc21ed9SDavid Malone fdp = data; 1482426da3bcSAlfred Perlstein FILEDESC_LOCK(fdescp); 1483df8bae1dSRodney W. Grimes for (i = 0; i < oldfds; i++) { 14848692c025SYoshinobu Inoue fd = *fdp++; 14858692c025SYoshinobu Inoue if ((unsigned)fd >= fdescp->fd_nfiles || 14862bc21ed9SDavid Malone fdescp->fd_ofiles[fd] == NULL) { 1487426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 14882bc21ed9SDavid Malone error = EBADF; 14892bc21ed9SDavid Malone goto out; 14902bc21ed9SDavid Malone } 1491e7d6662fSAlfred Perlstein fp = fdescp->fd_ofiles[fd]; 1492e7d6662fSAlfred Perlstein if (!(fp->f_ops->fo_flags & DFLAG_PASSABLE)) { 1493e7d6662fSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 1494e7d6662fSAlfred Perlstein error = EOPNOTSUPP; 1495e7d6662fSAlfred Perlstein goto out; 1496e7d6662fSAlfred Perlstein } 1497e7d6662fSAlfred Perlstein 1498df8bae1dSRodney W. Grimes } 1499ed5b7817SJulian Elischer /* 15001c381b19SRobert Watson * Now replace the integer FDs with pointers to the 15011c381b19SRobert Watson * associated global file table entry.. 1502ed5b7817SJulian Elischer */ 15032bc21ed9SDavid Malone newlen = oldfds * sizeof(struct file *); 15042bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 15052bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 15062bc21ed9SDavid Malone if (*controlp == NULL) { 1507426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 15082bc21ed9SDavid Malone error = E2BIG; 15092bc21ed9SDavid Malone goto out; 15108692c025SYoshinobu Inoue } 15118692c025SYoshinobu Inoue 15122bc21ed9SDavid Malone fdp = data; 15132bc21ed9SDavid Malone rp = (struct file **) 15142bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 15158692c025SYoshinobu Inoue for (i = 0; i < oldfds; i++) { 15168692c025SYoshinobu Inoue fp = fdescp->fd_ofiles[*fdp++]; 1517df8bae1dSRodney W. Grimes *rp++ = fp; 1518426da3bcSAlfred Perlstein FILE_LOCK(fp); 1519df8bae1dSRodney W. Grimes fp->f_count++; 1520df8bae1dSRodney W. Grimes fp->f_msgcount++; 1521426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1522df8bae1dSRodney W. Grimes unp_rights++; 1523df8bae1dSRodney W. Grimes } 1524426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 15252bc21ed9SDavid Malone break; 15262bc21ed9SDavid Malone 15272bc21ed9SDavid Malone case SCM_TIMESTAMP: 15282bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*tv), 15292bc21ed9SDavid Malone SCM_TIMESTAMP, SOL_SOCKET); 15302bc21ed9SDavid Malone if (*controlp == NULL) { 15312bc21ed9SDavid Malone error = ENOBUFS; 15322bc21ed9SDavid Malone goto out; 15338692c025SYoshinobu Inoue } 15342bc21ed9SDavid Malone tv = (struct timeval *) 15352bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 15362bc21ed9SDavid Malone microtime(tv); 15372bc21ed9SDavid Malone break; 15382bc21ed9SDavid Malone 15392bc21ed9SDavid Malone default: 15402bc21ed9SDavid Malone error = EINVAL; 15412bc21ed9SDavid Malone goto out; 15422bc21ed9SDavid Malone } 15432bc21ed9SDavid Malone 15442bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 15452bc21ed9SDavid Malone 15462bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 15472bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 15482bc21ed9SDavid Malone cm = (struct cmsghdr *) 15492bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 15502bc21ed9SDavid Malone } else { 15512bc21ed9SDavid Malone clen = 0; 15522bc21ed9SDavid Malone cm = NULL; 15532bc21ed9SDavid Malone } 15542bc21ed9SDavid Malone } 15552bc21ed9SDavid Malone 15562bc21ed9SDavid Malone out: 15572bc21ed9SDavid Malone m_freem(control); 15582bc21ed9SDavid Malone 15592bc21ed9SDavid Malone return (error); 1560df8bae1dSRodney W. Grimes } 1561df8bae1dSRodney W. Grimes 15625b950deaSRobert Watson static struct mbuf * 15636a2989fdSMatthew N. Dodd unp_addsockcred(struct thread *td, struct mbuf *control) 15646a2989fdSMatthew N. Dodd { 156570df31f4SMaxim Konovalov struct mbuf *m, *n, *n_prev; 15666a2989fdSMatthew N. Dodd struct sockcred *sc; 156770df31f4SMaxim Konovalov const struct cmsghdr *cm; 15686a2989fdSMatthew N. Dodd int ngroups; 15696a2989fdSMatthew N. Dodd int i; 15706a2989fdSMatthew N. Dodd 15716a2989fdSMatthew N. Dodd ngroups = MIN(td->td_ucred->cr_ngroups, CMGROUP_MAX); 15726a2989fdSMatthew N. Dodd 15736a2989fdSMatthew N. Dodd m = sbcreatecontrol(NULL, SOCKCREDSIZE(ngroups), SCM_CREDS, SOL_SOCKET); 15746a2989fdSMatthew N. Dodd if (m == NULL) 15756a2989fdSMatthew N. Dodd return (control); 15766a2989fdSMatthew N. Dodd 15776a2989fdSMatthew N. Dodd sc = (struct sockcred *) CMSG_DATA(mtod(m, struct cmsghdr *)); 15786a2989fdSMatthew N. Dodd sc->sc_uid = td->td_ucred->cr_ruid; 15796a2989fdSMatthew N. Dodd sc->sc_euid = td->td_ucred->cr_uid; 15806a2989fdSMatthew N. Dodd sc->sc_gid = td->td_ucred->cr_rgid; 15816a2989fdSMatthew N. Dodd sc->sc_egid = td->td_ucred->cr_gid; 15826a2989fdSMatthew N. Dodd sc->sc_ngroups = ngroups; 15836a2989fdSMatthew N. Dodd for (i = 0; i < sc->sc_ngroups; i++) 15846a2989fdSMatthew N. Dodd sc->sc_groups[i] = td->td_ucred->cr_groups[i]; 15856a2989fdSMatthew N. Dodd 15866a2989fdSMatthew N. Dodd /* 15871c381b19SRobert Watson * Unlink SCM_CREDS control messages (struct cmsgcred), since just 15881c381b19SRobert Watson * created SCM_CREDS control message (struct sockcred) has another 15891c381b19SRobert Watson * format. 15906a2989fdSMatthew N. Dodd */ 159170df31f4SMaxim Konovalov if (control != NULL) 159270df31f4SMaxim Konovalov for (n = control, n_prev = NULL; n != NULL;) { 159370df31f4SMaxim Konovalov cm = mtod(n, struct cmsghdr *); 159470df31f4SMaxim Konovalov if (cm->cmsg_level == SOL_SOCKET && 159570df31f4SMaxim Konovalov cm->cmsg_type == SCM_CREDS) { 159670df31f4SMaxim Konovalov if (n_prev == NULL) 159770df31f4SMaxim Konovalov control = n->m_next; 159870df31f4SMaxim Konovalov else 159970df31f4SMaxim Konovalov n_prev->m_next = n->m_next; 160070df31f4SMaxim Konovalov n = m_free(n); 160170df31f4SMaxim Konovalov } else { 160270df31f4SMaxim Konovalov n_prev = n; 160370df31f4SMaxim Konovalov n = n->m_next; 160470df31f4SMaxim Konovalov } 160570df31f4SMaxim Konovalov } 16066a2989fdSMatthew N. Dodd 160770df31f4SMaxim Konovalov /* Prepend it to the head. */ 160870df31f4SMaxim Konovalov m->m_next = control; 160970df31f4SMaxim Konovalov 161070df31f4SMaxim Konovalov return (m); 16116a2989fdSMatthew N. Dodd } 16126a2989fdSMatthew N. Dodd 1613161a0c7cSRobert Watson /* 1614a0ec558aSRobert Watson * unp_defer indicates whether additional work has been defered for a future 1615a0ec558aSRobert Watson * pass through unp_gc(). It is thread local and does not require explicit 1616a0ec558aSRobert Watson * synchronization. 1617161a0c7cSRobert Watson */ 1618a0ec558aSRobert Watson static int unp_defer; 1619a0ec558aSRobert Watson 1620a0ec558aSRobert Watson static int unp_taskcount; 1621a0ec558aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, taskcount, CTLFLAG_RD, &unp_taskcount, 0, ""); 1622a0ec558aSRobert Watson 1623a0ec558aSRobert Watson static int unp_recycled; 1624a0ec558aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, recycled, CTLFLAG_RD, &unp_recycled, 0, ""); 1625df8bae1dSRodney W. Grimes 1626f708ef1bSPoul-Henning Kamp static void 1627a0ec558aSRobert Watson unp_gc(__unused void *arg, int pending) 1628df8bae1dSRodney W. Grimes { 1629892af6b9SRobert Watson struct file *fp, *nextfp; 1630892af6b9SRobert Watson struct socket *so; 1631df8bae1dSRodney W. Grimes struct file **extra_ref, **fpp; 1632df8bae1dSRodney W. Grimes int nunref, i; 163395f004dcSAlfred Perlstein int nfiles_snap; 163495f004dcSAlfred Perlstein int nfiles_slack = 20; 1635df8bae1dSRodney W. Grimes 1636a0ec558aSRobert Watson unp_taskcount++; 1637df8bae1dSRodney W. Grimes unp_defer = 0; 1638ed5b7817SJulian Elischer /* 16399ae328fcSJohn Baldwin * Before going through all this, set all FDs to be NOT deferred and 16401c381b19SRobert Watson * NOT externally accessible. 1641ed5b7817SJulian Elischer */ 1642426da3bcSAlfred Perlstein sx_slock(&filelist_lock); 16432e3c8fcbSPoul-Henning Kamp LIST_FOREACH(fp, &filehead, f_list) 1644426da3bcSAlfred Perlstein fp->f_gcflag &= ~(FMARK|FDEFER); 1645df8bae1dSRodney W. Grimes do { 16465bb84bc8SRobert Watson KASSERT(unp_defer >= 0, ("unp_gc: unp_defer %d", unp_defer)); 16472e3c8fcbSPoul-Henning Kamp LIST_FOREACH(fp, &filehead, f_list) { 1648426da3bcSAlfred Perlstein FILE_LOCK(fp); 1649ed5b7817SJulian Elischer /* 1650a0ec558aSRobert Watson * If the file is not open, skip it -- could be a 1651a0ec558aSRobert Watson * file in the process of being opened, or in the 1652a0ec558aSRobert Watson * process of being closed. If the file is 1653a0ec558aSRobert Watson * "closing", it may have been marked for deferred 1654a0ec558aSRobert Watson * consideration. Clear the flag now if so. 1655ed5b7817SJulian Elischer */ 1656426da3bcSAlfred Perlstein if (fp->f_count == 0) { 1657a0ec558aSRobert Watson if (fp->f_gcflag & FDEFER) 1658a0ec558aSRobert Watson unp_defer--; 1659a0ec558aSRobert Watson fp->f_gcflag &= ~(FMARK|FDEFER); 1660426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1661df8bae1dSRodney W. Grimes continue; 1662426da3bcSAlfred Perlstein } 1663ed5b7817SJulian Elischer /* 16649ae328fcSJohn Baldwin * If we already marked it as 'defer' in a 16659ae328fcSJohn Baldwin * previous pass, then try to process it this 16669ae328fcSJohn Baldwin * time and un-mark it. 1667ed5b7817SJulian Elischer */ 1668426da3bcSAlfred Perlstein if (fp->f_gcflag & FDEFER) { 1669426da3bcSAlfred Perlstein fp->f_gcflag &= ~FDEFER; 1670df8bae1dSRodney W. Grimes unp_defer--; 1671df8bae1dSRodney W. Grimes } else { 1672ed5b7817SJulian Elischer /* 16739ae328fcSJohn Baldwin * if it's not deferred, then check if it's 1674ed5b7817SJulian Elischer * already marked.. if so skip it 1675ed5b7817SJulian Elischer */ 1676426da3bcSAlfred Perlstein if (fp->f_gcflag & FMARK) { 1677426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1678df8bae1dSRodney W. Grimes continue; 1679426da3bcSAlfred Perlstein } 1680ed5b7817SJulian Elischer /* 16811c381b19SRobert Watson * If all references are from messages in 16821c381b19SRobert Watson * transit, then skip it. it's not externally 16831c381b19SRobert Watson * accessible. 1684ed5b7817SJulian Elischer */ 1685426da3bcSAlfred Perlstein if (fp->f_count == fp->f_msgcount) { 1686426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1687df8bae1dSRodney W. Grimes continue; 1688426da3bcSAlfred Perlstein } 1689ed5b7817SJulian Elischer /* 1690ed5b7817SJulian Elischer * If it got this far then it must be 1691ed5b7817SJulian Elischer * externally accessible. 1692ed5b7817SJulian Elischer */ 1693426da3bcSAlfred Perlstein fp->f_gcflag |= FMARK; 1694df8bae1dSRodney W. Grimes } 1695ed5b7817SJulian Elischer /* 16969ae328fcSJohn Baldwin * Either it was deferred, or it is externally 16971c381b19SRobert Watson * accessible and not already marked so. Now check 16981c381b19SRobert Watson * if it is possibly one of OUR sockets. 1699ed5b7817SJulian Elischer */ 1700df8bae1dSRodney W. Grimes if (fp->f_type != DTYPE_SOCKET || 170148e3128bSMatthew Dillon (so = fp->f_data) == NULL) { 1702426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1703df8bae1dSRodney W. Grimes continue; 1704426da3bcSAlfred Perlstein } 1705748e0b0aSGarrett Wollman if (so->so_proto->pr_domain != &localdomain || 17069ae328fcSJohn Baldwin (so->so_proto->pr_flags & PR_RIGHTS) == 0) { 17079ae328fcSJohn Baldwin FILE_UNLOCK(fp); 1708df8bae1dSRodney W. Grimes continue; 17099ae328fcSJohn Baldwin } 17109ae328fcSJohn Baldwin 17119ae328fcSJohn Baldwin /* 17129ae328fcSJohn Baldwin * Tell any other threads that do a subsequent 17139ae328fcSJohn Baldwin * fdrop() that we are scanning the message 17149ae328fcSJohn Baldwin * buffers. 17159ae328fcSJohn Baldwin */ 17169ae328fcSJohn Baldwin fp->f_gcflag |= FWAIT; 17179ae328fcSJohn Baldwin FILE_UNLOCK(fp); 17189ae328fcSJohn Baldwin 1719ed5b7817SJulian Elischer /* 17201c381b19SRobert Watson * So, Ok, it's one of our sockets and it IS 17219ae328fcSJohn Baldwin * externally accessible (or was deferred). Now we 17221c381b19SRobert Watson * look to see if we hold any file descriptors in its 1723ed5b7817SJulian Elischer * message buffers. Follow those links and mark them 1724ed5b7817SJulian Elischer * as accessible too. 1725ed5b7817SJulian Elischer */ 17267717cf07SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 1727df8bae1dSRodney W. Grimes unp_scan(so->so_rcv.sb_mb, unp_mark); 17287717cf07SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 17299ae328fcSJohn Baldwin 17309ae328fcSJohn Baldwin /* 17319ae328fcSJohn Baldwin * Wake up any threads waiting in fdrop(). 17329ae328fcSJohn Baldwin */ 17339ae328fcSJohn Baldwin FILE_LOCK(fp); 17349ae328fcSJohn Baldwin fp->f_gcflag &= ~FWAIT; 17359ae328fcSJohn Baldwin wakeup(&fp->f_gcflag); 17369ae328fcSJohn Baldwin FILE_UNLOCK(fp); 1737df8bae1dSRodney W. Grimes } 1738df8bae1dSRodney W. Grimes } while (unp_defer); 1739426da3bcSAlfred Perlstein sx_sunlock(&filelist_lock); 1740df8bae1dSRodney W. Grimes /* 1741a0ec558aSRobert Watson * XXXRW: The following comments need updating for a post-SMPng and 1742a0ec558aSRobert Watson * deferred unp_gc() world, but are still generally accurate. 1743a0ec558aSRobert Watson * 17441c381b19SRobert Watson * We grab an extra reference to each of the file table entries that 17451c381b19SRobert Watson * are not otherwise accessible and then free the rights that are 17461c381b19SRobert Watson * stored in messages on them. 1747df8bae1dSRodney W. Grimes * 1748df8bae1dSRodney W. Grimes * The bug in the orginal code is a little tricky, so I'll describe 1749df8bae1dSRodney W. Grimes * what's wrong with it here. 1750df8bae1dSRodney W. Grimes * 1751df8bae1dSRodney W. Grimes * It is incorrect to simply unp_discard each entry for f_msgcount 1752df8bae1dSRodney W. Grimes * times -- consider the case of sockets A and B that contain 1753df8bae1dSRodney W. Grimes * references to each other. On a last close of some other socket, 1754df8bae1dSRodney W. Grimes * we trigger a gc since the number of outstanding rights (unp_rights) 1755a0ec558aSRobert Watson * is non-zero. If during the sweep phase the gc code unp_discards, 1756df8bae1dSRodney W. Grimes * we end up doing a (full) closef on the descriptor. A closef on A 1757df8bae1dSRodney W. Grimes * results in the following chain. Closef calls soo_close, which 1758df8bae1dSRodney W. Grimes * calls soclose. Soclose calls first (through the switch 1759df8bae1dSRodney W. Grimes * uipc_usrreq) unp_detach, which re-invokes unp_gc. Unp_gc simply 17601c381b19SRobert Watson * returns because the previous instance had set unp_gcing, and we 17611c381b19SRobert Watson * return all the way back to soclose, which marks the socket with 17621c381b19SRobert Watson * SS_NOFDREF, and then calls sofree. Sofree calls sorflush to free 17631c381b19SRobert Watson * up the rights that are queued in messages on the socket A, i.e., 17641c381b19SRobert Watson * the reference on B. The sorflush calls via the dom_dispose switch 17651c381b19SRobert Watson * unp_dispose, which unp_scans with unp_discard. This second 1766df8bae1dSRodney W. Grimes * instance of unp_discard just calls closef on B. 1767df8bae1dSRodney W. Grimes * 1768df8bae1dSRodney W. Grimes * Well, a similar chain occurs on B, resulting in a sorflush on B, 1769df8bae1dSRodney W. Grimes * which results in another closef on A. Unfortunately, A is already 1770df8bae1dSRodney W. Grimes * being closed, and the descriptor has already been marked with 1771df8bae1dSRodney W. Grimes * SS_NOFDREF, and soclose panics at this point. 1772df8bae1dSRodney W. Grimes * 1773df8bae1dSRodney W. Grimes * Here, we first take an extra reference to each inaccessible 17741c381b19SRobert Watson * descriptor. Then, we call sorflush ourself, since we know it is a 17751c381b19SRobert Watson * Unix domain socket anyhow. After we destroy all the rights 17761c381b19SRobert Watson * carried in messages, we do a last closef to get rid of our extra 17771c381b19SRobert Watson * reference. This is the last close, and the unp_detach etc will 17781c381b19SRobert Watson * shut down the socket. 1779df8bae1dSRodney W. Grimes * 1780df8bae1dSRodney W. Grimes * 91/09/19, bsy@cs.cmu.edu 1781df8bae1dSRodney W. Grimes */ 178295f004dcSAlfred Perlstein again: 1783e4643c73SPoul-Henning Kamp nfiles_snap = openfiles + nfiles_slack; /* some slack */ 178495f004dcSAlfred Perlstein extra_ref = malloc(nfiles_snap * sizeof(struct file *), M_TEMP, 178595f004dcSAlfred Perlstein M_WAITOK); 1786426da3bcSAlfred Perlstein sx_slock(&filelist_lock); 1787e4643c73SPoul-Henning Kamp if (nfiles_snap < openfiles) { 178895f004dcSAlfred Perlstein sx_sunlock(&filelist_lock); 178995f004dcSAlfred Perlstein free(extra_ref, M_TEMP); 179095f004dcSAlfred Perlstein nfiles_slack += 20; 179195f004dcSAlfred Perlstein goto again; 179295f004dcSAlfred Perlstein } 1793fc3fcacfSRobert Watson for (nunref = 0, fp = LIST_FIRST(&filehead), fpp = extra_ref; 1794fc3fcacfSRobert Watson fp != NULL; fp = nextfp) { 17952e3c8fcbSPoul-Henning Kamp nextfp = LIST_NEXT(fp, f_list); 1796426da3bcSAlfred Perlstein FILE_LOCK(fp); 1797ed5b7817SJulian Elischer /* 1798ed5b7817SJulian Elischer * If it's not open, skip it 1799ed5b7817SJulian Elischer */ 1800426da3bcSAlfred Perlstein if (fp->f_count == 0) { 1801426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1802df8bae1dSRodney W. Grimes continue; 1803426da3bcSAlfred Perlstein } 1804ed5b7817SJulian Elischer /* 1805ed5b7817SJulian Elischer * If all refs are from msgs, and it's not marked accessible 18061c381b19SRobert Watson * then it must be referenced from some unreachable cycle of 18071c381b19SRobert Watson * (shut-down) FDs, so include it in our list of FDs to 18081c381b19SRobert Watson * remove. 1809ed5b7817SJulian Elischer */ 1810426da3bcSAlfred Perlstein if (fp->f_count == fp->f_msgcount && !(fp->f_gcflag & FMARK)) { 1811df8bae1dSRodney W. Grimes *fpp++ = fp; 1812df8bae1dSRodney W. Grimes nunref++; 1813df8bae1dSRodney W. Grimes fp->f_count++; 1814df8bae1dSRodney W. Grimes } 1815426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1816df8bae1dSRodney W. Grimes } 1817426da3bcSAlfred Perlstein sx_sunlock(&filelist_lock); 1818ed5b7817SJulian Elischer /* 18191c381b19SRobert Watson * For each FD on our hit list, do the following two things: 1820ed5b7817SJulian Elischer */ 18211c7c3c6aSMatthew Dillon for (i = nunref, fpp = extra_ref; --i >= 0; ++fpp) { 18221c7c3c6aSMatthew Dillon struct file *tfp = *fpp; 1823426da3bcSAlfred Perlstein FILE_LOCK(tfp); 1824cd72f218SMatthew Dillon if (tfp->f_type == DTYPE_SOCKET && 182548e3128bSMatthew Dillon tfp->f_data != NULL) { 1826426da3bcSAlfred Perlstein FILE_UNLOCK(tfp); 182748e3128bSMatthew Dillon sorflush(tfp->f_data); 1828e5aeaa0cSDag-Erling Smørgrav } else { 1829426da3bcSAlfred Perlstein FILE_UNLOCK(tfp); 18301c7c3c6aSMatthew Dillon } 1831e5aeaa0cSDag-Erling Smørgrav } 1832a0ec558aSRobert Watson for (i = nunref, fpp = extra_ref; --i >= 0; ++fpp) { 1833b40ce416SJulian Elischer closef(*fpp, (struct thread *) NULL); 1834a0ec558aSRobert Watson unp_recycled++; 1835a0ec558aSRobert Watson } 1836210a5a71SAlfred Perlstein free(extra_ref, M_TEMP); 1837df8bae1dSRodney W. Grimes } 1838df8bae1dSRodney W. Grimes 183926f9a767SRodney W. Grimes void 1840892af6b9SRobert Watson unp_dispose(struct mbuf *m) 1841df8bae1dSRodney W. Grimes { 1842996c772fSJohn Dyson 1843df8bae1dSRodney W. Grimes if (m) 1844df8bae1dSRodney W. Grimes unp_scan(m, unp_discard); 1845df8bae1dSRodney W. Grimes } 1846df8bae1dSRodney W. Grimes 18470c1bb4fbSDima Dorfman static int 1848d374e81eSRobert Watson unp_listen(struct socket *so, struct unpcb *unp, int backlog, 1849d374e81eSRobert Watson struct thread *td) 18500c1bb4fbSDima Dorfman { 18510daccb9cSRobert Watson int error; 18520daccb9cSRobert Watson 18530d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 18540c1bb4fbSDima Dorfman 18550daccb9cSRobert Watson SOCK_LOCK(so); 18560daccb9cSRobert Watson error = solisten_proto_check(so); 18570daccb9cSRobert Watson if (error == 0) { 18586f105b34SJohn Baldwin cru2x(td->td_ucred, &unp->unp_peercred); 18590c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPCCACHED; 1860d374e81eSRobert Watson solisten_proto(so, backlog); 18610daccb9cSRobert Watson } 18620daccb9cSRobert Watson SOCK_UNLOCK(so); 18630daccb9cSRobert Watson return (error); 18640c1bb4fbSDima Dorfman } 18650c1bb4fbSDima Dorfman 1866f708ef1bSPoul-Henning Kamp static void 1867892af6b9SRobert Watson unp_scan(struct mbuf *m0, void (*op)(struct file *)) 1868df8bae1dSRodney W. Grimes { 18692bc21ed9SDavid Malone struct mbuf *m; 18702bc21ed9SDavid Malone struct file **rp; 18712bc21ed9SDavid Malone struct cmsghdr *cm; 18722bc21ed9SDavid Malone void *data; 18732bc21ed9SDavid Malone int i; 18742bc21ed9SDavid Malone socklen_t clen, datalen; 1875df8bae1dSRodney W. Grimes int qfds; 1876df8bae1dSRodney W. Grimes 1877fc3fcacfSRobert Watson while (m0 != NULL) { 18782bc21ed9SDavid Malone for (m = m0; m; m = m->m_next) { 187912396bdcSDavid Malone if (m->m_type != MT_CONTROL) 1880df8bae1dSRodney W. Grimes continue; 18812bc21ed9SDavid Malone 18822bc21ed9SDavid Malone cm = mtod(m, struct cmsghdr *); 18832bc21ed9SDavid Malone clen = m->m_len; 18842bc21ed9SDavid Malone 18852bc21ed9SDavid Malone while (cm != NULL) { 18862bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) 18872bc21ed9SDavid Malone break; 18882bc21ed9SDavid Malone 18892bc21ed9SDavid Malone data = CMSG_DATA(cm); 18902bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len 18912bc21ed9SDavid Malone - (caddr_t)data; 18922bc21ed9SDavid Malone 18932bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET && 18942bc21ed9SDavid Malone cm->cmsg_type == SCM_RIGHTS) { 18952bc21ed9SDavid Malone qfds = datalen / sizeof (struct file *); 18962bc21ed9SDavid Malone rp = data; 1897df8bae1dSRodney W. Grimes for (i = 0; i < qfds; i++) 1898df8bae1dSRodney W. Grimes (*op)(*rp++); 18992bc21ed9SDavid Malone } 19002bc21ed9SDavid Malone 19012bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 19022bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 19032bc21ed9SDavid Malone cm = (struct cmsghdr *) 19042bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 19052bc21ed9SDavid Malone } else { 19062bc21ed9SDavid Malone clen = 0; 19072bc21ed9SDavid Malone cm = NULL; 19082bc21ed9SDavid Malone } 19092bc21ed9SDavid Malone } 1910df8bae1dSRodney W. Grimes } 1911df8bae1dSRodney W. Grimes m0 = m0->m_act; 1912df8bae1dSRodney W. Grimes } 1913df8bae1dSRodney W. Grimes } 1914df8bae1dSRodney W. Grimes 1915f708ef1bSPoul-Henning Kamp static void 1916892af6b9SRobert Watson unp_mark(struct file *fp) 1917df8bae1dSRodney W. Grimes { 1918426da3bcSAlfred Perlstein if (fp->f_gcflag & FMARK) 1919df8bae1dSRodney W. Grimes return; 1920df8bae1dSRodney W. Grimes unp_defer++; 1921426da3bcSAlfred Perlstein fp->f_gcflag |= (FMARK|FDEFER); 1922df8bae1dSRodney W. Grimes } 1923df8bae1dSRodney W. Grimes 1924f708ef1bSPoul-Henning Kamp static void 1925892af6b9SRobert Watson unp_discard(struct file *fp) 1926df8bae1dSRodney W. Grimes { 1927a0ec558aSRobert Watson UNP_LOCK(); 1928426da3bcSAlfred Perlstein FILE_LOCK(fp); 1929df8bae1dSRodney W. Grimes fp->f_msgcount--; 1930df8bae1dSRodney W. Grimes unp_rights--; 1931426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1932a0ec558aSRobert Watson UNP_UNLOCK(); 1933b40ce416SJulian Elischer (void) closef(fp, (struct thread *)NULL); 1934df8bae1dSRodney W. Grimes } 1935