19454b2d8SWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1982, 1986, 1989, 1991, 1993 3e1ac28e2SRobert Watson * The Regents of the University of California. 446a1d9bfSRobert Watson * Copyright (c) 2004-2007 Robert N. M. Watson 5e1ac28e2SRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 31748e0b0aSGarrett Wollman * From: @(#)uipc_usrreq.c 8.3 (Berkeley) 1/4/94 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 34f23929fbSRobert Watson /* 35f23929fbSRobert Watson * UNIX Domain (Local) Sockets 36f23929fbSRobert Watson * 37f23929fbSRobert Watson * This is an implementation of UNIX (local) domain sockets. Each socket has 38f23929fbSRobert Watson * an associated struct unpcb (UNIX protocol control block). Stream sockets 39f23929fbSRobert Watson * may be connected to 0 or 1 other socket. Datagram sockets may be 40f23929fbSRobert Watson * connected to 0, 1, or many other sockets. Sockets may be created and 41f23929fbSRobert Watson * connected in pairs (socketpair(2)), or bound/connected to using the file 42f23929fbSRobert Watson * system name space. For most purposes, only the receive socket buffer is 43f23929fbSRobert Watson * used, as sending on one socket delivers directly to the receive socket 44f23929fbSRobert Watson * buffer of a second socket. The implementation is substantially 45f23929fbSRobert Watson * complicated by the fact that "ancillary data", such as file descriptors or 46ca948c5eSRobert Watson * credentials, may be passed across UNIX domain sockets. The potential for 47ca948c5eSRobert Watson * passing UNIX domain sockets over other UNIX domain sockets requires the 48ca948c5eSRobert Watson * implementation of a simple garbage collector to find and tear down cycles 49ca948c5eSRobert Watson * of disconnected sockets. 50aea52f1bSRobert Watson * 51aea52f1bSRobert Watson * TODO: 52aea52f1bSRobert Watson * SEQPACKET, RDM 53aea52f1bSRobert Watson * rethink name space problems 54aea52f1bSRobert Watson * need a proper out-of-band 55aea52f1bSRobert Watson * lock pushdown 56f23929fbSRobert Watson */ 57f23929fbSRobert Watson 58677b542eSDavid E. O'Brien #include <sys/cdefs.h> 59677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 60677b542eSDavid E. O'Brien 61335654d7SRobert Watson #include "opt_mac.h" 62335654d7SRobert Watson 63df8bae1dSRodney W. Grimes #include <sys/param.h> 64fb919e4dSMark Murray #include <sys/domain.h> 65960ed29cSSeigo Tanimura #include <sys/fcntl.h> 66d826c479SBruce Evans #include <sys/malloc.h> /* XXX must be before <sys/file.h> */ 674f590175SPaul Saab #include <sys/eventhandler.h> 68639acc13SGarrett Wollman #include <sys/file.h> 69960ed29cSSeigo Tanimura #include <sys/filedesc.h> 70960ed29cSSeigo Tanimura #include <sys/jail.h> 71960ed29cSSeigo Tanimura #include <sys/kernel.h> 72960ed29cSSeigo Tanimura #include <sys/lock.h> 73639acc13SGarrett Wollman #include <sys/mbuf.h> 74033eb86eSJeff Roberson #include <sys/mount.h> 75960ed29cSSeigo Tanimura #include <sys/mutex.h> 76639acc13SGarrett Wollman #include <sys/namei.h> 77639acc13SGarrett Wollman #include <sys/proc.h> 78df8bae1dSRodney W. Grimes #include <sys/protosw.h> 79960ed29cSSeigo Tanimura #include <sys/resourcevar.h> 80df8bae1dSRodney W. Grimes #include <sys/socket.h> 81df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 82960ed29cSSeigo Tanimura #include <sys/signalvar.h> 83df8bae1dSRodney W. Grimes #include <sys/stat.h> 84960ed29cSSeigo Tanimura #include <sys/sx.h> 85639acc13SGarrett Wollman #include <sys/sysctl.h> 86960ed29cSSeigo Tanimura #include <sys/systm.h> 87a0ec558aSRobert Watson #include <sys/taskqueue.h> 88639acc13SGarrett Wollman #include <sys/un.h> 8998271db4SGarrett Wollman #include <sys/unpcb.h> 90639acc13SGarrett Wollman #include <sys/vnode.h> 91df8bae1dSRodney W. Grimes 92aed55708SRobert Watson #include <security/mac/mac_framework.h> 93aed55708SRobert Watson 949e9d298aSJeff Roberson #include <vm/uma.h> 9598271db4SGarrett Wollman 969e9d298aSJeff Roberson static uma_zone_t unp_zone; 9798271db4SGarrett Wollman static unp_gen_t unp_gencnt; 98aea52f1bSRobert Watson static u_int unp_count; /* Count of local sockets. */ 99aea52f1bSRobert Watson static ino_t unp_ino; /* Prototype for fake inode numbers. */ 100aea52f1bSRobert Watson static int unp_rights; /* File descriptors in flight. */ 101aea52f1bSRobert Watson static struct unp_head unp_shead; /* List of local stream sockets. */ 102aea52f1bSRobert Watson static struct unp_head unp_dhead; /* List of local datagram sockets. */ 10398271db4SGarrett Wollman 104aea52f1bSRobert Watson static const struct sockaddr sun_noname = { sizeof(sun_noname), AF_LOCAL }; 10598271db4SGarrett Wollman 106df8bae1dSRodney W. Grimes /* 107aea52f1bSRobert Watson * Garbage collection of cyclic file descriptor/socket references occurs 108aea52f1bSRobert Watson * asynchronously in a taskqueue context in order to avoid recursion and 109aea52f1bSRobert Watson * reentrance in the UNIX domain socket, file descriptor, and socket layer 110aea52f1bSRobert Watson * code. See unp_gc() for a full description. 111df8bae1dSRodney W. Grimes */ 112aea52f1bSRobert Watson static struct task unp_gc_task; 113f708ef1bSPoul-Henning Kamp 114ce5f32deSRobert Watson /* 1157e711c3aSRobert Watson * Both send and receive buffers are allocated PIPSIZ bytes of buffering for 1167e711c3aSRobert Watson * stream sockets, although the total for sender and receiver is actually 1177e711c3aSRobert Watson * only PIPSIZ. 1187e711c3aSRobert Watson * 1197e711c3aSRobert Watson * Datagram sockets really use the sendspace as the maximum datagram size, 1207e711c3aSRobert Watson * and don't really want to reserve the sendspace. Their recvspace should be 1217e711c3aSRobert Watson * large enough for at least one max-size datagram plus address. 1227e711c3aSRobert Watson */ 1237e711c3aSRobert Watson #ifndef PIPSIZ 1247e711c3aSRobert Watson #define PIPSIZ 8192 1257e711c3aSRobert Watson #endif 1267e711c3aSRobert Watson static u_long unpst_sendspace = PIPSIZ; 1277e711c3aSRobert Watson static u_long unpst_recvspace = PIPSIZ; 1287e711c3aSRobert Watson static u_long unpdg_sendspace = 2*1024; /* really max datagram size */ 1297e711c3aSRobert Watson static u_long unpdg_recvspace = 4*1024; 1307e711c3aSRobert Watson 131e4445a03SRobert Watson SYSCTL_NODE(_net, PF_LOCAL, local, CTLFLAG_RW, 0, "Local domain"); 132e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_STREAM, stream, CTLFLAG_RW, 0, "SOCK_STREAM"); 133e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_DGRAM, dgram, CTLFLAG_RW, 0, "SOCK_DGRAM"); 134e4445a03SRobert Watson 1357e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, sendspace, CTLFLAG_RW, 1367e711c3aSRobert Watson &unpst_sendspace, 0, ""); 1377e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, recvspace, CTLFLAG_RW, 1387e711c3aSRobert Watson &unpst_recvspace, 0, ""); 1397e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, maxdgram, CTLFLAG_RW, 1407e711c3aSRobert Watson &unpdg_sendspace, 0, ""); 1417e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, recvspace, CTLFLAG_RW, 1427e711c3aSRobert Watson &unpdg_recvspace, 0, ""); 1437e711c3aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, inflight, CTLFLAG_RD, &unp_rights, 0, ""); 1447e711c3aSRobert Watson 1457e711c3aSRobert Watson /* 146ce5f32deSRobert Watson * Currently, UNIX domain sockets are protected by a single subsystem lock, 147ce5f32deSRobert Watson * which covers global data structures and variables, the contents of each 148ce5f32deSRobert Watson * per-socket unpcb structure, and the so_pcb field in sockets attached to 149ce5f32deSRobert Watson * the UNIX domain. This provides for a moderate degree of paralellism, as 150ce5f32deSRobert Watson * receive operations on UNIX domain sockets do not need to acquire the 151ce5f32deSRobert Watson * subsystem lock. Finer grained locking to permit send() without acquiring 152ce5f32deSRobert Watson * a global lock would be a logical next step. 153ce5f32deSRobert Watson * 154ce5f32deSRobert Watson * The UNIX domain socket lock preceds all socket layer locks, including the 155ce5f32deSRobert Watson * socket lock and socket buffer lock, permitting UNIX domain socket code to 156ce5f32deSRobert Watson * call into socket support routines without releasing its locks. 157ce5f32deSRobert Watson * 158ce5f32deSRobert Watson * Some caution is required in areas where the UNIX domain socket code enters 159ce5f32deSRobert Watson * VFS in order to create or find rendezvous points. This results in 160ce5f32deSRobert Watson * dropping of the UNIX domain socket subsystem lock, acquisition of the 161ce5f32deSRobert Watson * Giant lock, and potential sleeping. This increases the chances of races, 162ce5f32deSRobert Watson * and exposes weaknesses in the socket->protocol API by offering poor 163ce5f32deSRobert Watson * failure modes. 164ce5f32deSRobert Watson */ 1650d9ce3a1SRobert Watson static struct mtx unp_mtx; 1660d9ce3a1SRobert Watson #define UNP_LOCK_INIT() \ 16746a1d9bfSRobert Watson mtx_init(&unp_mtx, "unp", NULL, MTX_DEF | MTX_RECURSE) 1680d9ce3a1SRobert Watson #define UNP_LOCK() mtx_lock(&unp_mtx) 1690d9ce3a1SRobert Watson #define UNP_UNLOCK() mtx_unlock(&unp_mtx) 1700d9ce3a1SRobert Watson #define UNP_LOCK_ASSERT() mtx_assert(&unp_mtx, MA_OWNED) 1714c5bc1caSRobert Watson #define UNP_UNLOCK_ASSERT() mtx_assert(&unp_mtx, MA_NOTOWNED) 1720d9ce3a1SRobert Watson 173aea52f1bSRobert Watson static int unp_connect(struct socket *, struct sockaddr *, 174aea52f1bSRobert Watson struct thread *); 1756a2989fdSMatthew N. Dodd static int unp_connect2(struct socket *so, struct socket *so2, int); 1764d77a549SAlfred Perlstein static void unp_disconnect(struct unpcb *); 1774d77a549SAlfred Perlstein static void unp_shutdown(struct unpcb *); 1784d77a549SAlfred Perlstein static void unp_drop(struct unpcb *, int); 179a0ec558aSRobert Watson static void unp_gc(__unused void *, int); 1804d77a549SAlfred Perlstein static void unp_scan(struct mbuf *, void (*)(struct file *)); 1814d77a549SAlfred Perlstein static void unp_mark(struct file *); 1824d77a549SAlfred Perlstein static void unp_discard(struct file *); 1834d77a549SAlfred Perlstein static void unp_freerights(struct file **, int); 1844d77a549SAlfred Perlstein static int unp_internalize(struct mbuf **, struct thread *); 185d374e81eSRobert Watson static int unp_listen(struct socket *, struct unpcb *, int, 186d374e81eSRobert Watson struct thread *); 187aea52f1bSRobert Watson struct mbuf *unp_addsockcred(struct thread *, struct mbuf *); 188f708ef1bSPoul-Henning Kamp 189e4445a03SRobert Watson /* 190e4445a03SRobert Watson * Definitions of protocols supported in the LOCAL domain. 191e4445a03SRobert Watson */ 192e4445a03SRobert Watson static struct domain localdomain; 193e4445a03SRobert Watson static struct protosw localsw[] = { 194e4445a03SRobert Watson { 195e4445a03SRobert Watson .pr_type = SOCK_STREAM, 196e4445a03SRobert Watson .pr_domain = &localdomain, 197e4445a03SRobert Watson .pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_RIGHTS, 198e4445a03SRobert Watson .pr_ctloutput = &uipc_ctloutput, 199e4445a03SRobert Watson .pr_usrreqs = &uipc_usrreqs 200e4445a03SRobert Watson }, 201e4445a03SRobert Watson { 202e4445a03SRobert Watson .pr_type = SOCK_DGRAM, 203e4445a03SRobert Watson .pr_domain = &localdomain, 204e4445a03SRobert Watson .pr_flags = PR_ATOMIC|PR_ADDR|PR_RIGHTS, 205e4445a03SRobert Watson .pr_usrreqs = &uipc_usrreqs 206e4445a03SRobert Watson }, 207e4445a03SRobert Watson }; 208e4445a03SRobert Watson 209e4445a03SRobert Watson static struct domain localdomain = { 210e4445a03SRobert Watson .dom_family = AF_LOCAL, 211e4445a03SRobert Watson .dom_name = "local", 212e4445a03SRobert Watson .dom_init = unp_init, 213e4445a03SRobert Watson .dom_externalize = unp_externalize, 214e4445a03SRobert Watson .dom_dispose = unp_dispose, 215e4445a03SRobert Watson .dom_protosw = localsw, 216e4445a03SRobert Watson .dom_protoswNPROTOSW = &localsw[sizeof(localsw)/sizeof(localsw[0])] 217e4445a03SRobert Watson }; 218e4445a03SRobert Watson DOMAIN_SET(local); 219e4445a03SRobert Watson 220ac45e92fSRobert Watson static void 221a29f300eSGarrett Wollman uipc_abort(struct socket *so) 222df8bae1dSRodney W. Grimes { 22340f2ac28SRobert Watson struct unpcb *unp; 224df8bae1dSRodney W. Grimes 22540f2ac28SRobert Watson unp = sotounpcb(so); 2264d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_abort: unp == NULL")); 2274d4b555eSRobert Watson UNP_LOCK(); 228a29f300eSGarrett Wollman unp_drop(unp, ECONNABORTED); 229a152f8a3SRobert Watson UNP_UNLOCK(); 230df8bae1dSRodney W. Grimes } 231df8bae1dSRodney W. Grimes 232a29f300eSGarrett Wollman static int 23357bf258eSGarrett Wollman uipc_accept(struct socket *so, struct sockaddr **nam) 234a29f300eSGarrett Wollman { 23540f2ac28SRobert Watson struct unpcb *unp; 2360d9ce3a1SRobert Watson const struct sockaddr *sa; 237df8bae1dSRodney W. Grimes 238df8bae1dSRodney W. Grimes /* 2391c381b19SRobert Watson * Pass back name of connected socket, if it was bound and we are 2401c381b19SRobert Watson * still connected (our peer may have closed already!). 241df8bae1dSRodney W. Grimes */ 2424d4b555eSRobert Watson unp = sotounpcb(so); 2434d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_accept: unp == NULL")); 2440d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 2450d9ce3a1SRobert Watson UNP_LOCK(); 2460d9ce3a1SRobert Watson if (unp->unp_conn != NULL && unp->unp_conn->unp_addr != NULL) 2470d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_conn->unp_addr; 2480d9ce3a1SRobert Watson else 2490d9ce3a1SRobert Watson sa = &sun_noname; 2500d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 2510d9ce3a1SRobert Watson UNP_UNLOCK(); 252e5aeaa0cSDag-Erling Smørgrav return (0); 253a29f300eSGarrett Wollman } 254df8bae1dSRodney W. Grimes 255a29f300eSGarrett Wollman static int 256b40ce416SJulian Elischer uipc_attach(struct socket *so, int proto, struct thread *td) 257a29f300eSGarrett Wollman { 2586d32873cSRobert Watson struct unpcb *unp; 2596d32873cSRobert Watson int error; 260df8bae1dSRodney W. Grimes 2616d32873cSRobert Watson KASSERT(so->so_pcb == NULL, ("uipc_attach: so_pcb != NULL")); 2626d32873cSRobert Watson if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) { 2636d32873cSRobert Watson switch (so->so_type) { 2646d32873cSRobert Watson case SOCK_STREAM: 2656d32873cSRobert Watson error = soreserve(so, unpst_sendspace, unpst_recvspace); 2666d32873cSRobert Watson break; 2676d32873cSRobert Watson 2686d32873cSRobert Watson case SOCK_DGRAM: 2696d32873cSRobert Watson error = soreserve(so, unpdg_sendspace, unpdg_recvspace); 2706d32873cSRobert Watson break; 2716d32873cSRobert Watson 2726d32873cSRobert Watson default: 2736d32873cSRobert Watson panic("unp_attach"); 2746d32873cSRobert Watson } 2756d32873cSRobert Watson if (error) 2766d32873cSRobert Watson return (error); 2776d32873cSRobert Watson } 27846a1d9bfSRobert Watson unp = uma_zalloc(unp_zone, M_NOWAIT | M_ZERO); 2796d32873cSRobert Watson if (unp == NULL) 2806d32873cSRobert Watson return (ENOBUFS); 2816d32873cSRobert Watson LIST_INIT(&unp->unp_refs); 2826d32873cSRobert Watson unp->unp_socket = so; 2836d32873cSRobert Watson so->so_pcb = unp; 2846d32873cSRobert Watson 2859ae328fcSJohn Baldwin unp->unp_refcount = 1; 2866d32873cSRobert Watson UNP_LOCK(); 2876d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 2886d32873cSRobert Watson unp_count++; 289b7e2f3ecSRobert Watson LIST_INSERT_HEAD(so->so_type == SOCK_DGRAM ? &unp_dhead : &unp_shead, 290b7e2f3ecSRobert Watson unp, unp_link); 2916d32873cSRobert Watson UNP_UNLOCK(); 2926d32873cSRobert Watson 2936d32873cSRobert Watson return (0); 294a29f300eSGarrett Wollman } 295a29f300eSGarrett Wollman 296a29f300eSGarrett Wollman static int 297b40ce416SJulian Elischer uipc_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 298a29f300eSGarrett Wollman { 299dd47f5caSRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 300dd47f5caSRobert Watson struct vattr vattr; 301dd47f5caSRobert Watson int error, namelen; 302dd47f5caSRobert Watson struct nameidata nd; 30340f2ac28SRobert Watson struct unpcb *unp; 304dd47f5caSRobert Watson struct vnode *vp; 305dd47f5caSRobert Watson struct mount *mp; 306dd47f5caSRobert Watson char *buf; 307a29f300eSGarrett Wollman 30840f2ac28SRobert Watson unp = sotounpcb(so); 3094d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_bind: unp == NULL")); 3104f1f0ef5SRobert Watson 3114f1f0ef5SRobert Watson namelen = soun->sun_len - offsetof(struct sockaddr_un, sun_path); 3124f1f0ef5SRobert Watson if (namelen <= 0) 3134f1f0ef5SRobert Watson return (EINVAL); 314dd47f5caSRobert Watson 315dd47f5caSRobert Watson /* 3164f1f0ef5SRobert Watson * We don't allow simultaneous bind() calls on a single UNIX domain 3174f1f0ef5SRobert Watson * socket, so flag in-progress operations, and return an error if an 3184f1f0ef5SRobert Watson * operation is already in progress. 3194f1f0ef5SRobert Watson * 3204f1f0ef5SRobert Watson * Historically, we have not allowed a socket to be rebound, so this 3214f1f0ef5SRobert Watson * also returns an error. Not allowing re-binding certainly 3224f1f0ef5SRobert Watson * simplifies the implementation and avoids a great many possible 3234f1f0ef5SRobert Watson * failure modes. 324dd47f5caSRobert Watson */ 3254f1f0ef5SRobert Watson UNP_LOCK(); 326dd47f5caSRobert Watson if (unp->unp_vnode != NULL) { 32740f2ac28SRobert Watson UNP_UNLOCK(); 328dd47f5caSRobert Watson return (EINVAL); 329dd47f5caSRobert Watson } 3304f1f0ef5SRobert Watson if (unp->unp_flags & UNP_BINDING) { 331dd47f5caSRobert Watson UNP_UNLOCK(); 3324f1f0ef5SRobert Watson return (EALREADY); 333dd47f5caSRobert Watson } 3344f1f0ef5SRobert Watson unp->unp_flags |= UNP_BINDING; 335dd47f5caSRobert Watson UNP_UNLOCK(); 336dd47f5caSRobert Watson 337dd47f5caSRobert Watson buf = malloc(namelen + 1, M_TEMP, M_WAITOK); 338dd47f5caSRobert Watson strlcpy(buf, soun->sun_path, namelen + 1); 339dd47f5caSRobert Watson 340dd47f5caSRobert Watson mtx_lock(&Giant); 341dd47f5caSRobert Watson restart: 342dd47f5caSRobert Watson mtx_assert(&Giant, MA_OWNED); 343dd47f5caSRobert Watson NDINIT(&nd, CREATE, NOFOLLOW | LOCKPARENT | SAVENAME, UIO_SYSSPACE, 344dd47f5caSRobert Watson buf, td); 345dd47f5caSRobert Watson /* SHOULD BE ABLE TO ADOPT EXISTING AND wakeup() ALA FIFO's */ 346dd47f5caSRobert Watson error = namei(&nd); 347dd47f5caSRobert Watson if (error) 3484f1f0ef5SRobert Watson goto error; 349dd47f5caSRobert Watson vp = nd.ni_vp; 350dd47f5caSRobert Watson if (vp != NULL || vn_start_write(nd.ni_dvp, &mp, V_NOWAIT) != 0) { 351dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 352dd47f5caSRobert Watson if (nd.ni_dvp == vp) 353dd47f5caSRobert Watson vrele(nd.ni_dvp); 354dd47f5caSRobert Watson else 355dd47f5caSRobert Watson vput(nd.ni_dvp); 356dd47f5caSRobert Watson if (vp != NULL) { 357dd47f5caSRobert Watson vrele(vp); 358dd47f5caSRobert Watson error = EADDRINUSE; 3594f1f0ef5SRobert Watson goto error; 360dd47f5caSRobert Watson } 361dd47f5caSRobert Watson error = vn_start_write(NULL, &mp, V_XSLEEP | PCATCH); 362dd47f5caSRobert Watson if (error) 3634f1f0ef5SRobert Watson goto error; 364dd47f5caSRobert Watson goto restart; 365dd47f5caSRobert Watson } 366dd47f5caSRobert Watson VATTR_NULL(&vattr); 367dd47f5caSRobert Watson vattr.va_type = VSOCK; 368dd47f5caSRobert Watson vattr.va_mode = (ACCESSPERMS & ~td->td_proc->p_fd->fd_cmask); 369dd47f5caSRobert Watson #ifdef MAC 370dd47f5caSRobert Watson error = mac_check_vnode_create(td->td_ucred, nd.ni_dvp, &nd.ni_cnd, 371dd47f5caSRobert Watson &vattr); 372dd47f5caSRobert Watson #endif 373dd47f5caSRobert Watson if (error == 0) { 374dd47f5caSRobert Watson VOP_LEASE(nd.ni_dvp, td, td->td_ucred, LEASE_WRITE); 375dd47f5caSRobert Watson error = VOP_CREATE(nd.ni_dvp, &nd.ni_vp, &nd.ni_cnd, &vattr); 376dd47f5caSRobert Watson } 377dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 378dd47f5caSRobert Watson vput(nd.ni_dvp); 379dd47f5caSRobert Watson if (error) { 380dd47f5caSRobert Watson vn_finished_write(mp); 3814f1f0ef5SRobert Watson goto error; 382dd47f5caSRobert Watson } 383dd47f5caSRobert Watson vp = nd.ni_vp; 3844f1f0ef5SRobert Watson ASSERT_VOP_LOCKED(vp, "uipc_bind"); 385dd47f5caSRobert Watson soun = (struct sockaddr_un *)sodupsockaddr(nam, M_WAITOK); 386dd47f5caSRobert Watson UNP_LOCK(); 387dd47f5caSRobert Watson vp->v_socket = unp->unp_socket; 388dd47f5caSRobert Watson unp->unp_vnode = vp; 389dd47f5caSRobert Watson unp->unp_addr = soun; 3904f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 391dd47f5caSRobert Watson UNP_UNLOCK(); 392dd47f5caSRobert Watson VOP_UNLOCK(vp, 0, td); 393dd47f5caSRobert Watson vn_finished_write(mp); 3944f1f0ef5SRobert Watson mtx_unlock(&Giant); 3954f1f0ef5SRobert Watson free(buf, M_TEMP); 3964f1f0ef5SRobert Watson return (0); 3974f1f0ef5SRobert Watson error: 3984f1f0ef5SRobert Watson UNP_LOCK(); 3994f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 4004f1f0ef5SRobert Watson UNP_UNLOCK(); 401dd47f5caSRobert Watson mtx_unlock(&Giant); 402dd47f5caSRobert Watson free(buf, M_TEMP); 40340f2ac28SRobert Watson return (error); 404a29f300eSGarrett Wollman } 405a29f300eSGarrett Wollman 406a29f300eSGarrett Wollman static int 407b40ce416SJulian Elischer uipc_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 408a29f300eSGarrett Wollman { 4090d9ce3a1SRobert Watson int error; 410a29f300eSGarrett Wollman 411fd179ee9SRobert Watson KASSERT(td == curthread, ("uipc_connect: td != curthread")); 4124d4b555eSRobert Watson UNP_LOCK(); 413fd179ee9SRobert Watson error = unp_connect(so, nam, td); 4140d9ce3a1SRobert Watson UNP_UNLOCK(); 4150d9ce3a1SRobert Watson return (error); 416a29f300eSGarrett Wollman } 417a29f300eSGarrett Wollman 418a152f8a3SRobert Watson /* 419a152f8a3SRobert Watson * XXXRW: Should also unbind? 420a152f8a3SRobert Watson */ 421a152f8a3SRobert Watson static void 422a152f8a3SRobert Watson uipc_close(struct socket *so) 423a152f8a3SRobert Watson { 424a152f8a3SRobert Watson struct unpcb *unp; 425a152f8a3SRobert Watson 426a152f8a3SRobert Watson unp = sotounpcb(so); 427a152f8a3SRobert Watson KASSERT(unp != NULL, ("uipc_close: unp == NULL")); 428a152f8a3SRobert Watson UNP_LOCK(); 429a152f8a3SRobert Watson unp_disconnect(unp); 430a152f8a3SRobert Watson UNP_UNLOCK(); 431a152f8a3SRobert Watson } 432a152f8a3SRobert Watson 433db48c0d2SRobert Watson int 434a29f300eSGarrett Wollman uipc_connect2(struct socket *so1, struct socket *so2) 435a29f300eSGarrett Wollman { 43640f2ac28SRobert Watson struct unpcb *unp; 4370d9ce3a1SRobert Watson int error; 438a29f300eSGarrett Wollman 43940f2ac28SRobert Watson unp = sotounpcb(so1); 4404d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_connect2: unp == NULL")); 4414d4b555eSRobert Watson UNP_LOCK(); 4426a2989fdSMatthew N. Dodd error = unp_connect2(so1, so2, PRU_CONNECT2); 4430d9ce3a1SRobert Watson UNP_UNLOCK(); 4440d9ce3a1SRobert Watson return (error); 445a29f300eSGarrett Wollman } 446a29f300eSGarrett Wollman 447a29f300eSGarrett Wollman /* control is EOPNOTSUPP */ 448a29f300eSGarrett Wollman 449bc725eafSRobert Watson static void 450a29f300eSGarrett Wollman uipc_detach(struct socket *so) 451a29f300eSGarrett Wollman { 4529ae328fcSJohn Baldwin struct sockaddr_un *saved_unp_addr; 45340f2ac28SRobert Watson struct unpcb *unp; 4546d32873cSRobert Watson struct vnode *vp; 4559ae328fcSJohn Baldwin int freeunp, local_unp_rights; 456a29f300eSGarrett Wollman 45740f2ac28SRobert Watson unp = sotounpcb(so); 4584d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_detach: unp == NULL")); 4594d4b555eSRobert Watson UNP_LOCK(); 4606d32873cSRobert Watson LIST_REMOVE(unp, unp_link); 4616d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 4626d32873cSRobert Watson --unp_count; 4636d32873cSRobert Watson if ((vp = unp->unp_vnode) != NULL) { 4646d32873cSRobert Watson /* 4656d32873cSRobert Watson * XXXRW: should v_socket be frobbed only while holding 4666d32873cSRobert Watson * Giant? 4676d32873cSRobert Watson */ 4686d32873cSRobert Watson unp->unp_vnode->v_socket = NULL; 4696d32873cSRobert Watson unp->unp_vnode = NULL; 4706d32873cSRobert Watson } 4716d32873cSRobert Watson if (unp->unp_conn != NULL) 4726d32873cSRobert Watson unp_disconnect(unp); 4736d32873cSRobert Watson while (!LIST_EMPTY(&unp->unp_refs)) { 4746d32873cSRobert Watson struct unpcb *ref = LIST_FIRST(&unp->unp_refs); 4756d32873cSRobert Watson unp_drop(ref, ECONNRESET); 4766d32873cSRobert Watson } 4776d32873cSRobert Watson unp->unp_socket->so_pcb = NULL; 4786d32873cSRobert Watson local_unp_rights = unp_rights; 4799ae328fcSJohn Baldwin saved_unp_addr = unp->unp_addr; 4809ae328fcSJohn Baldwin unp->unp_addr = NULL; 4819ae328fcSJohn Baldwin unp->unp_refcount--; 4829ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 4836d32873cSRobert Watson UNP_UNLOCK(); 4849ae328fcSJohn Baldwin if (saved_unp_addr != NULL) 4859ae328fcSJohn Baldwin FREE(saved_unp_addr, M_SONAME); 4869ae328fcSJohn Baldwin if (freeunp) 4876d32873cSRobert Watson uma_zfree(unp_zone, unp); 4886d32873cSRobert Watson if (vp) { 4896d32873cSRobert Watson int vfslocked; 4906d32873cSRobert Watson 4916d32873cSRobert Watson vfslocked = VFS_LOCK_GIANT(vp->v_mount); 4926d32873cSRobert Watson vrele(vp); 4936d32873cSRobert Watson VFS_UNLOCK_GIANT(vfslocked); 4946d32873cSRobert Watson } 4956d32873cSRobert Watson if (local_unp_rights) 4966d32873cSRobert Watson taskqueue_enqueue(taskqueue_thread, &unp_gc_task); 497a29f300eSGarrett Wollman } 498a29f300eSGarrett Wollman 499a29f300eSGarrett Wollman static int 500a29f300eSGarrett Wollman uipc_disconnect(struct socket *so) 501a29f300eSGarrett Wollman { 50240f2ac28SRobert Watson struct unpcb *unp; 503a29f300eSGarrett Wollman 50440f2ac28SRobert Watson unp = sotounpcb(so); 5054d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_disconnect: unp == NULL")); 5064d4b555eSRobert Watson UNP_LOCK(); 507a29f300eSGarrett Wollman unp_disconnect(unp); 5080d9ce3a1SRobert Watson UNP_UNLOCK(); 509e5aeaa0cSDag-Erling Smørgrav return (0); 510a29f300eSGarrett Wollman } 511a29f300eSGarrett Wollman 512a29f300eSGarrett Wollman static int 513d374e81eSRobert Watson uipc_listen(struct socket *so, int backlog, struct thread *td) 514a29f300eSGarrett Wollman { 51540f2ac28SRobert Watson struct unpcb *unp; 5160d9ce3a1SRobert Watson int error; 517a29f300eSGarrett Wollman 51840f2ac28SRobert Watson unp = sotounpcb(so); 5194d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_listen: unp == NULL")); 5204d4b555eSRobert Watson UNP_LOCK(); 5214d4b555eSRobert Watson if (unp->unp_vnode == NULL) { 52240f2ac28SRobert Watson UNP_UNLOCK(); 52340f2ac28SRobert Watson return (EINVAL); 52440f2ac28SRobert Watson } 525d374e81eSRobert Watson error = unp_listen(so, unp, backlog, td); 5260d9ce3a1SRobert Watson UNP_UNLOCK(); 5270d9ce3a1SRobert Watson return (error); 528a29f300eSGarrett Wollman } 529a29f300eSGarrett Wollman 530a29f300eSGarrett Wollman static int 53157bf258eSGarrett Wollman uipc_peeraddr(struct socket *so, struct sockaddr **nam) 532a29f300eSGarrett Wollman { 53340f2ac28SRobert Watson struct unpcb *unp; 5340d9ce3a1SRobert Watson const struct sockaddr *sa; 535a29f300eSGarrett Wollman 5364d4b555eSRobert Watson unp = sotounpcb(so); 5374d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_peeraddr: unp == NULL")); 5380d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 5390d9ce3a1SRobert Watson UNP_LOCK(); 540fc3fcacfSRobert Watson if (unp->unp_conn != NULL && unp->unp_conn->unp_addr!= NULL) 5410d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_conn->unp_addr; 542bdc5f6a3SHajimu UMEMOTO else { 543bdc5f6a3SHajimu UMEMOTO /* 544bdc5f6a3SHajimu UMEMOTO * XXX: It seems that this test always fails even when 545bdc5f6a3SHajimu UMEMOTO * connection is established. So, this else clause is 546bdc5f6a3SHajimu UMEMOTO * added as workaround to return PF_LOCAL sockaddr. 547bdc5f6a3SHajimu UMEMOTO */ 5480d9ce3a1SRobert Watson sa = &sun_noname; 549bdc5f6a3SHajimu UMEMOTO } 5500d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 5510d9ce3a1SRobert Watson UNP_UNLOCK(); 552e5aeaa0cSDag-Erling Smørgrav return (0); 553a29f300eSGarrett Wollman } 554a29f300eSGarrett Wollman 555a29f300eSGarrett Wollman static int 556a29f300eSGarrett Wollman uipc_rcvd(struct socket *so, int flags) 557a29f300eSGarrett Wollman { 55840f2ac28SRobert Watson struct unpcb *unp; 559a29f300eSGarrett Wollman struct socket *so2; 560337cc6b6SRobert Watson u_int mbcnt, sbcc; 5616aef685fSBrian Feldman u_long newhiwat; 562a29f300eSGarrett Wollman 56340f2ac28SRobert Watson unp = sotounpcb(so); 5644d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_rcvd: unp == NULL")); 565df8bae1dSRodney W. Grimes switch (so->so_type) { 566df8bae1dSRodney W. Grimes case SOCK_DGRAM: 567a29f300eSGarrett Wollman panic("uipc_rcvd DGRAM?"); 568df8bae1dSRodney W. Grimes /*NOTREACHED*/ 569df8bae1dSRodney W. Grimes 570df8bae1dSRodney W. Grimes case SOCK_STREAM: 571df8bae1dSRodney W. Grimes /* 5721c381b19SRobert Watson * Adjust backpressure on sender and wakeup any waiting to 5731c381b19SRobert Watson * write. 574df8bae1dSRodney W. Grimes */ 575337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 576337cc6b6SRobert Watson mbcnt = so->so_rcv.sb_mbcnt; 577337cc6b6SRobert Watson sbcc = so->so_rcv.sb_cc; 578337cc6b6SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 579337cc6b6SRobert Watson UNP_LOCK(); 580337cc6b6SRobert Watson if (unp->unp_conn == NULL) { 581337cc6b6SRobert Watson UNP_UNLOCK(); 582337cc6b6SRobert Watson break; 583337cc6b6SRobert Watson } 584337cc6b6SRobert Watson so2 = unp->unp_conn->unp_socket; 585337cc6b6SRobert Watson SOCKBUF_LOCK(&so2->so_snd); 586337cc6b6SRobert Watson so2->so_snd.sb_mbmax += unp->unp_mbcnt - mbcnt; 587337cc6b6SRobert Watson newhiwat = so2->so_snd.sb_hiwat + unp->unp_cc - sbcc; 588f535380cSDon Lewis (void)chgsbsize(so2->so_cred->cr_uidinfo, &so2->so_snd.sb_hiwat, 5896aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 5901e4d7da7SRobert Watson sowwakeup_locked(so2); 591337cc6b6SRobert Watson unp->unp_mbcnt = mbcnt; 592337cc6b6SRobert Watson unp->unp_cc = sbcc; 593337cc6b6SRobert Watson UNP_UNLOCK(); 594df8bae1dSRodney W. Grimes break; 595df8bae1dSRodney W. Grimes 596df8bae1dSRodney W. Grimes default: 597a29f300eSGarrett Wollman panic("uipc_rcvd unknown socktype"); 598df8bae1dSRodney W. Grimes } 599e5aeaa0cSDag-Erling Smørgrav return (0); 600a29f300eSGarrett Wollman } 601df8bae1dSRodney W. Grimes 602a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */ 603a29f300eSGarrett Wollman 604a29f300eSGarrett Wollman static int 60557bf258eSGarrett Wollman uipc_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam, 606b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 607a29f300eSGarrett Wollman { 608f3f49bbbSRobert Watson struct unpcb *unp, *unp2; 609a29f300eSGarrett Wollman struct socket *so2; 610337cc6b6SRobert Watson u_int mbcnt, sbcc; 6116aef685fSBrian Feldman u_long newhiwat; 612f3f49bbbSRobert Watson int error = 0; 613a29f300eSGarrett Wollman 61440f2ac28SRobert Watson unp = sotounpcb(so); 6154d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_send: unp == NULL")); 616a29f300eSGarrett Wollman if (flags & PRUS_OOB) { 617a29f300eSGarrett Wollman error = EOPNOTSUPP; 618a29f300eSGarrett Wollman goto release; 619a29f300eSGarrett Wollman } 620a29f300eSGarrett Wollman 621fc3fcacfSRobert Watson if (control != NULL && (error = unp_internalize(&control, td))) 622a29f300eSGarrett Wollman goto release; 623df8bae1dSRodney W. Grimes 6240d9ce3a1SRobert Watson UNP_LOCK(); 625a29f300eSGarrett Wollman switch (so->so_type) { 626a29f300eSGarrett Wollman case SOCK_DGRAM: 627a29f300eSGarrett Wollman { 628e7dd9a10SRobert Watson const struct sockaddr *from; 629df8bae1dSRodney W. Grimes 630fc3fcacfSRobert Watson if (nam != NULL) { 631fc3fcacfSRobert Watson if (unp->unp_conn != NULL) { 632df8bae1dSRodney W. Grimes error = EISCONN; 633df8bae1dSRodney W. Grimes break; 634df8bae1dSRodney W. Grimes } 635b40ce416SJulian Elischer error = unp_connect(so, nam, td); 636df8bae1dSRodney W. Grimes if (error) 637df8bae1dSRodney W. Grimes break; 638df8bae1dSRodney W. Grimes } 639b5ff0914SRobert Watson /* 640b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 641b5ff0914SRobert Watson * with a target address, it's possible that the socket will 642b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 643b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 644b5ff0914SRobert Watson * correct error that the socket is not connected. 645b5ff0914SRobert Watson */ 646f3f49bbbSRobert Watson unp2 = unp->unp_conn; 647b5ff0914SRobert Watson if (unp2 == NULL) { 648b5ff0914SRobert Watson error = ENOTCONN; 649b5ff0914SRobert Watson break; 650b5ff0914SRobert Watson } 651f3f49bbbSRobert Watson so2 = unp2->unp_socket; 652fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 65357bf258eSGarrett Wollman from = (struct sockaddr *)unp->unp_addr; 654df8bae1dSRodney W. Grimes else 655df8bae1dSRodney W. Grimes from = &sun_noname; 656f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) 6576a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 658a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 659a34b7046SRobert Watson if (sbappendaddr_locked(&so2->so_rcv, from, m, control)) { 6601e4d7da7SRobert Watson sorwakeup_locked(so2); 661fc3fcacfSRobert Watson m = NULL; 662fc3fcacfSRobert Watson control = NULL; 663e5aeaa0cSDag-Erling Smørgrav } else { 664a34b7046SRobert Watson SOCKBUF_UNLOCK(&so2->so_rcv); 665df8bae1dSRodney W. Grimes error = ENOBUFS; 666e5aeaa0cSDag-Erling Smørgrav } 667fc3fcacfSRobert Watson if (nam != NULL) 668df8bae1dSRodney W. Grimes unp_disconnect(unp); 669df8bae1dSRodney W. Grimes break; 670df8bae1dSRodney W. Grimes } 671df8bae1dSRodney W. Grimes 672df8bae1dSRodney W. Grimes case SOCK_STREAM: 6736b8fda4dSGarrett Wollman /* 6741c381b19SRobert Watson * Connect if not connected yet. 6751c381b19SRobert Watson * 6761c381b19SRobert Watson * Note: A better implementation would complain if not equal 6771c381b19SRobert Watson * to the peer's address. 6786b8fda4dSGarrett Wollman */ 679402cc72dSDavid Greenman if ((so->so_state & SS_ISCONNECTED) == 0) { 680fc3fcacfSRobert Watson if (nam != NULL) { 681b40ce416SJulian Elischer error = unp_connect(so, nam, td); 682402cc72dSDavid Greenman if (error) 6836b8fda4dSGarrett Wollman break; /* XXX */ 684402cc72dSDavid Greenman } else { 685402cc72dSDavid Greenman error = ENOTCONN; 686402cc72dSDavid Greenman break; 687402cc72dSDavid Greenman } 688402cc72dSDavid Greenman } 689402cc72dSDavid Greenman 690337cc6b6SRobert Watson /* Lockless read. */ 691c0b99ffaSRobert Watson if (so->so_snd.sb_state & SBS_CANTSENDMORE) { 692df8bae1dSRodney W. Grimes error = EPIPE; 693df8bae1dSRodney W. Grimes break; 694df8bae1dSRodney W. Grimes } 695b5ff0914SRobert Watson /* 696b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 697b5ff0914SRobert Watson * with a target address, it's possible that the socket will 698b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 699b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 700b5ff0914SRobert Watson * correct error that the socket is not connected. 701b5ff0914SRobert Watson */ 702f3f49bbbSRobert Watson unp2 = unp->unp_conn; 703b5ff0914SRobert Watson if (unp2 == NULL) { 704b5ff0914SRobert Watson error = ENOTCONN; 705b5ff0914SRobert Watson break; 706b5ff0914SRobert Watson } 707f3f49bbbSRobert Watson so2 = unp2->unp_socket; 708a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 709f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) { 7106a2989fdSMatthew N. Dodd /* 7116a2989fdSMatthew N. Dodd * Credentials are passed only once on 7126a2989fdSMatthew N. Dodd * SOCK_STREAM. 7136a2989fdSMatthew N. Dodd */ 714f3f49bbbSRobert Watson unp2->unp_flags &= ~UNP_WANTCRED; 7156a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 7166a2989fdSMatthew N. Dodd } 717df8bae1dSRodney W. Grimes /* 7181c381b19SRobert Watson * Send to paired receive port, and then reduce send buffer 7191c381b19SRobert Watson * hiwater marks to maintain backpressure. Wake up readers. 720df8bae1dSRodney W. Grimes */ 721fc3fcacfSRobert Watson if (control != NULL) { 722a34b7046SRobert Watson if (sbappendcontrol_locked(&so2->so_rcv, m, control)) 723fc3fcacfSRobert Watson control = NULL; 724e5aeaa0cSDag-Erling Smørgrav } else { 725a34b7046SRobert Watson sbappend_locked(&so2->so_rcv, m); 726e5aeaa0cSDag-Erling Smørgrav } 727f3f49bbbSRobert Watson mbcnt = so2->so_rcv.sb_mbcnt - unp2->unp_mbcnt; 728f3f49bbbSRobert Watson unp2->unp_mbcnt = so2->so_rcv.sb_mbcnt; 729337cc6b6SRobert Watson sbcc = so2->so_rcv.sb_cc; 730337cc6b6SRobert Watson sorwakeup_locked(so2); 731337cc6b6SRobert Watson 732337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_snd); 733f3f49bbbSRobert Watson newhiwat = so->so_snd.sb_hiwat - (sbcc - unp2->unp_cc); 734f535380cSDon Lewis (void)chgsbsize(so->so_cred->cr_uidinfo, &so->so_snd.sb_hiwat, 7356aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 736337cc6b6SRobert Watson so->so_snd.sb_mbmax -= mbcnt; 7377abe2ac2SAlan Cox SOCKBUF_UNLOCK(&so->so_snd); 738337cc6b6SRobert Watson 739f3f49bbbSRobert Watson unp2->unp_cc = sbcc; 740fc3fcacfSRobert Watson m = NULL; 741df8bae1dSRodney W. Grimes break; 742df8bae1dSRodney W. Grimes 743df8bae1dSRodney W. Grimes default: 744a29f300eSGarrett Wollman panic("uipc_send unknown socktype"); 745df8bae1dSRodney W. Grimes } 746a29f300eSGarrett Wollman 7476b8fda4dSGarrett Wollman /* 7486b8fda4dSGarrett Wollman * SEND_EOF is equivalent to a SEND followed by 7496b8fda4dSGarrett Wollman * a SHUTDOWN. 7506b8fda4dSGarrett Wollman */ 751a29f300eSGarrett Wollman if (flags & PRUS_EOF) { 7526b8fda4dSGarrett Wollman socantsendmore(so); 7536b8fda4dSGarrett Wollman unp_shutdown(unp); 7546b8fda4dSGarrett Wollman } 7550d9ce3a1SRobert Watson UNP_UNLOCK(); 756df8bae1dSRodney W. Grimes 757fc3fcacfSRobert Watson if (control != NULL && error != 0) 758bd508d39SDon Lewis unp_dispose(control); 759bd508d39SDon Lewis 760a29f300eSGarrett Wollman release: 761fc3fcacfSRobert Watson if (control != NULL) 762a29f300eSGarrett Wollman m_freem(control); 763fc3fcacfSRobert Watson if (m != NULL) 764a29f300eSGarrett Wollman m_freem(m); 765e5aeaa0cSDag-Erling Smørgrav return (error); 766a29f300eSGarrett Wollman } 767df8bae1dSRodney W. Grimes 768a29f300eSGarrett Wollman static int 769a29f300eSGarrett Wollman uipc_sense(struct socket *so, struct stat *sb) 770a29f300eSGarrett Wollman { 77140f2ac28SRobert Watson struct unpcb *unp; 772a29f300eSGarrett Wollman struct socket *so2; 773a29f300eSGarrett Wollman 77440f2ac28SRobert Watson unp = sotounpcb(so); 7754d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sense: unp == NULL")); 7764d4b555eSRobert Watson UNP_LOCK(); 777a29f300eSGarrett Wollman sb->st_blksize = so->so_snd.sb_hiwat; 778fc3fcacfSRobert Watson if (so->so_type == SOCK_STREAM && unp->unp_conn != NULL) { 779df8bae1dSRodney W. Grimes so2 = unp->unp_conn->unp_socket; 780a29f300eSGarrett Wollman sb->st_blksize += so2->so_rcv.sb_cc; 781df8bae1dSRodney W. Grimes } 782f3732fd1SPoul-Henning Kamp sb->st_dev = NODEV; 783df8bae1dSRodney W. Grimes if (unp->unp_ino == 0) 7846f782c46SJeffrey Hsu unp->unp_ino = (++unp_ino == 0) ? ++unp_ino : unp_ino; 785a29f300eSGarrett Wollman sb->st_ino = unp->unp_ino; 7860d9ce3a1SRobert Watson UNP_UNLOCK(); 787df8bae1dSRodney W. Grimes return (0); 788a29f300eSGarrett Wollman } 789df8bae1dSRodney W. Grimes 790a29f300eSGarrett Wollman static int 791a29f300eSGarrett Wollman uipc_shutdown(struct socket *so) 792a29f300eSGarrett Wollman { 79340f2ac28SRobert Watson struct unpcb *unp; 794df8bae1dSRodney W. Grimes 79540f2ac28SRobert Watson unp = sotounpcb(so); 7964d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_shutdown: unp == NULL")); 7974d4b555eSRobert Watson UNP_LOCK(); 798a29f300eSGarrett Wollman socantsendmore(so); 799a29f300eSGarrett Wollman unp_shutdown(unp); 8000d9ce3a1SRobert Watson UNP_UNLOCK(); 801e5aeaa0cSDag-Erling Smørgrav return (0); 802a29f300eSGarrett Wollman } 803df8bae1dSRodney W. Grimes 804a29f300eSGarrett Wollman static int 80557bf258eSGarrett Wollman uipc_sockaddr(struct socket *so, struct sockaddr **nam) 806a29f300eSGarrett Wollman { 80740f2ac28SRobert Watson struct unpcb *unp; 8080d9ce3a1SRobert Watson const struct sockaddr *sa; 809a29f300eSGarrett Wollman 8104d4b555eSRobert Watson unp = sotounpcb(so); 8114d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sockaddr: unp == NULL")); 8120d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 8130d9ce3a1SRobert Watson UNP_LOCK(); 814fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 8150d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_addr; 81683f3198bSThomas Moestl else 8170d9ce3a1SRobert Watson sa = &sun_noname; 8180d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 8190d9ce3a1SRobert Watson UNP_UNLOCK(); 820e5aeaa0cSDag-Erling Smørgrav return (0); 821df8bae1dSRodney W. Grimes } 822a29f300eSGarrett Wollman 823a29f300eSGarrett Wollman struct pr_usrreqs uipc_usrreqs = { 824756d52a1SPoul-Henning Kamp .pru_abort = uipc_abort, 825756d52a1SPoul-Henning Kamp .pru_accept = uipc_accept, 826756d52a1SPoul-Henning Kamp .pru_attach = uipc_attach, 827756d52a1SPoul-Henning Kamp .pru_bind = uipc_bind, 828756d52a1SPoul-Henning Kamp .pru_connect = uipc_connect, 829756d52a1SPoul-Henning Kamp .pru_connect2 = uipc_connect2, 830756d52a1SPoul-Henning Kamp .pru_detach = uipc_detach, 831756d52a1SPoul-Henning Kamp .pru_disconnect = uipc_disconnect, 832756d52a1SPoul-Henning Kamp .pru_listen = uipc_listen, 833756d52a1SPoul-Henning Kamp .pru_peeraddr = uipc_peeraddr, 834756d52a1SPoul-Henning Kamp .pru_rcvd = uipc_rcvd, 835756d52a1SPoul-Henning Kamp .pru_send = uipc_send, 836756d52a1SPoul-Henning Kamp .pru_sense = uipc_sense, 837756d52a1SPoul-Henning Kamp .pru_shutdown = uipc_shutdown, 838756d52a1SPoul-Henning Kamp .pru_sockaddr = uipc_sockaddr, 839a152f8a3SRobert Watson .pru_close = uipc_close, 840a29f300eSGarrett Wollman }; 841df8bae1dSRodney W. Grimes 8420c1bb4fbSDima Dorfman int 843892af6b9SRobert Watson uipc_ctloutput(struct socket *so, struct sockopt *sopt) 8440c1bb4fbSDima Dorfman { 84540f2ac28SRobert Watson struct unpcb *unp; 8460d9ce3a1SRobert Watson struct xucred xu; 8476a2989fdSMatthew N. Dodd int error, optval; 8486a2989fdSMatthew N. Dodd 84996a041b5SMatthew N. Dodd if (sopt->sopt_level != 0) 85096a041b5SMatthew N. Dodd return (EINVAL); 85196a041b5SMatthew N. Dodd 8526a2989fdSMatthew N. Dodd unp = sotounpcb(so); 8534d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_ctloutput: unp == NULL")); 8546a2989fdSMatthew N. Dodd error = 0; 8550c1bb4fbSDima Dorfman switch (sopt->sopt_dir) { 8560c1bb4fbSDima Dorfman case SOPT_GET: 8570c1bb4fbSDima Dorfman switch (sopt->sopt_name) { 8580c1bb4fbSDima Dorfman case LOCAL_PEERCRED: 8591f837c47SRobert Watson UNP_LOCK(); 8600c1bb4fbSDima Dorfman if (unp->unp_flags & UNP_HAVEPC) 8610d9ce3a1SRobert Watson xu = unp->unp_peercred; 8620c1bb4fbSDima Dorfman else { 8630c1bb4fbSDima Dorfman if (so->so_type == SOCK_STREAM) 8640c1bb4fbSDima Dorfman error = ENOTCONN; 8650c1bb4fbSDima Dorfman else 8660c1bb4fbSDima Dorfman error = EINVAL; 8670c1bb4fbSDima Dorfman } 8681f837c47SRobert Watson UNP_UNLOCK(); 8690d9ce3a1SRobert Watson if (error == 0) 8700d9ce3a1SRobert Watson error = sooptcopyout(sopt, &xu, sizeof(xu)); 8710c1bb4fbSDima Dorfman break; 8726a2989fdSMatthew N. Dodd case LOCAL_CREDS: 8731f837c47SRobert Watson /* Unocked read. */ 8746a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_WANTCRED ? 1 : 0; 8756a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 8766a2989fdSMatthew N. Dodd break; 8776a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 8781f837c47SRobert Watson /* Unocked read. */ 8796a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_CONNWAIT ? 1 : 0; 8806a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 8816a2989fdSMatthew N. Dodd break; 8820c1bb4fbSDima Dorfman default: 8830c1bb4fbSDima Dorfman error = EOPNOTSUPP; 8840c1bb4fbSDima Dorfman break; 8850c1bb4fbSDima Dorfman } 8860c1bb4fbSDima Dorfman break; 8870c1bb4fbSDima Dorfman case SOPT_SET: 8886a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 8896a2989fdSMatthew N. Dodd case LOCAL_CREDS: 8906a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 8916a2989fdSMatthew N. Dodd error = sooptcopyin(sopt, &optval, sizeof(optval), 8926a2989fdSMatthew N. Dodd sizeof(optval)); 8936a2989fdSMatthew N. Dodd if (error) 8946a2989fdSMatthew N. Dodd break; 8956a2989fdSMatthew N. Dodd 8966a2989fdSMatthew N. Dodd #define OPTSET(bit) \ 8976a2989fdSMatthew N. Dodd if (optval) \ 8986a2989fdSMatthew N. Dodd unp->unp_flags |= bit; \ 8996a2989fdSMatthew N. Dodd else \ 9006a2989fdSMatthew N. Dodd unp->unp_flags &= ~bit; 9016a2989fdSMatthew N. Dodd 9021f837c47SRobert Watson UNP_LOCK(); 9036a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 9046a2989fdSMatthew N. Dodd case LOCAL_CREDS: 9056a2989fdSMatthew N. Dodd OPTSET(UNP_WANTCRED); 9066a2989fdSMatthew N. Dodd break; 9076a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 9086a2989fdSMatthew N. Dodd OPTSET(UNP_CONNWAIT); 9096a2989fdSMatthew N. Dodd break; 9106a2989fdSMatthew N. Dodd default: 9116a2989fdSMatthew N. Dodd break; 9126a2989fdSMatthew N. Dodd } 9131f837c47SRobert Watson UNP_UNLOCK(); 9146a2989fdSMatthew N. Dodd break; 9156a2989fdSMatthew N. Dodd #undef OPTSET 9166a2989fdSMatthew N. Dodd default: 9176a2989fdSMatthew N. Dodd error = ENOPROTOOPT; 9186a2989fdSMatthew N. Dodd break; 9196a2989fdSMatthew N. Dodd } 920abb886faSMatthew N. Dodd break; 9210c1bb4fbSDima Dorfman default: 9220c1bb4fbSDima Dorfman error = EOPNOTSUPP; 9230c1bb4fbSDima Dorfman break; 9240c1bb4fbSDima Dorfman } 9250c1bb4fbSDima Dorfman return (error); 9260c1bb4fbSDima Dorfman } 9270c1bb4fbSDima Dorfman 928f708ef1bSPoul-Henning Kamp static int 929892af6b9SRobert Watson unp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 930df8bae1dSRodney W. Grimes { 931892af6b9SRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 932892af6b9SRobert Watson struct vnode *vp; 933892af6b9SRobert Watson struct socket *so2, *so3; 934b295bdcdSRobert Watson struct unpcb *unp, *unp2, *unp3; 93557bf258eSGarrett Wollman int error, len; 936df8bae1dSRodney W. Grimes struct nameidata nd; 93757bf258eSGarrett Wollman char buf[SOCK_MAXADDRLEN]; 9380d9ce3a1SRobert Watson struct sockaddr *sa; 9390d9ce3a1SRobert Watson 9400d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 941df8bae1dSRodney W. Grimes 9424d4b555eSRobert Watson unp = sotounpcb(so); 9434d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 94457bf258eSGarrett Wollman len = nam->sa_len - offsetof(struct sockaddr_un, sun_path); 94557bf258eSGarrett Wollman if (len <= 0) 946e5aeaa0cSDag-Erling Smørgrav return (EINVAL); 94755c85568SRobert Drehmel strlcpy(buf, soun->sun_path, len + 1); 9484f1f0ef5SRobert Watson if (unp->unp_flags & UNP_CONNECTING) { 9494f1f0ef5SRobert Watson UNP_UNLOCK(); 9504f1f0ef5SRobert Watson return (EALREADY); 9514f1f0ef5SRobert Watson } 95205102f04SRobert Watson unp->unp_flags |= UNP_CONNECTING; 9530d9ce3a1SRobert Watson UNP_UNLOCK(); 9540d9ce3a1SRobert Watson sa = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 9550d9ce3a1SRobert Watson mtx_lock(&Giant); 956b40ce416SJulian Elischer NDINIT(&nd, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, buf, td); 957797f2d22SPoul-Henning Kamp error = namei(&nd); 958797f2d22SPoul-Henning Kamp if (error) 9590d9ce3a1SRobert Watson vp = NULL; 9600d9ce3a1SRobert Watson else 961df8bae1dSRodney W. Grimes vp = nd.ni_vp; 9620d9ce3a1SRobert Watson ASSERT_VOP_LOCKED(vp, "unp_connect"); 963762e6b85SEivind Eklund NDFREE(&nd, NDF_ONLY_PNBUF); 9640d9ce3a1SRobert Watson if (error) 9650d9ce3a1SRobert Watson goto bad; 9660d9ce3a1SRobert Watson 967df8bae1dSRodney W. Grimes if (vp->v_type != VSOCK) { 968df8bae1dSRodney W. Grimes error = ENOTSOCK; 969df8bae1dSRodney W. Grimes goto bad; 970df8bae1dSRodney W. Grimes } 971a854ed98SJohn Baldwin error = VOP_ACCESS(vp, VWRITE, td->td_ucred, td); 972797f2d22SPoul-Henning Kamp if (error) 973df8bae1dSRodney W. Grimes goto bad; 9742260c03dSRobert Watson mtx_unlock(&Giant); 9752260c03dSRobert Watson UNP_LOCK(); 976b295bdcdSRobert Watson unp = sotounpcb(so); 9774d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 978df8bae1dSRodney W. Grimes so2 = vp->v_socket; 979fc3fcacfSRobert Watson if (so2 == NULL) { 980df8bae1dSRodney W. Grimes error = ECONNREFUSED; 9812260c03dSRobert Watson goto bad2; 982df8bae1dSRodney W. Grimes } 983df8bae1dSRodney W. Grimes if (so->so_type != so2->so_type) { 984df8bae1dSRodney W. Grimes error = EPROTOTYPE; 9852260c03dSRobert Watson goto bad2; 986df8bae1dSRodney W. Grimes } 987df8bae1dSRodney W. Grimes if (so->so_proto->pr_flags & PR_CONNREQUIRED) { 98846a1d9bfSRobert Watson if (so2->so_options & SO_ACCEPTCONN) 9890d9ce3a1SRobert Watson so3 = sonewconn(so2, 0); 99046a1d9bfSRobert Watson else 9910d9ce3a1SRobert Watson so3 = NULL; 9920d9ce3a1SRobert Watson if (so3 == NULL) { 993df8bae1dSRodney W. Grimes error = ECONNREFUSED; 9940d9ce3a1SRobert Watson goto bad2; 995df8bae1dSRodney W. Grimes } 9960c1bb4fbSDima Dorfman unp = sotounpcb(so); 997df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 998df8bae1dSRodney W. Grimes unp3 = sotounpcb(so3); 9990d9ce3a1SRobert Watson if (unp2->unp_addr != NULL) { 10000d9ce3a1SRobert Watson bcopy(unp2->unp_addr, sa, unp2->unp_addr->sun_len); 10010d9ce3a1SRobert Watson unp3->unp_addr = (struct sockaddr_un *) sa; 10020d9ce3a1SRobert Watson sa = NULL; 10030d9ce3a1SRobert Watson } 10040c1bb4fbSDima Dorfman /* 10050c1bb4fbSDima Dorfman * unp_peercred management: 10060c1bb4fbSDima Dorfman * 10071c381b19SRobert Watson * The connecter's (client's) credentials are copied from its 10081c381b19SRobert Watson * process structure at the time of connect() (which is now). 10090c1bb4fbSDima Dorfman */ 1010a854ed98SJohn Baldwin cru2x(td->td_ucred, &unp3->unp_peercred); 10110c1bb4fbSDima Dorfman unp3->unp_flags |= UNP_HAVEPC; 10120c1bb4fbSDima Dorfman /* 10131c381b19SRobert Watson * The receiver's (server's) credentials are copied from the 10141c381b19SRobert Watson * unp_peercred member of socket on which the former called 10151c381b19SRobert Watson * listen(); unp_listen() cached that process's credentials 10161c381b19SRobert Watson * at that time so we can use them now. 10170c1bb4fbSDima Dorfman */ 10180c1bb4fbSDima Dorfman KASSERT(unp2->unp_flags & UNP_HAVEPCCACHED, 10190c1bb4fbSDima Dorfman ("unp_connect: listener without cached peercred")); 10200c1bb4fbSDima Dorfman memcpy(&unp->unp_peercred, &unp2->unp_peercred, 10210c1bb4fbSDima Dorfman sizeof(unp->unp_peercred)); 10220c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPC; 1023481f8fe8SMaxim Konovalov if (unp2->unp_flags & UNP_WANTCRED) 1024481f8fe8SMaxim Konovalov unp3->unp_flags |= UNP_WANTCRED; 1025335654d7SRobert Watson #ifdef MAC 1026310e7cebSRobert Watson SOCK_LOCK(so); 1027335654d7SRobert Watson mac_set_socket_peer_from_socket(so, so3); 1028335654d7SRobert Watson mac_set_socket_peer_from_socket(so3, so); 1029310e7cebSRobert Watson SOCK_UNLOCK(so); 1030335654d7SRobert Watson #endif 10310c1bb4fbSDima Dorfman 1032df8bae1dSRodney W. Grimes so2 = so3; 1033df8bae1dSRodney W. Grimes } 10346a2989fdSMatthew N. Dodd error = unp_connect2(so, so2, PRU_CONNECT); 10350d9ce3a1SRobert Watson bad2: 10360d9ce3a1SRobert Watson UNP_UNLOCK(); 10370d9ce3a1SRobert Watson mtx_lock(&Giant); 1038df8bae1dSRodney W. Grimes bad: 10390d9ce3a1SRobert Watson mtx_assert(&Giant, MA_OWNED); 10400d9ce3a1SRobert Watson if (vp != NULL) 1041df8bae1dSRodney W. Grimes vput(vp); 10420d9ce3a1SRobert Watson mtx_unlock(&Giant); 10430d9ce3a1SRobert Watson free(sa, M_SONAME); 10440d9ce3a1SRobert Watson UNP_LOCK(); 10454f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_CONNECTING; 1046df8bae1dSRodney W. Grimes return (error); 1047df8bae1dSRodney W. Grimes } 1048df8bae1dSRodney W. Grimes 1049db48c0d2SRobert Watson static int 10506a2989fdSMatthew N. Dodd unp_connect2(struct socket *so, struct socket *so2, int req) 1051df8bae1dSRodney W. Grimes { 1052892af6b9SRobert Watson struct unpcb *unp = sotounpcb(so); 1053892af6b9SRobert Watson struct unpcb *unp2; 1054df8bae1dSRodney W. Grimes 10550d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 10560d9ce3a1SRobert Watson 1057df8bae1dSRodney W. Grimes if (so2->so_type != so->so_type) 1058df8bae1dSRodney W. Grimes return (EPROTOTYPE); 1059df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 10604d4b555eSRobert Watson KASSERT(unp2 != NULL, ("unp_connect2: unp2 == NULL")); 1061df8bae1dSRodney W. Grimes unp->unp_conn = unp2; 1062df8bae1dSRodney W. Grimes switch (so->so_type) { 1063df8bae1dSRodney W. Grimes case SOCK_DGRAM: 106498271db4SGarrett Wollman LIST_INSERT_HEAD(&unp2->unp_refs, unp, unp_reflink); 1065df8bae1dSRodney W. Grimes soisconnected(so); 1066df8bae1dSRodney W. Grimes break; 1067df8bae1dSRodney W. Grimes 1068df8bae1dSRodney W. Grimes case SOCK_STREAM: 1069df8bae1dSRodney W. Grimes unp2->unp_conn = unp; 10706a2989fdSMatthew N. Dodd if (req == PRU_CONNECT && 10716a2989fdSMatthew N. Dodd ((unp->unp_flags | unp2->unp_flags) & UNP_CONNWAIT)) 10726a2989fdSMatthew N. Dodd soisconnecting(so); 10736a2989fdSMatthew N. Dodd else 1074df8bae1dSRodney W. Grimes soisconnected(so); 1075df8bae1dSRodney W. Grimes soisconnected(so2); 1076df8bae1dSRodney W. Grimes break; 1077df8bae1dSRodney W. Grimes 1078df8bae1dSRodney W. Grimes default: 1079df8bae1dSRodney W. Grimes panic("unp_connect2"); 1080df8bae1dSRodney W. Grimes } 1081df8bae1dSRodney W. Grimes return (0); 1082df8bae1dSRodney W. Grimes } 1083df8bae1dSRodney W. Grimes 1084f708ef1bSPoul-Henning Kamp static void 1085892af6b9SRobert Watson unp_disconnect(struct unpcb *unp) 1086df8bae1dSRodney W. Grimes { 1087892af6b9SRobert Watson struct unpcb *unp2 = unp->unp_conn; 10881b2e3b4bSRobert Watson struct socket *so; 1089df8bae1dSRodney W. Grimes 10900d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 10910d9ce3a1SRobert Watson 1092fc3fcacfSRobert Watson if (unp2 == NULL) 1093df8bae1dSRodney W. Grimes return; 1094fc3fcacfSRobert Watson unp->unp_conn = NULL; 1095df8bae1dSRodney W. Grimes switch (unp->unp_socket->so_type) { 1096df8bae1dSRodney W. Grimes case SOCK_DGRAM: 109798271db4SGarrett Wollman LIST_REMOVE(unp, unp_reflink); 10981b2e3b4bSRobert Watson so = unp->unp_socket; 10991b2e3b4bSRobert Watson SOCK_LOCK(so); 11001b2e3b4bSRobert Watson so->so_state &= ~SS_ISCONNECTED; 11011b2e3b4bSRobert Watson SOCK_UNLOCK(so); 1102df8bae1dSRodney W. Grimes break; 1103df8bae1dSRodney W. Grimes 1104df8bae1dSRodney W. Grimes case SOCK_STREAM: 1105df8bae1dSRodney W. Grimes soisdisconnected(unp->unp_socket); 1106fc3fcacfSRobert Watson unp2->unp_conn = NULL; 1107df8bae1dSRodney W. Grimes soisdisconnected(unp2->unp_socket); 1108df8bae1dSRodney W. Grimes break; 1109df8bae1dSRodney W. Grimes } 1110df8bae1dSRodney W. Grimes } 1111df8bae1dSRodney W. Grimes 11120d9ce3a1SRobert Watson /* 11131c381b19SRobert Watson * unp_pcblist() assumes that UNIX domain socket memory is never reclaimed by 11141c381b19SRobert Watson * the zone (UMA_ZONE_NOFREE), and as such potentially stale pointers are 11151c381b19SRobert Watson * safe to reference. It first scans the list of struct unpcb's to generate 11161c381b19SRobert Watson * a pointer list, then it rescans its list one entry at a time to 11170d9ce3a1SRobert Watson * externalize and copyout. It checks the generation number to see if a 11180d9ce3a1SRobert Watson * struct unpcb has been reused, and will skip it if so. 11190d9ce3a1SRobert Watson */ 112098271db4SGarrett Wollman static int 112182d9ae4eSPoul-Henning Kamp unp_pcblist(SYSCTL_HANDLER_ARGS) 112298271db4SGarrett Wollman { 1123f5ef029eSPoul-Henning Kamp int error, i, n; 11249ae328fcSJohn Baldwin int freeunp; 112598271db4SGarrett Wollman struct unpcb *unp, **unp_list; 112698271db4SGarrett Wollman unp_gen_t gencnt; 11278f364875SJulian Elischer struct xunpgen *xug; 112898271db4SGarrett Wollman struct unp_head *head; 11298f364875SJulian Elischer struct xunpcb *xu; 113098271db4SGarrett Wollman 1131a23d65bfSBruce Evans head = ((intptr_t)arg1 == SOCK_DGRAM ? &unp_dhead : &unp_shead); 113298271db4SGarrett Wollman 113398271db4SGarrett Wollman /* 113498271db4SGarrett Wollman * The process of preparing the PCB list is too time-consuming and 113598271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 113698271db4SGarrett Wollman */ 1137fc3fcacfSRobert Watson if (req->oldptr == NULL) { 113898271db4SGarrett Wollman n = unp_count; 11398f364875SJulian Elischer req->oldidx = 2 * (sizeof *xug) 114098271db4SGarrett Wollman + (n + n/8) * sizeof(struct xunpcb); 1141e5aeaa0cSDag-Erling Smørgrav return (0); 114298271db4SGarrett Wollman } 114398271db4SGarrett Wollman 1144fc3fcacfSRobert Watson if (req->newptr != NULL) 1145e5aeaa0cSDag-Erling Smørgrav return (EPERM); 114698271db4SGarrett Wollman 114798271db4SGarrett Wollman /* 114898271db4SGarrett Wollman * OK, now we're committed to doing something. 114998271db4SGarrett Wollman */ 1150a163d034SWarner Losh xug = malloc(sizeof(*xug), M_TEMP, M_WAITOK); 11510d9ce3a1SRobert Watson UNP_LOCK(); 115298271db4SGarrett Wollman gencnt = unp_gencnt; 115398271db4SGarrett Wollman n = unp_count; 11540d9ce3a1SRobert Watson UNP_UNLOCK(); 115598271db4SGarrett Wollman 11568f364875SJulian Elischer xug->xug_len = sizeof *xug; 11578f364875SJulian Elischer xug->xug_count = n; 11588f364875SJulian Elischer xug->xug_gen = gencnt; 11598f364875SJulian Elischer xug->xug_sogen = so_gencnt; 11608f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 11618f364875SJulian Elischer if (error) { 11628f364875SJulian Elischer free(xug, M_TEMP); 1163e5aeaa0cSDag-Erling Smørgrav return (error); 11648f364875SJulian Elischer } 116598271db4SGarrett Wollman 1166a163d034SWarner Losh unp_list = malloc(n * sizeof *unp_list, M_TEMP, M_WAITOK); 116798271db4SGarrett Wollman 11680d9ce3a1SRobert Watson UNP_LOCK(); 11692e3c8fcbSPoul-Henning Kamp for (unp = LIST_FIRST(head), i = 0; unp && i < n; 11702e3c8fcbSPoul-Henning Kamp unp = LIST_NEXT(unp, unp_link)) { 11718a7d8cc6SRobert Watson if (unp->unp_gencnt <= gencnt) { 1172a854ed98SJohn Baldwin if (cr_cansee(req->td->td_ucred, 11738a7d8cc6SRobert Watson unp->unp_socket->so_cred)) 11744787fd37SPaul Saab continue; 117598271db4SGarrett Wollman unp_list[i++] = unp; 11769ae328fcSJohn Baldwin unp->unp_refcount++; 117798271db4SGarrett Wollman } 11784787fd37SPaul Saab } 11790d9ce3a1SRobert Watson UNP_UNLOCK(); 11801c381b19SRobert Watson n = i; /* In case we lost some during malloc. */ 118198271db4SGarrett Wollman 118298271db4SGarrett Wollman error = 0; 1183fe2eee82SColin Percival xu = malloc(sizeof(*xu), M_TEMP, M_WAITOK | M_ZERO); 118498271db4SGarrett Wollman for (i = 0; i < n; i++) { 118598271db4SGarrett Wollman unp = unp_list[i]; 11869ae328fcSJohn Baldwin UNP_LOCK(); 11879ae328fcSJohn Baldwin unp->unp_refcount--; 11889ae328fcSJohn Baldwin if (unp->unp_refcount != 0 && unp->unp_gencnt <= gencnt) { 11898f364875SJulian Elischer xu->xu_len = sizeof *xu; 11908f364875SJulian Elischer xu->xu_unpp = unp; 119198271db4SGarrett Wollman /* 119298271db4SGarrett Wollman * XXX - need more locking here to protect against 119398271db4SGarrett Wollman * connect/disconnect races for SMP. 119498271db4SGarrett Wollman */ 1195fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 11968f364875SJulian Elischer bcopy(unp->unp_addr, &xu->xu_addr, 119798271db4SGarrett Wollman unp->unp_addr->sun_len); 1198fc3fcacfSRobert Watson if (unp->unp_conn != NULL && 1199fc3fcacfSRobert Watson unp->unp_conn->unp_addr != NULL) 120098271db4SGarrett Wollman bcopy(unp->unp_conn->unp_addr, 12018f364875SJulian Elischer &xu->xu_caddr, 120298271db4SGarrett Wollman unp->unp_conn->unp_addr->sun_len); 12038f364875SJulian Elischer bcopy(unp, &xu->xu_unp, sizeof *unp); 12048f364875SJulian Elischer sotoxsocket(unp->unp_socket, &xu->xu_socket); 12059ae328fcSJohn Baldwin UNP_UNLOCK(); 12068f364875SJulian Elischer error = SYSCTL_OUT(req, xu, sizeof *xu); 12079ae328fcSJohn Baldwin } else { 12089ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 12099ae328fcSJohn Baldwin UNP_UNLOCK(); 12109ae328fcSJohn Baldwin if (freeunp) 12119ae328fcSJohn Baldwin uma_zfree(unp_zone, unp); 121298271db4SGarrett Wollman } 121398271db4SGarrett Wollman } 12148f364875SJulian Elischer free(xu, M_TEMP); 121598271db4SGarrett Wollman if (!error) { 121698271db4SGarrett Wollman /* 12171c381b19SRobert Watson * Give the user an updated idea of our state. If the 12181c381b19SRobert Watson * generation differs from what we told her before, she knows 12191c381b19SRobert Watson * that something happened while we were processing this 12201c381b19SRobert Watson * request, and it might be necessary to retry. 122198271db4SGarrett Wollman */ 12228f364875SJulian Elischer xug->xug_gen = unp_gencnt; 12238f364875SJulian Elischer xug->xug_sogen = so_gencnt; 12248f364875SJulian Elischer xug->xug_count = unp_count; 12258f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 122698271db4SGarrett Wollman } 122798271db4SGarrett Wollman free(unp_list, M_TEMP); 12288f364875SJulian Elischer free(xug, M_TEMP); 1229e5aeaa0cSDag-Erling Smørgrav return (error); 123098271db4SGarrett Wollman } 123198271db4SGarrett Wollman 123298271db4SGarrett Wollman SYSCTL_PROC(_net_local_dgram, OID_AUTO, pcblist, CTLFLAG_RD, 123398271db4SGarrett Wollman (caddr_t)(long)SOCK_DGRAM, 0, unp_pcblist, "S,xunpcb", 123498271db4SGarrett Wollman "List of active local datagram sockets"); 123598271db4SGarrett Wollman SYSCTL_PROC(_net_local_stream, OID_AUTO, pcblist, CTLFLAG_RD, 123698271db4SGarrett Wollman (caddr_t)(long)SOCK_STREAM, 0, unp_pcblist, "S,xunpcb", 123798271db4SGarrett Wollman "List of active local stream sockets"); 123898271db4SGarrett Wollman 1239f708ef1bSPoul-Henning Kamp static void 1240892af6b9SRobert Watson unp_shutdown(struct unpcb *unp) 1241df8bae1dSRodney W. Grimes { 1242df8bae1dSRodney W. Grimes struct socket *so; 1243df8bae1dSRodney W. Grimes 12440d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 12450d9ce3a1SRobert Watson 1246df8bae1dSRodney W. Grimes if (unp->unp_socket->so_type == SOCK_STREAM && unp->unp_conn && 1247df8bae1dSRodney W. Grimes (so = unp->unp_conn->unp_socket)) 1248df8bae1dSRodney W. Grimes socantrcvmore(so); 1249df8bae1dSRodney W. Grimes } 1250df8bae1dSRodney W. Grimes 1251f708ef1bSPoul-Henning Kamp static void 1252892af6b9SRobert Watson unp_drop(struct unpcb *unp, int errno) 1253df8bae1dSRodney W. Grimes { 1254df8bae1dSRodney W. Grimes struct socket *so = unp->unp_socket; 1255df8bae1dSRodney W. Grimes 12560d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 12570d9ce3a1SRobert Watson 1258df8bae1dSRodney W. Grimes so->so_error = errno; 1259df8bae1dSRodney W. Grimes unp_disconnect(unp); 1260df8bae1dSRodney W. Grimes } 1261df8bae1dSRodney W. Grimes 12622bc21ed9SDavid Malone static void 1263892af6b9SRobert Watson unp_freerights(struct file **rp, int fdcount) 1264df8bae1dSRodney W. Grimes { 12652bc21ed9SDavid Malone int i; 12662bc21ed9SDavid Malone struct file *fp; 1267df8bae1dSRodney W. Grimes 12682bc21ed9SDavid Malone for (i = 0; i < fdcount; i++) { 1269df8bae1dSRodney W. Grimes fp = *rp; 12708692c025SYoshinobu Inoue /* 12711c381b19SRobert Watson * Zero the pointer before calling unp_discard since it may 12721c381b19SRobert Watson * end up in unp_gc().. 1273d7dca903SRobert Watson * 1274d7dca903SRobert Watson * XXXRW: This is less true than it used to be. 12758692c025SYoshinobu Inoue */ 1276df8bae1dSRodney W. Grimes *rp++ = 0; 12778692c025SYoshinobu Inoue unp_discard(fp); 1278df8bae1dSRodney W. Grimes } 12792bc21ed9SDavid Malone } 12802bc21ed9SDavid Malone 12812bc21ed9SDavid Malone int 1282892af6b9SRobert Watson unp_externalize(struct mbuf *control, struct mbuf **controlp) 12832bc21ed9SDavid Malone { 12842bc21ed9SDavid Malone struct thread *td = curthread; /* XXX */ 12852bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 12862bc21ed9SDavid Malone int i; 12872bc21ed9SDavid Malone int *fdp; 12882bc21ed9SDavid Malone struct file **rp; 12892bc21ed9SDavid Malone struct file *fp; 12902bc21ed9SDavid Malone void *data; 12912bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 12922bc21ed9SDavid Malone int error, newfds; 12932bc21ed9SDavid Malone int f; 12942bc21ed9SDavid Malone u_int newlen; 12952bc21ed9SDavid Malone 12964c5bc1caSRobert Watson UNP_UNLOCK_ASSERT(); 12974c5bc1caSRobert Watson 12982bc21ed9SDavid Malone error = 0; 12992bc21ed9SDavid Malone if (controlp != NULL) /* controlp == NULL => free control messages */ 13002bc21ed9SDavid Malone *controlp = NULL; 13012bc21ed9SDavid Malone 13022bc21ed9SDavid Malone while (cm != NULL) { 13032bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) { 13042bc21ed9SDavid Malone error = EINVAL; 13052bc21ed9SDavid Malone break; 13062bc21ed9SDavid Malone } 13072bc21ed9SDavid Malone 13082bc21ed9SDavid Malone data = CMSG_DATA(cm); 13092bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 13102bc21ed9SDavid Malone 13112bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET 13122bc21ed9SDavid Malone && cm->cmsg_type == SCM_RIGHTS) { 13132bc21ed9SDavid Malone newfds = datalen / sizeof(struct file *); 13142bc21ed9SDavid Malone rp = data; 13152bc21ed9SDavid Malone 1316e2f9a08bSOlivier Houchard /* If we're not outputting the descriptors free them. */ 13172bc21ed9SDavid Malone if (error || controlp == NULL) { 13182bc21ed9SDavid Malone unp_freerights(rp, newfds); 13192bc21ed9SDavid Malone goto next; 13202bc21ed9SDavid Malone } 1321426da3bcSAlfred Perlstein FILEDESC_LOCK(td->td_proc->p_fd); 13222bc21ed9SDavid Malone /* if the new FD's will not fit free them. */ 13232bc21ed9SDavid Malone if (!fdavail(td, newfds)) { 1324426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13252bc21ed9SDavid Malone error = EMSGSIZE; 13262bc21ed9SDavid Malone unp_freerights(rp, newfds); 13272bc21ed9SDavid Malone goto next; 1328df8bae1dSRodney W. Grimes } 1329ed5b7817SJulian Elischer /* 13301c381b19SRobert Watson * Now change each pointer to an fd in the global 13311c381b19SRobert Watson * table to an integer that is the index to the local 13321c381b19SRobert Watson * fd table entry that we set up to point to the 13331c381b19SRobert Watson * global one we are transferring. 1334ed5b7817SJulian Elischer */ 13352bc21ed9SDavid Malone newlen = newfds * sizeof(int); 13362bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 13372bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 13382bc21ed9SDavid Malone if (*controlp == NULL) { 1339426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13402bc21ed9SDavid Malone error = E2BIG; 13412bc21ed9SDavid Malone unp_freerights(rp, newfds); 13422bc21ed9SDavid Malone goto next; 13432bc21ed9SDavid Malone } 13442bc21ed9SDavid Malone 13452bc21ed9SDavid Malone fdp = (int *) 13462bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 1347df8bae1dSRodney W. Grimes for (i = 0; i < newfds; i++) { 1348a6d4491cSDag-Erling Smørgrav if (fdalloc(td, 0, &f)) 13492bc21ed9SDavid Malone panic("unp_externalize fdalloc failed"); 13508692c025SYoshinobu Inoue fp = *rp++; 1351b40ce416SJulian Elischer td->td_proc->p_fd->fd_ofiles[f] = fp; 1352426da3bcSAlfred Perlstein FILE_LOCK(fp); 1353df8bae1dSRodney W. Grimes fp->f_msgcount--; 1354426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1355df8bae1dSRodney W. Grimes unp_rights--; 13568692c025SYoshinobu Inoue *fdp++ = f; 1357df8bae1dSRodney W. Grimes } 1358426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13591c381b19SRobert Watson } else { 13601c381b19SRobert Watson /* We can just copy anything else across. */ 13612bc21ed9SDavid Malone if (error || controlp == NULL) 13622bc21ed9SDavid Malone goto next; 13632bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, datalen, 13642bc21ed9SDavid Malone cm->cmsg_type, cm->cmsg_level); 13652bc21ed9SDavid Malone if (*controlp == NULL) { 13662bc21ed9SDavid Malone error = ENOBUFS; 13672bc21ed9SDavid Malone goto next; 13682bc21ed9SDavid Malone } 13692bc21ed9SDavid Malone bcopy(data, 13702bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)), 13712bc21ed9SDavid Malone datalen); 13722bc21ed9SDavid Malone } 13732bc21ed9SDavid Malone 13742bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 13752bc21ed9SDavid Malone 13762bc21ed9SDavid Malone next: 13772bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 13782bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 13792bc21ed9SDavid Malone cm = (struct cmsghdr *) 13802bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 13818692c025SYoshinobu Inoue } else { 13822bc21ed9SDavid Malone clen = 0; 13832bc21ed9SDavid Malone cm = NULL; 13848692c025SYoshinobu Inoue } 13858692c025SYoshinobu Inoue } 13868692c025SYoshinobu Inoue 13872bc21ed9SDavid Malone m_freem(control); 13882bc21ed9SDavid Malone 13892bc21ed9SDavid Malone return (error); 1390df8bae1dSRodney W. Grimes } 1391df8bae1dSRodney W. Grimes 13924f590175SPaul Saab static void 13934f590175SPaul Saab unp_zone_change(void *tag) 13944f590175SPaul Saab { 13954f590175SPaul Saab 13964f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 13974f590175SPaul Saab } 13984f590175SPaul Saab 139998271db4SGarrett Wollman void 140098271db4SGarrett Wollman unp_init(void) 140198271db4SGarrett Wollman { 14021c381b19SRobert Watson 14039e9d298aSJeff Roberson unp_zone = uma_zcreate("unpcb", sizeof(struct unpcb), NULL, NULL, 14049ae328fcSJohn Baldwin NULL, NULL, UMA_ALIGN_PTR, 0); 1405fc3fcacfSRobert Watson if (unp_zone == NULL) 140698271db4SGarrett Wollman panic("unp_init"); 14074f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 14084f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, unp_zone_change, 14094f590175SPaul Saab NULL, EVENTHANDLER_PRI_ANY); 141098271db4SGarrett Wollman LIST_INIT(&unp_dhead); 141198271db4SGarrett Wollman LIST_INIT(&unp_shead); 1412a0ec558aSRobert Watson TASK_INIT(&unp_gc_task, 0, unp_gc, NULL); 14130d9ce3a1SRobert Watson UNP_LOCK_INIT(); 141498271db4SGarrett Wollman } 141598271db4SGarrett Wollman 1416f708ef1bSPoul-Henning Kamp static int 1417892af6b9SRobert Watson unp_internalize(struct mbuf **controlp, struct thread *td) 1418df8bae1dSRodney W. Grimes { 14192bc21ed9SDavid Malone struct mbuf *control = *controlp; 1420b40ce416SJulian Elischer struct proc *p = td->td_proc; 14218692c025SYoshinobu Inoue struct filedesc *fdescp = p->p_fd; 14222bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 14232bc21ed9SDavid Malone struct cmsgcred *cmcred; 14242bc21ed9SDavid Malone struct file **rp; 14252bc21ed9SDavid Malone struct file *fp; 14262bc21ed9SDavid Malone struct timeval *tv; 14272bc21ed9SDavid Malone int i, fd, *fdp; 14282bc21ed9SDavid Malone void *data; 14292bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 14302bc21ed9SDavid Malone int error, oldfds; 14318692c025SYoshinobu Inoue u_int newlen; 1432df8bae1dSRodney W. Grimes 14334c5bc1caSRobert Watson UNP_UNLOCK_ASSERT(); 14344c5bc1caSRobert Watson 14352bc21ed9SDavid Malone error = 0; 14362bc21ed9SDavid Malone *controlp = NULL; 14370b788fa1SBill Paul 14382bc21ed9SDavid Malone while (cm != NULL) { 14392bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_level != SOL_SOCKET 14402bc21ed9SDavid Malone || cm->cmsg_len > clen) { 14412bc21ed9SDavid Malone error = EINVAL; 14422bc21ed9SDavid Malone goto out; 14432bc21ed9SDavid Malone } 14442bc21ed9SDavid Malone 14452bc21ed9SDavid Malone data = CMSG_DATA(cm); 14462bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 14472bc21ed9SDavid Malone 14482bc21ed9SDavid Malone switch (cm->cmsg_type) { 14490b788fa1SBill Paul /* 14500b788fa1SBill Paul * Fill in credential information. 14510b788fa1SBill Paul */ 14522bc21ed9SDavid Malone case SCM_CREDS: 14532bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*cmcred), 14542bc21ed9SDavid Malone SCM_CREDS, SOL_SOCKET); 14552bc21ed9SDavid Malone if (*controlp == NULL) { 14562bc21ed9SDavid Malone error = ENOBUFS; 14572bc21ed9SDavid Malone goto out; 14582bc21ed9SDavid Malone } 14592bc21ed9SDavid Malone 14602bc21ed9SDavid Malone cmcred = (struct cmsgcred *) 14612bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 14620b788fa1SBill Paul cmcred->cmcred_pid = p->p_pid; 1463a854ed98SJohn Baldwin cmcred->cmcred_uid = td->td_ucred->cr_ruid; 1464a854ed98SJohn Baldwin cmcred->cmcred_gid = td->td_ucred->cr_rgid; 1465a854ed98SJohn Baldwin cmcred->cmcred_euid = td->td_ucred->cr_uid; 1466a854ed98SJohn Baldwin cmcred->cmcred_ngroups = MIN(td->td_ucred->cr_ngroups, 14670b788fa1SBill Paul CMGROUP_MAX); 14680b788fa1SBill Paul for (i = 0; i < cmcred->cmcred_ngroups; i++) 14692bc21ed9SDavid Malone cmcred->cmcred_groups[i] = 1470a854ed98SJohn Baldwin td->td_ucred->cr_groups[i]; 14712bc21ed9SDavid Malone break; 14720b788fa1SBill Paul 14732bc21ed9SDavid Malone case SCM_RIGHTS: 14742bc21ed9SDavid Malone oldfds = datalen / sizeof (int); 1475ed5b7817SJulian Elischer /* 14761c381b19SRobert Watson * Check that all the FDs passed in refer to legal 14771c381b19SRobert Watson * files. If not, reject the entire operation. 1478ed5b7817SJulian Elischer */ 14792bc21ed9SDavid Malone fdp = data; 1480426da3bcSAlfred Perlstein FILEDESC_LOCK(fdescp); 1481df8bae1dSRodney W. Grimes for (i = 0; i < oldfds; i++) { 14828692c025SYoshinobu Inoue fd = *fdp++; 14838692c025SYoshinobu Inoue if ((unsigned)fd >= fdescp->fd_nfiles || 14842bc21ed9SDavid Malone fdescp->fd_ofiles[fd] == NULL) { 1485426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 14862bc21ed9SDavid Malone error = EBADF; 14872bc21ed9SDavid Malone goto out; 14882bc21ed9SDavid Malone } 1489e7d6662fSAlfred Perlstein fp = fdescp->fd_ofiles[fd]; 1490e7d6662fSAlfred Perlstein if (!(fp->f_ops->fo_flags & DFLAG_PASSABLE)) { 1491e7d6662fSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 1492e7d6662fSAlfred Perlstein error = EOPNOTSUPP; 1493e7d6662fSAlfred Perlstein goto out; 1494e7d6662fSAlfred Perlstein } 1495e7d6662fSAlfred Perlstein 1496df8bae1dSRodney W. Grimes } 1497ed5b7817SJulian Elischer /* 14981c381b19SRobert Watson * Now replace the integer FDs with pointers to the 14991c381b19SRobert Watson * associated global file table entry.. 1500ed5b7817SJulian Elischer */ 15012bc21ed9SDavid Malone newlen = oldfds * sizeof(struct file *); 15022bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 15032bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 15042bc21ed9SDavid Malone if (*controlp == NULL) { 1505426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 15062bc21ed9SDavid Malone error = E2BIG; 15072bc21ed9SDavid Malone goto out; 15088692c025SYoshinobu Inoue } 15098692c025SYoshinobu Inoue 15102bc21ed9SDavid Malone fdp = data; 15112bc21ed9SDavid Malone rp = (struct file **) 15122bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 15138692c025SYoshinobu Inoue for (i = 0; i < oldfds; i++) { 15148692c025SYoshinobu Inoue fp = fdescp->fd_ofiles[*fdp++]; 1515df8bae1dSRodney W. Grimes *rp++ = fp; 1516426da3bcSAlfred Perlstein FILE_LOCK(fp); 1517df8bae1dSRodney W. Grimes fp->f_count++; 1518df8bae1dSRodney W. Grimes fp->f_msgcount++; 1519426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1520df8bae1dSRodney W. Grimes unp_rights++; 1521df8bae1dSRodney W. Grimes } 1522426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 15232bc21ed9SDavid Malone break; 15242bc21ed9SDavid Malone 15252bc21ed9SDavid Malone case SCM_TIMESTAMP: 15262bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*tv), 15272bc21ed9SDavid Malone SCM_TIMESTAMP, SOL_SOCKET); 15282bc21ed9SDavid Malone if (*controlp == NULL) { 15292bc21ed9SDavid Malone error = ENOBUFS; 15302bc21ed9SDavid Malone goto out; 15318692c025SYoshinobu Inoue } 15322bc21ed9SDavid Malone tv = (struct timeval *) 15332bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 15342bc21ed9SDavid Malone microtime(tv); 15352bc21ed9SDavid Malone break; 15362bc21ed9SDavid Malone 15372bc21ed9SDavid Malone default: 15382bc21ed9SDavid Malone error = EINVAL; 15392bc21ed9SDavid Malone goto out; 15402bc21ed9SDavid Malone } 15412bc21ed9SDavid Malone 15422bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 15432bc21ed9SDavid Malone 15442bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 15452bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 15462bc21ed9SDavid Malone cm = (struct cmsghdr *) 15472bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 15482bc21ed9SDavid Malone } else { 15492bc21ed9SDavid Malone clen = 0; 15502bc21ed9SDavid Malone cm = NULL; 15512bc21ed9SDavid Malone } 15522bc21ed9SDavid Malone } 15532bc21ed9SDavid Malone 15542bc21ed9SDavid Malone out: 15552bc21ed9SDavid Malone m_freem(control); 15562bc21ed9SDavid Malone 15572bc21ed9SDavid Malone return (error); 1558df8bae1dSRodney W. Grimes } 1559df8bae1dSRodney W. Grimes 15606a2989fdSMatthew N. Dodd struct mbuf * 15616a2989fdSMatthew N. Dodd unp_addsockcred(struct thread *td, struct mbuf *control) 15626a2989fdSMatthew N. Dodd { 156370df31f4SMaxim Konovalov struct mbuf *m, *n, *n_prev; 15646a2989fdSMatthew N. Dodd struct sockcred *sc; 156570df31f4SMaxim Konovalov const struct cmsghdr *cm; 15666a2989fdSMatthew N. Dodd int ngroups; 15676a2989fdSMatthew N. Dodd int i; 15686a2989fdSMatthew N. Dodd 15696a2989fdSMatthew N. Dodd ngroups = MIN(td->td_ucred->cr_ngroups, CMGROUP_MAX); 15706a2989fdSMatthew N. Dodd 15716a2989fdSMatthew N. Dodd m = sbcreatecontrol(NULL, SOCKCREDSIZE(ngroups), SCM_CREDS, SOL_SOCKET); 15726a2989fdSMatthew N. Dodd if (m == NULL) 15736a2989fdSMatthew N. Dodd return (control); 15746a2989fdSMatthew N. Dodd 15756a2989fdSMatthew N. Dodd sc = (struct sockcred *) CMSG_DATA(mtod(m, struct cmsghdr *)); 15766a2989fdSMatthew N. Dodd sc->sc_uid = td->td_ucred->cr_ruid; 15776a2989fdSMatthew N. Dodd sc->sc_euid = td->td_ucred->cr_uid; 15786a2989fdSMatthew N. Dodd sc->sc_gid = td->td_ucred->cr_rgid; 15796a2989fdSMatthew N. Dodd sc->sc_egid = td->td_ucred->cr_gid; 15806a2989fdSMatthew N. Dodd sc->sc_ngroups = ngroups; 15816a2989fdSMatthew N. Dodd for (i = 0; i < sc->sc_ngroups; i++) 15826a2989fdSMatthew N. Dodd sc->sc_groups[i] = td->td_ucred->cr_groups[i]; 15836a2989fdSMatthew N. Dodd 15846a2989fdSMatthew N. Dodd /* 15851c381b19SRobert Watson * Unlink SCM_CREDS control messages (struct cmsgcred), since just 15861c381b19SRobert Watson * created SCM_CREDS control message (struct sockcred) has another 15871c381b19SRobert Watson * format. 15886a2989fdSMatthew N. Dodd */ 158970df31f4SMaxim Konovalov if (control != NULL) 159070df31f4SMaxim Konovalov for (n = control, n_prev = NULL; n != NULL;) { 159170df31f4SMaxim Konovalov cm = mtod(n, struct cmsghdr *); 159270df31f4SMaxim Konovalov if (cm->cmsg_level == SOL_SOCKET && 159370df31f4SMaxim Konovalov cm->cmsg_type == SCM_CREDS) { 159470df31f4SMaxim Konovalov if (n_prev == NULL) 159570df31f4SMaxim Konovalov control = n->m_next; 159670df31f4SMaxim Konovalov else 159770df31f4SMaxim Konovalov n_prev->m_next = n->m_next; 159870df31f4SMaxim Konovalov n = m_free(n); 159970df31f4SMaxim Konovalov } else { 160070df31f4SMaxim Konovalov n_prev = n; 160170df31f4SMaxim Konovalov n = n->m_next; 160270df31f4SMaxim Konovalov } 160370df31f4SMaxim Konovalov } 16046a2989fdSMatthew N. Dodd 160570df31f4SMaxim Konovalov /* Prepend it to the head. */ 160670df31f4SMaxim Konovalov m->m_next = control; 160770df31f4SMaxim Konovalov 160870df31f4SMaxim Konovalov return (m); 16096a2989fdSMatthew N. Dodd } 16106a2989fdSMatthew N. Dodd 1611161a0c7cSRobert Watson /* 1612a0ec558aSRobert Watson * unp_defer indicates whether additional work has been defered for a future 1613a0ec558aSRobert Watson * pass through unp_gc(). It is thread local and does not require explicit 1614a0ec558aSRobert Watson * synchronization. 1615161a0c7cSRobert Watson */ 1616a0ec558aSRobert Watson static int unp_defer; 1617a0ec558aSRobert Watson 1618a0ec558aSRobert Watson static int unp_taskcount; 1619a0ec558aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, taskcount, CTLFLAG_RD, &unp_taskcount, 0, ""); 1620a0ec558aSRobert Watson 1621a0ec558aSRobert Watson static int unp_recycled; 1622a0ec558aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, recycled, CTLFLAG_RD, &unp_recycled, 0, ""); 1623df8bae1dSRodney W. Grimes 1624f708ef1bSPoul-Henning Kamp static void 1625a0ec558aSRobert Watson unp_gc(__unused void *arg, int pending) 1626df8bae1dSRodney W. Grimes { 1627892af6b9SRobert Watson struct file *fp, *nextfp; 1628892af6b9SRobert Watson struct socket *so; 1629df8bae1dSRodney W. Grimes struct file **extra_ref, **fpp; 1630df8bae1dSRodney W. Grimes int nunref, i; 163195f004dcSAlfred Perlstein int nfiles_snap; 163295f004dcSAlfred Perlstein int nfiles_slack = 20; 1633df8bae1dSRodney W. Grimes 1634a0ec558aSRobert Watson unp_taskcount++; 1635df8bae1dSRodney W. Grimes unp_defer = 0; 1636ed5b7817SJulian Elischer /* 16379ae328fcSJohn Baldwin * Before going through all this, set all FDs to be NOT deferred and 16381c381b19SRobert Watson * NOT externally accessible. 1639ed5b7817SJulian Elischer */ 1640426da3bcSAlfred Perlstein sx_slock(&filelist_lock); 16412e3c8fcbSPoul-Henning Kamp LIST_FOREACH(fp, &filehead, f_list) 1642426da3bcSAlfred Perlstein fp->f_gcflag &= ~(FMARK|FDEFER); 1643df8bae1dSRodney W. Grimes do { 16445bb84bc8SRobert Watson KASSERT(unp_defer >= 0, ("unp_gc: unp_defer %d", unp_defer)); 16452e3c8fcbSPoul-Henning Kamp LIST_FOREACH(fp, &filehead, f_list) { 1646426da3bcSAlfred Perlstein FILE_LOCK(fp); 1647ed5b7817SJulian Elischer /* 1648a0ec558aSRobert Watson * If the file is not open, skip it -- could be a 1649a0ec558aSRobert Watson * file in the process of being opened, or in the 1650a0ec558aSRobert Watson * process of being closed. If the file is 1651a0ec558aSRobert Watson * "closing", it may have been marked for deferred 1652a0ec558aSRobert Watson * consideration. Clear the flag now if so. 1653ed5b7817SJulian Elischer */ 1654426da3bcSAlfred Perlstein if (fp->f_count == 0) { 1655a0ec558aSRobert Watson if (fp->f_gcflag & FDEFER) 1656a0ec558aSRobert Watson unp_defer--; 1657a0ec558aSRobert Watson fp->f_gcflag &= ~(FMARK|FDEFER); 1658426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1659df8bae1dSRodney W. Grimes continue; 1660426da3bcSAlfred Perlstein } 1661ed5b7817SJulian Elischer /* 16629ae328fcSJohn Baldwin * If we already marked it as 'defer' in a 16639ae328fcSJohn Baldwin * previous pass, then try to process it this 16649ae328fcSJohn Baldwin * time and un-mark it. 1665ed5b7817SJulian Elischer */ 1666426da3bcSAlfred Perlstein if (fp->f_gcflag & FDEFER) { 1667426da3bcSAlfred Perlstein fp->f_gcflag &= ~FDEFER; 1668df8bae1dSRodney W. Grimes unp_defer--; 1669df8bae1dSRodney W. Grimes } else { 1670ed5b7817SJulian Elischer /* 16719ae328fcSJohn Baldwin * if it's not deferred, then check if it's 1672ed5b7817SJulian Elischer * already marked.. if so skip it 1673ed5b7817SJulian Elischer */ 1674426da3bcSAlfred Perlstein if (fp->f_gcflag & FMARK) { 1675426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1676df8bae1dSRodney W. Grimes continue; 1677426da3bcSAlfred Perlstein } 1678ed5b7817SJulian Elischer /* 16791c381b19SRobert Watson * If all references are from messages in 16801c381b19SRobert Watson * transit, then skip it. it's not externally 16811c381b19SRobert Watson * accessible. 1682ed5b7817SJulian Elischer */ 1683426da3bcSAlfred Perlstein if (fp->f_count == fp->f_msgcount) { 1684426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1685df8bae1dSRodney W. Grimes continue; 1686426da3bcSAlfred Perlstein } 1687ed5b7817SJulian Elischer /* 1688ed5b7817SJulian Elischer * If it got this far then it must be 1689ed5b7817SJulian Elischer * externally accessible. 1690ed5b7817SJulian Elischer */ 1691426da3bcSAlfred Perlstein fp->f_gcflag |= FMARK; 1692df8bae1dSRodney W. Grimes } 1693ed5b7817SJulian Elischer /* 16949ae328fcSJohn Baldwin * Either it was deferred, or it is externally 16951c381b19SRobert Watson * accessible and not already marked so. Now check 16961c381b19SRobert Watson * if it is possibly one of OUR sockets. 1697ed5b7817SJulian Elischer */ 1698df8bae1dSRodney W. Grimes if (fp->f_type != DTYPE_SOCKET || 169948e3128bSMatthew Dillon (so = fp->f_data) == NULL) { 1700426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1701df8bae1dSRodney W. Grimes continue; 1702426da3bcSAlfred Perlstein } 1703748e0b0aSGarrett Wollman if (so->so_proto->pr_domain != &localdomain || 17049ae328fcSJohn Baldwin (so->so_proto->pr_flags & PR_RIGHTS) == 0) { 17059ae328fcSJohn Baldwin FILE_UNLOCK(fp); 1706df8bae1dSRodney W. Grimes continue; 17079ae328fcSJohn Baldwin } 17089ae328fcSJohn Baldwin 17099ae328fcSJohn Baldwin /* 17109ae328fcSJohn Baldwin * Tell any other threads that do a subsequent 17119ae328fcSJohn Baldwin * fdrop() that we are scanning the message 17129ae328fcSJohn Baldwin * buffers. 17139ae328fcSJohn Baldwin */ 17149ae328fcSJohn Baldwin fp->f_gcflag |= FWAIT; 17159ae328fcSJohn Baldwin FILE_UNLOCK(fp); 17169ae328fcSJohn Baldwin 1717ed5b7817SJulian Elischer /* 17181c381b19SRobert Watson * So, Ok, it's one of our sockets and it IS 17199ae328fcSJohn Baldwin * externally accessible (or was deferred). Now we 17201c381b19SRobert Watson * look to see if we hold any file descriptors in its 1721ed5b7817SJulian Elischer * message buffers. Follow those links and mark them 1722ed5b7817SJulian Elischer * as accessible too. 1723ed5b7817SJulian Elischer */ 17247717cf07SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 1725df8bae1dSRodney W. Grimes unp_scan(so->so_rcv.sb_mb, unp_mark); 17267717cf07SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 17279ae328fcSJohn Baldwin 17289ae328fcSJohn Baldwin /* 17299ae328fcSJohn Baldwin * Wake up any threads waiting in fdrop(). 17309ae328fcSJohn Baldwin */ 17319ae328fcSJohn Baldwin FILE_LOCK(fp); 17329ae328fcSJohn Baldwin fp->f_gcflag &= ~FWAIT; 17339ae328fcSJohn Baldwin wakeup(&fp->f_gcflag); 17349ae328fcSJohn Baldwin FILE_UNLOCK(fp); 1735df8bae1dSRodney W. Grimes } 1736df8bae1dSRodney W. Grimes } while (unp_defer); 1737426da3bcSAlfred Perlstein sx_sunlock(&filelist_lock); 1738df8bae1dSRodney W. Grimes /* 1739a0ec558aSRobert Watson * XXXRW: The following comments need updating for a post-SMPng and 1740a0ec558aSRobert Watson * deferred unp_gc() world, but are still generally accurate. 1741a0ec558aSRobert Watson * 17421c381b19SRobert Watson * We grab an extra reference to each of the file table entries that 17431c381b19SRobert Watson * are not otherwise accessible and then free the rights that are 17441c381b19SRobert Watson * stored in messages on them. 1745df8bae1dSRodney W. Grimes * 1746df8bae1dSRodney W. Grimes * The bug in the orginal code is a little tricky, so I'll describe 1747df8bae1dSRodney W. Grimes * what's wrong with it here. 1748df8bae1dSRodney W. Grimes * 1749df8bae1dSRodney W. Grimes * It is incorrect to simply unp_discard each entry for f_msgcount 1750df8bae1dSRodney W. Grimes * times -- consider the case of sockets A and B that contain 1751df8bae1dSRodney W. Grimes * references to each other. On a last close of some other socket, 1752df8bae1dSRodney W. Grimes * we trigger a gc since the number of outstanding rights (unp_rights) 1753a0ec558aSRobert Watson * is non-zero. If during the sweep phase the gc code unp_discards, 1754df8bae1dSRodney W. Grimes * we end up doing a (full) closef on the descriptor. A closef on A 1755df8bae1dSRodney W. Grimes * results in the following chain. Closef calls soo_close, which 1756df8bae1dSRodney W. Grimes * calls soclose. Soclose calls first (through the switch 1757df8bae1dSRodney W. Grimes * uipc_usrreq) unp_detach, which re-invokes unp_gc. Unp_gc simply 17581c381b19SRobert Watson * returns because the previous instance had set unp_gcing, and we 17591c381b19SRobert Watson * return all the way back to soclose, which marks the socket with 17601c381b19SRobert Watson * SS_NOFDREF, and then calls sofree. Sofree calls sorflush to free 17611c381b19SRobert Watson * up the rights that are queued in messages on the socket A, i.e., 17621c381b19SRobert Watson * the reference on B. The sorflush calls via the dom_dispose switch 17631c381b19SRobert Watson * unp_dispose, which unp_scans with unp_discard. This second 1764df8bae1dSRodney W. Grimes * instance of unp_discard just calls closef on B. 1765df8bae1dSRodney W. Grimes * 1766df8bae1dSRodney W. Grimes * Well, a similar chain occurs on B, resulting in a sorflush on B, 1767df8bae1dSRodney W. Grimes * which results in another closef on A. Unfortunately, A is already 1768df8bae1dSRodney W. Grimes * being closed, and the descriptor has already been marked with 1769df8bae1dSRodney W. Grimes * SS_NOFDREF, and soclose panics at this point. 1770df8bae1dSRodney W. Grimes * 1771df8bae1dSRodney W. Grimes * Here, we first take an extra reference to each inaccessible 17721c381b19SRobert Watson * descriptor. Then, we call sorflush ourself, since we know it is a 17731c381b19SRobert Watson * Unix domain socket anyhow. After we destroy all the rights 17741c381b19SRobert Watson * carried in messages, we do a last closef to get rid of our extra 17751c381b19SRobert Watson * reference. This is the last close, and the unp_detach etc will 17761c381b19SRobert Watson * shut down the socket. 1777df8bae1dSRodney W. Grimes * 1778df8bae1dSRodney W. Grimes * 91/09/19, bsy@cs.cmu.edu 1779df8bae1dSRodney W. Grimes */ 178095f004dcSAlfred Perlstein again: 1781e4643c73SPoul-Henning Kamp nfiles_snap = openfiles + nfiles_slack; /* some slack */ 178295f004dcSAlfred Perlstein extra_ref = malloc(nfiles_snap * sizeof(struct file *), M_TEMP, 178395f004dcSAlfred Perlstein M_WAITOK); 1784426da3bcSAlfred Perlstein sx_slock(&filelist_lock); 1785e4643c73SPoul-Henning Kamp if (nfiles_snap < openfiles) { 178695f004dcSAlfred Perlstein sx_sunlock(&filelist_lock); 178795f004dcSAlfred Perlstein free(extra_ref, M_TEMP); 178895f004dcSAlfred Perlstein nfiles_slack += 20; 178995f004dcSAlfred Perlstein goto again; 179095f004dcSAlfred Perlstein } 1791fc3fcacfSRobert Watson for (nunref = 0, fp = LIST_FIRST(&filehead), fpp = extra_ref; 1792fc3fcacfSRobert Watson fp != NULL; fp = nextfp) { 17932e3c8fcbSPoul-Henning Kamp nextfp = LIST_NEXT(fp, f_list); 1794426da3bcSAlfred Perlstein FILE_LOCK(fp); 1795ed5b7817SJulian Elischer /* 1796ed5b7817SJulian Elischer * If it's not open, skip it 1797ed5b7817SJulian Elischer */ 1798426da3bcSAlfred Perlstein if (fp->f_count == 0) { 1799426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1800df8bae1dSRodney W. Grimes continue; 1801426da3bcSAlfred Perlstein } 1802ed5b7817SJulian Elischer /* 1803ed5b7817SJulian Elischer * If all refs are from msgs, and it's not marked accessible 18041c381b19SRobert Watson * then it must be referenced from some unreachable cycle of 18051c381b19SRobert Watson * (shut-down) FDs, so include it in our list of FDs to 18061c381b19SRobert Watson * remove. 1807ed5b7817SJulian Elischer */ 1808426da3bcSAlfred Perlstein if (fp->f_count == fp->f_msgcount && !(fp->f_gcflag & FMARK)) { 1809df8bae1dSRodney W. Grimes *fpp++ = fp; 1810df8bae1dSRodney W. Grimes nunref++; 1811df8bae1dSRodney W. Grimes fp->f_count++; 1812df8bae1dSRodney W. Grimes } 1813426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1814df8bae1dSRodney W. Grimes } 1815426da3bcSAlfred Perlstein sx_sunlock(&filelist_lock); 1816ed5b7817SJulian Elischer /* 18171c381b19SRobert Watson * For each FD on our hit list, do the following two things: 1818ed5b7817SJulian Elischer */ 18191c7c3c6aSMatthew Dillon for (i = nunref, fpp = extra_ref; --i >= 0; ++fpp) { 18201c7c3c6aSMatthew Dillon struct file *tfp = *fpp; 1821426da3bcSAlfred Perlstein FILE_LOCK(tfp); 1822cd72f218SMatthew Dillon if (tfp->f_type == DTYPE_SOCKET && 182348e3128bSMatthew Dillon tfp->f_data != NULL) { 1824426da3bcSAlfred Perlstein FILE_UNLOCK(tfp); 182548e3128bSMatthew Dillon sorflush(tfp->f_data); 1826e5aeaa0cSDag-Erling Smørgrav } else { 1827426da3bcSAlfred Perlstein FILE_UNLOCK(tfp); 18281c7c3c6aSMatthew Dillon } 1829e5aeaa0cSDag-Erling Smørgrav } 1830a0ec558aSRobert Watson for (i = nunref, fpp = extra_ref; --i >= 0; ++fpp) { 1831b40ce416SJulian Elischer closef(*fpp, (struct thread *) NULL); 1832a0ec558aSRobert Watson unp_recycled++; 1833a0ec558aSRobert Watson } 1834210a5a71SAlfred Perlstein free(extra_ref, M_TEMP); 1835df8bae1dSRodney W. Grimes } 1836df8bae1dSRodney W. Grimes 183726f9a767SRodney W. Grimes void 1838892af6b9SRobert Watson unp_dispose(struct mbuf *m) 1839df8bae1dSRodney W. Grimes { 1840996c772fSJohn Dyson 1841df8bae1dSRodney W. Grimes if (m) 1842df8bae1dSRodney W. Grimes unp_scan(m, unp_discard); 1843df8bae1dSRodney W. Grimes } 1844df8bae1dSRodney W. Grimes 18450c1bb4fbSDima Dorfman static int 1846d374e81eSRobert Watson unp_listen(struct socket *so, struct unpcb *unp, int backlog, 1847d374e81eSRobert Watson struct thread *td) 18480c1bb4fbSDima Dorfman { 18490daccb9cSRobert Watson int error; 18500daccb9cSRobert Watson 18510d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 18520c1bb4fbSDima Dorfman 18530daccb9cSRobert Watson SOCK_LOCK(so); 18540daccb9cSRobert Watson error = solisten_proto_check(so); 18550daccb9cSRobert Watson if (error == 0) { 18566f105b34SJohn Baldwin cru2x(td->td_ucred, &unp->unp_peercred); 18570c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPCCACHED; 1858d374e81eSRobert Watson solisten_proto(so, backlog); 18590daccb9cSRobert Watson } 18600daccb9cSRobert Watson SOCK_UNLOCK(so); 18610daccb9cSRobert Watson return (error); 18620c1bb4fbSDima Dorfman } 18630c1bb4fbSDima Dorfman 1864f708ef1bSPoul-Henning Kamp static void 1865892af6b9SRobert Watson unp_scan(struct mbuf *m0, void (*op)(struct file *)) 1866df8bae1dSRodney W. Grimes { 18672bc21ed9SDavid Malone struct mbuf *m; 18682bc21ed9SDavid Malone struct file **rp; 18692bc21ed9SDavid Malone struct cmsghdr *cm; 18702bc21ed9SDavid Malone void *data; 18712bc21ed9SDavid Malone int i; 18722bc21ed9SDavid Malone socklen_t clen, datalen; 1873df8bae1dSRodney W. Grimes int qfds; 1874df8bae1dSRodney W. Grimes 1875fc3fcacfSRobert Watson while (m0 != NULL) { 18762bc21ed9SDavid Malone for (m = m0; m; m = m->m_next) { 187712396bdcSDavid Malone if (m->m_type != MT_CONTROL) 1878df8bae1dSRodney W. Grimes continue; 18792bc21ed9SDavid Malone 18802bc21ed9SDavid Malone cm = mtod(m, struct cmsghdr *); 18812bc21ed9SDavid Malone clen = m->m_len; 18822bc21ed9SDavid Malone 18832bc21ed9SDavid Malone while (cm != NULL) { 18842bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) 18852bc21ed9SDavid Malone break; 18862bc21ed9SDavid Malone 18872bc21ed9SDavid Malone data = CMSG_DATA(cm); 18882bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len 18892bc21ed9SDavid Malone - (caddr_t)data; 18902bc21ed9SDavid Malone 18912bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET && 18922bc21ed9SDavid Malone cm->cmsg_type == SCM_RIGHTS) { 18932bc21ed9SDavid Malone qfds = datalen / sizeof (struct file *); 18942bc21ed9SDavid Malone rp = data; 1895df8bae1dSRodney W. Grimes for (i = 0; i < qfds; i++) 1896df8bae1dSRodney W. Grimes (*op)(*rp++); 18972bc21ed9SDavid Malone } 18982bc21ed9SDavid Malone 18992bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 19002bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 19012bc21ed9SDavid Malone cm = (struct cmsghdr *) 19022bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 19032bc21ed9SDavid Malone } else { 19042bc21ed9SDavid Malone clen = 0; 19052bc21ed9SDavid Malone cm = NULL; 19062bc21ed9SDavid Malone } 19072bc21ed9SDavid Malone } 1908df8bae1dSRodney W. Grimes } 1909df8bae1dSRodney W. Grimes m0 = m0->m_act; 1910df8bae1dSRodney W. Grimes } 1911df8bae1dSRodney W. Grimes } 1912df8bae1dSRodney W. Grimes 1913f708ef1bSPoul-Henning Kamp static void 1914892af6b9SRobert Watson unp_mark(struct file *fp) 1915df8bae1dSRodney W. Grimes { 1916426da3bcSAlfred Perlstein if (fp->f_gcflag & FMARK) 1917df8bae1dSRodney W. Grimes return; 1918df8bae1dSRodney W. Grimes unp_defer++; 1919426da3bcSAlfred Perlstein fp->f_gcflag |= (FMARK|FDEFER); 1920df8bae1dSRodney W. Grimes } 1921df8bae1dSRodney W. Grimes 1922f708ef1bSPoul-Henning Kamp static void 1923892af6b9SRobert Watson unp_discard(struct file *fp) 1924df8bae1dSRodney W. Grimes { 1925a0ec558aSRobert Watson UNP_LOCK(); 1926426da3bcSAlfred Perlstein FILE_LOCK(fp); 1927df8bae1dSRodney W. Grimes fp->f_msgcount--; 1928df8bae1dSRodney W. Grimes unp_rights--; 1929426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1930a0ec558aSRobert Watson UNP_UNLOCK(); 1931b40ce416SJulian Elischer (void) closef(fp, (struct thread *)NULL); 1932df8bae1dSRodney W. Grimes } 1933