19454b2d8SWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1982, 1986, 1989, 1991, 1993 3e1ac28e2SRobert Watson * The Regents of the University of California. 4abdeb3b0SRobert Watson * Copyright (c) 2004-2006 Robert N. M. Watson 5e1ac28e2SRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 31748e0b0aSGarrett Wollman * From: @(#)uipc_usrreq.c 8.3 (Berkeley) 1/4/94 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 34f23929fbSRobert Watson /* 35f23929fbSRobert Watson * UNIX Domain (Local) Sockets 36f23929fbSRobert Watson * 37f23929fbSRobert Watson * This is an implementation of UNIX (local) domain sockets. Each socket has 38f23929fbSRobert Watson * an associated struct unpcb (UNIX protocol control block). Stream sockets 39f23929fbSRobert Watson * may be connected to 0 or 1 other socket. Datagram sockets may be 40f23929fbSRobert Watson * connected to 0, 1, or many other sockets. Sockets may be created and 41f23929fbSRobert Watson * connected in pairs (socketpair(2)), or bound/connected to using the file 42f23929fbSRobert Watson * system name space. For most purposes, only the receive socket buffer is 43f23929fbSRobert Watson * used, as sending on one socket delivers directly to the receive socket 44f23929fbSRobert Watson * buffer of a second socket. The implementation is substantially 45f23929fbSRobert Watson * complicated by the fact that "ancillary data", such as file descriptors or 46ca948c5eSRobert Watson * credentials, may be passed across UNIX domain sockets. The potential for 47ca948c5eSRobert Watson * passing UNIX domain sockets over other UNIX domain sockets requires the 48ca948c5eSRobert Watson * implementation of a simple garbage collector to find and tear down cycles 49ca948c5eSRobert Watson * of disconnected sockets. 50f23929fbSRobert Watson */ 51f23929fbSRobert Watson 52677b542eSDavid E. O'Brien #include <sys/cdefs.h> 53677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 54677b542eSDavid E. O'Brien 55335654d7SRobert Watson #include "opt_mac.h" 56335654d7SRobert Watson 57df8bae1dSRodney W. Grimes #include <sys/param.h> 58fb919e4dSMark Murray #include <sys/domain.h> 59960ed29cSSeigo Tanimura #include <sys/fcntl.h> 60d826c479SBruce Evans #include <sys/malloc.h> /* XXX must be before <sys/file.h> */ 614f590175SPaul Saab #include <sys/eventhandler.h> 62639acc13SGarrett Wollman #include <sys/file.h> 63960ed29cSSeigo Tanimura #include <sys/filedesc.h> 64960ed29cSSeigo Tanimura #include <sys/jail.h> 65960ed29cSSeigo Tanimura #include <sys/kernel.h> 66960ed29cSSeigo Tanimura #include <sys/lock.h> 67639acc13SGarrett Wollman #include <sys/mbuf.h> 68033eb86eSJeff Roberson #include <sys/mount.h> 69960ed29cSSeigo Tanimura #include <sys/mutex.h> 70639acc13SGarrett Wollman #include <sys/namei.h> 71639acc13SGarrett Wollman #include <sys/proc.h> 72df8bae1dSRodney W. Grimes #include <sys/protosw.h> 73960ed29cSSeigo Tanimura #include <sys/resourcevar.h> 74df8bae1dSRodney W. Grimes #include <sys/socket.h> 75df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 76960ed29cSSeigo Tanimura #include <sys/signalvar.h> 77df8bae1dSRodney W. Grimes #include <sys/stat.h> 78960ed29cSSeigo Tanimura #include <sys/sx.h> 79639acc13SGarrett Wollman #include <sys/sysctl.h> 80960ed29cSSeigo Tanimura #include <sys/systm.h> 81a0ec558aSRobert Watson #include <sys/taskqueue.h> 82639acc13SGarrett Wollman #include <sys/un.h> 8398271db4SGarrett Wollman #include <sys/unpcb.h> 84639acc13SGarrett Wollman #include <sys/vnode.h> 85df8bae1dSRodney W. Grimes 86aed55708SRobert Watson #include <security/mac/mac_framework.h> 87aed55708SRobert Watson 889e9d298aSJeff Roberson #include <vm/uma.h> 8998271db4SGarrett Wollman 909e9d298aSJeff Roberson static uma_zone_t unp_zone; 9198271db4SGarrett Wollman static unp_gen_t unp_gencnt; 9298271db4SGarrett Wollman static u_int unp_count; 9398271db4SGarrett Wollman 9498271db4SGarrett Wollman static struct unp_head unp_shead, unp_dhead; 9598271db4SGarrett Wollman 96df8bae1dSRodney W. Grimes /* 97df8bae1dSRodney W. Grimes * Unix communications domain. 98df8bae1dSRodney W. Grimes * 99df8bae1dSRodney W. Grimes * TODO: 100df8bae1dSRodney W. Grimes * SEQPACKET, RDM 101df8bae1dSRodney W. Grimes * rethink name space problems 102df8bae1dSRodney W. Grimes * need a proper out-of-band 10398271db4SGarrett Wollman * lock pushdown 104df8bae1dSRodney W. Grimes */ 105e7dd9a10SRobert Watson static const struct sockaddr sun_noname = { sizeof(sun_noname), AF_LOCAL }; 106f708ef1bSPoul-Henning Kamp static ino_t unp_ino; /* prototype for fake inode numbers */ 1076a2989fdSMatthew N. Dodd struct mbuf *unp_addsockcred(struct thread *, struct mbuf *); 108f708ef1bSPoul-Henning Kamp 109ce5f32deSRobert Watson /* 1107e711c3aSRobert Watson * Both send and receive buffers are allocated PIPSIZ bytes of buffering for 1117e711c3aSRobert Watson * stream sockets, although the total for sender and receiver is actually 1127e711c3aSRobert Watson * only PIPSIZ. 1137e711c3aSRobert Watson * 1147e711c3aSRobert Watson * Datagram sockets really use the sendspace as the maximum datagram size, 1157e711c3aSRobert Watson * and don't really want to reserve the sendspace. Their recvspace should be 1167e711c3aSRobert Watson * large enough for at least one max-size datagram plus address. 1177e711c3aSRobert Watson */ 1187e711c3aSRobert Watson #ifndef PIPSIZ 1197e711c3aSRobert Watson #define PIPSIZ 8192 1207e711c3aSRobert Watson #endif 1217e711c3aSRobert Watson static u_long unpst_sendspace = PIPSIZ; 1227e711c3aSRobert Watson static u_long unpst_recvspace = PIPSIZ; 1237e711c3aSRobert Watson static u_long unpdg_sendspace = 2*1024; /* really max datagram size */ 1247e711c3aSRobert Watson static u_long unpdg_recvspace = 4*1024; 1257e711c3aSRobert Watson 1267e711c3aSRobert Watson static int unp_rights; /* file descriptors in flight */ 1277e711c3aSRobert Watson 128e4445a03SRobert Watson SYSCTL_NODE(_net, PF_LOCAL, local, CTLFLAG_RW, 0, "Local domain"); 129e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_STREAM, stream, CTLFLAG_RW, 0, "SOCK_STREAM"); 130e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_DGRAM, dgram, CTLFLAG_RW, 0, "SOCK_DGRAM"); 131e4445a03SRobert Watson 1327e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, sendspace, CTLFLAG_RW, 1337e711c3aSRobert Watson &unpst_sendspace, 0, ""); 1347e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, recvspace, CTLFLAG_RW, 1357e711c3aSRobert Watson &unpst_recvspace, 0, ""); 1367e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, maxdgram, CTLFLAG_RW, 1377e711c3aSRobert Watson &unpdg_sendspace, 0, ""); 1387e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, recvspace, CTLFLAG_RW, 1397e711c3aSRobert Watson &unpdg_recvspace, 0, ""); 1407e711c3aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, inflight, CTLFLAG_RD, &unp_rights, 0, ""); 1417e711c3aSRobert Watson 1427e711c3aSRobert Watson /* 143ce5f32deSRobert Watson * Currently, UNIX domain sockets are protected by a single subsystem lock, 144ce5f32deSRobert Watson * which covers global data structures and variables, the contents of each 145ce5f32deSRobert Watson * per-socket unpcb structure, and the so_pcb field in sockets attached to 146ce5f32deSRobert Watson * the UNIX domain. This provides for a moderate degree of paralellism, as 147ce5f32deSRobert Watson * receive operations on UNIX domain sockets do not need to acquire the 148ce5f32deSRobert Watson * subsystem lock. Finer grained locking to permit send() without acquiring 149ce5f32deSRobert Watson * a global lock would be a logical next step. 150ce5f32deSRobert Watson * 151ce5f32deSRobert Watson * The UNIX domain socket lock preceds all socket layer locks, including the 152ce5f32deSRobert Watson * socket lock and socket buffer lock, permitting UNIX domain socket code to 153ce5f32deSRobert Watson * call into socket support routines without releasing its locks. 154ce5f32deSRobert Watson * 155ce5f32deSRobert Watson * Some caution is required in areas where the UNIX domain socket code enters 156ce5f32deSRobert Watson * VFS in order to create or find rendezvous points. This results in 157ce5f32deSRobert Watson * dropping of the UNIX domain socket subsystem lock, acquisition of the 158ce5f32deSRobert Watson * Giant lock, and potential sleeping. This increases the chances of races, 159ce5f32deSRobert Watson * and exposes weaknesses in the socket->protocol API by offering poor 160ce5f32deSRobert Watson * failure modes. 161ce5f32deSRobert Watson */ 1620d9ce3a1SRobert Watson static struct mtx unp_mtx; 1630d9ce3a1SRobert Watson #define UNP_LOCK_INIT() \ 1640d9ce3a1SRobert Watson mtx_init(&unp_mtx, "unp", NULL, MTX_DEF) 1650d9ce3a1SRobert Watson #define UNP_LOCK() mtx_lock(&unp_mtx) 1660d9ce3a1SRobert Watson #define UNP_UNLOCK() mtx_unlock(&unp_mtx) 1670d9ce3a1SRobert Watson #define UNP_LOCK_ASSERT() mtx_assert(&unp_mtx, MA_OWNED) 1684c5bc1caSRobert Watson #define UNP_UNLOCK_ASSERT() mtx_assert(&unp_mtx, MA_NOTOWNED) 1690d9ce3a1SRobert Watson 170a0ec558aSRobert Watson /* 171a0ec558aSRobert Watson * Garbage collection of cyclic file descriptor/socket references occurs 172a0ec558aSRobert Watson * asynchronously in a taskqueue context in order to avoid recursion and 173a0ec558aSRobert Watson * reentrance in the UNIX domain socket, file descriptor, and socket layer 174a0ec558aSRobert Watson * code. See unp_gc() for a full description. 175a0ec558aSRobert Watson */ 176a0ec558aSRobert Watson static struct task unp_gc_task; 177a0ec558aSRobert Watson 17870f52b48SBruce Evans static int unp_connect(struct socket *,struct sockaddr *, struct thread *); 1796a2989fdSMatthew N. Dodd static int unp_connect2(struct socket *so, struct socket *so2, int); 1804d77a549SAlfred Perlstein static void unp_disconnect(struct unpcb *); 1814d77a549SAlfred Perlstein static void unp_shutdown(struct unpcb *); 1824d77a549SAlfred Perlstein static void unp_drop(struct unpcb *, int); 183a0ec558aSRobert Watson static void unp_gc(__unused void *, int); 1844d77a549SAlfred Perlstein static void unp_scan(struct mbuf *, void (*)(struct file *)); 1854d77a549SAlfred Perlstein static void unp_mark(struct file *); 1864d77a549SAlfred Perlstein static void unp_discard(struct file *); 1874d77a549SAlfred Perlstein static void unp_freerights(struct file **, int); 1884d77a549SAlfred Perlstein static int unp_internalize(struct mbuf **, struct thread *); 189d374e81eSRobert Watson static int unp_listen(struct socket *, struct unpcb *, int, 190d374e81eSRobert Watson struct thread *); 191f708ef1bSPoul-Henning Kamp 192e4445a03SRobert Watson /* 193e4445a03SRobert Watson * Definitions of protocols supported in the LOCAL domain. 194e4445a03SRobert Watson */ 195e4445a03SRobert Watson static struct domain localdomain; 196e4445a03SRobert Watson static struct protosw localsw[] = { 197e4445a03SRobert Watson { 198e4445a03SRobert Watson .pr_type = SOCK_STREAM, 199e4445a03SRobert Watson .pr_domain = &localdomain, 200e4445a03SRobert Watson .pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_RIGHTS, 201e4445a03SRobert Watson .pr_ctloutput = &uipc_ctloutput, 202e4445a03SRobert Watson .pr_usrreqs = &uipc_usrreqs 203e4445a03SRobert Watson }, 204e4445a03SRobert Watson { 205e4445a03SRobert Watson .pr_type = SOCK_DGRAM, 206e4445a03SRobert Watson .pr_domain = &localdomain, 207e4445a03SRobert Watson .pr_flags = PR_ATOMIC|PR_ADDR|PR_RIGHTS, 208e4445a03SRobert Watson .pr_usrreqs = &uipc_usrreqs 209e4445a03SRobert Watson }, 210e4445a03SRobert Watson }; 211e4445a03SRobert Watson 212e4445a03SRobert Watson static struct domain localdomain = { 213e4445a03SRobert Watson .dom_family = AF_LOCAL, 214e4445a03SRobert Watson .dom_name = "local", 215e4445a03SRobert Watson .dom_init = unp_init, 216e4445a03SRobert Watson .dom_externalize = unp_externalize, 217e4445a03SRobert Watson .dom_dispose = unp_dispose, 218e4445a03SRobert Watson .dom_protosw = localsw, 219e4445a03SRobert Watson .dom_protoswNPROTOSW = &localsw[sizeof(localsw)/sizeof(localsw[0])] 220e4445a03SRobert Watson }; 221e4445a03SRobert Watson DOMAIN_SET(local); 222e4445a03SRobert Watson 223ac45e92fSRobert Watson static void 224a29f300eSGarrett Wollman uipc_abort(struct socket *so) 225df8bae1dSRodney W. Grimes { 22640f2ac28SRobert Watson struct unpcb *unp; 227df8bae1dSRodney W. Grimes 22840f2ac28SRobert Watson unp = sotounpcb(so); 2294d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_abort: unp == NULL")); 2304d4b555eSRobert Watson UNP_LOCK(); 231a29f300eSGarrett Wollman unp_drop(unp, ECONNABORTED); 232a152f8a3SRobert Watson UNP_UNLOCK(); 233df8bae1dSRodney W. Grimes } 234df8bae1dSRodney W. Grimes 235a29f300eSGarrett Wollman static int 23657bf258eSGarrett Wollman uipc_accept(struct socket *so, struct sockaddr **nam) 237a29f300eSGarrett Wollman { 23840f2ac28SRobert Watson struct unpcb *unp; 2390d9ce3a1SRobert Watson const struct sockaddr *sa; 240df8bae1dSRodney W. Grimes 241df8bae1dSRodney W. Grimes /* 2421c381b19SRobert Watson * Pass back name of connected socket, if it was bound and we are 2431c381b19SRobert Watson * still connected (our peer may have closed already!). 244df8bae1dSRodney W. Grimes */ 2454d4b555eSRobert Watson unp = sotounpcb(so); 2464d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_accept: unp == NULL")); 2470d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 2480d9ce3a1SRobert Watson UNP_LOCK(); 2490d9ce3a1SRobert Watson if (unp->unp_conn != NULL && unp->unp_conn->unp_addr != NULL) 2500d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_conn->unp_addr; 2510d9ce3a1SRobert Watson else 2520d9ce3a1SRobert Watson sa = &sun_noname; 2530d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 2540d9ce3a1SRobert Watson UNP_UNLOCK(); 255e5aeaa0cSDag-Erling Smørgrav return (0); 256a29f300eSGarrett Wollman } 257df8bae1dSRodney W. Grimes 258a29f300eSGarrett Wollman static int 259b40ce416SJulian Elischer uipc_attach(struct socket *so, int proto, struct thread *td) 260a29f300eSGarrett Wollman { 2616d32873cSRobert Watson struct unpcb *unp; 2626d32873cSRobert Watson int error; 263df8bae1dSRodney W. Grimes 2646d32873cSRobert Watson KASSERT(so->so_pcb == NULL, ("uipc_attach: so_pcb != NULL")); 2656d32873cSRobert Watson if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) { 2666d32873cSRobert Watson switch (so->so_type) { 2676d32873cSRobert Watson case SOCK_STREAM: 2686d32873cSRobert Watson error = soreserve(so, unpst_sendspace, unpst_recvspace); 2696d32873cSRobert Watson break; 2706d32873cSRobert Watson 2716d32873cSRobert Watson case SOCK_DGRAM: 2726d32873cSRobert Watson error = soreserve(so, unpdg_sendspace, unpdg_recvspace); 2736d32873cSRobert Watson break; 2746d32873cSRobert Watson 2756d32873cSRobert Watson default: 2766d32873cSRobert Watson panic("unp_attach"); 2776d32873cSRobert Watson } 2786d32873cSRobert Watson if (error) 2796d32873cSRobert Watson return (error); 2806d32873cSRobert Watson } 2816d32873cSRobert Watson unp = uma_zalloc(unp_zone, M_WAITOK | M_ZERO); 2826d32873cSRobert Watson if (unp == NULL) 2836d32873cSRobert Watson return (ENOBUFS); 2846d32873cSRobert Watson LIST_INIT(&unp->unp_refs); 2856d32873cSRobert Watson unp->unp_socket = so; 2866d32873cSRobert Watson so->so_pcb = unp; 2876d32873cSRobert Watson 2889ae328fcSJohn Baldwin unp->unp_refcount = 1; 2896d32873cSRobert Watson UNP_LOCK(); 2906d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 2916d32873cSRobert Watson unp_count++; 292b7e2f3ecSRobert Watson LIST_INSERT_HEAD(so->so_type == SOCK_DGRAM ? &unp_dhead : &unp_shead, 293b7e2f3ecSRobert Watson unp, unp_link); 2946d32873cSRobert Watson UNP_UNLOCK(); 2956d32873cSRobert Watson 2966d32873cSRobert Watson return (0); 297a29f300eSGarrett Wollman } 298a29f300eSGarrett Wollman 299a29f300eSGarrett Wollman static int 300b40ce416SJulian Elischer uipc_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 301a29f300eSGarrett Wollman { 302dd47f5caSRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 303dd47f5caSRobert Watson struct vattr vattr; 304dd47f5caSRobert Watson int error, namelen; 305dd47f5caSRobert Watson struct nameidata nd; 30640f2ac28SRobert Watson struct unpcb *unp; 307dd47f5caSRobert Watson struct vnode *vp; 308dd47f5caSRobert Watson struct mount *mp; 309dd47f5caSRobert Watson char *buf; 310a29f300eSGarrett Wollman 31140f2ac28SRobert Watson unp = sotounpcb(so); 3124d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_bind: unp == NULL")); 3134f1f0ef5SRobert Watson 3144f1f0ef5SRobert Watson namelen = soun->sun_len - offsetof(struct sockaddr_un, sun_path); 3154f1f0ef5SRobert Watson if (namelen <= 0) 3164f1f0ef5SRobert Watson return (EINVAL); 317dd47f5caSRobert Watson 318dd47f5caSRobert Watson /* 3194f1f0ef5SRobert Watson * We don't allow simultaneous bind() calls on a single UNIX domain 3204f1f0ef5SRobert Watson * socket, so flag in-progress operations, and return an error if an 3214f1f0ef5SRobert Watson * operation is already in progress. 3224f1f0ef5SRobert Watson * 3234f1f0ef5SRobert Watson * Historically, we have not allowed a socket to be rebound, so this 3244f1f0ef5SRobert Watson * also returns an error. Not allowing re-binding certainly 3254f1f0ef5SRobert Watson * simplifies the implementation and avoids a great many possible 3264f1f0ef5SRobert Watson * failure modes. 327dd47f5caSRobert Watson */ 3284f1f0ef5SRobert Watson UNP_LOCK(); 329dd47f5caSRobert Watson if (unp->unp_vnode != NULL) { 33040f2ac28SRobert Watson UNP_UNLOCK(); 331dd47f5caSRobert Watson return (EINVAL); 332dd47f5caSRobert Watson } 3334f1f0ef5SRobert Watson if (unp->unp_flags & UNP_BINDING) { 334dd47f5caSRobert Watson UNP_UNLOCK(); 3354f1f0ef5SRobert Watson return (EALREADY); 336dd47f5caSRobert Watson } 3374f1f0ef5SRobert Watson unp->unp_flags |= UNP_BINDING; 338dd47f5caSRobert Watson UNP_UNLOCK(); 339dd47f5caSRobert Watson 340dd47f5caSRobert Watson buf = malloc(namelen + 1, M_TEMP, M_WAITOK); 341dd47f5caSRobert Watson strlcpy(buf, soun->sun_path, namelen + 1); 342dd47f5caSRobert Watson 343dd47f5caSRobert Watson mtx_lock(&Giant); 344dd47f5caSRobert Watson restart: 345dd47f5caSRobert Watson mtx_assert(&Giant, MA_OWNED); 346dd47f5caSRobert Watson NDINIT(&nd, CREATE, NOFOLLOW | LOCKPARENT | SAVENAME, UIO_SYSSPACE, 347dd47f5caSRobert Watson buf, td); 348dd47f5caSRobert Watson /* SHOULD BE ABLE TO ADOPT EXISTING AND wakeup() ALA FIFO's */ 349dd47f5caSRobert Watson error = namei(&nd); 350dd47f5caSRobert Watson if (error) 3514f1f0ef5SRobert Watson goto error; 352dd47f5caSRobert Watson vp = nd.ni_vp; 353dd47f5caSRobert Watson if (vp != NULL || vn_start_write(nd.ni_dvp, &mp, V_NOWAIT) != 0) { 354dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 355dd47f5caSRobert Watson if (nd.ni_dvp == vp) 356dd47f5caSRobert Watson vrele(nd.ni_dvp); 357dd47f5caSRobert Watson else 358dd47f5caSRobert Watson vput(nd.ni_dvp); 359dd47f5caSRobert Watson if (vp != NULL) { 360dd47f5caSRobert Watson vrele(vp); 361dd47f5caSRobert Watson error = EADDRINUSE; 3624f1f0ef5SRobert Watson goto error; 363dd47f5caSRobert Watson } 364dd47f5caSRobert Watson error = vn_start_write(NULL, &mp, V_XSLEEP | PCATCH); 365dd47f5caSRobert Watson if (error) 3664f1f0ef5SRobert Watson goto error; 367dd47f5caSRobert Watson goto restart; 368dd47f5caSRobert Watson } 369dd47f5caSRobert Watson VATTR_NULL(&vattr); 370dd47f5caSRobert Watson vattr.va_type = VSOCK; 371dd47f5caSRobert Watson vattr.va_mode = (ACCESSPERMS & ~td->td_proc->p_fd->fd_cmask); 372dd47f5caSRobert Watson #ifdef MAC 373dd47f5caSRobert Watson error = mac_check_vnode_create(td->td_ucred, nd.ni_dvp, &nd.ni_cnd, 374dd47f5caSRobert Watson &vattr); 375dd47f5caSRobert Watson #endif 376dd47f5caSRobert Watson if (error == 0) { 377dd47f5caSRobert Watson VOP_LEASE(nd.ni_dvp, td, td->td_ucred, LEASE_WRITE); 378dd47f5caSRobert Watson error = VOP_CREATE(nd.ni_dvp, &nd.ni_vp, &nd.ni_cnd, &vattr); 379dd47f5caSRobert Watson } 380dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 381dd47f5caSRobert Watson vput(nd.ni_dvp); 382dd47f5caSRobert Watson if (error) { 383dd47f5caSRobert Watson vn_finished_write(mp); 3844f1f0ef5SRobert Watson goto error; 385dd47f5caSRobert Watson } 386dd47f5caSRobert Watson vp = nd.ni_vp; 3874f1f0ef5SRobert Watson ASSERT_VOP_LOCKED(vp, "uipc_bind"); 388dd47f5caSRobert Watson soun = (struct sockaddr_un *)sodupsockaddr(nam, M_WAITOK); 389dd47f5caSRobert Watson UNP_LOCK(); 390dd47f5caSRobert Watson vp->v_socket = unp->unp_socket; 391dd47f5caSRobert Watson unp->unp_vnode = vp; 392dd47f5caSRobert Watson unp->unp_addr = soun; 3934f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 394dd47f5caSRobert Watson UNP_UNLOCK(); 395dd47f5caSRobert Watson VOP_UNLOCK(vp, 0, td); 396dd47f5caSRobert Watson vn_finished_write(mp); 3974f1f0ef5SRobert Watson mtx_unlock(&Giant); 3984f1f0ef5SRobert Watson free(buf, M_TEMP); 3994f1f0ef5SRobert Watson return (0); 4004f1f0ef5SRobert Watson error: 4014f1f0ef5SRobert Watson UNP_LOCK(); 4024f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 4034f1f0ef5SRobert Watson UNP_UNLOCK(); 404dd47f5caSRobert Watson mtx_unlock(&Giant); 405dd47f5caSRobert Watson free(buf, M_TEMP); 40640f2ac28SRobert Watson return (error); 407a29f300eSGarrett Wollman } 408a29f300eSGarrett Wollman 409a29f300eSGarrett Wollman static int 410b40ce416SJulian Elischer uipc_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 411a29f300eSGarrett Wollman { 4120d9ce3a1SRobert Watson int error; 413a29f300eSGarrett Wollman 414fd179ee9SRobert Watson KASSERT(td == curthread, ("uipc_connect: td != curthread")); 4154d4b555eSRobert Watson UNP_LOCK(); 416fd179ee9SRobert Watson error = unp_connect(so, nam, td); 4170d9ce3a1SRobert Watson UNP_UNLOCK(); 4180d9ce3a1SRobert Watson return (error); 419a29f300eSGarrett Wollman } 420a29f300eSGarrett Wollman 421a152f8a3SRobert Watson /* 422a152f8a3SRobert Watson * XXXRW: Should also unbind? 423a152f8a3SRobert Watson */ 424a152f8a3SRobert Watson static void 425a152f8a3SRobert Watson uipc_close(struct socket *so) 426a152f8a3SRobert Watson { 427a152f8a3SRobert Watson struct unpcb *unp; 428a152f8a3SRobert Watson 429a152f8a3SRobert Watson unp = sotounpcb(so); 430a152f8a3SRobert Watson KASSERT(unp != NULL, ("uipc_close: unp == NULL")); 431a152f8a3SRobert Watson UNP_LOCK(); 432a152f8a3SRobert Watson unp_disconnect(unp); 433a152f8a3SRobert Watson UNP_UNLOCK(); 434a152f8a3SRobert Watson } 435a152f8a3SRobert Watson 436db48c0d2SRobert Watson int 437a29f300eSGarrett Wollman uipc_connect2(struct socket *so1, struct socket *so2) 438a29f300eSGarrett Wollman { 43940f2ac28SRobert Watson struct unpcb *unp; 4400d9ce3a1SRobert Watson int error; 441a29f300eSGarrett Wollman 44240f2ac28SRobert Watson unp = sotounpcb(so1); 4434d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_connect2: unp == NULL")); 4444d4b555eSRobert Watson UNP_LOCK(); 4456a2989fdSMatthew N. Dodd error = unp_connect2(so1, so2, PRU_CONNECT2); 4460d9ce3a1SRobert Watson UNP_UNLOCK(); 4470d9ce3a1SRobert Watson return (error); 448a29f300eSGarrett Wollman } 449a29f300eSGarrett Wollman 450a29f300eSGarrett Wollman /* control is EOPNOTSUPP */ 451a29f300eSGarrett Wollman 452bc725eafSRobert Watson static void 453a29f300eSGarrett Wollman uipc_detach(struct socket *so) 454a29f300eSGarrett Wollman { 4559ae328fcSJohn Baldwin struct sockaddr_un *saved_unp_addr; 45640f2ac28SRobert Watson struct unpcb *unp; 4576d32873cSRobert Watson struct vnode *vp; 4589ae328fcSJohn Baldwin int freeunp, local_unp_rights; 459a29f300eSGarrett Wollman 46040f2ac28SRobert Watson unp = sotounpcb(so); 4614d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_detach: unp == NULL")); 4624d4b555eSRobert Watson UNP_LOCK(); 4636d32873cSRobert Watson LIST_REMOVE(unp, unp_link); 4646d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 4656d32873cSRobert Watson --unp_count; 4666d32873cSRobert Watson if ((vp = unp->unp_vnode) != NULL) { 4676d32873cSRobert Watson /* 4686d32873cSRobert Watson * XXXRW: should v_socket be frobbed only while holding 4696d32873cSRobert Watson * Giant? 4706d32873cSRobert Watson */ 4716d32873cSRobert Watson unp->unp_vnode->v_socket = NULL; 4726d32873cSRobert Watson unp->unp_vnode = NULL; 4736d32873cSRobert Watson } 4746d32873cSRobert Watson if (unp->unp_conn != NULL) 4756d32873cSRobert Watson unp_disconnect(unp); 4766d32873cSRobert Watson while (!LIST_EMPTY(&unp->unp_refs)) { 4776d32873cSRobert Watson struct unpcb *ref = LIST_FIRST(&unp->unp_refs); 4786d32873cSRobert Watson unp_drop(ref, ECONNRESET); 4796d32873cSRobert Watson } 4806d32873cSRobert Watson unp->unp_socket->so_pcb = NULL; 4816d32873cSRobert Watson local_unp_rights = unp_rights; 4829ae328fcSJohn Baldwin saved_unp_addr = unp->unp_addr; 4839ae328fcSJohn Baldwin unp->unp_addr = NULL; 4849ae328fcSJohn Baldwin unp->unp_refcount--; 4859ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 4866d32873cSRobert Watson UNP_UNLOCK(); 4879ae328fcSJohn Baldwin if (saved_unp_addr != NULL) 4889ae328fcSJohn Baldwin FREE(saved_unp_addr, M_SONAME); 4899ae328fcSJohn Baldwin if (freeunp) 4906d32873cSRobert Watson uma_zfree(unp_zone, unp); 4916d32873cSRobert Watson if (vp) { 4926d32873cSRobert Watson int vfslocked; 4936d32873cSRobert Watson 4946d32873cSRobert Watson vfslocked = VFS_LOCK_GIANT(vp->v_mount); 4956d32873cSRobert Watson vrele(vp); 4966d32873cSRobert Watson VFS_UNLOCK_GIANT(vfslocked); 4976d32873cSRobert Watson } 4986d32873cSRobert Watson if (local_unp_rights) 4996d32873cSRobert Watson taskqueue_enqueue(taskqueue_thread, &unp_gc_task); 500a29f300eSGarrett Wollman } 501a29f300eSGarrett Wollman 502a29f300eSGarrett Wollman static int 503a29f300eSGarrett Wollman uipc_disconnect(struct socket *so) 504a29f300eSGarrett Wollman { 50540f2ac28SRobert Watson struct unpcb *unp; 506a29f300eSGarrett Wollman 50740f2ac28SRobert Watson unp = sotounpcb(so); 5084d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_disconnect: unp == NULL")); 5094d4b555eSRobert Watson UNP_LOCK(); 510a29f300eSGarrett Wollman unp_disconnect(unp); 5110d9ce3a1SRobert Watson UNP_UNLOCK(); 512e5aeaa0cSDag-Erling Smørgrav return (0); 513a29f300eSGarrett Wollman } 514a29f300eSGarrett Wollman 515a29f300eSGarrett Wollman static int 516d374e81eSRobert Watson uipc_listen(struct socket *so, int backlog, struct thread *td) 517a29f300eSGarrett Wollman { 51840f2ac28SRobert Watson struct unpcb *unp; 5190d9ce3a1SRobert Watson int error; 520a29f300eSGarrett Wollman 52140f2ac28SRobert Watson unp = sotounpcb(so); 5224d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_listen: unp == NULL")); 5234d4b555eSRobert Watson UNP_LOCK(); 5244d4b555eSRobert Watson if (unp->unp_vnode == NULL) { 52540f2ac28SRobert Watson UNP_UNLOCK(); 52640f2ac28SRobert Watson return (EINVAL); 52740f2ac28SRobert Watson } 528d374e81eSRobert Watson error = unp_listen(so, unp, backlog, td); 5290d9ce3a1SRobert Watson UNP_UNLOCK(); 5300d9ce3a1SRobert Watson return (error); 531a29f300eSGarrett Wollman } 532a29f300eSGarrett Wollman 533a29f300eSGarrett Wollman static int 53457bf258eSGarrett Wollman uipc_peeraddr(struct socket *so, struct sockaddr **nam) 535a29f300eSGarrett Wollman { 53640f2ac28SRobert Watson struct unpcb *unp; 5370d9ce3a1SRobert Watson const struct sockaddr *sa; 538a29f300eSGarrett Wollman 5394d4b555eSRobert Watson unp = sotounpcb(so); 5404d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_peeraddr: unp == NULL")); 5410d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 5420d9ce3a1SRobert Watson UNP_LOCK(); 543fc3fcacfSRobert Watson if (unp->unp_conn != NULL && unp->unp_conn->unp_addr!= NULL) 5440d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_conn->unp_addr; 545bdc5f6a3SHajimu UMEMOTO else { 546bdc5f6a3SHajimu UMEMOTO /* 547bdc5f6a3SHajimu UMEMOTO * XXX: It seems that this test always fails even when 548bdc5f6a3SHajimu UMEMOTO * connection is established. So, this else clause is 549bdc5f6a3SHajimu UMEMOTO * added as workaround to return PF_LOCAL sockaddr. 550bdc5f6a3SHajimu UMEMOTO */ 5510d9ce3a1SRobert Watson sa = &sun_noname; 552bdc5f6a3SHajimu UMEMOTO } 5530d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 5540d9ce3a1SRobert Watson UNP_UNLOCK(); 555e5aeaa0cSDag-Erling Smørgrav return (0); 556a29f300eSGarrett Wollman } 557a29f300eSGarrett Wollman 558a29f300eSGarrett Wollman static int 559a29f300eSGarrett Wollman uipc_rcvd(struct socket *so, int flags) 560a29f300eSGarrett Wollman { 56140f2ac28SRobert Watson struct unpcb *unp; 562a29f300eSGarrett Wollman struct socket *so2; 563337cc6b6SRobert Watson u_int mbcnt, sbcc; 5646aef685fSBrian Feldman u_long newhiwat; 565a29f300eSGarrett Wollman 56640f2ac28SRobert Watson unp = sotounpcb(so); 5674d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_rcvd: unp == NULL")); 568df8bae1dSRodney W. Grimes switch (so->so_type) { 569df8bae1dSRodney W. Grimes case SOCK_DGRAM: 570a29f300eSGarrett Wollman panic("uipc_rcvd DGRAM?"); 571df8bae1dSRodney W. Grimes /*NOTREACHED*/ 572df8bae1dSRodney W. Grimes 573df8bae1dSRodney W. Grimes case SOCK_STREAM: 574df8bae1dSRodney W. Grimes /* 5751c381b19SRobert Watson * Adjust backpressure on sender and wakeup any waiting to 5761c381b19SRobert Watson * write. 577df8bae1dSRodney W. Grimes */ 578337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 579337cc6b6SRobert Watson mbcnt = so->so_rcv.sb_mbcnt; 580337cc6b6SRobert Watson sbcc = so->so_rcv.sb_cc; 581337cc6b6SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 582337cc6b6SRobert Watson UNP_LOCK(); 583337cc6b6SRobert Watson if (unp->unp_conn == NULL) { 584337cc6b6SRobert Watson UNP_UNLOCK(); 585337cc6b6SRobert Watson break; 586337cc6b6SRobert Watson } 587337cc6b6SRobert Watson so2 = unp->unp_conn->unp_socket; 588337cc6b6SRobert Watson SOCKBUF_LOCK(&so2->so_snd); 589337cc6b6SRobert Watson so2->so_snd.sb_mbmax += unp->unp_mbcnt - mbcnt; 590337cc6b6SRobert Watson newhiwat = so2->so_snd.sb_hiwat + unp->unp_cc - sbcc; 591f535380cSDon Lewis (void)chgsbsize(so2->so_cred->cr_uidinfo, &so2->so_snd.sb_hiwat, 5926aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 5931e4d7da7SRobert Watson sowwakeup_locked(so2); 594337cc6b6SRobert Watson unp->unp_mbcnt = mbcnt; 595337cc6b6SRobert Watson unp->unp_cc = sbcc; 596337cc6b6SRobert Watson UNP_UNLOCK(); 597df8bae1dSRodney W. Grimes break; 598df8bae1dSRodney W. Grimes 599df8bae1dSRodney W. Grimes default: 600a29f300eSGarrett Wollman panic("uipc_rcvd unknown socktype"); 601df8bae1dSRodney W. Grimes } 602e5aeaa0cSDag-Erling Smørgrav return (0); 603a29f300eSGarrett Wollman } 604df8bae1dSRodney W. Grimes 605a29f300eSGarrett Wollman /* pru_rcvoob is EOPNOTSUPP */ 606a29f300eSGarrett Wollman 607a29f300eSGarrett Wollman static int 60857bf258eSGarrett Wollman uipc_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam, 609b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 610a29f300eSGarrett Wollman { 611f3f49bbbSRobert Watson struct unpcb *unp, *unp2; 612a29f300eSGarrett Wollman struct socket *so2; 613337cc6b6SRobert Watson u_int mbcnt, sbcc; 6146aef685fSBrian Feldman u_long newhiwat; 615f3f49bbbSRobert Watson int error = 0; 616a29f300eSGarrett Wollman 61740f2ac28SRobert Watson unp = sotounpcb(so); 6184d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_send: unp == NULL")); 619a29f300eSGarrett Wollman if (flags & PRUS_OOB) { 620a29f300eSGarrett Wollman error = EOPNOTSUPP; 621a29f300eSGarrett Wollman goto release; 622a29f300eSGarrett Wollman } 623a29f300eSGarrett Wollman 624fc3fcacfSRobert Watson if (control != NULL && (error = unp_internalize(&control, td))) 625a29f300eSGarrett Wollman goto release; 626df8bae1dSRodney W. Grimes 6270d9ce3a1SRobert Watson UNP_LOCK(); 628a29f300eSGarrett Wollman switch (so->so_type) { 629a29f300eSGarrett Wollman case SOCK_DGRAM: 630a29f300eSGarrett Wollman { 631e7dd9a10SRobert Watson const struct sockaddr *from; 632df8bae1dSRodney W. Grimes 633fc3fcacfSRobert Watson if (nam != NULL) { 634fc3fcacfSRobert Watson if (unp->unp_conn != NULL) { 635df8bae1dSRodney W. Grimes error = EISCONN; 636df8bae1dSRodney W. Grimes break; 637df8bae1dSRodney W. Grimes } 638b40ce416SJulian Elischer error = unp_connect(so, nam, td); 639df8bae1dSRodney W. Grimes if (error) 640df8bae1dSRodney W. Grimes break; 641df8bae1dSRodney W. Grimes } 642b5ff0914SRobert Watson /* 643b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 644b5ff0914SRobert Watson * with a target address, it's possible that the socket will 645b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 646b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 647b5ff0914SRobert Watson * correct error that the socket is not connected. 648b5ff0914SRobert Watson */ 649f3f49bbbSRobert Watson unp2 = unp->unp_conn; 650b5ff0914SRobert Watson if (unp2 == NULL) { 651b5ff0914SRobert Watson error = ENOTCONN; 652b5ff0914SRobert Watson break; 653b5ff0914SRobert Watson } 654f3f49bbbSRobert Watson so2 = unp2->unp_socket; 655fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 65657bf258eSGarrett Wollman from = (struct sockaddr *)unp->unp_addr; 657df8bae1dSRodney W. Grimes else 658df8bae1dSRodney W. Grimes from = &sun_noname; 659f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) 6606a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 661a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 662a34b7046SRobert Watson if (sbappendaddr_locked(&so2->so_rcv, from, m, control)) { 6631e4d7da7SRobert Watson sorwakeup_locked(so2); 664fc3fcacfSRobert Watson m = NULL; 665fc3fcacfSRobert Watson control = NULL; 666e5aeaa0cSDag-Erling Smørgrav } else { 667a34b7046SRobert Watson SOCKBUF_UNLOCK(&so2->so_rcv); 668df8bae1dSRodney W. Grimes error = ENOBUFS; 669e5aeaa0cSDag-Erling Smørgrav } 670fc3fcacfSRobert Watson if (nam != NULL) 671df8bae1dSRodney W. Grimes unp_disconnect(unp); 672df8bae1dSRodney W. Grimes break; 673df8bae1dSRodney W. Grimes } 674df8bae1dSRodney W. Grimes 675df8bae1dSRodney W. Grimes case SOCK_STREAM: 6766b8fda4dSGarrett Wollman /* 6771c381b19SRobert Watson * Connect if not connected yet. 6781c381b19SRobert Watson * 6791c381b19SRobert Watson * Note: A better implementation would complain if not equal 6801c381b19SRobert Watson * to the peer's address. 6816b8fda4dSGarrett Wollman */ 682402cc72dSDavid Greenman if ((so->so_state & SS_ISCONNECTED) == 0) { 683fc3fcacfSRobert Watson if (nam != NULL) { 684b40ce416SJulian Elischer error = unp_connect(so, nam, td); 685402cc72dSDavid Greenman if (error) 6866b8fda4dSGarrett Wollman break; /* XXX */ 687402cc72dSDavid Greenman } else { 688402cc72dSDavid Greenman error = ENOTCONN; 689402cc72dSDavid Greenman break; 690402cc72dSDavid Greenman } 691402cc72dSDavid Greenman } 692402cc72dSDavid Greenman 693337cc6b6SRobert Watson /* Lockless read. */ 694c0b99ffaSRobert Watson if (so->so_snd.sb_state & SBS_CANTSENDMORE) { 695df8bae1dSRodney W. Grimes error = EPIPE; 696df8bae1dSRodney W. Grimes break; 697df8bae1dSRodney W. Grimes } 698b5ff0914SRobert Watson /* 699b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 700b5ff0914SRobert Watson * with a target address, it's possible that the socket will 701b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 702b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 703b5ff0914SRobert Watson * correct error that the socket is not connected. 704b5ff0914SRobert Watson */ 705f3f49bbbSRobert Watson unp2 = unp->unp_conn; 706b5ff0914SRobert Watson if (unp2 == NULL) { 707b5ff0914SRobert Watson error = ENOTCONN; 708b5ff0914SRobert Watson break; 709b5ff0914SRobert Watson } 710f3f49bbbSRobert Watson so2 = unp2->unp_socket; 711a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 712f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) { 7136a2989fdSMatthew N. Dodd /* 7146a2989fdSMatthew N. Dodd * Credentials are passed only once on 7156a2989fdSMatthew N. Dodd * SOCK_STREAM. 7166a2989fdSMatthew N. Dodd */ 717f3f49bbbSRobert Watson unp2->unp_flags &= ~UNP_WANTCRED; 7186a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 7196a2989fdSMatthew N. Dodd } 720df8bae1dSRodney W. Grimes /* 7211c381b19SRobert Watson * Send to paired receive port, and then reduce send buffer 7221c381b19SRobert Watson * hiwater marks to maintain backpressure. Wake up readers. 723df8bae1dSRodney W. Grimes */ 724fc3fcacfSRobert Watson if (control != NULL) { 725a34b7046SRobert Watson if (sbappendcontrol_locked(&so2->so_rcv, m, control)) 726fc3fcacfSRobert Watson control = NULL; 727e5aeaa0cSDag-Erling Smørgrav } else { 728a34b7046SRobert Watson sbappend_locked(&so2->so_rcv, m); 729e5aeaa0cSDag-Erling Smørgrav } 730f3f49bbbSRobert Watson mbcnt = so2->so_rcv.sb_mbcnt - unp2->unp_mbcnt; 731f3f49bbbSRobert Watson unp2->unp_mbcnt = so2->so_rcv.sb_mbcnt; 732337cc6b6SRobert Watson sbcc = so2->so_rcv.sb_cc; 733337cc6b6SRobert Watson sorwakeup_locked(so2); 734337cc6b6SRobert Watson 735337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_snd); 736f3f49bbbSRobert Watson newhiwat = so->so_snd.sb_hiwat - (sbcc - unp2->unp_cc); 737f535380cSDon Lewis (void)chgsbsize(so->so_cred->cr_uidinfo, &so->so_snd.sb_hiwat, 7386aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 739337cc6b6SRobert Watson so->so_snd.sb_mbmax -= mbcnt; 7407abe2ac2SAlan Cox SOCKBUF_UNLOCK(&so->so_snd); 741337cc6b6SRobert Watson 742f3f49bbbSRobert Watson unp2->unp_cc = sbcc; 743fc3fcacfSRobert Watson m = NULL; 744df8bae1dSRodney W. Grimes break; 745df8bae1dSRodney W. Grimes 746df8bae1dSRodney W. Grimes default: 747a29f300eSGarrett Wollman panic("uipc_send unknown socktype"); 748df8bae1dSRodney W. Grimes } 749a29f300eSGarrett Wollman 7506b8fda4dSGarrett Wollman /* 7516b8fda4dSGarrett Wollman * SEND_EOF is equivalent to a SEND followed by 7526b8fda4dSGarrett Wollman * a SHUTDOWN. 7536b8fda4dSGarrett Wollman */ 754a29f300eSGarrett Wollman if (flags & PRUS_EOF) { 7556b8fda4dSGarrett Wollman socantsendmore(so); 7566b8fda4dSGarrett Wollman unp_shutdown(unp); 7576b8fda4dSGarrett Wollman } 7580d9ce3a1SRobert Watson UNP_UNLOCK(); 759df8bae1dSRodney W. Grimes 760fc3fcacfSRobert Watson if (control != NULL && error != 0) 761bd508d39SDon Lewis unp_dispose(control); 762bd508d39SDon Lewis 763a29f300eSGarrett Wollman release: 764fc3fcacfSRobert Watson if (control != NULL) 765a29f300eSGarrett Wollman m_freem(control); 766fc3fcacfSRobert Watson if (m != NULL) 767a29f300eSGarrett Wollman m_freem(m); 768e5aeaa0cSDag-Erling Smørgrav return (error); 769a29f300eSGarrett Wollman } 770df8bae1dSRodney W. Grimes 771a29f300eSGarrett Wollman static int 772a29f300eSGarrett Wollman uipc_sense(struct socket *so, struct stat *sb) 773a29f300eSGarrett Wollman { 77440f2ac28SRobert Watson struct unpcb *unp; 775a29f300eSGarrett Wollman struct socket *so2; 776a29f300eSGarrett Wollman 77740f2ac28SRobert Watson unp = sotounpcb(so); 7784d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sense: unp == NULL")); 7794d4b555eSRobert Watson UNP_LOCK(); 780a29f300eSGarrett Wollman sb->st_blksize = so->so_snd.sb_hiwat; 781fc3fcacfSRobert Watson if (so->so_type == SOCK_STREAM && unp->unp_conn != NULL) { 782df8bae1dSRodney W. Grimes so2 = unp->unp_conn->unp_socket; 783a29f300eSGarrett Wollman sb->st_blksize += so2->so_rcv.sb_cc; 784df8bae1dSRodney W. Grimes } 785f3732fd1SPoul-Henning Kamp sb->st_dev = NODEV; 786df8bae1dSRodney W. Grimes if (unp->unp_ino == 0) 7876f782c46SJeffrey Hsu unp->unp_ino = (++unp_ino == 0) ? ++unp_ino : unp_ino; 788a29f300eSGarrett Wollman sb->st_ino = unp->unp_ino; 7890d9ce3a1SRobert Watson UNP_UNLOCK(); 790df8bae1dSRodney W. Grimes return (0); 791a29f300eSGarrett Wollman } 792df8bae1dSRodney W. Grimes 793a29f300eSGarrett Wollman static int 794a29f300eSGarrett Wollman uipc_shutdown(struct socket *so) 795a29f300eSGarrett Wollman { 79640f2ac28SRobert Watson struct unpcb *unp; 797df8bae1dSRodney W. Grimes 79840f2ac28SRobert Watson unp = sotounpcb(so); 7994d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_shutdown: unp == NULL")); 8004d4b555eSRobert Watson UNP_LOCK(); 801a29f300eSGarrett Wollman socantsendmore(so); 802a29f300eSGarrett Wollman unp_shutdown(unp); 8030d9ce3a1SRobert Watson UNP_UNLOCK(); 804e5aeaa0cSDag-Erling Smørgrav return (0); 805a29f300eSGarrett Wollman } 806df8bae1dSRodney W. Grimes 807a29f300eSGarrett Wollman static int 80857bf258eSGarrett Wollman uipc_sockaddr(struct socket *so, struct sockaddr **nam) 809a29f300eSGarrett Wollman { 81040f2ac28SRobert Watson struct unpcb *unp; 8110d9ce3a1SRobert Watson const struct sockaddr *sa; 812a29f300eSGarrett Wollman 8134d4b555eSRobert Watson unp = sotounpcb(so); 8144d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sockaddr: unp == NULL")); 8150d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 8160d9ce3a1SRobert Watson UNP_LOCK(); 817fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 8180d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_addr; 81983f3198bSThomas Moestl else 8200d9ce3a1SRobert Watson sa = &sun_noname; 8210d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 8220d9ce3a1SRobert Watson UNP_UNLOCK(); 823e5aeaa0cSDag-Erling Smørgrav return (0); 824df8bae1dSRodney W. Grimes } 825a29f300eSGarrett Wollman 826a29f300eSGarrett Wollman struct pr_usrreqs uipc_usrreqs = { 827756d52a1SPoul-Henning Kamp .pru_abort = uipc_abort, 828756d52a1SPoul-Henning Kamp .pru_accept = uipc_accept, 829756d52a1SPoul-Henning Kamp .pru_attach = uipc_attach, 830756d52a1SPoul-Henning Kamp .pru_bind = uipc_bind, 831756d52a1SPoul-Henning Kamp .pru_connect = uipc_connect, 832756d52a1SPoul-Henning Kamp .pru_connect2 = uipc_connect2, 833756d52a1SPoul-Henning Kamp .pru_detach = uipc_detach, 834756d52a1SPoul-Henning Kamp .pru_disconnect = uipc_disconnect, 835756d52a1SPoul-Henning Kamp .pru_listen = uipc_listen, 836756d52a1SPoul-Henning Kamp .pru_peeraddr = uipc_peeraddr, 837756d52a1SPoul-Henning Kamp .pru_rcvd = uipc_rcvd, 838756d52a1SPoul-Henning Kamp .pru_send = uipc_send, 839756d52a1SPoul-Henning Kamp .pru_sense = uipc_sense, 840756d52a1SPoul-Henning Kamp .pru_shutdown = uipc_shutdown, 841756d52a1SPoul-Henning Kamp .pru_sockaddr = uipc_sockaddr, 842a152f8a3SRobert Watson .pru_close = uipc_close, 843a29f300eSGarrett Wollman }; 844df8bae1dSRodney W. Grimes 8450c1bb4fbSDima Dorfman int 846892af6b9SRobert Watson uipc_ctloutput(struct socket *so, struct sockopt *sopt) 8470c1bb4fbSDima Dorfman { 84840f2ac28SRobert Watson struct unpcb *unp; 8490d9ce3a1SRobert Watson struct xucred xu; 8506a2989fdSMatthew N. Dodd int error, optval; 8516a2989fdSMatthew N. Dodd 85296a041b5SMatthew N. Dodd if (sopt->sopt_level != 0) 85396a041b5SMatthew N. Dodd return (EINVAL); 85496a041b5SMatthew N. Dodd 8556a2989fdSMatthew N. Dodd unp = sotounpcb(so); 8564d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_ctloutput: unp == NULL")); 8576a2989fdSMatthew N. Dodd error = 0; 8580c1bb4fbSDima Dorfman switch (sopt->sopt_dir) { 8590c1bb4fbSDima Dorfman case SOPT_GET: 8600c1bb4fbSDima Dorfman switch (sopt->sopt_name) { 8610c1bb4fbSDima Dorfman case LOCAL_PEERCRED: 8621f837c47SRobert Watson UNP_LOCK(); 8630c1bb4fbSDima Dorfman if (unp->unp_flags & UNP_HAVEPC) 8640d9ce3a1SRobert Watson xu = unp->unp_peercred; 8650c1bb4fbSDima Dorfman else { 8660c1bb4fbSDima Dorfman if (so->so_type == SOCK_STREAM) 8670c1bb4fbSDima Dorfman error = ENOTCONN; 8680c1bb4fbSDima Dorfman else 8690c1bb4fbSDima Dorfman error = EINVAL; 8700c1bb4fbSDima Dorfman } 8711f837c47SRobert Watson UNP_UNLOCK(); 8720d9ce3a1SRobert Watson if (error == 0) 8730d9ce3a1SRobert Watson error = sooptcopyout(sopt, &xu, sizeof(xu)); 8740c1bb4fbSDima Dorfman break; 8756a2989fdSMatthew N. Dodd case LOCAL_CREDS: 8761f837c47SRobert Watson /* Unocked read. */ 8776a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_WANTCRED ? 1 : 0; 8786a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 8796a2989fdSMatthew N. Dodd break; 8806a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 8811f837c47SRobert Watson /* Unocked read. */ 8826a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_CONNWAIT ? 1 : 0; 8836a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 8846a2989fdSMatthew N. Dodd break; 8850c1bb4fbSDima Dorfman default: 8860c1bb4fbSDima Dorfman error = EOPNOTSUPP; 8870c1bb4fbSDima Dorfman break; 8880c1bb4fbSDima Dorfman } 8890c1bb4fbSDima Dorfman break; 8900c1bb4fbSDima Dorfman case SOPT_SET: 8916a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 8926a2989fdSMatthew N. Dodd case LOCAL_CREDS: 8936a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 8946a2989fdSMatthew N. Dodd error = sooptcopyin(sopt, &optval, sizeof(optval), 8956a2989fdSMatthew N. Dodd sizeof(optval)); 8966a2989fdSMatthew N. Dodd if (error) 8976a2989fdSMatthew N. Dodd break; 8986a2989fdSMatthew N. Dodd 8996a2989fdSMatthew N. Dodd #define OPTSET(bit) \ 9006a2989fdSMatthew N. Dodd if (optval) \ 9016a2989fdSMatthew N. Dodd unp->unp_flags |= bit; \ 9026a2989fdSMatthew N. Dodd else \ 9036a2989fdSMatthew N. Dodd unp->unp_flags &= ~bit; 9046a2989fdSMatthew N. Dodd 9051f837c47SRobert Watson UNP_LOCK(); 9066a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 9076a2989fdSMatthew N. Dodd case LOCAL_CREDS: 9086a2989fdSMatthew N. Dodd OPTSET(UNP_WANTCRED); 9096a2989fdSMatthew N. Dodd break; 9106a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 9116a2989fdSMatthew N. Dodd OPTSET(UNP_CONNWAIT); 9126a2989fdSMatthew N. Dodd break; 9136a2989fdSMatthew N. Dodd default: 9146a2989fdSMatthew N. Dodd break; 9156a2989fdSMatthew N. Dodd } 9161f837c47SRobert Watson UNP_UNLOCK(); 9176a2989fdSMatthew N. Dodd break; 9186a2989fdSMatthew N. Dodd #undef OPTSET 9196a2989fdSMatthew N. Dodd default: 9206a2989fdSMatthew N. Dodd error = ENOPROTOOPT; 9216a2989fdSMatthew N. Dodd break; 9226a2989fdSMatthew N. Dodd } 923abb886faSMatthew N. Dodd break; 9240c1bb4fbSDima Dorfman default: 9250c1bb4fbSDima Dorfman error = EOPNOTSUPP; 9260c1bb4fbSDima Dorfman break; 9270c1bb4fbSDima Dorfman } 9280c1bb4fbSDima Dorfman return (error); 9290c1bb4fbSDima Dorfman } 9300c1bb4fbSDima Dorfman 931f708ef1bSPoul-Henning Kamp static int 932892af6b9SRobert Watson unp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 933df8bae1dSRodney W. Grimes { 934892af6b9SRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 935892af6b9SRobert Watson struct vnode *vp; 936892af6b9SRobert Watson struct socket *so2, *so3; 937b295bdcdSRobert Watson struct unpcb *unp, *unp2, *unp3; 93857bf258eSGarrett Wollman int error, len; 939df8bae1dSRodney W. Grimes struct nameidata nd; 94057bf258eSGarrett Wollman char buf[SOCK_MAXADDRLEN]; 9410d9ce3a1SRobert Watson struct sockaddr *sa; 9420d9ce3a1SRobert Watson 9430d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 944df8bae1dSRodney W. Grimes 9454d4b555eSRobert Watson unp = sotounpcb(so); 9464d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 94757bf258eSGarrett Wollman len = nam->sa_len - offsetof(struct sockaddr_un, sun_path); 94857bf258eSGarrett Wollman if (len <= 0) 949e5aeaa0cSDag-Erling Smørgrav return (EINVAL); 95055c85568SRobert Drehmel strlcpy(buf, soun->sun_path, len + 1); 9514f1f0ef5SRobert Watson if (unp->unp_flags & UNP_CONNECTING) { 9524f1f0ef5SRobert Watson UNP_UNLOCK(); 9534f1f0ef5SRobert Watson return (EALREADY); 9544f1f0ef5SRobert Watson } 95505102f04SRobert Watson unp->unp_flags |= UNP_CONNECTING; 9560d9ce3a1SRobert Watson UNP_UNLOCK(); 9570d9ce3a1SRobert Watson sa = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 9580d9ce3a1SRobert Watson mtx_lock(&Giant); 959b40ce416SJulian Elischer NDINIT(&nd, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, buf, td); 960797f2d22SPoul-Henning Kamp error = namei(&nd); 961797f2d22SPoul-Henning Kamp if (error) 9620d9ce3a1SRobert Watson vp = NULL; 9630d9ce3a1SRobert Watson else 964df8bae1dSRodney W. Grimes vp = nd.ni_vp; 9650d9ce3a1SRobert Watson ASSERT_VOP_LOCKED(vp, "unp_connect"); 966762e6b85SEivind Eklund NDFREE(&nd, NDF_ONLY_PNBUF); 9670d9ce3a1SRobert Watson if (error) 9680d9ce3a1SRobert Watson goto bad; 9690d9ce3a1SRobert Watson 970df8bae1dSRodney W. Grimes if (vp->v_type != VSOCK) { 971df8bae1dSRodney W. Grimes error = ENOTSOCK; 972df8bae1dSRodney W. Grimes goto bad; 973df8bae1dSRodney W. Grimes } 974a854ed98SJohn Baldwin error = VOP_ACCESS(vp, VWRITE, td->td_ucred, td); 975797f2d22SPoul-Henning Kamp if (error) 976df8bae1dSRodney W. Grimes goto bad; 9772260c03dSRobert Watson mtx_unlock(&Giant); 9782260c03dSRobert Watson UNP_LOCK(); 979b295bdcdSRobert Watson unp = sotounpcb(so); 9804d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 981df8bae1dSRodney W. Grimes so2 = vp->v_socket; 982fc3fcacfSRobert Watson if (so2 == NULL) { 983df8bae1dSRodney W. Grimes error = ECONNREFUSED; 9842260c03dSRobert Watson goto bad2; 985df8bae1dSRodney W. Grimes } 986df8bae1dSRodney W. Grimes if (so->so_type != so2->so_type) { 987df8bae1dSRodney W. Grimes error = EPROTOTYPE; 9882260c03dSRobert Watson goto bad2; 989df8bae1dSRodney W. Grimes } 990df8bae1dSRodney W. Grimes if (so->so_proto->pr_flags & PR_CONNREQUIRED) { 9910d9ce3a1SRobert Watson if (so2->so_options & SO_ACCEPTCONN) { 9920d9ce3a1SRobert Watson /* 9931c381b19SRobert Watson * NB: drop locks here so unp_attach is entered w/o 9941c381b19SRobert Watson * locks; this avoids a recursive lock of the head 9951c381b19SRobert Watson * and holding sleep locks across a (potentially) 9961c381b19SRobert Watson * blocking malloc. 9970d9ce3a1SRobert Watson */ 9980d9ce3a1SRobert Watson UNP_UNLOCK(); 9990d9ce3a1SRobert Watson so3 = sonewconn(so2, 0); 10000d9ce3a1SRobert Watson UNP_LOCK(); 10010d9ce3a1SRobert Watson } else 10020d9ce3a1SRobert Watson so3 = NULL; 10030d9ce3a1SRobert Watson if (so3 == NULL) { 1004df8bae1dSRodney W. Grimes error = ECONNREFUSED; 10050d9ce3a1SRobert Watson goto bad2; 1006df8bae1dSRodney W. Grimes } 10070c1bb4fbSDima Dorfman unp = sotounpcb(so); 1008df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 1009df8bae1dSRodney W. Grimes unp3 = sotounpcb(so3); 10100d9ce3a1SRobert Watson if (unp2->unp_addr != NULL) { 10110d9ce3a1SRobert Watson bcopy(unp2->unp_addr, sa, unp2->unp_addr->sun_len); 10120d9ce3a1SRobert Watson unp3->unp_addr = (struct sockaddr_un *) sa; 10130d9ce3a1SRobert Watson sa = NULL; 10140d9ce3a1SRobert Watson } 10150c1bb4fbSDima Dorfman /* 10160c1bb4fbSDima Dorfman * unp_peercred management: 10170c1bb4fbSDima Dorfman * 10181c381b19SRobert Watson * The connecter's (client's) credentials are copied from its 10191c381b19SRobert Watson * process structure at the time of connect() (which is now). 10200c1bb4fbSDima Dorfman */ 1021a854ed98SJohn Baldwin cru2x(td->td_ucred, &unp3->unp_peercred); 10220c1bb4fbSDima Dorfman unp3->unp_flags |= UNP_HAVEPC; 10230c1bb4fbSDima Dorfman /* 10241c381b19SRobert Watson * The receiver's (server's) credentials are copied from the 10251c381b19SRobert Watson * unp_peercred member of socket on which the former called 10261c381b19SRobert Watson * listen(); unp_listen() cached that process's credentials 10271c381b19SRobert Watson * at that time so we can use them now. 10280c1bb4fbSDima Dorfman */ 10290c1bb4fbSDima Dorfman KASSERT(unp2->unp_flags & UNP_HAVEPCCACHED, 10300c1bb4fbSDima Dorfman ("unp_connect: listener without cached peercred")); 10310c1bb4fbSDima Dorfman memcpy(&unp->unp_peercred, &unp2->unp_peercred, 10320c1bb4fbSDima Dorfman sizeof(unp->unp_peercred)); 10330c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPC; 1034481f8fe8SMaxim Konovalov if (unp2->unp_flags & UNP_WANTCRED) 1035481f8fe8SMaxim Konovalov unp3->unp_flags |= UNP_WANTCRED; 1036335654d7SRobert Watson #ifdef MAC 1037310e7cebSRobert Watson SOCK_LOCK(so); 1038335654d7SRobert Watson mac_set_socket_peer_from_socket(so, so3); 1039335654d7SRobert Watson mac_set_socket_peer_from_socket(so3, so); 1040310e7cebSRobert Watson SOCK_UNLOCK(so); 1041335654d7SRobert Watson #endif 10420c1bb4fbSDima Dorfman 1043df8bae1dSRodney W. Grimes so2 = so3; 1044df8bae1dSRodney W. Grimes } 10456a2989fdSMatthew N. Dodd error = unp_connect2(so, so2, PRU_CONNECT); 10460d9ce3a1SRobert Watson bad2: 10470d9ce3a1SRobert Watson UNP_UNLOCK(); 10480d9ce3a1SRobert Watson mtx_lock(&Giant); 1049df8bae1dSRodney W. Grimes bad: 10500d9ce3a1SRobert Watson mtx_assert(&Giant, MA_OWNED); 10510d9ce3a1SRobert Watson if (vp != NULL) 1052df8bae1dSRodney W. Grimes vput(vp); 10530d9ce3a1SRobert Watson mtx_unlock(&Giant); 10540d9ce3a1SRobert Watson free(sa, M_SONAME); 10550d9ce3a1SRobert Watson UNP_LOCK(); 10564f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_CONNECTING; 1057df8bae1dSRodney W. Grimes return (error); 1058df8bae1dSRodney W. Grimes } 1059df8bae1dSRodney W. Grimes 1060db48c0d2SRobert Watson static int 10616a2989fdSMatthew N. Dodd unp_connect2(struct socket *so, struct socket *so2, int req) 1062df8bae1dSRodney W. Grimes { 1063892af6b9SRobert Watson struct unpcb *unp = sotounpcb(so); 1064892af6b9SRobert Watson struct unpcb *unp2; 1065df8bae1dSRodney W. Grimes 10660d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 10670d9ce3a1SRobert Watson 1068df8bae1dSRodney W. Grimes if (so2->so_type != so->so_type) 1069df8bae1dSRodney W. Grimes return (EPROTOTYPE); 1070df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 10714d4b555eSRobert Watson KASSERT(unp2 != NULL, ("unp_connect2: unp2 == NULL")); 1072df8bae1dSRodney W. Grimes unp->unp_conn = unp2; 1073df8bae1dSRodney W. Grimes switch (so->so_type) { 1074df8bae1dSRodney W. Grimes case SOCK_DGRAM: 107598271db4SGarrett Wollman LIST_INSERT_HEAD(&unp2->unp_refs, unp, unp_reflink); 1076df8bae1dSRodney W. Grimes soisconnected(so); 1077df8bae1dSRodney W. Grimes break; 1078df8bae1dSRodney W. Grimes 1079df8bae1dSRodney W. Grimes case SOCK_STREAM: 1080df8bae1dSRodney W. Grimes unp2->unp_conn = unp; 10816a2989fdSMatthew N. Dodd if (req == PRU_CONNECT && 10826a2989fdSMatthew N. Dodd ((unp->unp_flags | unp2->unp_flags) & UNP_CONNWAIT)) 10836a2989fdSMatthew N. Dodd soisconnecting(so); 10846a2989fdSMatthew N. Dodd else 1085df8bae1dSRodney W. Grimes soisconnected(so); 1086df8bae1dSRodney W. Grimes soisconnected(so2); 1087df8bae1dSRodney W. Grimes break; 1088df8bae1dSRodney W. Grimes 1089df8bae1dSRodney W. Grimes default: 1090df8bae1dSRodney W. Grimes panic("unp_connect2"); 1091df8bae1dSRodney W. Grimes } 1092df8bae1dSRodney W. Grimes return (0); 1093df8bae1dSRodney W. Grimes } 1094df8bae1dSRodney W. Grimes 1095f708ef1bSPoul-Henning Kamp static void 1096892af6b9SRobert Watson unp_disconnect(struct unpcb *unp) 1097df8bae1dSRodney W. Grimes { 1098892af6b9SRobert Watson struct unpcb *unp2 = unp->unp_conn; 10991b2e3b4bSRobert Watson struct socket *so; 1100df8bae1dSRodney W. Grimes 11010d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 11020d9ce3a1SRobert Watson 1103fc3fcacfSRobert Watson if (unp2 == NULL) 1104df8bae1dSRodney W. Grimes return; 1105fc3fcacfSRobert Watson unp->unp_conn = NULL; 1106df8bae1dSRodney W. Grimes switch (unp->unp_socket->so_type) { 1107df8bae1dSRodney W. Grimes case SOCK_DGRAM: 110898271db4SGarrett Wollman LIST_REMOVE(unp, unp_reflink); 11091b2e3b4bSRobert Watson so = unp->unp_socket; 11101b2e3b4bSRobert Watson SOCK_LOCK(so); 11111b2e3b4bSRobert Watson so->so_state &= ~SS_ISCONNECTED; 11121b2e3b4bSRobert Watson SOCK_UNLOCK(so); 1113df8bae1dSRodney W. Grimes break; 1114df8bae1dSRodney W. Grimes 1115df8bae1dSRodney W. Grimes case SOCK_STREAM: 1116df8bae1dSRodney W. Grimes soisdisconnected(unp->unp_socket); 1117fc3fcacfSRobert Watson unp2->unp_conn = NULL; 1118df8bae1dSRodney W. Grimes soisdisconnected(unp2->unp_socket); 1119df8bae1dSRodney W. Grimes break; 1120df8bae1dSRodney W. Grimes } 1121df8bae1dSRodney W. Grimes } 1122df8bae1dSRodney W. Grimes 11230d9ce3a1SRobert Watson /* 11241c381b19SRobert Watson * unp_pcblist() assumes that UNIX domain socket memory is never reclaimed by 11251c381b19SRobert Watson * the zone (UMA_ZONE_NOFREE), and as such potentially stale pointers are 11261c381b19SRobert Watson * safe to reference. It first scans the list of struct unpcb's to generate 11271c381b19SRobert Watson * a pointer list, then it rescans its list one entry at a time to 11280d9ce3a1SRobert Watson * externalize and copyout. It checks the generation number to see if a 11290d9ce3a1SRobert Watson * struct unpcb has been reused, and will skip it if so. 11300d9ce3a1SRobert Watson */ 113198271db4SGarrett Wollman static int 113282d9ae4eSPoul-Henning Kamp unp_pcblist(SYSCTL_HANDLER_ARGS) 113398271db4SGarrett Wollman { 1134f5ef029eSPoul-Henning Kamp int error, i, n; 11359ae328fcSJohn Baldwin int freeunp; 113698271db4SGarrett Wollman struct unpcb *unp, **unp_list; 113798271db4SGarrett Wollman unp_gen_t gencnt; 11388f364875SJulian Elischer struct xunpgen *xug; 113998271db4SGarrett Wollman struct unp_head *head; 11408f364875SJulian Elischer struct xunpcb *xu; 114198271db4SGarrett Wollman 1142a23d65bfSBruce Evans head = ((intptr_t)arg1 == SOCK_DGRAM ? &unp_dhead : &unp_shead); 114398271db4SGarrett Wollman 114498271db4SGarrett Wollman /* 114598271db4SGarrett Wollman * The process of preparing the PCB list is too time-consuming and 114698271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 114798271db4SGarrett Wollman */ 1148fc3fcacfSRobert Watson if (req->oldptr == NULL) { 114998271db4SGarrett Wollman n = unp_count; 11508f364875SJulian Elischer req->oldidx = 2 * (sizeof *xug) 115198271db4SGarrett Wollman + (n + n/8) * sizeof(struct xunpcb); 1152e5aeaa0cSDag-Erling Smørgrav return (0); 115398271db4SGarrett Wollman } 115498271db4SGarrett Wollman 1155fc3fcacfSRobert Watson if (req->newptr != NULL) 1156e5aeaa0cSDag-Erling Smørgrav return (EPERM); 115798271db4SGarrett Wollman 115898271db4SGarrett Wollman /* 115998271db4SGarrett Wollman * OK, now we're committed to doing something. 116098271db4SGarrett Wollman */ 1161a163d034SWarner Losh xug = malloc(sizeof(*xug), M_TEMP, M_WAITOK); 11620d9ce3a1SRobert Watson UNP_LOCK(); 116398271db4SGarrett Wollman gencnt = unp_gencnt; 116498271db4SGarrett Wollman n = unp_count; 11650d9ce3a1SRobert Watson UNP_UNLOCK(); 116698271db4SGarrett Wollman 11678f364875SJulian Elischer xug->xug_len = sizeof *xug; 11688f364875SJulian Elischer xug->xug_count = n; 11698f364875SJulian Elischer xug->xug_gen = gencnt; 11708f364875SJulian Elischer xug->xug_sogen = so_gencnt; 11718f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 11728f364875SJulian Elischer if (error) { 11738f364875SJulian Elischer free(xug, M_TEMP); 1174e5aeaa0cSDag-Erling Smørgrav return (error); 11758f364875SJulian Elischer } 117698271db4SGarrett Wollman 1177a163d034SWarner Losh unp_list = malloc(n * sizeof *unp_list, M_TEMP, M_WAITOK); 117898271db4SGarrett Wollman 11790d9ce3a1SRobert Watson UNP_LOCK(); 11802e3c8fcbSPoul-Henning Kamp for (unp = LIST_FIRST(head), i = 0; unp && i < n; 11812e3c8fcbSPoul-Henning Kamp unp = LIST_NEXT(unp, unp_link)) { 11828a7d8cc6SRobert Watson if (unp->unp_gencnt <= gencnt) { 1183a854ed98SJohn Baldwin if (cr_cansee(req->td->td_ucred, 11848a7d8cc6SRobert Watson unp->unp_socket->so_cred)) 11854787fd37SPaul Saab continue; 118698271db4SGarrett Wollman unp_list[i++] = unp; 11879ae328fcSJohn Baldwin unp->unp_refcount++; 118898271db4SGarrett Wollman } 11894787fd37SPaul Saab } 11900d9ce3a1SRobert Watson UNP_UNLOCK(); 11911c381b19SRobert Watson n = i; /* In case we lost some during malloc. */ 119298271db4SGarrett Wollman 119398271db4SGarrett Wollman error = 0; 1194fe2eee82SColin Percival xu = malloc(sizeof(*xu), M_TEMP, M_WAITOK | M_ZERO); 119598271db4SGarrett Wollman for (i = 0; i < n; i++) { 119698271db4SGarrett Wollman unp = unp_list[i]; 11979ae328fcSJohn Baldwin UNP_LOCK(); 11989ae328fcSJohn Baldwin unp->unp_refcount--; 11999ae328fcSJohn Baldwin if (unp->unp_refcount != 0 && unp->unp_gencnt <= gencnt) { 12008f364875SJulian Elischer xu->xu_len = sizeof *xu; 12018f364875SJulian Elischer xu->xu_unpp = unp; 120298271db4SGarrett Wollman /* 120398271db4SGarrett Wollman * XXX - need more locking here to protect against 120498271db4SGarrett Wollman * connect/disconnect races for SMP. 120598271db4SGarrett Wollman */ 1206fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 12078f364875SJulian Elischer bcopy(unp->unp_addr, &xu->xu_addr, 120898271db4SGarrett Wollman unp->unp_addr->sun_len); 1209fc3fcacfSRobert Watson if (unp->unp_conn != NULL && 1210fc3fcacfSRobert Watson unp->unp_conn->unp_addr != NULL) 121198271db4SGarrett Wollman bcopy(unp->unp_conn->unp_addr, 12128f364875SJulian Elischer &xu->xu_caddr, 121398271db4SGarrett Wollman unp->unp_conn->unp_addr->sun_len); 12148f364875SJulian Elischer bcopy(unp, &xu->xu_unp, sizeof *unp); 12158f364875SJulian Elischer sotoxsocket(unp->unp_socket, &xu->xu_socket); 12169ae328fcSJohn Baldwin UNP_UNLOCK(); 12178f364875SJulian Elischer error = SYSCTL_OUT(req, xu, sizeof *xu); 12189ae328fcSJohn Baldwin } else { 12199ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 12209ae328fcSJohn Baldwin UNP_UNLOCK(); 12219ae328fcSJohn Baldwin if (freeunp) 12229ae328fcSJohn Baldwin uma_zfree(unp_zone, unp); 122398271db4SGarrett Wollman } 122498271db4SGarrett Wollman } 12258f364875SJulian Elischer free(xu, M_TEMP); 122698271db4SGarrett Wollman if (!error) { 122798271db4SGarrett Wollman /* 12281c381b19SRobert Watson * Give the user an updated idea of our state. If the 12291c381b19SRobert Watson * generation differs from what we told her before, she knows 12301c381b19SRobert Watson * that something happened while we were processing this 12311c381b19SRobert Watson * request, and it might be necessary to retry. 123298271db4SGarrett Wollman */ 12338f364875SJulian Elischer xug->xug_gen = unp_gencnt; 12348f364875SJulian Elischer xug->xug_sogen = so_gencnt; 12358f364875SJulian Elischer xug->xug_count = unp_count; 12368f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 123798271db4SGarrett Wollman } 123898271db4SGarrett Wollman free(unp_list, M_TEMP); 12398f364875SJulian Elischer free(xug, M_TEMP); 1240e5aeaa0cSDag-Erling Smørgrav return (error); 124198271db4SGarrett Wollman } 124298271db4SGarrett Wollman 124398271db4SGarrett Wollman SYSCTL_PROC(_net_local_dgram, OID_AUTO, pcblist, CTLFLAG_RD, 124498271db4SGarrett Wollman (caddr_t)(long)SOCK_DGRAM, 0, unp_pcblist, "S,xunpcb", 124598271db4SGarrett Wollman "List of active local datagram sockets"); 124698271db4SGarrett Wollman SYSCTL_PROC(_net_local_stream, OID_AUTO, pcblist, CTLFLAG_RD, 124798271db4SGarrett Wollman (caddr_t)(long)SOCK_STREAM, 0, unp_pcblist, "S,xunpcb", 124898271db4SGarrett Wollman "List of active local stream sockets"); 124998271db4SGarrett Wollman 1250f708ef1bSPoul-Henning Kamp static void 1251892af6b9SRobert Watson unp_shutdown(struct unpcb *unp) 1252df8bae1dSRodney W. Grimes { 1253df8bae1dSRodney W. Grimes struct socket *so; 1254df8bae1dSRodney W. Grimes 12550d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 12560d9ce3a1SRobert Watson 1257df8bae1dSRodney W. Grimes if (unp->unp_socket->so_type == SOCK_STREAM && unp->unp_conn && 1258df8bae1dSRodney W. Grimes (so = unp->unp_conn->unp_socket)) 1259df8bae1dSRodney W. Grimes socantrcvmore(so); 1260df8bae1dSRodney W. Grimes } 1261df8bae1dSRodney W. Grimes 1262f708ef1bSPoul-Henning Kamp static void 1263892af6b9SRobert Watson unp_drop(struct unpcb *unp, int errno) 1264df8bae1dSRodney W. Grimes { 1265df8bae1dSRodney W. Grimes struct socket *so = unp->unp_socket; 1266df8bae1dSRodney W. Grimes 12670d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 12680d9ce3a1SRobert Watson 1269df8bae1dSRodney W. Grimes so->so_error = errno; 1270df8bae1dSRodney W. Grimes unp_disconnect(unp); 1271df8bae1dSRodney W. Grimes } 1272df8bae1dSRodney W. Grimes 12732bc21ed9SDavid Malone static void 1274892af6b9SRobert Watson unp_freerights(struct file **rp, int fdcount) 1275df8bae1dSRodney W. Grimes { 12762bc21ed9SDavid Malone int i; 12772bc21ed9SDavid Malone struct file *fp; 1278df8bae1dSRodney W. Grimes 12792bc21ed9SDavid Malone for (i = 0; i < fdcount; i++) { 1280df8bae1dSRodney W. Grimes fp = *rp; 12818692c025SYoshinobu Inoue /* 12821c381b19SRobert Watson * Zero the pointer before calling unp_discard since it may 12831c381b19SRobert Watson * end up in unp_gc().. 1284d7dca903SRobert Watson * 1285d7dca903SRobert Watson * XXXRW: This is less true than it used to be. 12868692c025SYoshinobu Inoue */ 1287df8bae1dSRodney W. Grimes *rp++ = 0; 12888692c025SYoshinobu Inoue unp_discard(fp); 1289df8bae1dSRodney W. Grimes } 12902bc21ed9SDavid Malone } 12912bc21ed9SDavid Malone 12922bc21ed9SDavid Malone int 1293892af6b9SRobert Watson unp_externalize(struct mbuf *control, struct mbuf **controlp) 12942bc21ed9SDavid Malone { 12952bc21ed9SDavid Malone struct thread *td = curthread; /* XXX */ 12962bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 12972bc21ed9SDavid Malone int i; 12982bc21ed9SDavid Malone int *fdp; 12992bc21ed9SDavid Malone struct file **rp; 13002bc21ed9SDavid Malone struct file *fp; 13012bc21ed9SDavid Malone void *data; 13022bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 13032bc21ed9SDavid Malone int error, newfds; 13042bc21ed9SDavid Malone int f; 13052bc21ed9SDavid Malone u_int newlen; 13062bc21ed9SDavid Malone 13074c5bc1caSRobert Watson UNP_UNLOCK_ASSERT(); 13084c5bc1caSRobert Watson 13092bc21ed9SDavid Malone error = 0; 13102bc21ed9SDavid Malone if (controlp != NULL) /* controlp == NULL => free control messages */ 13112bc21ed9SDavid Malone *controlp = NULL; 13122bc21ed9SDavid Malone 13132bc21ed9SDavid Malone while (cm != NULL) { 13142bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) { 13152bc21ed9SDavid Malone error = EINVAL; 13162bc21ed9SDavid Malone break; 13172bc21ed9SDavid Malone } 13182bc21ed9SDavid Malone 13192bc21ed9SDavid Malone data = CMSG_DATA(cm); 13202bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 13212bc21ed9SDavid Malone 13222bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET 13232bc21ed9SDavid Malone && cm->cmsg_type == SCM_RIGHTS) { 13242bc21ed9SDavid Malone newfds = datalen / sizeof(struct file *); 13252bc21ed9SDavid Malone rp = data; 13262bc21ed9SDavid Malone 1327e2f9a08bSOlivier Houchard /* If we're not outputting the descriptors free them. */ 13282bc21ed9SDavid Malone if (error || controlp == NULL) { 13292bc21ed9SDavid Malone unp_freerights(rp, newfds); 13302bc21ed9SDavid Malone goto next; 13312bc21ed9SDavid Malone } 1332426da3bcSAlfred Perlstein FILEDESC_LOCK(td->td_proc->p_fd); 13332bc21ed9SDavid Malone /* if the new FD's will not fit free them. */ 13342bc21ed9SDavid Malone if (!fdavail(td, newfds)) { 1335426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13362bc21ed9SDavid Malone error = EMSGSIZE; 13372bc21ed9SDavid Malone unp_freerights(rp, newfds); 13382bc21ed9SDavid Malone goto next; 1339df8bae1dSRodney W. Grimes } 1340ed5b7817SJulian Elischer /* 13411c381b19SRobert Watson * Now change each pointer to an fd in the global 13421c381b19SRobert Watson * table to an integer that is the index to the local 13431c381b19SRobert Watson * fd table entry that we set up to point to the 13441c381b19SRobert Watson * global one we are transferring. 1345ed5b7817SJulian Elischer */ 13462bc21ed9SDavid Malone newlen = newfds * sizeof(int); 13472bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 13482bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 13492bc21ed9SDavid Malone if (*controlp == NULL) { 1350426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13512bc21ed9SDavid Malone error = E2BIG; 13522bc21ed9SDavid Malone unp_freerights(rp, newfds); 13532bc21ed9SDavid Malone goto next; 13542bc21ed9SDavid Malone } 13552bc21ed9SDavid Malone 13562bc21ed9SDavid Malone fdp = (int *) 13572bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 1358df8bae1dSRodney W. Grimes for (i = 0; i < newfds; i++) { 1359a6d4491cSDag-Erling Smørgrav if (fdalloc(td, 0, &f)) 13602bc21ed9SDavid Malone panic("unp_externalize fdalloc failed"); 13618692c025SYoshinobu Inoue fp = *rp++; 1362b40ce416SJulian Elischer td->td_proc->p_fd->fd_ofiles[f] = fp; 1363426da3bcSAlfred Perlstein FILE_LOCK(fp); 1364df8bae1dSRodney W. Grimes fp->f_msgcount--; 1365426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1366df8bae1dSRodney W. Grimes unp_rights--; 13678692c025SYoshinobu Inoue *fdp++ = f; 1368df8bae1dSRodney W. Grimes } 1369426da3bcSAlfred Perlstein FILEDESC_UNLOCK(td->td_proc->p_fd); 13701c381b19SRobert Watson } else { 13711c381b19SRobert Watson /* We can just copy anything else across. */ 13722bc21ed9SDavid Malone if (error || controlp == NULL) 13732bc21ed9SDavid Malone goto next; 13742bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, datalen, 13752bc21ed9SDavid Malone cm->cmsg_type, cm->cmsg_level); 13762bc21ed9SDavid Malone if (*controlp == NULL) { 13772bc21ed9SDavid Malone error = ENOBUFS; 13782bc21ed9SDavid Malone goto next; 13792bc21ed9SDavid Malone } 13802bc21ed9SDavid Malone bcopy(data, 13812bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)), 13822bc21ed9SDavid Malone datalen); 13832bc21ed9SDavid Malone } 13842bc21ed9SDavid Malone 13852bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 13862bc21ed9SDavid Malone 13872bc21ed9SDavid Malone next: 13882bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 13892bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 13902bc21ed9SDavid Malone cm = (struct cmsghdr *) 13912bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 13928692c025SYoshinobu Inoue } else { 13932bc21ed9SDavid Malone clen = 0; 13942bc21ed9SDavid Malone cm = NULL; 13958692c025SYoshinobu Inoue } 13968692c025SYoshinobu Inoue } 13978692c025SYoshinobu Inoue 13982bc21ed9SDavid Malone m_freem(control); 13992bc21ed9SDavid Malone 14002bc21ed9SDavid Malone return (error); 1401df8bae1dSRodney W. Grimes } 1402df8bae1dSRodney W. Grimes 14034f590175SPaul Saab static void 14044f590175SPaul Saab unp_zone_change(void *tag) 14054f590175SPaul Saab { 14064f590175SPaul Saab 14074f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 14084f590175SPaul Saab } 14094f590175SPaul Saab 141098271db4SGarrett Wollman void 141198271db4SGarrett Wollman unp_init(void) 141298271db4SGarrett Wollman { 14131c381b19SRobert Watson 14149e9d298aSJeff Roberson unp_zone = uma_zcreate("unpcb", sizeof(struct unpcb), NULL, NULL, 14159ae328fcSJohn Baldwin NULL, NULL, UMA_ALIGN_PTR, 0); 1416fc3fcacfSRobert Watson if (unp_zone == NULL) 141798271db4SGarrett Wollman panic("unp_init"); 14184f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 14194f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, unp_zone_change, 14204f590175SPaul Saab NULL, EVENTHANDLER_PRI_ANY); 142198271db4SGarrett Wollman LIST_INIT(&unp_dhead); 142298271db4SGarrett Wollman LIST_INIT(&unp_shead); 1423a0ec558aSRobert Watson TASK_INIT(&unp_gc_task, 0, unp_gc, NULL); 14240d9ce3a1SRobert Watson UNP_LOCK_INIT(); 142598271db4SGarrett Wollman } 142698271db4SGarrett Wollman 1427f708ef1bSPoul-Henning Kamp static int 1428892af6b9SRobert Watson unp_internalize(struct mbuf **controlp, struct thread *td) 1429df8bae1dSRodney W. Grimes { 14302bc21ed9SDavid Malone struct mbuf *control = *controlp; 1431b40ce416SJulian Elischer struct proc *p = td->td_proc; 14328692c025SYoshinobu Inoue struct filedesc *fdescp = p->p_fd; 14332bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 14342bc21ed9SDavid Malone struct cmsgcred *cmcred; 14352bc21ed9SDavid Malone struct file **rp; 14362bc21ed9SDavid Malone struct file *fp; 14372bc21ed9SDavid Malone struct timeval *tv; 14382bc21ed9SDavid Malone int i, fd, *fdp; 14392bc21ed9SDavid Malone void *data; 14402bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 14412bc21ed9SDavid Malone int error, oldfds; 14428692c025SYoshinobu Inoue u_int newlen; 1443df8bae1dSRodney W. Grimes 14444c5bc1caSRobert Watson UNP_UNLOCK_ASSERT(); 14454c5bc1caSRobert Watson 14462bc21ed9SDavid Malone error = 0; 14472bc21ed9SDavid Malone *controlp = NULL; 14480b788fa1SBill Paul 14492bc21ed9SDavid Malone while (cm != NULL) { 14502bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_level != SOL_SOCKET 14512bc21ed9SDavid Malone || cm->cmsg_len > clen) { 14522bc21ed9SDavid Malone error = EINVAL; 14532bc21ed9SDavid Malone goto out; 14542bc21ed9SDavid Malone } 14552bc21ed9SDavid Malone 14562bc21ed9SDavid Malone data = CMSG_DATA(cm); 14572bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 14582bc21ed9SDavid Malone 14592bc21ed9SDavid Malone switch (cm->cmsg_type) { 14600b788fa1SBill Paul /* 14610b788fa1SBill Paul * Fill in credential information. 14620b788fa1SBill Paul */ 14632bc21ed9SDavid Malone case SCM_CREDS: 14642bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*cmcred), 14652bc21ed9SDavid Malone SCM_CREDS, SOL_SOCKET); 14662bc21ed9SDavid Malone if (*controlp == NULL) { 14672bc21ed9SDavid Malone error = ENOBUFS; 14682bc21ed9SDavid Malone goto out; 14692bc21ed9SDavid Malone } 14702bc21ed9SDavid Malone 14712bc21ed9SDavid Malone cmcred = (struct cmsgcred *) 14722bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 14730b788fa1SBill Paul cmcred->cmcred_pid = p->p_pid; 1474a854ed98SJohn Baldwin cmcred->cmcred_uid = td->td_ucred->cr_ruid; 1475a854ed98SJohn Baldwin cmcred->cmcred_gid = td->td_ucred->cr_rgid; 1476a854ed98SJohn Baldwin cmcred->cmcred_euid = td->td_ucred->cr_uid; 1477a854ed98SJohn Baldwin cmcred->cmcred_ngroups = MIN(td->td_ucred->cr_ngroups, 14780b788fa1SBill Paul CMGROUP_MAX); 14790b788fa1SBill Paul for (i = 0; i < cmcred->cmcred_ngroups; i++) 14802bc21ed9SDavid Malone cmcred->cmcred_groups[i] = 1481a854ed98SJohn Baldwin td->td_ucred->cr_groups[i]; 14822bc21ed9SDavid Malone break; 14830b788fa1SBill Paul 14842bc21ed9SDavid Malone case SCM_RIGHTS: 14852bc21ed9SDavid Malone oldfds = datalen / sizeof (int); 1486ed5b7817SJulian Elischer /* 14871c381b19SRobert Watson * Check that all the FDs passed in refer to legal 14881c381b19SRobert Watson * files. If not, reject the entire operation. 1489ed5b7817SJulian Elischer */ 14902bc21ed9SDavid Malone fdp = data; 1491426da3bcSAlfred Perlstein FILEDESC_LOCK(fdescp); 1492df8bae1dSRodney W. Grimes for (i = 0; i < oldfds; i++) { 14938692c025SYoshinobu Inoue fd = *fdp++; 14948692c025SYoshinobu Inoue if ((unsigned)fd >= fdescp->fd_nfiles || 14952bc21ed9SDavid Malone fdescp->fd_ofiles[fd] == NULL) { 1496426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 14972bc21ed9SDavid Malone error = EBADF; 14982bc21ed9SDavid Malone goto out; 14992bc21ed9SDavid Malone } 1500e7d6662fSAlfred Perlstein fp = fdescp->fd_ofiles[fd]; 1501e7d6662fSAlfred Perlstein if (!(fp->f_ops->fo_flags & DFLAG_PASSABLE)) { 1502e7d6662fSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 1503e7d6662fSAlfred Perlstein error = EOPNOTSUPP; 1504e7d6662fSAlfred Perlstein goto out; 1505e7d6662fSAlfred Perlstein } 1506e7d6662fSAlfred Perlstein 1507df8bae1dSRodney W. Grimes } 1508ed5b7817SJulian Elischer /* 15091c381b19SRobert Watson * Now replace the integer FDs with pointers to the 15101c381b19SRobert Watson * associated global file table entry.. 1511ed5b7817SJulian Elischer */ 15122bc21ed9SDavid Malone newlen = oldfds * sizeof(struct file *); 15132bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 15142bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 15152bc21ed9SDavid Malone if (*controlp == NULL) { 1516426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 15172bc21ed9SDavid Malone error = E2BIG; 15182bc21ed9SDavid Malone goto out; 15198692c025SYoshinobu Inoue } 15208692c025SYoshinobu Inoue 15212bc21ed9SDavid Malone fdp = data; 15222bc21ed9SDavid Malone rp = (struct file **) 15232bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 15248692c025SYoshinobu Inoue for (i = 0; i < oldfds; i++) { 15258692c025SYoshinobu Inoue fp = fdescp->fd_ofiles[*fdp++]; 1526df8bae1dSRodney W. Grimes *rp++ = fp; 1527426da3bcSAlfred Perlstein FILE_LOCK(fp); 1528df8bae1dSRodney W. Grimes fp->f_count++; 1529df8bae1dSRodney W. Grimes fp->f_msgcount++; 1530426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1531df8bae1dSRodney W. Grimes unp_rights++; 1532df8bae1dSRodney W. Grimes } 1533426da3bcSAlfred Perlstein FILEDESC_UNLOCK(fdescp); 15342bc21ed9SDavid Malone break; 15352bc21ed9SDavid Malone 15362bc21ed9SDavid Malone case SCM_TIMESTAMP: 15372bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*tv), 15382bc21ed9SDavid Malone SCM_TIMESTAMP, SOL_SOCKET); 15392bc21ed9SDavid Malone if (*controlp == NULL) { 15402bc21ed9SDavid Malone error = ENOBUFS; 15412bc21ed9SDavid Malone goto out; 15428692c025SYoshinobu Inoue } 15432bc21ed9SDavid Malone tv = (struct timeval *) 15442bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 15452bc21ed9SDavid Malone microtime(tv); 15462bc21ed9SDavid Malone break; 15472bc21ed9SDavid Malone 15482bc21ed9SDavid Malone default: 15492bc21ed9SDavid Malone error = EINVAL; 15502bc21ed9SDavid Malone goto out; 15512bc21ed9SDavid Malone } 15522bc21ed9SDavid Malone 15532bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 15542bc21ed9SDavid Malone 15552bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 15562bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 15572bc21ed9SDavid Malone cm = (struct cmsghdr *) 15582bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 15592bc21ed9SDavid Malone } else { 15602bc21ed9SDavid Malone clen = 0; 15612bc21ed9SDavid Malone cm = NULL; 15622bc21ed9SDavid Malone } 15632bc21ed9SDavid Malone } 15642bc21ed9SDavid Malone 15652bc21ed9SDavid Malone out: 15662bc21ed9SDavid Malone m_freem(control); 15672bc21ed9SDavid Malone 15682bc21ed9SDavid Malone return (error); 1569df8bae1dSRodney W. Grimes } 1570df8bae1dSRodney W. Grimes 15716a2989fdSMatthew N. Dodd struct mbuf * 15726a2989fdSMatthew N. Dodd unp_addsockcred(struct thread *td, struct mbuf *control) 15736a2989fdSMatthew N. Dodd { 157470df31f4SMaxim Konovalov struct mbuf *m, *n, *n_prev; 15756a2989fdSMatthew N. Dodd struct sockcred *sc; 157670df31f4SMaxim Konovalov const struct cmsghdr *cm; 15776a2989fdSMatthew N. Dodd int ngroups; 15786a2989fdSMatthew N. Dodd int i; 15796a2989fdSMatthew N. Dodd 15806a2989fdSMatthew N. Dodd ngroups = MIN(td->td_ucred->cr_ngroups, CMGROUP_MAX); 15816a2989fdSMatthew N. Dodd 15826a2989fdSMatthew N. Dodd m = sbcreatecontrol(NULL, SOCKCREDSIZE(ngroups), SCM_CREDS, SOL_SOCKET); 15836a2989fdSMatthew N. Dodd if (m == NULL) 15846a2989fdSMatthew N. Dodd return (control); 15856a2989fdSMatthew N. Dodd 15866a2989fdSMatthew N. Dodd sc = (struct sockcred *) CMSG_DATA(mtod(m, struct cmsghdr *)); 15876a2989fdSMatthew N. Dodd sc->sc_uid = td->td_ucred->cr_ruid; 15886a2989fdSMatthew N. Dodd sc->sc_euid = td->td_ucred->cr_uid; 15896a2989fdSMatthew N. Dodd sc->sc_gid = td->td_ucred->cr_rgid; 15906a2989fdSMatthew N. Dodd sc->sc_egid = td->td_ucred->cr_gid; 15916a2989fdSMatthew N. Dodd sc->sc_ngroups = ngroups; 15926a2989fdSMatthew N. Dodd for (i = 0; i < sc->sc_ngroups; i++) 15936a2989fdSMatthew N. Dodd sc->sc_groups[i] = td->td_ucred->cr_groups[i]; 15946a2989fdSMatthew N. Dodd 15956a2989fdSMatthew N. Dodd /* 15961c381b19SRobert Watson * Unlink SCM_CREDS control messages (struct cmsgcred), since just 15971c381b19SRobert Watson * created SCM_CREDS control message (struct sockcred) has another 15981c381b19SRobert Watson * format. 15996a2989fdSMatthew N. Dodd */ 160070df31f4SMaxim Konovalov if (control != NULL) 160170df31f4SMaxim Konovalov for (n = control, n_prev = NULL; n != NULL;) { 160270df31f4SMaxim Konovalov cm = mtod(n, struct cmsghdr *); 160370df31f4SMaxim Konovalov if (cm->cmsg_level == SOL_SOCKET && 160470df31f4SMaxim Konovalov cm->cmsg_type == SCM_CREDS) { 160570df31f4SMaxim Konovalov if (n_prev == NULL) 160670df31f4SMaxim Konovalov control = n->m_next; 160770df31f4SMaxim Konovalov else 160870df31f4SMaxim Konovalov n_prev->m_next = n->m_next; 160970df31f4SMaxim Konovalov n = m_free(n); 161070df31f4SMaxim Konovalov } else { 161170df31f4SMaxim Konovalov n_prev = n; 161270df31f4SMaxim Konovalov n = n->m_next; 161370df31f4SMaxim Konovalov } 161470df31f4SMaxim Konovalov } 16156a2989fdSMatthew N. Dodd 161670df31f4SMaxim Konovalov /* Prepend it to the head. */ 161770df31f4SMaxim Konovalov m->m_next = control; 161870df31f4SMaxim Konovalov 161970df31f4SMaxim Konovalov return (m); 16206a2989fdSMatthew N. Dodd } 16216a2989fdSMatthew N. Dodd 1622161a0c7cSRobert Watson /* 1623a0ec558aSRobert Watson * unp_defer indicates whether additional work has been defered for a future 1624a0ec558aSRobert Watson * pass through unp_gc(). It is thread local and does not require explicit 1625a0ec558aSRobert Watson * synchronization. 1626161a0c7cSRobert Watson */ 1627a0ec558aSRobert Watson static int unp_defer; 1628a0ec558aSRobert Watson 1629a0ec558aSRobert Watson static int unp_taskcount; 1630a0ec558aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, taskcount, CTLFLAG_RD, &unp_taskcount, 0, ""); 1631a0ec558aSRobert Watson 1632a0ec558aSRobert Watson static int unp_recycled; 1633a0ec558aSRobert Watson SYSCTL_INT(_net_local, OID_AUTO, recycled, CTLFLAG_RD, &unp_recycled, 0, ""); 1634df8bae1dSRodney W. Grimes 1635f708ef1bSPoul-Henning Kamp static void 1636a0ec558aSRobert Watson unp_gc(__unused void *arg, int pending) 1637df8bae1dSRodney W. Grimes { 1638892af6b9SRobert Watson struct file *fp, *nextfp; 1639892af6b9SRobert Watson struct socket *so; 1640df8bae1dSRodney W. Grimes struct file **extra_ref, **fpp; 1641df8bae1dSRodney W. Grimes int nunref, i; 164295f004dcSAlfred Perlstein int nfiles_snap; 164395f004dcSAlfred Perlstein int nfiles_slack = 20; 1644df8bae1dSRodney W. Grimes 1645a0ec558aSRobert Watson unp_taskcount++; 1646df8bae1dSRodney W. Grimes unp_defer = 0; 1647ed5b7817SJulian Elischer /* 16489ae328fcSJohn Baldwin * Before going through all this, set all FDs to be NOT deferred and 16491c381b19SRobert Watson * NOT externally accessible. 1650ed5b7817SJulian Elischer */ 1651426da3bcSAlfred Perlstein sx_slock(&filelist_lock); 16522e3c8fcbSPoul-Henning Kamp LIST_FOREACH(fp, &filehead, f_list) 1653426da3bcSAlfred Perlstein fp->f_gcflag &= ~(FMARK|FDEFER); 1654df8bae1dSRodney W. Grimes do { 16555bb84bc8SRobert Watson KASSERT(unp_defer >= 0, ("unp_gc: unp_defer %d", unp_defer)); 16562e3c8fcbSPoul-Henning Kamp LIST_FOREACH(fp, &filehead, f_list) { 1657426da3bcSAlfred Perlstein FILE_LOCK(fp); 1658ed5b7817SJulian Elischer /* 1659a0ec558aSRobert Watson * If the file is not open, skip it -- could be a 1660a0ec558aSRobert Watson * file in the process of being opened, or in the 1661a0ec558aSRobert Watson * process of being closed. If the file is 1662a0ec558aSRobert Watson * "closing", it may have been marked for deferred 1663a0ec558aSRobert Watson * consideration. Clear the flag now if so. 1664ed5b7817SJulian Elischer */ 1665426da3bcSAlfred Perlstein if (fp->f_count == 0) { 1666a0ec558aSRobert Watson if (fp->f_gcflag & FDEFER) 1667a0ec558aSRobert Watson unp_defer--; 1668a0ec558aSRobert Watson fp->f_gcflag &= ~(FMARK|FDEFER); 1669426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1670df8bae1dSRodney W. Grimes continue; 1671426da3bcSAlfred Perlstein } 1672ed5b7817SJulian Elischer /* 16739ae328fcSJohn Baldwin * If we already marked it as 'defer' in a 16749ae328fcSJohn Baldwin * previous pass, then try to process it this 16759ae328fcSJohn Baldwin * time and un-mark it. 1676ed5b7817SJulian Elischer */ 1677426da3bcSAlfred Perlstein if (fp->f_gcflag & FDEFER) { 1678426da3bcSAlfred Perlstein fp->f_gcflag &= ~FDEFER; 1679df8bae1dSRodney W. Grimes unp_defer--; 1680df8bae1dSRodney W. Grimes } else { 1681ed5b7817SJulian Elischer /* 16829ae328fcSJohn Baldwin * if it's not deferred, then check if it's 1683ed5b7817SJulian Elischer * already marked.. if so skip it 1684ed5b7817SJulian Elischer */ 1685426da3bcSAlfred Perlstein if (fp->f_gcflag & FMARK) { 1686426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1687df8bae1dSRodney W. Grimes continue; 1688426da3bcSAlfred Perlstein } 1689ed5b7817SJulian Elischer /* 16901c381b19SRobert Watson * If all references are from messages in 16911c381b19SRobert Watson * transit, then skip it. it's not externally 16921c381b19SRobert Watson * accessible. 1693ed5b7817SJulian Elischer */ 1694426da3bcSAlfred Perlstein if (fp->f_count == fp->f_msgcount) { 1695426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1696df8bae1dSRodney W. Grimes continue; 1697426da3bcSAlfred Perlstein } 1698ed5b7817SJulian Elischer /* 1699ed5b7817SJulian Elischer * If it got this far then it must be 1700ed5b7817SJulian Elischer * externally accessible. 1701ed5b7817SJulian Elischer */ 1702426da3bcSAlfred Perlstein fp->f_gcflag |= FMARK; 1703df8bae1dSRodney W. Grimes } 1704ed5b7817SJulian Elischer /* 17059ae328fcSJohn Baldwin * Either it was deferred, or it is externally 17061c381b19SRobert Watson * accessible and not already marked so. Now check 17071c381b19SRobert Watson * if it is possibly one of OUR sockets. 1708ed5b7817SJulian Elischer */ 1709df8bae1dSRodney W. Grimes if (fp->f_type != DTYPE_SOCKET || 171048e3128bSMatthew Dillon (so = fp->f_data) == NULL) { 1711426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1712df8bae1dSRodney W. Grimes continue; 1713426da3bcSAlfred Perlstein } 1714748e0b0aSGarrett Wollman if (so->so_proto->pr_domain != &localdomain || 17159ae328fcSJohn Baldwin (so->so_proto->pr_flags & PR_RIGHTS) == 0) { 17169ae328fcSJohn Baldwin FILE_UNLOCK(fp); 1717df8bae1dSRodney W. Grimes continue; 17189ae328fcSJohn Baldwin } 17199ae328fcSJohn Baldwin 17209ae328fcSJohn Baldwin /* 17219ae328fcSJohn Baldwin * Tell any other threads that do a subsequent 17229ae328fcSJohn Baldwin * fdrop() that we are scanning the message 17239ae328fcSJohn Baldwin * buffers. 17249ae328fcSJohn Baldwin */ 17259ae328fcSJohn Baldwin fp->f_gcflag |= FWAIT; 17269ae328fcSJohn Baldwin FILE_UNLOCK(fp); 17279ae328fcSJohn Baldwin 1728ed5b7817SJulian Elischer /* 17291c381b19SRobert Watson * So, Ok, it's one of our sockets and it IS 17309ae328fcSJohn Baldwin * externally accessible (or was deferred). Now we 17311c381b19SRobert Watson * look to see if we hold any file descriptors in its 1732ed5b7817SJulian Elischer * message buffers. Follow those links and mark them 1733ed5b7817SJulian Elischer * as accessible too. 1734ed5b7817SJulian Elischer */ 17357717cf07SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 1736df8bae1dSRodney W. Grimes unp_scan(so->so_rcv.sb_mb, unp_mark); 17377717cf07SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 17389ae328fcSJohn Baldwin 17399ae328fcSJohn Baldwin /* 17409ae328fcSJohn Baldwin * Wake up any threads waiting in fdrop(). 17419ae328fcSJohn Baldwin */ 17429ae328fcSJohn Baldwin FILE_LOCK(fp); 17439ae328fcSJohn Baldwin fp->f_gcflag &= ~FWAIT; 17449ae328fcSJohn Baldwin wakeup(&fp->f_gcflag); 17459ae328fcSJohn Baldwin FILE_UNLOCK(fp); 1746df8bae1dSRodney W. Grimes } 1747df8bae1dSRodney W. Grimes } while (unp_defer); 1748426da3bcSAlfred Perlstein sx_sunlock(&filelist_lock); 1749df8bae1dSRodney W. Grimes /* 1750a0ec558aSRobert Watson * XXXRW: The following comments need updating for a post-SMPng and 1751a0ec558aSRobert Watson * deferred unp_gc() world, but are still generally accurate. 1752a0ec558aSRobert Watson * 17531c381b19SRobert Watson * We grab an extra reference to each of the file table entries that 17541c381b19SRobert Watson * are not otherwise accessible and then free the rights that are 17551c381b19SRobert Watson * stored in messages on them. 1756df8bae1dSRodney W. Grimes * 1757df8bae1dSRodney W. Grimes * The bug in the orginal code is a little tricky, so I'll describe 1758df8bae1dSRodney W. Grimes * what's wrong with it here. 1759df8bae1dSRodney W. Grimes * 1760df8bae1dSRodney W. Grimes * It is incorrect to simply unp_discard each entry for f_msgcount 1761df8bae1dSRodney W. Grimes * times -- consider the case of sockets A and B that contain 1762df8bae1dSRodney W. Grimes * references to each other. On a last close of some other socket, 1763df8bae1dSRodney W. Grimes * we trigger a gc since the number of outstanding rights (unp_rights) 1764a0ec558aSRobert Watson * is non-zero. If during the sweep phase the gc code unp_discards, 1765df8bae1dSRodney W. Grimes * we end up doing a (full) closef on the descriptor. A closef on A 1766df8bae1dSRodney W. Grimes * results in the following chain. Closef calls soo_close, which 1767df8bae1dSRodney W. Grimes * calls soclose. Soclose calls first (through the switch 1768df8bae1dSRodney W. Grimes * uipc_usrreq) unp_detach, which re-invokes unp_gc. Unp_gc simply 17691c381b19SRobert Watson * returns because the previous instance had set unp_gcing, and we 17701c381b19SRobert Watson * return all the way back to soclose, which marks the socket with 17711c381b19SRobert Watson * SS_NOFDREF, and then calls sofree. Sofree calls sorflush to free 17721c381b19SRobert Watson * up the rights that are queued in messages on the socket A, i.e., 17731c381b19SRobert Watson * the reference on B. The sorflush calls via the dom_dispose switch 17741c381b19SRobert Watson * unp_dispose, which unp_scans with unp_discard. This second 1775df8bae1dSRodney W. Grimes * instance of unp_discard just calls closef on B. 1776df8bae1dSRodney W. Grimes * 1777df8bae1dSRodney W. Grimes * Well, a similar chain occurs on B, resulting in a sorflush on B, 1778df8bae1dSRodney W. Grimes * which results in another closef on A. Unfortunately, A is already 1779df8bae1dSRodney W. Grimes * being closed, and the descriptor has already been marked with 1780df8bae1dSRodney W. Grimes * SS_NOFDREF, and soclose panics at this point. 1781df8bae1dSRodney W. Grimes * 1782df8bae1dSRodney W. Grimes * Here, we first take an extra reference to each inaccessible 17831c381b19SRobert Watson * descriptor. Then, we call sorflush ourself, since we know it is a 17841c381b19SRobert Watson * Unix domain socket anyhow. After we destroy all the rights 17851c381b19SRobert Watson * carried in messages, we do a last closef to get rid of our extra 17861c381b19SRobert Watson * reference. This is the last close, and the unp_detach etc will 17871c381b19SRobert Watson * shut down the socket. 1788df8bae1dSRodney W. Grimes * 1789df8bae1dSRodney W. Grimes * 91/09/19, bsy@cs.cmu.edu 1790df8bae1dSRodney W. Grimes */ 179195f004dcSAlfred Perlstein again: 1792e4643c73SPoul-Henning Kamp nfiles_snap = openfiles + nfiles_slack; /* some slack */ 179395f004dcSAlfred Perlstein extra_ref = malloc(nfiles_snap * sizeof(struct file *), M_TEMP, 179495f004dcSAlfred Perlstein M_WAITOK); 1795426da3bcSAlfred Perlstein sx_slock(&filelist_lock); 1796e4643c73SPoul-Henning Kamp if (nfiles_snap < openfiles) { 179795f004dcSAlfred Perlstein sx_sunlock(&filelist_lock); 179895f004dcSAlfred Perlstein free(extra_ref, M_TEMP); 179995f004dcSAlfred Perlstein nfiles_slack += 20; 180095f004dcSAlfred Perlstein goto again; 180195f004dcSAlfred Perlstein } 1802fc3fcacfSRobert Watson for (nunref = 0, fp = LIST_FIRST(&filehead), fpp = extra_ref; 1803fc3fcacfSRobert Watson fp != NULL; fp = nextfp) { 18042e3c8fcbSPoul-Henning Kamp nextfp = LIST_NEXT(fp, f_list); 1805426da3bcSAlfred Perlstein FILE_LOCK(fp); 1806ed5b7817SJulian Elischer /* 1807ed5b7817SJulian Elischer * If it's not open, skip it 1808ed5b7817SJulian Elischer */ 1809426da3bcSAlfred Perlstein if (fp->f_count == 0) { 1810426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1811df8bae1dSRodney W. Grimes continue; 1812426da3bcSAlfred Perlstein } 1813ed5b7817SJulian Elischer /* 1814ed5b7817SJulian Elischer * If all refs are from msgs, and it's not marked accessible 18151c381b19SRobert Watson * then it must be referenced from some unreachable cycle of 18161c381b19SRobert Watson * (shut-down) FDs, so include it in our list of FDs to 18171c381b19SRobert Watson * remove. 1818ed5b7817SJulian Elischer */ 1819426da3bcSAlfred Perlstein if (fp->f_count == fp->f_msgcount && !(fp->f_gcflag & FMARK)) { 1820df8bae1dSRodney W. Grimes *fpp++ = fp; 1821df8bae1dSRodney W. Grimes nunref++; 1822df8bae1dSRodney W. Grimes fp->f_count++; 1823df8bae1dSRodney W. Grimes } 1824426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1825df8bae1dSRodney W. Grimes } 1826426da3bcSAlfred Perlstein sx_sunlock(&filelist_lock); 1827ed5b7817SJulian Elischer /* 18281c381b19SRobert Watson * For each FD on our hit list, do the following two things: 1829ed5b7817SJulian Elischer */ 18301c7c3c6aSMatthew Dillon for (i = nunref, fpp = extra_ref; --i >= 0; ++fpp) { 18311c7c3c6aSMatthew Dillon struct file *tfp = *fpp; 1832426da3bcSAlfred Perlstein FILE_LOCK(tfp); 1833cd72f218SMatthew Dillon if (tfp->f_type == DTYPE_SOCKET && 183448e3128bSMatthew Dillon tfp->f_data != NULL) { 1835426da3bcSAlfred Perlstein FILE_UNLOCK(tfp); 183648e3128bSMatthew Dillon sorflush(tfp->f_data); 1837e5aeaa0cSDag-Erling Smørgrav } else { 1838426da3bcSAlfred Perlstein FILE_UNLOCK(tfp); 18391c7c3c6aSMatthew Dillon } 1840e5aeaa0cSDag-Erling Smørgrav } 1841a0ec558aSRobert Watson for (i = nunref, fpp = extra_ref; --i >= 0; ++fpp) { 1842b40ce416SJulian Elischer closef(*fpp, (struct thread *) NULL); 1843a0ec558aSRobert Watson unp_recycled++; 1844a0ec558aSRobert Watson } 1845210a5a71SAlfred Perlstein free(extra_ref, M_TEMP); 1846df8bae1dSRodney W. Grimes } 1847df8bae1dSRodney W. Grimes 184826f9a767SRodney W. Grimes void 1849892af6b9SRobert Watson unp_dispose(struct mbuf *m) 1850df8bae1dSRodney W. Grimes { 1851996c772fSJohn Dyson 1852df8bae1dSRodney W. Grimes if (m) 1853df8bae1dSRodney W. Grimes unp_scan(m, unp_discard); 1854df8bae1dSRodney W. Grimes } 1855df8bae1dSRodney W. Grimes 18560c1bb4fbSDima Dorfman static int 1857d374e81eSRobert Watson unp_listen(struct socket *so, struct unpcb *unp, int backlog, 1858d374e81eSRobert Watson struct thread *td) 18590c1bb4fbSDima Dorfman { 18600daccb9cSRobert Watson int error; 18610daccb9cSRobert Watson 18620d9ce3a1SRobert Watson UNP_LOCK_ASSERT(); 18630c1bb4fbSDima Dorfman 18640daccb9cSRobert Watson SOCK_LOCK(so); 18650daccb9cSRobert Watson error = solisten_proto_check(so); 18660daccb9cSRobert Watson if (error == 0) { 18676f105b34SJohn Baldwin cru2x(td->td_ucred, &unp->unp_peercred); 18680c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPCCACHED; 1869d374e81eSRobert Watson solisten_proto(so, backlog); 18700daccb9cSRobert Watson } 18710daccb9cSRobert Watson SOCK_UNLOCK(so); 18720daccb9cSRobert Watson return (error); 18730c1bb4fbSDima Dorfman } 18740c1bb4fbSDima Dorfman 1875f708ef1bSPoul-Henning Kamp static void 1876892af6b9SRobert Watson unp_scan(struct mbuf *m0, void (*op)(struct file *)) 1877df8bae1dSRodney W. Grimes { 18782bc21ed9SDavid Malone struct mbuf *m; 18792bc21ed9SDavid Malone struct file **rp; 18802bc21ed9SDavid Malone struct cmsghdr *cm; 18812bc21ed9SDavid Malone void *data; 18822bc21ed9SDavid Malone int i; 18832bc21ed9SDavid Malone socklen_t clen, datalen; 1884df8bae1dSRodney W. Grimes int qfds; 1885df8bae1dSRodney W. Grimes 1886fc3fcacfSRobert Watson while (m0 != NULL) { 18872bc21ed9SDavid Malone for (m = m0; m; m = m->m_next) { 188812396bdcSDavid Malone if (m->m_type != MT_CONTROL) 1889df8bae1dSRodney W. Grimes continue; 18902bc21ed9SDavid Malone 18912bc21ed9SDavid Malone cm = mtod(m, struct cmsghdr *); 18922bc21ed9SDavid Malone clen = m->m_len; 18932bc21ed9SDavid Malone 18942bc21ed9SDavid Malone while (cm != NULL) { 18952bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) 18962bc21ed9SDavid Malone break; 18972bc21ed9SDavid Malone 18982bc21ed9SDavid Malone data = CMSG_DATA(cm); 18992bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len 19002bc21ed9SDavid Malone - (caddr_t)data; 19012bc21ed9SDavid Malone 19022bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET && 19032bc21ed9SDavid Malone cm->cmsg_type == SCM_RIGHTS) { 19042bc21ed9SDavid Malone qfds = datalen / sizeof (struct file *); 19052bc21ed9SDavid Malone rp = data; 1906df8bae1dSRodney W. Grimes for (i = 0; i < qfds; i++) 1907df8bae1dSRodney W. Grimes (*op)(*rp++); 19082bc21ed9SDavid Malone } 19092bc21ed9SDavid Malone 19102bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 19112bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 19122bc21ed9SDavid Malone cm = (struct cmsghdr *) 19132bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 19142bc21ed9SDavid Malone } else { 19152bc21ed9SDavid Malone clen = 0; 19162bc21ed9SDavid Malone cm = NULL; 19172bc21ed9SDavid Malone } 19182bc21ed9SDavid Malone } 1919df8bae1dSRodney W. Grimes } 1920df8bae1dSRodney W. Grimes m0 = m0->m_act; 1921df8bae1dSRodney W. Grimes } 1922df8bae1dSRodney W. Grimes } 1923df8bae1dSRodney W. Grimes 1924f708ef1bSPoul-Henning Kamp static void 1925892af6b9SRobert Watson unp_mark(struct file *fp) 1926df8bae1dSRodney W. Grimes { 1927426da3bcSAlfred Perlstein if (fp->f_gcflag & FMARK) 1928df8bae1dSRodney W. Grimes return; 1929df8bae1dSRodney W. Grimes unp_defer++; 1930426da3bcSAlfred Perlstein fp->f_gcflag |= (FMARK|FDEFER); 1931df8bae1dSRodney W. Grimes } 1932df8bae1dSRodney W. Grimes 1933f708ef1bSPoul-Henning Kamp static void 1934892af6b9SRobert Watson unp_discard(struct file *fp) 1935df8bae1dSRodney W. Grimes { 1936a0ec558aSRobert Watson UNP_LOCK(); 1937426da3bcSAlfred Perlstein FILE_LOCK(fp); 1938df8bae1dSRodney W. Grimes fp->f_msgcount--; 1939df8bae1dSRodney W. Grimes unp_rights--; 1940426da3bcSAlfred Perlstein FILE_UNLOCK(fp); 1941a0ec558aSRobert Watson UNP_UNLOCK(); 1942b40ce416SJulian Elischer (void) closef(fp, (struct thread *)NULL); 1943df8bae1dSRodney W. Grimes } 1944