19454b2d8SWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1982, 1986, 1989, 1991, 1993 3e1ac28e2SRobert Watson * The Regents of the University of California. 43dab55bcSRobert Watson * Copyright (c) 2004-2009 Robert N. M. Watson 5e1ac28e2SRobert Watson * All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 8df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 9df8bae1dSRodney W. Grimes * are met: 10df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 12df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 13df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 14df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 15df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 16df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 17df8bae1dSRodney W. Grimes * without specific prior written permission. 18df8bae1dSRodney W. Grimes * 19df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29df8bae1dSRodney W. Grimes * SUCH DAMAGE. 30df8bae1dSRodney W. Grimes * 31748e0b0aSGarrett Wollman * From: @(#)uipc_usrreq.c 8.3 (Berkeley) 1/4/94 32df8bae1dSRodney W. Grimes */ 33df8bae1dSRodney W. Grimes 34f23929fbSRobert Watson /* 35f23929fbSRobert Watson * UNIX Domain (Local) Sockets 36f23929fbSRobert Watson * 37f23929fbSRobert Watson * This is an implementation of UNIX (local) domain sockets. Each socket has 38f23929fbSRobert Watson * an associated struct unpcb (UNIX protocol control block). Stream sockets 39f23929fbSRobert Watson * may be connected to 0 or 1 other socket. Datagram sockets may be 40f23929fbSRobert Watson * connected to 0, 1, or many other sockets. Sockets may be created and 41f23929fbSRobert Watson * connected in pairs (socketpair(2)), or bound/connected to using the file 42f23929fbSRobert Watson * system name space. For most purposes, only the receive socket buffer is 43f23929fbSRobert Watson * used, as sending on one socket delivers directly to the receive socket 445b950deaSRobert Watson * buffer of a second socket. 455b950deaSRobert Watson * 465b950deaSRobert Watson * The implementation is substantially complicated by the fact that 475b950deaSRobert Watson * "ancillary data", such as file descriptors or credentials, may be passed 485b950deaSRobert Watson * across UNIX domain sockets. The potential for passing UNIX domain sockets 495b950deaSRobert Watson * over other UNIX domain sockets requires the implementation of a simple 505b950deaSRobert Watson * garbage collector to find and tear down cycles of disconnected sockets. 51aea52f1bSRobert Watson * 52aea52f1bSRobert Watson * TODO: 5384d61770SRobert Watson * RDM 5484d61770SRobert Watson * distinguish datagram size limits from flow control limits in SEQPACKET 55aea52f1bSRobert Watson * rethink name space problems 56aea52f1bSRobert Watson * need a proper out-of-band 57f23929fbSRobert Watson */ 58f23929fbSRobert Watson 59677b542eSDavid E. O'Brien #include <sys/cdefs.h> 60677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 61677b542eSDavid E. O'Brien 6203c96c31SRobert Watson #include "opt_ddb.h" 63335654d7SRobert Watson 64df8bae1dSRodney W. Grimes #include <sys/param.h> 65fb919e4dSMark Murray #include <sys/domain.h> 66960ed29cSSeigo Tanimura #include <sys/fcntl.h> 67d826c479SBruce Evans #include <sys/malloc.h> /* XXX must be before <sys/file.h> */ 684f590175SPaul Saab #include <sys/eventhandler.h> 69639acc13SGarrett Wollman #include <sys/file.h> 70960ed29cSSeigo Tanimura #include <sys/filedesc.h> 71960ed29cSSeigo Tanimura #include <sys/kernel.h> 72960ed29cSSeigo Tanimura #include <sys/lock.h> 73639acc13SGarrett Wollman #include <sys/mbuf.h> 74033eb86eSJeff Roberson #include <sys/mount.h> 75960ed29cSSeigo Tanimura #include <sys/mutex.h> 76639acc13SGarrett Wollman #include <sys/namei.h> 77639acc13SGarrett Wollman #include <sys/proc.h> 78df8bae1dSRodney W. Grimes #include <sys/protosw.h> 790cb64678SKonstantin Belousov #include <sys/queue.h> 80960ed29cSSeigo Tanimura #include <sys/resourcevar.h> 81e7c33e29SRobert Watson #include <sys/rwlock.h> 82df8bae1dSRodney W. Grimes #include <sys/socket.h> 83df8bae1dSRodney W. Grimes #include <sys/socketvar.h> 84960ed29cSSeigo Tanimura #include <sys/signalvar.h> 85df8bae1dSRodney W. Grimes #include <sys/stat.h> 86960ed29cSSeigo Tanimura #include <sys/sx.h> 87639acc13SGarrett Wollman #include <sys/sysctl.h> 88960ed29cSSeigo Tanimura #include <sys/systm.h> 89a0ec558aSRobert Watson #include <sys/taskqueue.h> 90639acc13SGarrett Wollman #include <sys/un.h> 9198271db4SGarrett Wollman #include <sys/unpcb.h> 92639acc13SGarrett Wollman #include <sys/vnode.h> 93530c0060SRobert Watson 94530c0060SRobert Watson #include <net/vnet.h> 95df8bae1dSRodney W. Grimes 9603c96c31SRobert Watson #ifdef DDB 9703c96c31SRobert Watson #include <ddb/ddb.h> 9803c96c31SRobert Watson #endif 9903c96c31SRobert Watson 100aed55708SRobert Watson #include <security/mac/mac_framework.h> 101aed55708SRobert Watson 1029e9d298aSJeff Roberson #include <vm/uma.h> 10398271db4SGarrett Wollman 1043dab55bcSRobert Watson /* 1053dab55bcSRobert Watson * Locking key: 1063dab55bcSRobert Watson * (l) Locked using list lock 1073dab55bcSRobert Watson * (g) Locked using linkage lock 1083dab55bcSRobert Watson */ 1093dab55bcSRobert Watson 1109e9d298aSJeff Roberson static uma_zone_t unp_zone; 1113dab55bcSRobert Watson static unp_gen_t unp_gencnt; /* (l) */ 1123dab55bcSRobert Watson static u_int unp_count; /* (l) Count of local sockets. */ 113aea52f1bSRobert Watson static ino_t unp_ino; /* Prototype for fake inode numbers. */ 1143dab55bcSRobert Watson static int unp_rights; /* (g) File descriptors in flight. */ 1153dab55bcSRobert Watson static struct unp_head unp_shead; /* (l) List of stream sockets. */ 1163dab55bcSRobert Watson static struct unp_head unp_dhead; /* (l) List of datagram sockets. */ 11784d61770SRobert Watson static struct unp_head unp_sphead; /* (l) List of seqpacket sockets. */ 11898271db4SGarrett Wollman 1190cb64678SKonstantin Belousov struct unp_defer { 1200cb64678SKonstantin Belousov SLIST_ENTRY(unp_defer) ud_link; 1210cb64678SKonstantin Belousov struct file *ud_fp; 1220cb64678SKonstantin Belousov }; 1230cb64678SKonstantin Belousov static SLIST_HEAD(, unp_defer) unp_defers; 1240cb64678SKonstantin Belousov static int unp_defers_count; 1250cb64678SKonstantin Belousov 126aea52f1bSRobert Watson static const struct sockaddr sun_noname = { sizeof(sun_noname), AF_LOCAL }; 12798271db4SGarrett Wollman 128df8bae1dSRodney W. Grimes /* 129aea52f1bSRobert Watson * Garbage collection of cyclic file descriptor/socket references occurs 130aea52f1bSRobert Watson * asynchronously in a taskqueue context in order to avoid recursion and 131aea52f1bSRobert Watson * reentrance in the UNIX domain socket, file descriptor, and socket layer 132aea52f1bSRobert Watson * code. See unp_gc() for a full description. 133df8bae1dSRodney W. Grimes */ 134aea52f1bSRobert Watson static struct task unp_gc_task; 135f708ef1bSPoul-Henning Kamp 136ce5f32deSRobert Watson /* 1370cb64678SKonstantin Belousov * The close of unix domain sockets attached as SCM_RIGHTS is 1380cb64678SKonstantin Belousov * postponed to the taskqueue, to avoid arbitrary recursion depth. 1390cb64678SKonstantin Belousov * The attached sockets might have another sockets attached. 1400cb64678SKonstantin Belousov */ 1410cb64678SKonstantin Belousov static struct task unp_defer_task; 1420cb64678SKonstantin Belousov 1430cb64678SKonstantin Belousov /* 1447e711c3aSRobert Watson * Both send and receive buffers are allocated PIPSIZ bytes of buffering for 1457e711c3aSRobert Watson * stream sockets, although the total for sender and receiver is actually 1467e711c3aSRobert Watson * only PIPSIZ. 1477e711c3aSRobert Watson * 1487e711c3aSRobert Watson * Datagram sockets really use the sendspace as the maximum datagram size, 1497e711c3aSRobert Watson * and don't really want to reserve the sendspace. Their recvspace should be 1507e711c3aSRobert Watson * large enough for at least one max-size datagram plus address. 1517e711c3aSRobert Watson */ 1527e711c3aSRobert Watson #ifndef PIPSIZ 1537e711c3aSRobert Watson #define PIPSIZ 8192 1547e711c3aSRobert Watson #endif 1557e711c3aSRobert Watson static u_long unpst_sendspace = PIPSIZ; 1567e711c3aSRobert Watson static u_long unpst_recvspace = PIPSIZ; 1577e711c3aSRobert Watson static u_long unpdg_sendspace = 2*1024; /* really max datagram size */ 1587e711c3aSRobert Watson static u_long unpdg_recvspace = 4*1024; 15984d61770SRobert Watson static u_long unpsp_sendspace = PIPSIZ; /* really max datagram size */ 16084d61770SRobert Watson static u_long unpsp_recvspace = PIPSIZ; 1617e711c3aSRobert Watson 162e4445a03SRobert Watson SYSCTL_NODE(_net, PF_LOCAL, local, CTLFLAG_RW, 0, "Local domain"); 163e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_STREAM, stream, CTLFLAG_RW, 0, "SOCK_STREAM"); 164e4445a03SRobert Watson SYSCTL_NODE(_net_local, SOCK_DGRAM, dgram, CTLFLAG_RW, 0, "SOCK_DGRAM"); 16584d61770SRobert Watson SYSCTL_NODE(_net_local, SOCK_SEQPACKET, seqpacket, CTLFLAG_RW, 0, 16684d61770SRobert Watson "SOCK_SEQPACKET"); 167e4445a03SRobert Watson 1687e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, sendspace, CTLFLAG_RW, 169be6b1304STom Rhodes &unpst_sendspace, 0, "Default stream send space."); 1707e711c3aSRobert Watson SYSCTL_ULONG(_net_local_stream, OID_AUTO, recvspace, CTLFLAG_RW, 171be6b1304STom Rhodes &unpst_recvspace, 0, "Default stream receive space."); 1727e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, maxdgram, CTLFLAG_RW, 173be6b1304STom Rhodes &unpdg_sendspace, 0, "Default datagram send space."); 1747e711c3aSRobert Watson SYSCTL_ULONG(_net_local_dgram, OID_AUTO, recvspace, CTLFLAG_RW, 175be6b1304STom Rhodes &unpdg_recvspace, 0, "Default datagram receive space."); 17684d61770SRobert Watson SYSCTL_ULONG(_net_local_seqpacket, OID_AUTO, maxseqpacket, CTLFLAG_RW, 17784d61770SRobert Watson &unpsp_sendspace, 0, "Default seqpacket send space."); 17884d61770SRobert Watson SYSCTL_ULONG(_net_local_seqpacket, OID_AUTO, recvspace, CTLFLAG_RW, 17984d61770SRobert Watson &unpsp_recvspace, 0, "Default seqpacket receive space."); 180be6b1304STom Rhodes SYSCTL_INT(_net_local, OID_AUTO, inflight, CTLFLAG_RD, &unp_rights, 0, 181be6b1304STom Rhodes "File descriptors in flight."); 1820cb64678SKonstantin Belousov SYSCTL_INT(_net_local, OID_AUTO, deferred, CTLFLAG_RD, 1830cb64678SKonstantin Belousov &unp_defers_count, 0, 1840cb64678SKonstantin Belousov "File descriptors deferred to taskqueue for close."); 1857e711c3aSRobert Watson 186175389cfSEdward Tomasz Napierala /* 187e7c33e29SRobert Watson * Locking and synchronization: 188ce5f32deSRobert Watson * 1893dab55bcSRobert Watson * Three types of locks exit in the local domain socket implementation: a 1903dab55bcSRobert Watson * global list mutex, a global linkage rwlock, and per-unpcb mutexes. Of the 1913dab55bcSRobert Watson * global locks, the list lock protects the socket count, global generation 1923dab55bcSRobert Watson * number, and stream/datagram global lists. The linkage lock protects the 1933dab55bcSRobert Watson * interconnection of unpcbs, the v_socket and unp_vnode pointers, and can be 1943dab55bcSRobert Watson * held exclusively over the acquisition of multiple unpcb locks to prevent 1953dab55bcSRobert Watson * deadlock. 196ce5f32deSRobert Watson * 197e7c33e29SRobert Watson * UNIX domain sockets each have an unpcb hung off of their so_pcb pointer, 198e7c33e29SRobert Watson * allocated in pru_attach() and freed in pru_detach(). The validity of that 199e7c33e29SRobert Watson * pointer is an invariant, so no lock is required to dereference the so_pcb 200e7c33e29SRobert Watson * pointer if a valid socket reference is held by the caller. In practice, 201e7c33e29SRobert Watson * this is always true during operations performed on a socket. Each unpcb 202e7c33e29SRobert Watson * has a back-pointer to its socket, unp_socket, which will be stable under 203e7c33e29SRobert Watson * the same circumstances. 204e7c33e29SRobert Watson * 205e7c33e29SRobert Watson * This pointer may only be safely dereferenced as long as a valid reference 206e7c33e29SRobert Watson * to the unpcb is held. Typically, this reference will be from the socket, 207e7c33e29SRobert Watson * or from another unpcb when the referring unpcb's lock is held (in order 208e7c33e29SRobert Watson * that the reference not be invalidated during use). For example, to follow 209e7c33e29SRobert Watson * unp->unp_conn->unp_socket, you need unlock the lock on unp, not unp_conn, 210e7c33e29SRobert Watson * as unp_socket remains valid as long as the reference to unp_conn is valid. 211e7c33e29SRobert Watson * 212e7c33e29SRobert Watson * Fields of unpcbss are locked using a per-unpcb lock, unp_mtx. Individual 213e7c33e29SRobert Watson * atomic reads without the lock may be performed "lockless", but more 214e7c33e29SRobert Watson * complex reads and read-modify-writes require the mutex to be held. No 215e7c33e29SRobert Watson * lock order is defined between unpcb locks -- multiple unpcb locks may be 2163dab55bcSRobert Watson * acquired at the same time only when holding the linkage rwlock 2173dab55bcSRobert Watson * exclusively, which prevents deadlocks. 218e7c33e29SRobert Watson * 219e7c33e29SRobert Watson * Blocking with UNIX domain sockets is a tricky issue: unlike most network 220e7c33e29SRobert Watson * protocols, bind() is a non-atomic operation, and connect() requires 221e7c33e29SRobert Watson * potential sleeping in the protocol, due to potentially waiting on local or 222e7c33e29SRobert Watson * distributed file systems. We try to separate "lookup" operations, which 223e7c33e29SRobert Watson * may sleep, and the IPC operations themselves, which typically can occur 224e7c33e29SRobert Watson * with relative atomicity as locks can be held over the entire operation. 225e7c33e29SRobert Watson * 226e7c33e29SRobert Watson * Another tricky issue is simultaneous multi-threaded or multi-process 227e7c33e29SRobert Watson * access to a single UNIX domain socket. These are handled by the flags 228e7c33e29SRobert Watson * UNP_CONNECTING and UNP_BINDING, which prevent concurrent connecting or 229e7c33e29SRobert Watson * binding, both of which involve dropping UNIX domain socket locks in order 230e7c33e29SRobert Watson * to perform namei() and other file system operations. 231ce5f32deSRobert Watson */ 2323dab55bcSRobert Watson static struct rwlock unp_link_rwlock; 2333dab55bcSRobert Watson static struct mtx unp_list_lock; 2340cb64678SKonstantin Belousov static struct mtx unp_defers_lock; 235e7c33e29SRobert Watson 2363dab55bcSRobert Watson #define UNP_LINK_LOCK_INIT() rw_init(&unp_link_rwlock, \ 2373dab55bcSRobert Watson "unp_link_rwlock") 238e7c33e29SRobert Watson 2393dab55bcSRobert Watson #define UNP_LINK_LOCK_ASSERT() rw_assert(&unp_link_rwlock, \ 240e7c33e29SRobert Watson RA_LOCKED) 2413dab55bcSRobert Watson #define UNP_LINK_UNLOCK_ASSERT() rw_assert(&unp_link_rwlock, \ 242e7c33e29SRobert Watson RA_UNLOCKED) 243e7c33e29SRobert Watson 2443dab55bcSRobert Watson #define UNP_LINK_RLOCK() rw_rlock(&unp_link_rwlock) 2453dab55bcSRobert Watson #define UNP_LINK_RUNLOCK() rw_runlock(&unp_link_rwlock) 2463dab55bcSRobert Watson #define UNP_LINK_WLOCK() rw_wlock(&unp_link_rwlock) 2473dab55bcSRobert Watson #define UNP_LINK_WUNLOCK() rw_wunlock(&unp_link_rwlock) 2483dab55bcSRobert Watson #define UNP_LINK_WLOCK_ASSERT() rw_assert(&unp_link_rwlock, \ 249e7c33e29SRobert Watson RA_WLOCKED) 250e7c33e29SRobert Watson 2513dab55bcSRobert Watson #define UNP_LIST_LOCK_INIT() mtx_init(&unp_list_lock, \ 2523dab55bcSRobert Watson "unp_list_lock", NULL, MTX_DEF) 2533dab55bcSRobert Watson #define UNP_LIST_LOCK() mtx_lock(&unp_list_lock) 2543dab55bcSRobert Watson #define UNP_LIST_UNLOCK() mtx_unlock(&unp_list_lock) 255e7c33e29SRobert Watson 2560cb64678SKonstantin Belousov #define UNP_DEFERRED_LOCK_INIT() mtx_init(&unp_defers_lock, \ 2570cb64678SKonstantin Belousov "unp_defer", NULL, MTX_DEF) 2580cb64678SKonstantin Belousov #define UNP_DEFERRED_LOCK() mtx_lock(&unp_defers_lock) 2590cb64678SKonstantin Belousov #define UNP_DEFERRED_UNLOCK() mtx_unlock(&unp_defers_lock) 2600cb64678SKonstantin Belousov 261e7c33e29SRobert Watson #define UNP_PCB_LOCK_INIT(unp) mtx_init(&(unp)->unp_mtx, \ 262e7c33e29SRobert Watson "unp_mtx", "unp_mtx", \ 263e7c33e29SRobert Watson MTX_DUPOK|MTX_DEF|MTX_RECURSE) 264e7c33e29SRobert Watson #define UNP_PCB_LOCK_DESTROY(unp) mtx_destroy(&(unp)->unp_mtx) 265e7c33e29SRobert Watson #define UNP_PCB_LOCK(unp) mtx_lock(&(unp)->unp_mtx) 266e7c33e29SRobert Watson #define UNP_PCB_UNLOCK(unp) mtx_unlock(&(unp)->unp_mtx) 267e7c33e29SRobert Watson #define UNP_PCB_LOCK_ASSERT(unp) mtx_assert(&(unp)->unp_mtx, MA_OWNED) 2680d9ce3a1SRobert Watson 2692c899584SRobert Watson static int uipc_connect2(struct socket *, struct socket *); 2700b36cd25SRobert Watson static int uipc_ctloutput(struct socket *, struct sockopt *); 271aea52f1bSRobert Watson static int unp_connect(struct socket *, struct sockaddr *, 272aea52f1bSRobert Watson struct thread *); 2736a2989fdSMatthew N. Dodd static int unp_connect2(struct socket *so, struct socket *so2, int); 274e7c33e29SRobert Watson static void unp_disconnect(struct unpcb *unp, struct unpcb *unp2); 2750b36cd25SRobert Watson static void unp_dispose(struct mbuf *); 2764d77a549SAlfred Perlstein static void unp_shutdown(struct unpcb *); 2774d77a549SAlfred Perlstein static void unp_drop(struct unpcb *, int); 278a0ec558aSRobert Watson static void unp_gc(__unused void *, int); 2794d77a549SAlfred Perlstein static void unp_scan(struct mbuf *, void (*)(struct file *)); 2804d77a549SAlfred Perlstein static void unp_discard(struct file *); 2814d77a549SAlfred Perlstein static void unp_freerights(struct file **, int); 2820b36cd25SRobert Watson static void unp_init(void); 2834d77a549SAlfred Perlstein static int unp_internalize(struct mbuf **, struct thread *); 284397c19d1SJeff Roberson static void unp_internalize_fp(struct file *); 2850b36cd25SRobert Watson static int unp_externalize(struct mbuf *, struct mbuf **); 2860cb64678SKonstantin Belousov static int unp_externalize_fp(struct file *); 2875b950deaSRobert Watson static struct mbuf *unp_addsockcred(struct thread *, struct mbuf *); 2880cb64678SKonstantin Belousov static void unp_process_defers(void * __unused, int); 289f708ef1bSPoul-Henning Kamp 290e4445a03SRobert Watson /* 291e4445a03SRobert Watson * Definitions of protocols supported in the LOCAL domain. 292e4445a03SRobert Watson */ 293e4445a03SRobert Watson static struct domain localdomain; 294fa9402f2SRobert Watson static struct pr_usrreqs uipc_usrreqs_dgram, uipc_usrreqs_stream; 29584d61770SRobert Watson static struct pr_usrreqs uipc_usrreqs_seqpacket; 296e4445a03SRobert Watson static struct protosw localsw[] = { 297e4445a03SRobert Watson { 298e4445a03SRobert Watson .pr_type = SOCK_STREAM, 299e4445a03SRobert Watson .pr_domain = &localdomain, 300e4445a03SRobert Watson .pr_flags = PR_CONNREQUIRED|PR_WANTRCVD|PR_RIGHTS, 301e4445a03SRobert Watson .pr_ctloutput = &uipc_ctloutput, 302fa9402f2SRobert Watson .pr_usrreqs = &uipc_usrreqs_stream 303e4445a03SRobert Watson }, 304e4445a03SRobert Watson { 305e4445a03SRobert Watson .pr_type = SOCK_DGRAM, 306e4445a03SRobert Watson .pr_domain = &localdomain, 307e4445a03SRobert Watson .pr_flags = PR_ATOMIC|PR_ADDR|PR_RIGHTS, 308fa9402f2SRobert Watson .pr_usrreqs = &uipc_usrreqs_dgram 309e4445a03SRobert Watson }, 31084d61770SRobert Watson { 31184d61770SRobert Watson .pr_type = SOCK_SEQPACKET, 31284d61770SRobert Watson .pr_domain = &localdomain, 31384d61770SRobert Watson 31484d61770SRobert Watson /* 31584d61770SRobert Watson * XXXRW: For now, PR_ADDR because soreceive will bump into them 31684d61770SRobert Watson * due to our use of sbappendaddr. A new sbappend variants is needed 31784d61770SRobert Watson * that supports both atomic record writes and control data. 31884d61770SRobert Watson */ 31984d61770SRobert Watson .pr_flags = PR_ADDR|PR_ATOMIC|PR_CONNREQUIRED|PR_WANTRCVD| 32084d61770SRobert Watson PR_RIGHTS, 32184d61770SRobert Watson .pr_usrreqs = &uipc_usrreqs_seqpacket, 32284d61770SRobert Watson }, 323e4445a03SRobert Watson }; 324e4445a03SRobert Watson 325e4445a03SRobert Watson static struct domain localdomain = { 326e4445a03SRobert Watson .dom_family = AF_LOCAL, 327e4445a03SRobert Watson .dom_name = "local", 328e4445a03SRobert Watson .dom_init = unp_init, 329e4445a03SRobert Watson .dom_externalize = unp_externalize, 330e4445a03SRobert Watson .dom_dispose = unp_dispose, 331e4445a03SRobert Watson .dom_protosw = localsw, 332e4445a03SRobert Watson .dom_protoswNPROTOSW = &localsw[sizeof(localsw)/sizeof(localsw[0])] 333e4445a03SRobert Watson }; 334e4445a03SRobert Watson DOMAIN_SET(local); 335e4445a03SRobert Watson 336ac45e92fSRobert Watson static void 337a29f300eSGarrett Wollman uipc_abort(struct socket *so) 338df8bae1dSRodney W. Grimes { 339e7c33e29SRobert Watson struct unpcb *unp, *unp2; 340df8bae1dSRodney W. Grimes 34140f2ac28SRobert Watson unp = sotounpcb(so); 3424d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_abort: unp == NULL")); 343e7c33e29SRobert Watson 3443dab55bcSRobert Watson UNP_LINK_WLOCK(); 345e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 346e7c33e29SRobert Watson unp2 = unp->unp_conn; 347e7c33e29SRobert Watson if (unp2 != NULL) { 348e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 349e7c33e29SRobert Watson unp_drop(unp2, ECONNABORTED); 350e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 351e7c33e29SRobert Watson } 352e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 3533dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 354df8bae1dSRodney W. Grimes } 355df8bae1dSRodney W. Grimes 356a29f300eSGarrett Wollman static int 35757bf258eSGarrett Wollman uipc_accept(struct socket *so, struct sockaddr **nam) 358a29f300eSGarrett Wollman { 359e7c33e29SRobert Watson struct unpcb *unp, *unp2; 3600d9ce3a1SRobert Watson const struct sockaddr *sa; 361df8bae1dSRodney W. Grimes 362df8bae1dSRodney W. Grimes /* 3631c381b19SRobert Watson * Pass back name of connected socket, if it was bound and we are 3641c381b19SRobert Watson * still connected (our peer may have closed already!). 365df8bae1dSRodney W. Grimes */ 3664d4b555eSRobert Watson unp = sotounpcb(so); 3674d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_accept: unp == NULL")); 368e7c33e29SRobert Watson 3690d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 3703dab55bcSRobert Watson UNP_LINK_RLOCK(); 371e7c33e29SRobert Watson unp2 = unp->unp_conn; 372e7c33e29SRobert Watson if (unp2 != NULL && unp2->unp_addr != NULL) { 373e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 374e7c33e29SRobert Watson sa = (struct sockaddr *) unp2->unp_addr; 375e7c33e29SRobert Watson bcopy(sa, *nam, sa->sa_len); 376e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 377e7c33e29SRobert Watson } else { 3780d9ce3a1SRobert Watson sa = &sun_noname; 3790d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 380e7c33e29SRobert Watson } 3813dab55bcSRobert Watson UNP_LINK_RUNLOCK(); 382e5aeaa0cSDag-Erling Smørgrav return (0); 383a29f300eSGarrett Wollman } 384df8bae1dSRodney W. Grimes 385a29f300eSGarrett Wollman static int 386b40ce416SJulian Elischer uipc_attach(struct socket *so, int proto, struct thread *td) 387a29f300eSGarrett Wollman { 388e7c33e29SRobert Watson u_long sendspace, recvspace; 3896d32873cSRobert Watson struct unpcb *unp; 3903dab55bcSRobert Watson int error; 391df8bae1dSRodney W. Grimes 3926d32873cSRobert Watson KASSERT(so->so_pcb == NULL, ("uipc_attach: so_pcb != NULL")); 3936d32873cSRobert Watson if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) { 3946d32873cSRobert Watson switch (so->so_type) { 3956d32873cSRobert Watson case SOCK_STREAM: 396e7c33e29SRobert Watson sendspace = unpst_sendspace; 397e7c33e29SRobert Watson recvspace = unpst_recvspace; 3986d32873cSRobert Watson break; 3996d32873cSRobert Watson 4006d32873cSRobert Watson case SOCK_DGRAM: 401e7c33e29SRobert Watson sendspace = unpdg_sendspace; 402e7c33e29SRobert Watson recvspace = unpdg_recvspace; 4036d32873cSRobert Watson break; 4046d32873cSRobert Watson 40584d61770SRobert Watson case SOCK_SEQPACKET: 40684d61770SRobert Watson sendspace = unpsp_sendspace; 40784d61770SRobert Watson recvspace = unpsp_recvspace; 40884d61770SRobert Watson break; 40984d61770SRobert Watson 4106d32873cSRobert Watson default: 411e7c33e29SRobert Watson panic("uipc_attach"); 4126d32873cSRobert Watson } 413e7c33e29SRobert Watson error = soreserve(so, sendspace, recvspace); 4146d32873cSRobert Watson if (error) 4156d32873cSRobert Watson return (error); 4166d32873cSRobert Watson } 41746a1d9bfSRobert Watson unp = uma_zalloc(unp_zone, M_NOWAIT | M_ZERO); 4186d32873cSRobert Watson if (unp == NULL) 4196d32873cSRobert Watson return (ENOBUFS); 4206d32873cSRobert Watson LIST_INIT(&unp->unp_refs); 421e7c33e29SRobert Watson UNP_PCB_LOCK_INIT(unp); 4226d32873cSRobert Watson unp->unp_socket = so; 4236d32873cSRobert Watson so->so_pcb = unp; 4249ae328fcSJohn Baldwin unp->unp_refcount = 1; 425e7c33e29SRobert Watson 4263dab55bcSRobert Watson UNP_LIST_LOCK(); 4276d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 4286d32873cSRobert Watson unp_count++; 42984d61770SRobert Watson switch (so->so_type) { 43084d61770SRobert Watson case SOCK_STREAM: 43184d61770SRobert Watson LIST_INSERT_HEAD(&unp_shead, unp, unp_link); 43284d61770SRobert Watson break; 43384d61770SRobert Watson 43484d61770SRobert Watson case SOCK_DGRAM: 43584d61770SRobert Watson LIST_INSERT_HEAD(&unp_dhead, unp, unp_link); 43684d61770SRobert Watson break; 43784d61770SRobert Watson 43884d61770SRobert Watson case SOCK_SEQPACKET: 43984d61770SRobert Watson LIST_INSERT_HEAD(&unp_sphead, unp, unp_link); 44084d61770SRobert Watson break; 44184d61770SRobert Watson 44284d61770SRobert Watson default: 44384d61770SRobert Watson panic("uipc_attach"); 44484d61770SRobert Watson } 4453dab55bcSRobert Watson UNP_LIST_UNLOCK(); 4466d32873cSRobert Watson 4476d32873cSRobert Watson return (0); 448a29f300eSGarrett Wollman } 449a29f300eSGarrett Wollman 450a29f300eSGarrett Wollman static int 451b40ce416SJulian Elischer uipc_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 452a29f300eSGarrett Wollman { 453dd47f5caSRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 454dd47f5caSRobert Watson struct vattr vattr; 4559e289446SWojciech A. Koszek int error, namelen, vfslocked; 456dd47f5caSRobert Watson struct nameidata nd; 45740f2ac28SRobert Watson struct unpcb *unp; 458dd47f5caSRobert Watson struct vnode *vp; 459dd47f5caSRobert Watson struct mount *mp; 460dd47f5caSRobert Watson char *buf; 461a29f300eSGarrett Wollman 46240f2ac28SRobert Watson unp = sotounpcb(so); 4634d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_bind: unp == NULL")); 4644f1f0ef5SRobert Watson 4654f1f0ef5SRobert Watson namelen = soun->sun_len - offsetof(struct sockaddr_un, sun_path); 4664f1f0ef5SRobert Watson if (namelen <= 0) 4674f1f0ef5SRobert Watson return (EINVAL); 468dd47f5caSRobert Watson 469dd47f5caSRobert Watson /* 4704f1f0ef5SRobert Watson * We don't allow simultaneous bind() calls on a single UNIX domain 4714f1f0ef5SRobert Watson * socket, so flag in-progress operations, and return an error if an 4724f1f0ef5SRobert Watson * operation is already in progress. 4734f1f0ef5SRobert Watson * 4744f1f0ef5SRobert Watson * Historically, we have not allowed a socket to be rebound, so this 475d7924b70SRobert Watson * also returns an error. Not allowing re-binding simplifies the 476d7924b70SRobert Watson * implementation and avoids a great many possible failure modes. 477dd47f5caSRobert Watson */ 478e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 479dd47f5caSRobert Watson if (unp->unp_vnode != NULL) { 480e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 481dd47f5caSRobert Watson return (EINVAL); 482dd47f5caSRobert Watson } 4834f1f0ef5SRobert Watson if (unp->unp_flags & UNP_BINDING) { 484e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 4854f1f0ef5SRobert Watson return (EALREADY); 486dd47f5caSRobert Watson } 4874f1f0ef5SRobert Watson unp->unp_flags |= UNP_BINDING; 488e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 489dd47f5caSRobert Watson 490dd47f5caSRobert Watson buf = malloc(namelen + 1, M_TEMP, M_WAITOK); 4917928893dSEd Maste bcopy(soun->sun_path, buf, namelen); 4927928893dSEd Maste buf[namelen] = 0; 493dd47f5caSRobert Watson 494dd47f5caSRobert Watson restart: 4959e289446SWojciech A. Koszek vfslocked = 0; 4969e289446SWojciech A. Koszek NDINIT(&nd, CREATE, MPSAFE | NOFOLLOW | LOCKPARENT | SAVENAME, 4979e289446SWojciech A. Koszek UIO_SYSSPACE, buf, td); 498dd47f5caSRobert Watson /* SHOULD BE ABLE TO ADOPT EXISTING AND wakeup() ALA FIFO's */ 499dd47f5caSRobert Watson error = namei(&nd); 500dd47f5caSRobert Watson if (error) 5014f1f0ef5SRobert Watson goto error; 502dd47f5caSRobert Watson vp = nd.ni_vp; 5039e289446SWojciech A. Koszek vfslocked = NDHASGIANT(&nd); 504dd47f5caSRobert Watson if (vp != NULL || vn_start_write(nd.ni_dvp, &mp, V_NOWAIT) != 0) { 505dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 506dd47f5caSRobert Watson if (nd.ni_dvp == vp) 507dd47f5caSRobert Watson vrele(nd.ni_dvp); 508dd47f5caSRobert Watson else 509dd47f5caSRobert Watson vput(nd.ni_dvp); 510dd47f5caSRobert Watson if (vp != NULL) { 511dd47f5caSRobert Watson vrele(vp); 512dd47f5caSRobert Watson error = EADDRINUSE; 5134f1f0ef5SRobert Watson goto error; 514dd47f5caSRobert Watson } 515dd47f5caSRobert Watson error = vn_start_write(NULL, &mp, V_XSLEEP | PCATCH); 516dd47f5caSRobert Watson if (error) 5174f1f0ef5SRobert Watson goto error; 5189e289446SWojciech A. Koszek VFS_UNLOCK_GIANT(vfslocked); 519dd47f5caSRobert Watson goto restart; 520dd47f5caSRobert Watson } 521dd47f5caSRobert Watson VATTR_NULL(&vattr); 522dd47f5caSRobert Watson vattr.va_type = VSOCK; 523dd47f5caSRobert Watson vattr.va_mode = (ACCESSPERMS & ~td->td_proc->p_fd->fd_cmask); 524dd47f5caSRobert Watson #ifdef MAC 52530d239bcSRobert Watson error = mac_vnode_check_create(td->td_ucred, nd.ni_dvp, &nd.ni_cnd, 526dd47f5caSRobert Watson &vattr); 527dd47f5caSRobert Watson #endif 528885868cdSRobert Watson if (error == 0) 529dd47f5caSRobert Watson error = VOP_CREATE(nd.ni_dvp, &nd.ni_vp, &nd.ni_cnd, &vattr); 530dd47f5caSRobert Watson NDFREE(&nd, NDF_ONLY_PNBUF); 531dd47f5caSRobert Watson vput(nd.ni_dvp); 532dd47f5caSRobert Watson if (error) { 533dd47f5caSRobert Watson vn_finished_write(mp); 5344f1f0ef5SRobert Watson goto error; 535dd47f5caSRobert Watson } 536dd47f5caSRobert Watson vp = nd.ni_vp; 53757fd3d55SPawel Jakub Dawidek ASSERT_VOP_ELOCKED(vp, "uipc_bind"); 538dd47f5caSRobert Watson soun = (struct sockaddr_un *)sodupsockaddr(nam, M_WAITOK); 539e7c33e29SRobert Watson 5403dab55bcSRobert Watson UNP_LINK_WLOCK(); 541e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 542dd47f5caSRobert Watson vp->v_socket = unp->unp_socket; 543dd47f5caSRobert Watson unp->unp_vnode = vp; 544dd47f5caSRobert Watson unp->unp_addr = soun; 5454f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 546e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 5473dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 54822db15c0SAttilio Rao VOP_UNLOCK(vp, 0); 549dd47f5caSRobert Watson vn_finished_write(mp); 5509e289446SWojciech A. Koszek VFS_UNLOCK_GIANT(vfslocked); 5514f1f0ef5SRobert Watson free(buf, M_TEMP); 5524f1f0ef5SRobert Watson return (0); 553e7c33e29SRobert Watson 5544f1f0ef5SRobert Watson error: 5559e289446SWojciech A. Koszek VFS_UNLOCK_GIANT(vfslocked); 556e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 5574f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_BINDING; 558e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 559dd47f5caSRobert Watson free(buf, M_TEMP); 56040f2ac28SRobert Watson return (error); 561a29f300eSGarrett Wollman } 562a29f300eSGarrett Wollman 563a29f300eSGarrett Wollman static int 564b40ce416SJulian Elischer uipc_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 565a29f300eSGarrett Wollman { 5660d9ce3a1SRobert Watson int error; 567a29f300eSGarrett Wollman 568fd179ee9SRobert Watson KASSERT(td == curthread, ("uipc_connect: td != curthread")); 5693dab55bcSRobert Watson UNP_LINK_WLOCK(); 570fd179ee9SRobert Watson error = unp_connect(so, nam, td); 5713dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 5720d9ce3a1SRobert Watson return (error); 573a29f300eSGarrett Wollman } 574a29f300eSGarrett Wollman 575a152f8a3SRobert Watson static void 576a152f8a3SRobert Watson uipc_close(struct socket *so) 577a152f8a3SRobert Watson { 578e7c33e29SRobert Watson struct unpcb *unp, *unp2; 579a152f8a3SRobert Watson 580a152f8a3SRobert Watson unp = sotounpcb(so); 581a152f8a3SRobert Watson KASSERT(unp != NULL, ("uipc_close: unp == NULL")); 582e7c33e29SRobert Watson 5833dab55bcSRobert Watson UNP_LINK_WLOCK(); 584e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 585e7c33e29SRobert Watson unp2 = unp->unp_conn; 586e7c33e29SRobert Watson if (unp2 != NULL) { 587e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 588e7c33e29SRobert Watson unp_disconnect(unp, unp2); 589e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 590e7c33e29SRobert Watson } 591e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 5923dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 593a152f8a3SRobert Watson } 594a152f8a3SRobert Watson 5952c899584SRobert Watson static int 596a29f300eSGarrett Wollman uipc_connect2(struct socket *so1, struct socket *so2) 597a29f300eSGarrett Wollman { 598e7c33e29SRobert Watson struct unpcb *unp, *unp2; 5990d9ce3a1SRobert Watson int error; 600a29f300eSGarrett Wollman 6013dab55bcSRobert Watson UNP_LINK_WLOCK(); 602e7c33e29SRobert Watson unp = so1->so_pcb; 6034d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_connect2: unp == NULL")); 604e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 605e7c33e29SRobert Watson unp2 = so2->so_pcb; 606e7c33e29SRobert Watson KASSERT(unp2 != NULL, ("uipc_connect2: unp2 == NULL")); 607e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 6086a2989fdSMatthew N. Dodd error = unp_connect2(so1, so2, PRU_CONNECT2); 609e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 610e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 6113dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 6120d9ce3a1SRobert Watson return (error); 613a29f300eSGarrett Wollman } 614a29f300eSGarrett Wollman 615bc725eafSRobert Watson static void 616a29f300eSGarrett Wollman uipc_detach(struct socket *so) 617a29f300eSGarrett Wollman { 618e7c33e29SRobert Watson struct unpcb *unp, *unp2; 6199ae328fcSJohn Baldwin struct sockaddr_un *saved_unp_addr; 6206d32873cSRobert Watson struct vnode *vp; 6219ae328fcSJohn Baldwin int freeunp, local_unp_rights; 622a29f300eSGarrett Wollman 62340f2ac28SRobert Watson unp = sotounpcb(so); 6244d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_detach: unp == NULL")); 625e7c33e29SRobert Watson 6263dab55bcSRobert Watson UNP_LINK_WLOCK(); 6273dab55bcSRobert Watson UNP_LIST_LOCK(); 628e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 6296d32873cSRobert Watson LIST_REMOVE(unp, unp_link); 6306d32873cSRobert Watson unp->unp_gencnt = ++unp_gencnt; 6316d32873cSRobert Watson --unp_count; 6323dab55bcSRobert Watson UNP_LIST_UNLOCK(); 633e7c33e29SRobert Watson 634e7c33e29SRobert Watson /* 635e7c33e29SRobert Watson * XXXRW: Should assert vp->v_socket == so. 636e7c33e29SRobert Watson */ 6376d32873cSRobert Watson if ((vp = unp->unp_vnode) != NULL) { 6386d32873cSRobert Watson unp->unp_vnode->v_socket = NULL; 6396d32873cSRobert Watson unp->unp_vnode = NULL; 6406d32873cSRobert Watson } 641e7c33e29SRobert Watson unp2 = unp->unp_conn; 642e7c33e29SRobert Watson if (unp2 != NULL) { 643e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 644e7c33e29SRobert Watson unp_disconnect(unp, unp2); 645e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 646e7c33e29SRobert Watson } 647e7c33e29SRobert Watson 648e7c33e29SRobert Watson /* 6493dab55bcSRobert Watson * We hold the linkage lock exclusively, so it's OK to acquire 65060a5ef26SRobert Watson * multiple pcb locks at a time. 651e7c33e29SRobert Watson */ 6526d32873cSRobert Watson while (!LIST_EMPTY(&unp->unp_refs)) { 6536d32873cSRobert Watson struct unpcb *ref = LIST_FIRST(&unp->unp_refs); 654e7c33e29SRobert Watson 655e7c33e29SRobert Watson UNP_PCB_LOCK(ref); 6566d32873cSRobert Watson unp_drop(ref, ECONNRESET); 657e7c33e29SRobert Watson UNP_PCB_UNLOCK(ref); 6586d32873cSRobert Watson } 659397c19d1SJeff Roberson local_unp_rights = unp_rights; 6603dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 6616d32873cSRobert Watson unp->unp_socket->so_pcb = NULL; 6629ae328fcSJohn Baldwin saved_unp_addr = unp->unp_addr; 6639ae328fcSJohn Baldwin unp->unp_addr = NULL; 6649ae328fcSJohn Baldwin unp->unp_refcount--; 6659ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 6669ae328fcSJohn Baldwin if (saved_unp_addr != NULL) 6671ede983cSDag-Erling Smørgrav free(saved_unp_addr, M_SONAME); 668e7c33e29SRobert Watson if (freeunp) { 669e7c33e29SRobert Watson UNP_PCB_LOCK_DESTROY(unp); 6706d32873cSRobert Watson uma_zfree(unp_zone, unp); 6716e2faa24SRobert Watson } else 6726e2faa24SRobert Watson UNP_PCB_UNLOCK(unp); 6736d32873cSRobert Watson if (vp) { 6746d32873cSRobert Watson int vfslocked; 6756d32873cSRobert Watson 6766d32873cSRobert Watson vfslocked = VFS_LOCK_GIANT(vp->v_mount); 6776d32873cSRobert Watson vrele(vp); 6786d32873cSRobert Watson VFS_UNLOCK_GIANT(vfslocked); 6796d32873cSRobert Watson } 6806d32873cSRobert Watson if (local_unp_rights) 6816d32873cSRobert Watson taskqueue_enqueue(taskqueue_thread, &unp_gc_task); 682a29f300eSGarrett Wollman } 683a29f300eSGarrett Wollman 684a29f300eSGarrett Wollman static int 685a29f300eSGarrett Wollman uipc_disconnect(struct socket *so) 686a29f300eSGarrett Wollman { 687e7c33e29SRobert Watson struct unpcb *unp, *unp2; 688a29f300eSGarrett Wollman 68940f2ac28SRobert Watson unp = sotounpcb(so); 6904d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_disconnect: unp == NULL")); 691e7c33e29SRobert Watson 6923dab55bcSRobert Watson UNP_LINK_WLOCK(); 693e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 694e7c33e29SRobert Watson unp2 = unp->unp_conn; 695e7c33e29SRobert Watson if (unp2 != NULL) { 696e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 697e7c33e29SRobert Watson unp_disconnect(unp, unp2); 698e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 699e7c33e29SRobert Watson } 700e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 7013dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 702e5aeaa0cSDag-Erling Smørgrav return (0); 703a29f300eSGarrett Wollman } 704a29f300eSGarrett Wollman 705a29f300eSGarrett Wollman static int 706d374e81eSRobert Watson uipc_listen(struct socket *so, int backlog, struct thread *td) 707a29f300eSGarrett Wollman { 70840f2ac28SRobert Watson struct unpcb *unp; 7090d9ce3a1SRobert Watson int error; 710a29f300eSGarrett Wollman 71140f2ac28SRobert Watson unp = sotounpcb(so); 7124d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_listen: unp == NULL")); 713e7c33e29SRobert Watson 714e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 7154d4b555eSRobert Watson if (unp->unp_vnode == NULL) { 716e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 71740f2ac28SRobert Watson return (EINVAL); 71840f2ac28SRobert Watson } 719e7c33e29SRobert Watson 720e7c33e29SRobert Watson SOCK_LOCK(so); 721e7c33e29SRobert Watson error = solisten_proto_check(so); 722e7c33e29SRobert Watson if (error == 0) { 723e7c33e29SRobert Watson cru2x(td->td_ucred, &unp->unp_peercred); 724e7c33e29SRobert Watson unp->unp_flags |= UNP_HAVEPCCACHED; 725e7c33e29SRobert Watson solisten_proto(so, backlog); 726e7c33e29SRobert Watson } 727e7c33e29SRobert Watson SOCK_UNLOCK(so); 728e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 7290d9ce3a1SRobert Watson return (error); 730a29f300eSGarrett Wollman } 731a29f300eSGarrett Wollman 732a29f300eSGarrett Wollman static int 73357bf258eSGarrett Wollman uipc_peeraddr(struct socket *so, struct sockaddr **nam) 734a29f300eSGarrett Wollman { 735e7c33e29SRobert Watson struct unpcb *unp, *unp2; 7360d9ce3a1SRobert Watson const struct sockaddr *sa; 737a29f300eSGarrett Wollman 7384d4b555eSRobert Watson unp = sotounpcb(so); 7394d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_peeraddr: unp == NULL")); 740e7c33e29SRobert Watson 7410d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 742afd9f91cSJohn Baldwin UNP_LINK_RLOCK(); 743bdc5f6a3SHajimu UMEMOTO /* 744e7c33e29SRobert Watson * XXX: It seems that this test always fails even when connection is 745e7c33e29SRobert Watson * established. So, this else clause is added as workaround to 746e7c33e29SRobert Watson * return PF_LOCAL sockaddr. 747bdc5f6a3SHajimu UMEMOTO */ 748e7c33e29SRobert Watson unp2 = unp->unp_conn; 749e7c33e29SRobert Watson if (unp2 != NULL) { 750e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 751e7c33e29SRobert Watson if (unp2->unp_addr != NULL) 752afd9f91cSJohn Baldwin sa = (struct sockaddr *) unp2->unp_addr; 753e7c33e29SRobert Watson else 7540d9ce3a1SRobert Watson sa = &sun_noname; 7550d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 756e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 757e7c33e29SRobert Watson } else { 758e7c33e29SRobert Watson sa = &sun_noname; 759e7c33e29SRobert Watson bcopy(sa, *nam, sa->sa_len); 760e7c33e29SRobert Watson } 761afd9f91cSJohn Baldwin UNP_LINK_RUNLOCK(); 762e5aeaa0cSDag-Erling Smørgrav return (0); 763a29f300eSGarrett Wollman } 764a29f300eSGarrett Wollman 765a29f300eSGarrett Wollman static int 766a29f300eSGarrett Wollman uipc_rcvd(struct socket *so, int flags) 767a29f300eSGarrett Wollman { 768e7c33e29SRobert Watson struct unpcb *unp, *unp2; 769a29f300eSGarrett Wollman struct socket *so2; 770337cc6b6SRobert Watson u_int mbcnt, sbcc; 7716aef685fSBrian Feldman u_long newhiwat; 772a29f300eSGarrett Wollman 77340f2ac28SRobert Watson unp = sotounpcb(so); 7744d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_rcvd: unp == NULL")); 775df8bae1dSRodney W. Grimes 77684d61770SRobert Watson if (so->so_type != SOCK_STREAM && so->so_type != SOCK_SEQPACKET) 77784d61770SRobert Watson panic("uipc_rcvd socktype %d", so->so_type); 778e7c33e29SRobert Watson 779df8bae1dSRodney W. Grimes /* 780e7c33e29SRobert Watson * Adjust backpressure on sender and wakeup any waiting to write. 781e7c33e29SRobert Watson * 782d7924b70SRobert Watson * The unp lock is acquired to maintain the validity of the unp_conn 783d7924b70SRobert Watson * pointer; no lock on unp2 is required as unp2->unp_socket will be 784d7924b70SRobert Watson * static as long as we don't permit unp2 to disconnect from unp, 785d7924b70SRobert Watson * which is prevented by the lock on unp. We cache values from 786d7924b70SRobert Watson * so_rcv to avoid holding the so_rcv lock over the entire 787d7924b70SRobert Watson * transaction on the remote so_snd. 788df8bae1dSRodney W. Grimes */ 789337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_rcv); 790337cc6b6SRobert Watson mbcnt = so->so_rcv.sb_mbcnt; 791337cc6b6SRobert Watson sbcc = so->so_rcv.sb_cc; 792337cc6b6SRobert Watson SOCKBUF_UNLOCK(&so->so_rcv); 793e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 794e7c33e29SRobert Watson unp2 = unp->unp_conn; 795e7c33e29SRobert Watson if (unp2 == NULL) { 796e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 797e7c33e29SRobert Watson return (0); 798337cc6b6SRobert Watson } 799e7c33e29SRobert Watson so2 = unp2->unp_socket; 800337cc6b6SRobert Watson SOCKBUF_LOCK(&so2->so_snd); 801337cc6b6SRobert Watson so2->so_snd.sb_mbmax += unp->unp_mbcnt - mbcnt; 802337cc6b6SRobert Watson newhiwat = so2->so_snd.sb_hiwat + unp->unp_cc - sbcc; 803f535380cSDon Lewis (void)chgsbsize(so2->so_cred->cr_uidinfo, &so2->so_snd.sb_hiwat, 8046aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 8051e4d7da7SRobert Watson sowwakeup_locked(so2); 806337cc6b6SRobert Watson unp->unp_mbcnt = mbcnt; 807337cc6b6SRobert Watson unp->unp_cc = sbcc; 808e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 809e5aeaa0cSDag-Erling Smørgrav return (0); 810a29f300eSGarrett Wollman } 811df8bae1dSRodney W. Grimes 812a29f300eSGarrett Wollman static int 81357bf258eSGarrett Wollman uipc_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam, 814b40ce416SJulian Elischer struct mbuf *control, struct thread *td) 815a29f300eSGarrett Wollman { 816f3f49bbbSRobert Watson struct unpcb *unp, *unp2; 817a29f300eSGarrett Wollman struct socket *so2; 818a9f3c7d2SRobert Watson u_int mbcnt_delta, sbcc; 8196aef685fSBrian Feldman u_long newhiwat; 820f3f49bbbSRobert Watson int error = 0; 821a29f300eSGarrett Wollman 82240f2ac28SRobert Watson unp = sotounpcb(so); 8234d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_send: unp == NULL")); 824e7c33e29SRobert Watson 825a29f300eSGarrett Wollman if (flags & PRUS_OOB) { 826a29f300eSGarrett Wollman error = EOPNOTSUPP; 827a29f300eSGarrett Wollman goto release; 828a29f300eSGarrett Wollman } 829fc3fcacfSRobert Watson if (control != NULL && (error = unp_internalize(&control, td))) 830a29f300eSGarrett Wollman goto release; 831e7c33e29SRobert Watson if ((nam != NULL) || (flags & PRUS_EOF)) 8323dab55bcSRobert Watson UNP_LINK_WLOCK(); 833e7c33e29SRobert Watson else 8343dab55bcSRobert Watson UNP_LINK_RLOCK(); 835a29f300eSGarrett Wollman switch (so->so_type) { 836a29f300eSGarrett Wollman case SOCK_DGRAM: 837a29f300eSGarrett Wollman { 838e7dd9a10SRobert Watson const struct sockaddr *from; 839df8bae1dSRodney W. Grimes 840e7c33e29SRobert Watson unp2 = unp->unp_conn; 841fc3fcacfSRobert Watson if (nam != NULL) { 8423dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 843e7c33e29SRobert Watson if (unp2 != NULL) { 844df8bae1dSRodney W. Grimes error = EISCONN; 845df8bae1dSRodney W. Grimes break; 846df8bae1dSRodney W. Grimes } 847b40ce416SJulian Elischer error = unp_connect(so, nam, td); 848df8bae1dSRodney W. Grimes if (error) 849df8bae1dSRodney W. Grimes break; 850e7c33e29SRobert Watson unp2 = unp->unp_conn; 851df8bae1dSRodney W. Grimes } 85260a5ef26SRobert Watson 853b5ff0914SRobert Watson /* 854b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 855b5ff0914SRobert Watson * with a target address, it's possible that the socket will 856b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 857b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 858b5ff0914SRobert Watson * correct error that the socket is not connected. 859b5ff0914SRobert Watson */ 860b5ff0914SRobert Watson if (unp2 == NULL) { 861b5ff0914SRobert Watson error = ENOTCONN; 862b5ff0914SRobert Watson break; 863b5ff0914SRobert Watson } 864ede6e136SRobert Watson /* Lockless read. */ 865ede6e136SRobert Watson if (unp2->unp_flags & UNP_WANTCRED) 866ede6e136SRobert Watson control = unp_addsockcred(td, control); 867ede6e136SRobert Watson UNP_PCB_LOCK(unp); 868fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 86957bf258eSGarrett Wollman from = (struct sockaddr *)unp->unp_addr; 870df8bae1dSRodney W. Grimes else 871df8bae1dSRodney W. Grimes from = &sun_noname; 872ede6e136SRobert Watson so2 = unp2->unp_socket; 873a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 874a34b7046SRobert Watson if (sbappendaddr_locked(&so2->so_rcv, from, m, control)) { 8751e4d7da7SRobert Watson sorwakeup_locked(so2); 876fc3fcacfSRobert Watson m = NULL; 877fc3fcacfSRobert Watson control = NULL; 878e5aeaa0cSDag-Erling Smørgrav } else { 879a34b7046SRobert Watson SOCKBUF_UNLOCK(&so2->so_rcv); 880df8bae1dSRodney W. Grimes error = ENOBUFS; 881e5aeaa0cSDag-Erling Smørgrav } 882ede6e136SRobert Watson if (nam != NULL) { 8833dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 884ede6e136SRobert Watson UNP_PCB_LOCK(unp2); 885e7c33e29SRobert Watson unp_disconnect(unp, unp2); 886e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 887ede6e136SRobert Watson } 888ede6e136SRobert Watson UNP_PCB_UNLOCK(unp); 889df8bae1dSRodney W. Grimes break; 890df8bae1dSRodney W. Grimes } 891df8bae1dSRodney W. Grimes 89284d61770SRobert Watson case SOCK_SEQPACKET: 893df8bae1dSRodney W. Grimes case SOCK_STREAM: 894402cc72dSDavid Greenman if ((so->so_state & SS_ISCONNECTED) == 0) { 895fc3fcacfSRobert Watson if (nam != NULL) { 8963dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 897b40ce416SJulian Elischer error = unp_connect(so, nam, td); 898402cc72dSDavid Greenman if (error) 8996b8fda4dSGarrett Wollman break; /* XXX */ 900402cc72dSDavid Greenman } else { 901402cc72dSDavid Greenman error = ENOTCONN; 902402cc72dSDavid Greenman break; 903402cc72dSDavid Greenman } 904ede6e136SRobert Watson } 905402cc72dSDavid Greenman 906337cc6b6SRobert Watson /* Lockless read. */ 907c0b99ffaSRobert Watson if (so->so_snd.sb_state & SBS_CANTSENDMORE) { 908df8bae1dSRodney W. Grimes error = EPIPE; 909df8bae1dSRodney W. Grimes break; 910df8bae1dSRodney W. Grimes } 91160a5ef26SRobert Watson 912b5ff0914SRobert Watson /* 913b5ff0914SRobert Watson * Because connect() and send() are non-atomic in a sendto() 914b5ff0914SRobert Watson * with a target address, it's possible that the socket will 915b5ff0914SRobert Watson * have disconnected before the send() can run. In that case 916b5ff0914SRobert Watson * return the slightly counter-intuitive but otherwise 917b5ff0914SRobert Watson * correct error that the socket is not connected. 918e7c33e29SRobert Watson * 919afd9f91cSJohn Baldwin * Locking here must be done carefully: the linkage lock 920d7924b70SRobert Watson * prevents interconnections between unpcbs from changing, so 921d7924b70SRobert Watson * we can traverse from unp to unp2 without acquiring unp's 922d7924b70SRobert Watson * lock. Socket buffer locks follow unpcb locks, so we can 923d7924b70SRobert Watson * acquire both remote and lock socket buffer locks. 924b5ff0914SRobert Watson */ 925f3f49bbbSRobert Watson unp2 = unp->unp_conn; 926b5ff0914SRobert Watson if (unp2 == NULL) { 927b5ff0914SRobert Watson error = ENOTCONN; 928b5ff0914SRobert Watson break; 929b5ff0914SRobert Watson } 930f3f49bbbSRobert Watson so2 = unp2->unp_socket; 931ede6e136SRobert Watson UNP_PCB_LOCK(unp2); 932a34b7046SRobert Watson SOCKBUF_LOCK(&so2->so_rcv); 933f3f49bbbSRobert Watson if (unp2->unp_flags & UNP_WANTCRED) { 9346a2989fdSMatthew N. Dodd /* 935ede6e136SRobert Watson * Credentials are passed only once on SOCK_STREAM. 9366a2989fdSMatthew N. Dodd */ 937f3f49bbbSRobert Watson unp2->unp_flags &= ~UNP_WANTCRED; 9386a2989fdSMatthew N. Dodd control = unp_addsockcred(td, control); 9396a2989fdSMatthew N. Dodd } 940df8bae1dSRodney W. Grimes /* 9411c381b19SRobert Watson * Send to paired receive port, and then reduce send buffer 9421c381b19SRobert Watson * hiwater marks to maintain backpressure. Wake up readers. 943df8bae1dSRodney W. Grimes */ 94484d61770SRobert Watson switch (so->so_type) { 94584d61770SRobert Watson case SOCK_STREAM: 946fc3fcacfSRobert Watson if (control != NULL) { 94784d61770SRobert Watson if (sbappendcontrol_locked(&so2->so_rcv, m, 94884d61770SRobert Watson control)) 949fc3fcacfSRobert Watson control = NULL; 950e7c33e29SRobert Watson } else 951a34b7046SRobert Watson sbappend_locked(&so2->so_rcv, m); 95284d61770SRobert Watson break; 95384d61770SRobert Watson 95484d61770SRobert Watson case SOCK_SEQPACKET: { 95584d61770SRobert Watson const struct sockaddr *from; 95684d61770SRobert Watson 95784d61770SRobert Watson from = &sun_noname; 95884d61770SRobert Watson if (sbappendaddr_locked(&so2->so_rcv, from, m, 95984d61770SRobert Watson control)) 96084d61770SRobert Watson control = NULL; 96184d61770SRobert Watson break; 96284d61770SRobert Watson } 96384d61770SRobert Watson } 96484d61770SRobert Watson 96584d61770SRobert Watson /* 96684d61770SRobert Watson * XXXRW: While fine for SOCK_STREAM, this conflates maximum 96784d61770SRobert Watson * datagram size and back-pressure for SOCK_SEQPACKET, which 96884d61770SRobert Watson * can lead to undesired return of EMSGSIZE on send instead 96984d61770SRobert Watson * of more desirable blocking. 97084d61770SRobert Watson */ 971a9f3c7d2SRobert Watson mbcnt_delta = so2->so_rcv.sb_mbcnt - unp2->unp_mbcnt; 972f3f49bbbSRobert Watson unp2->unp_mbcnt = so2->so_rcv.sb_mbcnt; 973337cc6b6SRobert Watson sbcc = so2->so_rcv.sb_cc; 974337cc6b6SRobert Watson sorwakeup_locked(so2); 975337cc6b6SRobert Watson 976337cc6b6SRobert Watson SOCKBUF_LOCK(&so->so_snd); 977f3f49bbbSRobert Watson newhiwat = so->so_snd.sb_hiwat - (sbcc - unp2->unp_cc); 978f535380cSDon Lewis (void)chgsbsize(so->so_cred->cr_uidinfo, &so->so_snd.sb_hiwat, 9796aef685fSBrian Feldman newhiwat, RLIM_INFINITY); 980a9f3c7d2SRobert Watson so->so_snd.sb_mbmax -= mbcnt_delta; 9817abe2ac2SAlan Cox SOCKBUF_UNLOCK(&so->so_snd); 982f3f49bbbSRobert Watson unp2->unp_cc = sbcc; 983e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 984fc3fcacfSRobert Watson m = NULL; 985df8bae1dSRodney W. Grimes break; 986df8bae1dSRodney W. Grimes 987df8bae1dSRodney W. Grimes default: 988a29f300eSGarrett Wollman panic("uipc_send unknown socktype"); 989df8bae1dSRodney W. Grimes } 990a29f300eSGarrett Wollman 9916b8fda4dSGarrett Wollman /* 99260a5ef26SRobert Watson * PRUS_EOF is equivalent to pru_send followed by pru_shutdown. 9936b8fda4dSGarrett Wollman */ 994a29f300eSGarrett Wollman if (flags & PRUS_EOF) { 995ede6e136SRobert Watson UNP_PCB_LOCK(unp); 9966b8fda4dSGarrett Wollman socantsendmore(so); 9976b8fda4dSGarrett Wollman unp_shutdown(unp); 998e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 999ede6e136SRobert Watson } 1000e7c33e29SRobert Watson 1001e7c33e29SRobert Watson if ((nam != NULL) || (flags & PRUS_EOF)) 10023dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 1003e7c33e29SRobert Watson else 10043dab55bcSRobert Watson UNP_LINK_RUNLOCK(); 1005df8bae1dSRodney W. Grimes 1006fc3fcacfSRobert Watson if (control != NULL && error != 0) 1007bd508d39SDon Lewis unp_dispose(control); 1008bd508d39SDon Lewis 1009a29f300eSGarrett Wollman release: 1010fc3fcacfSRobert Watson if (control != NULL) 1011a29f300eSGarrett Wollman m_freem(control); 1012fc3fcacfSRobert Watson if (m != NULL) 1013a29f300eSGarrett Wollman m_freem(m); 1014e5aeaa0cSDag-Erling Smørgrav return (error); 1015a29f300eSGarrett Wollman } 1016df8bae1dSRodney W. Grimes 1017a29f300eSGarrett Wollman static int 1018a29f300eSGarrett Wollman uipc_sense(struct socket *so, struct stat *sb) 1019a29f300eSGarrett Wollman { 1020e7c33e29SRobert Watson struct unpcb *unp, *unp2; 1021a29f300eSGarrett Wollman struct socket *so2; 1022a29f300eSGarrett Wollman 102340f2ac28SRobert Watson unp = sotounpcb(so); 10244d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sense: unp == NULL")); 1025e7c33e29SRobert Watson 1026a29f300eSGarrett Wollman sb->st_blksize = so->so_snd.sb_hiwat; 10273dab55bcSRobert Watson UNP_LINK_RLOCK(); 1028e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 1029e7c33e29SRobert Watson unp2 = unp->unp_conn; 103084d61770SRobert Watson if ((so->so_type == SOCK_STREAM || so->so_type == SOCK_SEQPACKET) && 103184d61770SRobert Watson unp2 != NULL) { 1032e7c33e29SRobert Watson so2 = unp2->unp_socket; 1033a29f300eSGarrett Wollman sb->st_blksize += so2->so_rcv.sb_cc; 1034df8bae1dSRodney W. Grimes } 1035f3732fd1SPoul-Henning Kamp sb->st_dev = NODEV; 1036df8bae1dSRodney W. Grimes if (unp->unp_ino == 0) 10376f782c46SJeffrey Hsu unp->unp_ino = (++unp_ino == 0) ? ++unp_ino : unp_ino; 1038a29f300eSGarrett Wollman sb->st_ino = unp->unp_ino; 1039e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 10403dab55bcSRobert Watson UNP_LINK_RUNLOCK(); 1041df8bae1dSRodney W. Grimes return (0); 1042a29f300eSGarrett Wollman } 1043df8bae1dSRodney W. Grimes 1044a29f300eSGarrett Wollman static int 1045a29f300eSGarrett Wollman uipc_shutdown(struct socket *so) 1046a29f300eSGarrett Wollman { 104740f2ac28SRobert Watson struct unpcb *unp; 1048df8bae1dSRodney W. Grimes 104940f2ac28SRobert Watson unp = sotounpcb(so); 10504d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_shutdown: unp == NULL")); 1051e7c33e29SRobert Watson 10523dab55bcSRobert Watson UNP_LINK_WLOCK(); 1053e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 1054a29f300eSGarrett Wollman socantsendmore(so); 1055a29f300eSGarrett Wollman unp_shutdown(unp); 1056e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 10573dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 1058e5aeaa0cSDag-Erling Smørgrav return (0); 1059a29f300eSGarrett Wollman } 1060df8bae1dSRodney W. Grimes 1061a29f300eSGarrett Wollman static int 106257bf258eSGarrett Wollman uipc_sockaddr(struct socket *so, struct sockaddr **nam) 1063a29f300eSGarrett Wollman { 106440f2ac28SRobert Watson struct unpcb *unp; 10650d9ce3a1SRobert Watson const struct sockaddr *sa; 1066a29f300eSGarrett Wollman 10674d4b555eSRobert Watson unp = sotounpcb(so); 10684d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_sockaddr: unp == NULL")); 1069e7c33e29SRobert Watson 10700d9ce3a1SRobert Watson *nam = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 1071e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 1072fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 10730d9ce3a1SRobert Watson sa = (struct sockaddr *) unp->unp_addr; 107483f3198bSThomas Moestl else 10750d9ce3a1SRobert Watson sa = &sun_noname; 10760d9ce3a1SRobert Watson bcopy(sa, *nam, sa->sa_len); 1077e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 1078e5aeaa0cSDag-Erling Smørgrav return (0); 1079df8bae1dSRodney W. Grimes } 1080a29f300eSGarrett Wollman 1081fa9402f2SRobert Watson static struct pr_usrreqs uipc_usrreqs_dgram = { 1082756d52a1SPoul-Henning Kamp .pru_abort = uipc_abort, 1083756d52a1SPoul-Henning Kamp .pru_accept = uipc_accept, 1084756d52a1SPoul-Henning Kamp .pru_attach = uipc_attach, 1085756d52a1SPoul-Henning Kamp .pru_bind = uipc_bind, 1086756d52a1SPoul-Henning Kamp .pru_connect = uipc_connect, 1087756d52a1SPoul-Henning Kamp .pru_connect2 = uipc_connect2, 1088756d52a1SPoul-Henning Kamp .pru_detach = uipc_detach, 1089756d52a1SPoul-Henning Kamp .pru_disconnect = uipc_disconnect, 1090756d52a1SPoul-Henning Kamp .pru_listen = uipc_listen, 1091756d52a1SPoul-Henning Kamp .pru_peeraddr = uipc_peeraddr, 1092756d52a1SPoul-Henning Kamp .pru_rcvd = uipc_rcvd, 1093756d52a1SPoul-Henning Kamp .pru_send = uipc_send, 1094756d52a1SPoul-Henning Kamp .pru_sense = uipc_sense, 1095756d52a1SPoul-Henning Kamp .pru_shutdown = uipc_shutdown, 1096756d52a1SPoul-Henning Kamp .pru_sockaddr = uipc_sockaddr, 1097fa9402f2SRobert Watson .pru_soreceive = soreceive_dgram, 1098fa9402f2SRobert Watson .pru_close = uipc_close, 1099fa9402f2SRobert Watson }; 1100fa9402f2SRobert Watson 110184d61770SRobert Watson static struct pr_usrreqs uipc_usrreqs_seqpacket = { 110284d61770SRobert Watson .pru_abort = uipc_abort, 110384d61770SRobert Watson .pru_accept = uipc_accept, 110484d61770SRobert Watson .pru_attach = uipc_attach, 110584d61770SRobert Watson .pru_bind = uipc_bind, 110684d61770SRobert Watson .pru_connect = uipc_connect, 110784d61770SRobert Watson .pru_connect2 = uipc_connect2, 110884d61770SRobert Watson .pru_detach = uipc_detach, 110984d61770SRobert Watson .pru_disconnect = uipc_disconnect, 111084d61770SRobert Watson .pru_listen = uipc_listen, 111184d61770SRobert Watson .pru_peeraddr = uipc_peeraddr, 111284d61770SRobert Watson .pru_rcvd = uipc_rcvd, 111384d61770SRobert Watson .pru_send = uipc_send, 111484d61770SRobert Watson .pru_sense = uipc_sense, 111584d61770SRobert Watson .pru_shutdown = uipc_shutdown, 111684d61770SRobert Watson .pru_sockaddr = uipc_sockaddr, 111784d61770SRobert Watson .pru_soreceive = soreceive_generic, /* XXX: or...? */ 111884d61770SRobert Watson .pru_close = uipc_close, 111984d61770SRobert Watson }; 112084d61770SRobert Watson 1121fa9402f2SRobert Watson static struct pr_usrreqs uipc_usrreqs_stream = { 1122fa9402f2SRobert Watson .pru_abort = uipc_abort, 1123fa9402f2SRobert Watson .pru_accept = uipc_accept, 1124fa9402f2SRobert Watson .pru_attach = uipc_attach, 1125fa9402f2SRobert Watson .pru_bind = uipc_bind, 1126fa9402f2SRobert Watson .pru_connect = uipc_connect, 1127fa9402f2SRobert Watson .pru_connect2 = uipc_connect2, 1128fa9402f2SRobert Watson .pru_detach = uipc_detach, 1129fa9402f2SRobert Watson .pru_disconnect = uipc_disconnect, 1130fa9402f2SRobert Watson .pru_listen = uipc_listen, 1131fa9402f2SRobert Watson .pru_peeraddr = uipc_peeraddr, 1132fa9402f2SRobert Watson .pru_rcvd = uipc_rcvd, 1133fa9402f2SRobert Watson .pru_send = uipc_send, 1134fa9402f2SRobert Watson .pru_sense = uipc_sense, 1135fa9402f2SRobert Watson .pru_shutdown = uipc_shutdown, 1136fa9402f2SRobert Watson .pru_sockaddr = uipc_sockaddr, 1137fa9402f2SRobert Watson .pru_soreceive = soreceive_generic, 1138a152f8a3SRobert Watson .pru_close = uipc_close, 1139a29f300eSGarrett Wollman }; 1140df8bae1dSRodney W. Grimes 11410b36cd25SRobert Watson static int 1142892af6b9SRobert Watson uipc_ctloutput(struct socket *so, struct sockopt *sopt) 11430c1bb4fbSDima Dorfman { 114440f2ac28SRobert Watson struct unpcb *unp; 11450d9ce3a1SRobert Watson struct xucred xu; 11466a2989fdSMatthew N. Dodd int error, optval; 11476a2989fdSMatthew N. Dodd 114896a041b5SMatthew N. Dodd if (sopt->sopt_level != 0) 114996a041b5SMatthew N. Dodd return (EINVAL); 115096a041b5SMatthew N. Dodd 11516a2989fdSMatthew N. Dodd unp = sotounpcb(so); 11524d4b555eSRobert Watson KASSERT(unp != NULL, ("uipc_ctloutput: unp == NULL")); 11536a2989fdSMatthew N. Dodd error = 0; 11540c1bb4fbSDima Dorfman switch (sopt->sopt_dir) { 11550c1bb4fbSDima Dorfman case SOPT_GET: 11560c1bb4fbSDima Dorfman switch (sopt->sopt_name) { 11570c1bb4fbSDima Dorfman case LOCAL_PEERCRED: 1158e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 11590c1bb4fbSDima Dorfman if (unp->unp_flags & UNP_HAVEPC) 11600d9ce3a1SRobert Watson xu = unp->unp_peercred; 11610c1bb4fbSDima Dorfman else { 11620c1bb4fbSDima Dorfman if (so->so_type == SOCK_STREAM) 11630c1bb4fbSDima Dorfman error = ENOTCONN; 11640c1bb4fbSDima Dorfman else 11650c1bb4fbSDima Dorfman error = EINVAL; 11660c1bb4fbSDima Dorfman } 1167e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 11680d9ce3a1SRobert Watson if (error == 0) 11690d9ce3a1SRobert Watson error = sooptcopyout(sopt, &xu, sizeof(xu)); 11700c1bb4fbSDima Dorfman break; 1171e7c33e29SRobert Watson 11726a2989fdSMatthew N. Dodd case LOCAL_CREDS: 1173a6357845SRobert Watson /* Unlocked read. */ 11746a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_WANTCRED ? 1 : 0; 11756a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 11766a2989fdSMatthew N. Dodd break; 1177e7c33e29SRobert Watson 11786a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 1179a6357845SRobert Watson /* Unlocked read. */ 11806a2989fdSMatthew N. Dodd optval = unp->unp_flags & UNP_CONNWAIT ? 1 : 0; 11816a2989fdSMatthew N. Dodd error = sooptcopyout(sopt, &optval, sizeof(optval)); 11826a2989fdSMatthew N. Dodd break; 1183e7c33e29SRobert Watson 11840c1bb4fbSDima Dorfman default: 11850c1bb4fbSDima Dorfman error = EOPNOTSUPP; 11860c1bb4fbSDima Dorfman break; 11870c1bb4fbSDima Dorfman } 11880c1bb4fbSDima Dorfman break; 1189e7c33e29SRobert Watson 11900c1bb4fbSDima Dorfman case SOPT_SET: 11916a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 11926a2989fdSMatthew N. Dodd case LOCAL_CREDS: 11936a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 11946a2989fdSMatthew N. Dodd error = sooptcopyin(sopt, &optval, sizeof(optval), 11956a2989fdSMatthew N. Dodd sizeof(optval)); 11966a2989fdSMatthew N. Dodd if (error) 11976a2989fdSMatthew N. Dodd break; 11986a2989fdSMatthew N. Dodd 1199e7c33e29SRobert Watson #define OPTSET(bit) do { \ 1200e7c33e29SRobert Watson UNP_PCB_LOCK(unp); \ 12016a2989fdSMatthew N. Dodd if (optval) \ 12026a2989fdSMatthew N. Dodd unp->unp_flags |= bit; \ 12036a2989fdSMatthew N. Dodd else \ 1204e7c33e29SRobert Watson unp->unp_flags &= ~bit; \ 1205e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); \ 1206e7c33e29SRobert Watson } while (0) 12076a2989fdSMatthew N. Dodd 12086a2989fdSMatthew N. Dodd switch (sopt->sopt_name) { 12096a2989fdSMatthew N. Dodd case LOCAL_CREDS: 12106a2989fdSMatthew N. Dodd OPTSET(UNP_WANTCRED); 12116a2989fdSMatthew N. Dodd break; 1212e7c33e29SRobert Watson 12136a2989fdSMatthew N. Dodd case LOCAL_CONNWAIT: 12146a2989fdSMatthew N. Dodd OPTSET(UNP_CONNWAIT); 12156a2989fdSMatthew N. Dodd break; 1216e7c33e29SRobert Watson 12176a2989fdSMatthew N. Dodd default: 12186a2989fdSMatthew N. Dodd break; 12196a2989fdSMatthew N. Dodd } 12206a2989fdSMatthew N. Dodd break; 12216a2989fdSMatthew N. Dodd #undef OPTSET 12226a2989fdSMatthew N. Dodd default: 12236a2989fdSMatthew N. Dodd error = ENOPROTOOPT; 12246a2989fdSMatthew N. Dodd break; 12256a2989fdSMatthew N. Dodd } 1226abb886faSMatthew N. Dodd break; 1227e7c33e29SRobert Watson 12280c1bb4fbSDima Dorfman default: 12290c1bb4fbSDima Dorfman error = EOPNOTSUPP; 12300c1bb4fbSDima Dorfman break; 12310c1bb4fbSDima Dorfman } 12320c1bb4fbSDima Dorfman return (error); 12330c1bb4fbSDima Dorfman } 12340c1bb4fbSDima Dorfman 1235f708ef1bSPoul-Henning Kamp static int 1236892af6b9SRobert Watson unp_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 1237df8bae1dSRodney W. Grimes { 1238892af6b9SRobert Watson struct sockaddr_un *soun = (struct sockaddr_un *)nam; 1239892af6b9SRobert Watson struct vnode *vp; 1240892af6b9SRobert Watson struct socket *so2, *so3; 1241b295bdcdSRobert Watson struct unpcb *unp, *unp2, *unp3; 12429e289446SWojciech A. Koszek int error, len, vfslocked; 1243df8bae1dSRodney W. Grimes struct nameidata nd; 124457bf258eSGarrett Wollman char buf[SOCK_MAXADDRLEN]; 12450d9ce3a1SRobert Watson struct sockaddr *sa; 12460d9ce3a1SRobert Watson 12473dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 1248df8bae1dSRodney W. Grimes 12494d4b555eSRobert Watson unp = sotounpcb(so); 12504d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 1251e7c33e29SRobert Watson 125257bf258eSGarrett Wollman len = nam->sa_len - offsetof(struct sockaddr_un, sun_path); 125357bf258eSGarrett Wollman if (len <= 0) 1254e5aeaa0cSDag-Erling Smørgrav return (EINVAL); 12557928893dSEd Maste bcopy(soun->sun_path, buf, len); 12567928893dSEd Maste buf[len] = 0; 1257e7c33e29SRobert Watson 1258e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 12594f1f0ef5SRobert Watson if (unp->unp_flags & UNP_CONNECTING) { 1260e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 12614f1f0ef5SRobert Watson return (EALREADY); 12624f1f0ef5SRobert Watson } 12633dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 126405102f04SRobert Watson unp->unp_flags |= UNP_CONNECTING; 1265e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 1266e7c33e29SRobert Watson 12670d9ce3a1SRobert Watson sa = malloc(sizeof(struct sockaddr_un), M_SONAME, M_WAITOK); 12689e289446SWojciech A. Koszek NDINIT(&nd, LOOKUP, MPSAFE | FOLLOW | LOCKLEAF, UIO_SYSSPACE, buf, 12699e289446SWojciech A. Koszek td); 1270797f2d22SPoul-Henning Kamp error = namei(&nd); 1271797f2d22SPoul-Henning Kamp if (error) 12720d9ce3a1SRobert Watson vp = NULL; 12730d9ce3a1SRobert Watson else 1274df8bae1dSRodney W. Grimes vp = nd.ni_vp; 12750d9ce3a1SRobert Watson ASSERT_VOP_LOCKED(vp, "unp_connect"); 12769e289446SWojciech A. Koszek vfslocked = NDHASGIANT(&nd); 1277762e6b85SEivind Eklund NDFREE(&nd, NDF_ONLY_PNBUF); 12780d9ce3a1SRobert Watson if (error) 12790d9ce3a1SRobert Watson goto bad; 12800d9ce3a1SRobert Watson 1281df8bae1dSRodney W. Grimes if (vp->v_type != VSOCK) { 1282df8bae1dSRodney W. Grimes error = ENOTSOCK; 1283df8bae1dSRodney W. Grimes goto bad; 1284df8bae1dSRodney W. Grimes } 12856fac927cSRobert Watson #ifdef MAC 128630d239bcSRobert Watson error = mac_vnode_check_open(td->td_ucred, vp, VWRITE | VREAD); 12876fac927cSRobert Watson if (error) 12886fac927cSRobert Watson goto bad; 12896fac927cSRobert Watson #endif 1290a854ed98SJohn Baldwin error = VOP_ACCESS(vp, VWRITE, td->td_ucred, td); 1291797f2d22SPoul-Henning Kamp if (error) 1292df8bae1dSRodney W. Grimes goto bad; 12939e289446SWojciech A. Koszek VFS_UNLOCK_GIANT(vfslocked); 1294e7c33e29SRobert Watson 1295b295bdcdSRobert Watson unp = sotounpcb(so); 12964d4b555eSRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 1297e7c33e29SRobert Watson 1298e7c33e29SRobert Watson /* 12993dab55bcSRobert Watson * Lock linkage lock for two reasons: make sure v_socket is stable, 1300e7c33e29SRobert Watson * and to protect simultaneous locking of multiple pcbs. 1301e7c33e29SRobert Watson */ 13023dab55bcSRobert Watson UNP_LINK_WLOCK(); 1303df8bae1dSRodney W. Grimes so2 = vp->v_socket; 1304fc3fcacfSRobert Watson if (so2 == NULL) { 1305df8bae1dSRodney W. Grimes error = ECONNREFUSED; 13062260c03dSRobert Watson goto bad2; 1307df8bae1dSRodney W. Grimes } 1308df8bae1dSRodney W. Grimes if (so->so_type != so2->so_type) { 1309df8bae1dSRodney W. Grimes error = EPROTOTYPE; 13102260c03dSRobert Watson goto bad2; 1311df8bae1dSRodney W. Grimes } 1312df8bae1dSRodney W. Grimes if (so->so_proto->pr_flags & PR_CONNREQUIRED) { 1313e7c33e29SRobert Watson if (so2->so_options & SO_ACCEPTCONN) { 13140d9ce3a1SRobert Watson so3 = sonewconn(so2, 0); 1315e7c33e29SRobert Watson } else 13160d9ce3a1SRobert Watson so3 = NULL; 13170d9ce3a1SRobert Watson if (so3 == NULL) { 1318df8bae1dSRodney W. Grimes error = ECONNREFUSED; 13190d9ce3a1SRobert Watson goto bad2; 1320df8bae1dSRodney W. Grimes } 13210c1bb4fbSDima Dorfman unp = sotounpcb(so); 1322df8bae1dSRodney W. Grimes unp2 = sotounpcb(so2); 1323df8bae1dSRodney W. Grimes unp3 = sotounpcb(so3); 1324e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 1325e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 1326e7c33e29SRobert Watson UNP_PCB_LOCK(unp3); 13270d9ce3a1SRobert Watson if (unp2->unp_addr != NULL) { 13280d9ce3a1SRobert Watson bcopy(unp2->unp_addr, sa, unp2->unp_addr->sun_len); 13290d9ce3a1SRobert Watson unp3->unp_addr = (struct sockaddr_un *) sa; 13300d9ce3a1SRobert Watson sa = NULL; 13310d9ce3a1SRobert Watson } 1332b523ec24SRobert Watson 13330c1bb4fbSDima Dorfman /* 13341c381b19SRobert Watson * The connecter's (client's) credentials are copied from its 13351c381b19SRobert Watson * process structure at the time of connect() (which is now). 13360c1bb4fbSDima Dorfman */ 1337a854ed98SJohn Baldwin cru2x(td->td_ucred, &unp3->unp_peercred); 13380c1bb4fbSDima Dorfman unp3->unp_flags |= UNP_HAVEPC; 1339b523ec24SRobert Watson 13400c1bb4fbSDima Dorfman /* 13411c381b19SRobert Watson * The receiver's (server's) credentials are copied from the 13421c381b19SRobert Watson * unp_peercred member of socket on which the former called 1343e7c33e29SRobert Watson * listen(); uipc_listen() cached that process's credentials 13441c381b19SRobert Watson * at that time so we can use them now. 13450c1bb4fbSDima Dorfman */ 13460c1bb4fbSDima Dorfman KASSERT(unp2->unp_flags & UNP_HAVEPCCACHED, 13470c1bb4fbSDima Dorfman ("unp_connect: listener without cached peercred")); 13480c1bb4fbSDima Dorfman memcpy(&unp->unp_peercred, &unp2->unp_peercred, 13490c1bb4fbSDima Dorfman sizeof(unp->unp_peercred)); 13500c1bb4fbSDima Dorfman unp->unp_flags |= UNP_HAVEPC; 1351481f8fe8SMaxim Konovalov if (unp2->unp_flags & UNP_WANTCRED) 1352481f8fe8SMaxim Konovalov unp3->unp_flags |= UNP_WANTCRED; 1353e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp3); 1354e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 1355e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 1356335654d7SRobert Watson #ifdef MAC 135730d239bcSRobert Watson mac_socketpeer_set_from_socket(so, so3); 135830d239bcSRobert Watson mac_socketpeer_set_from_socket(so3, so); 1359335654d7SRobert Watson #endif 13600c1bb4fbSDima Dorfman 1361df8bae1dSRodney W. Grimes so2 = so3; 1362df8bae1dSRodney W. Grimes } 1363e7c33e29SRobert Watson unp = sotounpcb(so); 1364e7c33e29SRobert Watson KASSERT(unp != NULL, ("unp_connect: unp == NULL")); 1365e7c33e29SRobert Watson unp2 = sotounpcb(so2); 1366e7c33e29SRobert Watson KASSERT(unp2 != NULL, ("unp_connect: unp2 == NULL")); 1367e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 1368e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 13696a2989fdSMatthew N. Dodd error = unp_connect2(so, so2, PRU_CONNECT); 1370e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 1371e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 13720d9ce3a1SRobert Watson bad2: 13733dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 13749e289446SWojciech A. Koszek if (vfslocked) 13759e289446SWojciech A. Koszek /* 13769e289446SWojciech A. Koszek * Giant has been previously acquired. This means filesystem 13779e289446SWojciech A. Koszek * isn't MPSAFE. Do it once again. 13789e289446SWojciech A. Koszek */ 13790d9ce3a1SRobert Watson mtx_lock(&Giant); 1380df8bae1dSRodney W. Grimes bad: 13810d9ce3a1SRobert Watson if (vp != NULL) 1382df8bae1dSRodney W. Grimes vput(vp); 13839e289446SWojciech A. Koszek VFS_UNLOCK_GIANT(vfslocked); 13840d9ce3a1SRobert Watson free(sa, M_SONAME); 13853dab55bcSRobert Watson UNP_LINK_WLOCK(); 1386e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 13874f1f0ef5SRobert Watson unp->unp_flags &= ~UNP_CONNECTING; 1388e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 1389df8bae1dSRodney W. Grimes return (error); 1390df8bae1dSRodney W. Grimes } 1391df8bae1dSRodney W. Grimes 1392db48c0d2SRobert Watson static int 13936a2989fdSMatthew N. Dodd unp_connect2(struct socket *so, struct socket *so2, int req) 1394df8bae1dSRodney W. Grimes { 1395e7c33e29SRobert Watson struct unpcb *unp; 1396892af6b9SRobert Watson struct unpcb *unp2; 1397df8bae1dSRodney W. Grimes 1398e7c33e29SRobert Watson unp = sotounpcb(so); 1399e7c33e29SRobert Watson KASSERT(unp != NULL, ("unp_connect2: unp == NULL")); 1400e7c33e29SRobert Watson unp2 = sotounpcb(so2); 1401e7c33e29SRobert Watson KASSERT(unp2 != NULL, ("unp_connect2: unp2 == NULL")); 1402e7c33e29SRobert Watson 14033dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 1404e7c33e29SRobert Watson UNP_PCB_LOCK_ASSERT(unp); 1405e7c33e29SRobert Watson UNP_PCB_LOCK_ASSERT(unp2); 14060d9ce3a1SRobert Watson 1407df8bae1dSRodney W. Grimes if (so2->so_type != so->so_type) 1408df8bae1dSRodney W. Grimes return (EPROTOTYPE); 1409df8bae1dSRodney W. Grimes unp->unp_conn = unp2; 1410e7c33e29SRobert Watson 1411df8bae1dSRodney W. Grimes switch (so->so_type) { 1412df8bae1dSRodney W. Grimes case SOCK_DGRAM: 141398271db4SGarrett Wollman LIST_INSERT_HEAD(&unp2->unp_refs, unp, unp_reflink); 1414df8bae1dSRodney W. Grimes soisconnected(so); 1415df8bae1dSRodney W. Grimes break; 1416df8bae1dSRodney W. Grimes 1417df8bae1dSRodney W. Grimes case SOCK_STREAM: 141884d61770SRobert Watson case SOCK_SEQPACKET: 1419df8bae1dSRodney W. Grimes unp2->unp_conn = unp; 14206a2989fdSMatthew N. Dodd if (req == PRU_CONNECT && 14216a2989fdSMatthew N. Dodd ((unp->unp_flags | unp2->unp_flags) & UNP_CONNWAIT)) 14226a2989fdSMatthew N. Dodd soisconnecting(so); 14236a2989fdSMatthew N. Dodd else 1424df8bae1dSRodney W. Grimes soisconnected(so); 1425df8bae1dSRodney W. Grimes soisconnected(so2); 1426df8bae1dSRodney W. Grimes break; 1427df8bae1dSRodney W. Grimes 1428df8bae1dSRodney W. Grimes default: 1429df8bae1dSRodney W. Grimes panic("unp_connect2"); 1430df8bae1dSRodney W. Grimes } 1431df8bae1dSRodney W. Grimes return (0); 1432df8bae1dSRodney W. Grimes } 1433df8bae1dSRodney W. Grimes 1434f708ef1bSPoul-Henning Kamp static void 1435e7c33e29SRobert Watson unp_disconnect(struct unpcb *unp, struct unpcb *unp2) 1436df8bae1dSRodney W. Grimes { 14371b2e3b4bSRobert Watson struct socket *so; 1438df8bae1dSRodney W. Grimes 1439e7c33e29SRobert Watson KASSERT(unp2 != NULL, ("unp_disconnect: unp2 == NULL")); 14400d9ce3a1SRobert Watson 14413dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 1442e7c33e29SRobert Watson UNP_PCB_LOCK_ASSERT(unp); 1443e7c33e29SRobert Watson UNP_PCB_LOCK_ASSERT(unp2); 1444e7c33e29SRobert Watson 1445fc3fcacfSRobert Watson unp->unp_conn = NULL; 1446df8bae1dSRodney W. Grimes switch (unp->unp_socket->so_type) { 1447df8bae1dSRodney W. Grimes case SOCK_DGRAM: 144898271db4SGarrett Wollman LIST_REMOVE(unp, unp_reflink); 14491b2e3b4bSRobert Watson so = unp->unp_socket; 14501b2e3b4bSRobert Watson SOCK_LOCK(so); 14511b2e3b4bSRobert Watson so->so_state &= ~SS_ISCONNECTED; 14521b2e3b4bSRobert Watson SOCK_UNLOCK(so); 1453df8bae1dSRodney W. Grimes break; 1454df8bae1dSRodney W. Grimes 1455df8bae1dSRodney W. Grimes case SOCK_STREAM: 145684d61770SRobert Watson case SOCK_SEQPACKET: 1457df8bae1dSRodney W. Grimes soisdisconnected(unp->unp_socket); 1458fc3fcacfSRobert Watson unp2->unp_conn = NULL; 1459df8bae1dSRodney W. Grimes soisdisconnected(unp2->unp_socket); 1460df8bae1dSRodney W. Grimes break; 1461df8bae1dSRodney W. Grimes } 1462df8bae1dSRodney W. Grimes } 1463df8bae1dSRodney W. Grimes 14640d9ce3a1SRobert Watson /* 1465d7924b70SRobert Watson * unp_pcblist() walks the global list of struct unpcb's to generate a 1466d7924b70SRobert Watson * pointer list, bumping the refcount on each unpcb. It then copies them out 1467d7924b70SRobert Watson * sequentially, validating the generation number on each to see if it has 1468d7924b70SRobert Watson * been detached. All of this is necessary because copyout() may sleep on 1469d7924b70SRobert Watson * disk I/O. 14700d9ce3a1SRobert Watson */ 147198271db4SGarrett Wollman static int 147282d9ae4eSPoul-Henning Kamp unp_pcblist(SYSCTL_HANDLER_ARGS) 147398271db4SGarrett Wollman { 1474f5ef029eSPoul-Henning Kamp int error, i, n; 14759ae328fcSJohn Baldwin int freeunp; 147698271db4SGarrett Wollman struct unpcb *unp, **unp_list; 147798271db4SGarrett Wollman unp_gen_t gencnt; 14788f364875SJulian Elischer struct xunpgen *xug; 147998271db4SGarrett Wollman struct unp_head *head; 14808f364875SJulian Elischer struct xunpcb *xu; 148198271db4SGarrett Wollman 148284d61770SRobert Watson switch ((intptr_t)arg1) { 148384d61770SRobert Watson case SOCK_STREAM: 148484d61770SRobert Watson head = &unp_shead; 148584d61770SRobert Watson break; 148684d61770SRobert Watson 148784d61770SRobert Watson case SOCK_DGRAM: 148884d61770SRobert Watson head = &unp_dhead; 148984d61770SRobert Watson break; 149084d61770SRobert Watson 149184d61770SRobert Watson case SOCK_SEQPACKET: 149284d61770SRobert Watson head = &unp_sphead; 149384d61770SRobert Watson break; 149484d61770SRobert Watson 149584d61770SRobert Watson default: 1496604f19c9SRobert Watson panic("unp_pcblist: arg1 %d", (int)(intptr_t)arg1); 149784d61770SRobert Watson } 149898271db4SGarrett Wollman 149998271db4SGarrett Wollman /* 150098271db4SGarrett Wollman * The process of preparing the PCB list is too time-consuming and 150198271db4SGarrett Wollman * resource-intensive to repeat twice on every request. 150298271db4SGarrett Wollman */ 1503fc3fcacfSRobert Watson if (req->oldptr == NULL) { 150498271db4SGarrett Wollman n = unp_count; 15058f364875SJulian Elischer req->oldidx = 2 * (sizeof *xug) 150698271db4SGarrett Wollman + (n + n/8) * sizeof(struct xunpcb); 1507e5aeaa0cSDag-Erling Smørgrav return (0); 150898271db4SGarrett Wollman } 150998271db4SGarrett Wollman 1510fc3fcacfSRobert Watson if (req->newptr != NULL) 1511e5aeaa0cSDag-Erling Smørgrav return (EPERM); 151298271db4SGarrett Wollman 151398271db4SGarrett Wollman /* 151498271db4SGarrett Wollman * OK, now we're committed to doing something. 151598271db4SGarrett Wollman */ 1516a163d034SWarner Losh xug = malloc(sizeof(*xug), M_TEMP, M_WAITOK); 15173dab55bcSRobert Watson UNP_LIST_LOCK(); 151898271db4SGarrett Wollman gencnt = unp_gencnt; 151998271db4SGarrett Wollman n = unp_count; 15203dab55bcSRobert Watson UNP_LIST_UNLOCK(); 152198271db4SGarrett Wollman 15228f364875SJulian Elischer xug->xug_len = sizeof *xug; 15238f364875SJulian Elischer xug->xug_count = n; 15248f364875SJulian Elischer xug->xug_gen = gencnt; 15258f364875SJulian Elischer xug->xug_sogen = so_gencnt; 15268f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 15278f364875SJulian Elischer if (error) { 15288f364875SJulian Elischer free(xug, M_TEMP); 1529e5aeaa0cSDag-Erling Smørgrav return (error); 15308f364875SJulian Elischer } 153198271db4SGarrett Wollman 1532a163d034SWarner Losh unp_list = malloc(n * sizeof *unp_list, M_TEMP, M_WAITOK); 153398271db4SGarrett Wollman 15343dab55bcSRobert Watson UNP_LIST_LOCK(); 15352e3c8fcbSPoul-Henning Kamp for (unp = LIST_FIRST(head), i = 0; unp && i < n; 15362e3c8fcbSPoul-Henning Kamp unp = LIST_NEXT(unp, unp_link)) { 1537e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 15388a7d8cc6SRobert Watson if (unp->unp_gencnt <= gencnt) { 1539a854ed98SJohn Baldwin if (cr_cansee(req->td->td_ucred, 1540e7c33e29SRobert Watson unp->unp_socket->so_cred)) { 1541e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 15424787fd37SPaul Saab continue; 1543e7c33e29SRobert Watson } 154498271db4SGarrett Wollman unp_list[i++] = unp; 15459ae328fcSJohn Baldwin unp->unp_refcount++; 154698271db4SGarrett Wollman } 1547e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 15484787fd37SPaul Saab } 15493dab55bcSRobert Watson UNP_LIST_UNLOCK(); 15501c381b19SRobert Watson n = i; /* In case we lost some during malloc. */ 155198271db4SGarrett Wollman 155298271db4SGarrett Wollman error = 0; 1553fe2eee82SColin Percival xu = malloc(sizeof(*xu), M_TEMP, M_WAITOK | M_ZERO); 155498271db4SGarrett Wollman for (i = 0; i < n; i++) { 155598271db4SGarrett Wollman unp = unp_list[i]; 1556e7c33e29SRobert Watson UNP_PCB_LOCK(unp); 15579ae328fcSJohn Baldwin unp->unp_refcount--; 15589ae328fcSJohn Baldwin if (unp->unp_refcount != 0 && unp->unp_gencnt <= gencnt) { 15598f364875SJulian Elischer xu->xu_len = sizeof *xu; 15608f364875SJulian Elischer xu->xu_unpp = unp; 156198271db4SGarrett Wollman /* 156298271db4SGarrett Wollman * XXX - need more locking here to protect against 156398271db4SGarrett Wollman * connect/disconnect races for SMP. 156498271db4SGarrett Wollman */ 1565fc3fcacfSRobert Watson if (unp->unp_addr != NULL) 15668f364875SJulian Elischer bcopy(unp->unp_addr, &xu->xu_addr, 156798271db4SGarrett Wollman unp->unp_addr->sun_len); 1568fc3fcacfSRobert Watson if (unp->unp_conn != NULL && 1569fc3fcacfSRobert Watson unp->unp_conn->unp_addr != NULL) 157098271db4SGarrett Wollman bcopy(unp->unp_conn->unp_addr, 15718f364875SJulian Elischer &xu->xu_caddr, 157298271db4SGarrett Wollman unp->unp_conn->unp_addr->sun_len); 15738f364875SJulian Elischer bcopy(unp, &xu->xu_unp, sizeof *unp); 15748f364875SJulian Elischer sotoxsocket(unp->unp_socket, &xu->xu_socket); 1575e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 15768f364875SJulian Elischer error = SYSCTL_OUT(req, xu, sizeof *xu); 15779ae328fcSJohn Baldwin } else { 15789ae328fcSJohn Baldwin freeunp = (unp->unp_refcount == 0); 1579e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp); 1580e7c33e29SRobert Watson if (freeunp) { 1581e7c33e29SRobert Watson UNP_PCB_LOCK_DESTROY(unp); 15829ae328fcSJohn Baldwin uma_zfree(unp_zone, unp); 158398271db4SGarrett Wollman } 158498271db4SGarrett Wollman } 1585e7c33e29SRobert Watson } 15868f364875SJulian Elischer free(xu, M_TEMP); 158798271db4SGarrett Wollman if (!error) { 158898271db4SGarrett Wollman /* 15891c381b19SRobert Watson * Give the user an updated idea of our state. If the 15901c381b19SRobert Watson * generation differs from what we told her before, she knows 15911c381b19SRobert Watson * that something happened while we were processing this 15921c381b19SRobert Watson * request, and it might be necessary to retry. 159398271db4SGarrett Wollman */ 15948f364875SJulian Elischer xug->xug_gen = unp_gencnt; 15958f364875SJulian Elischer xug->xug_sogen = so_gencnt; 15968f364875SJulian Elischer xug->xug_count = unp_count; 15978f364875SJulian Elischer error = SYSCTL_OUT(req, xug, sizeof *xug); 159898271db4SGarrett Wollman } 159998271db4SGarrett Wollman free(unp_list, M_TEMP); 16008f364875SJulian Elischer free(xug, M_TEMP); 1601e5aeaa0cSDag-Erling Smørgrav return (error); 160298271db4SGarrett Wollman } 160398271db4SGarrett Wollman 16042fee06f0SMatthew D Fleming SYSCTL_PROC(_net_local_dgram, OID_AUTO, pcblist, CTLTYPE_OPAQUE | CTLFLAG_RD, 16052fee06f0SMatthew D Fleming (void *)(intptr_t)SOCK_DGRAM, 0, unp_pcblist, "S,xunpcb", 160698271db4SGarrett Wollman "List of active local datagram sockets"); 16072fee06f0SMatthew D Fleming SYSCTL_PROC(_net_local_stream, OID_AUTO, pcblist, CTLTYPE_OPAQUE | CTLFLAG_RD, 16082fee06f0SMatthew D Fleming (void *)(intptr_t)SOCK_STREAM, 0, unp_pcblist, "S,xunpcb", 160998271db4SGarrett Wollman "List of active local stream sockets"); 16102fee06f0SMatthew D Fleming SYSCTL_PROC(_net_local_seqpacket, OID_AUTO, pcblist, 16112fee06f0SMatthew D Fleming CTLTYPE_OPAQUE | CTLFLAG_RD, 16122fee06f0SMatthew D Fleming (void *)(intptr_t)SOCK_SEQPACKET, 0, unp_pcblist, "S,xunpcb", 161384d61770SRobert Watson "List of active local seqpacket sockets"); 161498271db4SGarrett Wollman 1615f708ef1bSPoul-Henning Kamp static void 1616892af6b9SRobert Watson unp_shutdown(struct unpcb *unp) 1617df8bae1dSRodney W. Grimes { 1618e7c33e29SRobert Watson struct unpcb *unp2; 1619df8bae1dSRodney W. Grimes struct socket *so; 1620df8bae1dSRodney W. Grimes 16213dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 1622e7c33e29SRobert Watson UNP_PCB_LOCK_ASSERT(unp); 16230d9ce3a1SRobert Watson 1624e7c33e29SRobert Watson unp2 = unp->unp_conn; 162584d61770SRobert Watson if ((unp->unp_socket->so_type == SOCK_STREAM || 162684d61770SRobert Watson (unp->unp_socket->so_type == SOCK_SEQPACKET)) && unp2 != NULL) { 1627e7c33e29SRobert Watson so = unp2->unp_socket; 1628e7c33e29SRobert Watson if (so != NULL) 1629df8bae1dSRodney W. Grimes socantrcvmore(so); 1630df8bae1dSRodney W. Grimes } 1631e7c33e29SRobert Watson } 1632df8bae1dSRodney W. Grimes 1633f708ef1bSPoul-Henning Kamp static void 1634892af6b9SRobert Watson unp_drop(struct unpcb *unp, int errno) 1635df8bae1dSRodney W. Grimes { 1636df8bae1dSRodney W. Grimes struct socket *so = unp->unp_socket; 1637e7c33e29SRobert Watson struct unpcb *unp2; 1638df8bae1dSRodney W. Grimes 16393dab55bcSRobert Watson UNP_LINK_WLOCK_ASSERT(); 1640e7c33e29SRobert Watson UNP_PCB_LOCK_ASSERT(unp); 16410d9ce3a1SRobert Watson 1642df8bae1dSRodney W. Grimes so->so_error = errno; 1643e7c33e29SRobert Watson unp2 = unp->unp_conn; 1644e7c33e29SRobert Watson if (unp2 == NULL) 1645e7c33e29SRobert Watson return; 1646e7c33e29SRobert Watson UNP_PCB_LOCK(unp2); 1647e7c33e29SRobert Watson unp_disconnect(unp, unp2); 1648e7c33e29SRobert Watson UNP_PCB_UNLOCK(unp2); 1649df8bae1dSRodney W. Grimes } 1650df8bae1dSRodney W. Grimes 16512bc21ed9SDavid Malone static void 1652892af6b9SRobert Watson unp_freerights(struct file **rp, int fdcount) 1653df8bae1dSRodney W. Grimes { 16542bc21ed9SDavid Malone int i; 16552bc21ed9SDavid Malone struct file *fp; 1656df8bae1dSRodney W. Grimes 16572bc21ed9SDavid Malone for (i = 0; i < fdcount; i++) { 1658e7c33e29SRobert Watson fp = *rp; 1659e7c33e29SRobert Watson *rp++ = NULL; 16608692c025SYoshinobu Inoue unp_discard(fp); 1661df8bae1dSRodney W. Grimes } 16622bc21ed9SDavid Malone } 16632bc21ed9SDavid Malone 16640b36cd25SRobert Watson static int 1665892af6b9SRobert Watson unp_externalize(struct mbuf *control, struct mbuf **controlp) 16662bc21ed9SDavid Malone { 16672bc21ed9SDavid Malone struct thread *td = curthread; /* XXX */ 16682bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 16692bc21ed9SDavid Malone int i; 16702bc21ed9SDavid Malone int *fdp; 16712bc21ed9SDavid Malone struct file **rp; 16722bc21ed9SDavid Malone struct file *fp; 16732bc21ed9SDavid Malone void *data; 16742bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 16752bc21ed9SDavid Malone int error, newfds; 16762bc21ed9SDavid Malone int f; 16772bc21ed9SDavid Malone u_int newlen; 16782bc21ed9SDavid Malone 16793dab55bcSRobert Watson UNP_LINK_UNLOCK_ASSERT(); 16804c5bc1caSRobert Watson 16812bc21ed9SDavid Malone error = 0; 16822bc21ed9SDavid Malone if (controlp != NULL) /* controlp == NULL => free control messages */ 16832bc21ed9SDavid Malone *controlp = NULL; 16842bc21ed9SDavid Malone while (cm != NULL) { 16852bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) { 16862bc21ed9SDavid Malone error = EINVAL; 16872bc21ed9SDavid Malone break; 16882bc21ed9SDavid Malone } 16892bc21ed9SDavid Malone data = CMSG_DATA(cm); 16902bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 16912bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET 16922bc21ed9SDavid Malone && cm->cmsg_type == SCM_RIGHTS) { 16932bc21ed9SDavid Malone newfds = datalen / sizeof(struct file *); 16942bc21ed9SDavid Malone rp = data; 16952bc21ed9SDavid Malone 1696e2f9a08bSOlivier Houchard /* If we're not outputting the descriptors free them. */ 16972bc21ed9SDavid Malone if (error || controlp == NULL) { 16982bc21ed9SDavid Malone unp_freerights(rp, newfds); 16992bc21ed9SDavid Malone goto next; 17002bc21ed9SDavid Malone } 17015e3f7694SRobert Watson FILEDESC_XLOCK(td->td_proc->p_fd); 17022bc21ed9SDavid Malone /* if the new FD's will not fit free them. */ 17032bc21ed9SDavid Malone if (!fdavail(td, newfds)) { 17045e3f7694SRobert Watson FILEDESC_XUNLOCK(td->td_proc->p_fd); 17052bc21ed9SDavid Malone error = EMSGSIZE; 17062bc21ed9SDavid Malone unp_freerights(rp, newfds); 17072bc21ed9SDavid Malone goto next; 1708df8bae1dSRodney W. Grimes } 170960a5ef26SRobert Watson 1710ed5b7817SJulian Elischer /* 17111c381b19SRobert Watson * Now change each pointer to an fd in the global 17121c381b19SRobert Watson * table to an integer that is the index to the local 17131c381b19SRobert Watson * fd table entry that we set up to point to the 17141c381b19SRobert Watson * global one we are transferring. 1715ed5b7817SJulian Elischer */ 17162bc21ed9SDavid Malone newlen = newfds * sizeof(int); 17172bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 17182bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 17192bc21ed9SDavid Malone if (*controlp == NULL) { 17205e3f7694SRobert Watson FILEDESC_XUNLOCK(td->td_proc->p_fd); 17212bc21ed9SDavid Malone error = E2BIG; 17222bc21ed9SDavid Malone unp_freerights(rp, newfds); 17232bc21ed9SDavid Malone goto next; 17242bc21ed9SDavid Malone } 17252bc21ed9SDavid Malone 17262bc21ed9SDavid Malone fdp = (int *) 17272bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 1728df8bae1dSRodney W. Grimes for (i = 0; i < newfds; i++) { 1729a6d4491cSDag-Erling Smørgrav if (fdalloc(td, 0, &f)) 17302bc21ed9SDavid Malone panic("unp_externalize fdalloc failed"); 17318692c025SYoshinobu Inoue fp = *rp++; 1732b40ce416SJulian Elischer td->td_proc->p_fd->fd_ofiles[f] = fp; 1733397c19d1SJeff Roberson unp_externalize_fp(fp); 17348692c025SYoshinobu Inoue *fdp++ = f; 1735df8bae1dSRodney W. Grimes } 17365e3f7694SRobert Watson FILEDESC_XUNLOCK(td->td_proc->p_fd); 17371c381b19SRobert Watson } else { 17381c381b19SRobert Watson /* We can just copy anything else across. */ 17392bc21ed9SDavid Malone if (error || controlp == NULL) 17402bc21ed9SDavid Malone goto next; 17412bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, datalen, 17422bc21ed9SDavid Malone cm->cmsg_type, cm->cmsg_level); 17432bc21ed9SDavid Malone if (*controlp == NULL) { 17442bc21ed9SDavid Malone error = ENOBUFS; 17452bc21ed9SDavid Malone goto next; 17462bc21ed9SDavid Malone } 17472bc21ed9SDavid Malone bcopy(data, 17482bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)), 17492bc21ed9SDavid Malone datalen); 17502bc21ed9SDavid Malone } 17512bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 17522bc21ed9SDavid Malone 17532bc21ed9SDavid Malone next: 17542bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 17552bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 17562bc21ed9SDavid Malone cm = (struct cmsghdr *) 17572bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 17588692c025SYoshinobu Inoue } else { 17592bc21ed9SDavid Malone clen = 0; 17602bc21ed9SDavid Malone cm = NULL; 17618692c025SYoshinobu Inoue } 17628692c025SYoshinobu Inoue } 17638692c025SYoshinobu Inoue 17642bc21ed9SDavid Malone m_freem(control); 17652bc21ed9SDavid Malone return (error); 1766df8bae1dSRodney W. Grimes } 1767df8bae1dSRodney W. Grimes 17684f590175SPaul Saab static void 17694f590175SPaul Saab unp_zone_change(void *tag) 17704f590175SPaul Saab { 17714f590175SPaul Saab 17724f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 17734f590175SPaul Saab } 17744f590175SPaul Saab 17750b36cd25SRobert Watson static void 177698271db4SGarrett Wollman unp_init(void) 177798271db4SGarrett Wollman { 17781c381b19SRobert Watson 177921ca7b57SMarko Zec #ifdef VIMAGE 178021ca7b57SMarko Zec if (!IS_DEFAULT_VNET(curvnet)) 178121ca7b57SMarko Zec return; 178221ca7b57SMarko Zec #endif 17839e9d298aSJeff Roberson unp_zone = uma_zcreate("unpcb", sizeof(struct unpcb), NULL, NULL, 17849ae328fcSJohn Baldwin NULL, NULL, UMA_ALIGN_PTR, 0); 1785fc3fcacfSRobert Watson if (unp_zone == NULL) 178698271db4SGarrett Wollman panic("unp_init"); 17874f590175SPaul Saab uma_zone_set_max(unp_zone, maxsockets); 17884f590175SPaul Saab EVENTHANDLER_REGISTER(maxsockets_change, unp_zone_change, 17894f590175SPaul Saab NULL, EVENTHANDLER_PRI_ANY); 179098271db4SGarrett Wollman LIST_INIT(&unp_dhead); 179198271db4SGarrett Wollman LIST_INIT(&unp_shead); 179284d61770SRobert Watson LIST_INIT(&unp_sphead); 17930cb64678SKonstantin Belousov SLIST_INIT(&unp_defers); 1794a0ec558aSRobert Watson TASK_INIT(&unp_gc_task, 0, unp_gc, NULL); 17950cb64678SKonstantin Belousov TASK_INIT(&unp_defer_task, 0, unp_process_defers, NULL); 17963dab55bcSRobert Watson UNP_LINK_LOCK_INIT(); 17973dab55bcSRobert Watson UNP_LIST_LOCK_INIT(); 17980cb64678SKonstantin Belousov UNP_DEFERRED_LOCK_INIT(); 179998271db4SGarrett Wollman } 180098271db4SGarrett Wollman 1801f708ef1bSPoul-Henning Kamp static int 1802892af6b9SRobert Watson unp_internalize(struct mbuf **controlp, struct thread *td) 1803df8bae1dSRodney W. Grimes { 18042bc21ed9SDavid Malone struct mbuf *control = *controlp; 1805b40ce416SJulian Elischer struct proc *p = td->td_proc; 18068692c025SYoshinobu Inoue struct filedesc *fdescp = p->p_fd; 18072bc21ed9SDavid Malone struct cmsghdr *cm = mtod(control, struct cmsghdr *); 18082bc21ed9SDavid Malone struct cmsgcred *cmcred; 18092bc21ed9SDavid Malone struct file **rp; 18102bc21ed9SDavid Malone struct file *fp; 18112bc21ed9SDavid Malone struct timeval *tv; 18122bc21ed9SDavid Malone int i, fd, *fdp; 18132bc21ed9SDavid Malone void *data; 18142bc21ed9SDavid Malone socklen_t clen = control->m_len, datalen; 18152bc21ed9SDavid Malone int error, oldfds; 18168692c025SYoshinobu Inoue u_int newlen; 1817df8bae1dSRodney W. Grimes 18183dab55bcSRobert Watson UNP_LINK_UNLOCK_ASSERT(); 18194c5bc1caSRobert Watson 18202bc21ed9SDavid Malone error = 0; 18212bc21ed9SDavid Malone *controlp = NULL; 18222bc21ed9SDavid Malone while (cm != NULL) { 18232bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_level != SOL_SOCKET 18242bc21ed9SDavid Malone || cm->cmsg_len > clen) { 18252bc21ed9SDavid Malone error = EINVAL; 18262bc21ed9SDavid Malone goto out; 18272bc21ed9SDavid Malone } 18282bc21ed9SDavid Malone data = CMSG_DATA(cm); 18292bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len - (caddr_t)data; 18302bc21ed9SDavid Malone 18312bc21ed9SDavid Malone switch (cm->cmsg_type) { 18320b788fa1SBill Paul /* 18330b788fa1SBill Paul * Fill in credential information. 18340b788fa1SBill Paul */ 18352bc21ed9SDavid Malone case SCM_CREDS: 18362bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*cmcred), 18372bc21ed9SDavid Malone SCM_CREDS, SOL_SOCKET); 18382bc21ed9SDavid Malone if (*controlp == NULL) { 18392bc21ed9SDavid Malone error = ENOBUFS; 18402bc21ed9SDavid Malone goto out; 18412bc21ed9SDavid Malone } 18422bc21ed9SDavid Malone cmcred = (struct cmsgcred *) 18432bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 18440b788fa1SBill Paul cmcred->cmcred_pid = p->p_pid; 1845a854ed98SJohn Baldwin cmcred->cmcred_uid = td->td_ucred->cr_ruid; 1846a854ed98SJohn Baldwin cmcred->cmcred_gid = td->td_ucred->cr_rgid; 1847a854ed98SJohn Baldwin cmcred->cmcred_euid = td->td_ucred->cr_uid; 1848a854ed98SJohn Baldwin cmcred->cmcred_ngroups = MIN(td->td_ucred->cr_ngroups, 18490b788fa1SBill Paul CMGROUP_MAX); 18500b788fa1SBill Paul for (i = 0; i < cmcred->cmcred_ngroups; i++) 18512bc21ed9SDavid Malone cmcred->cmcred_groups[i] = 1852a854ed98SJohn Baldwin td->td_ucred->cr_groups[i]; 18532bc21ed9SDavid Malone break; 18540b788fa1SBill Paul 18552bc21ed9SDavid Malone case SCM_RIGHTS: 18562bc21ed9SDavid Malone oldfds = datalen / sizeof (int); 1857ed5b7817SJulian Elischer /* 18581c381b19SRobert Watson * Check that all the FDs passed in refer to legal 18591c381b19SRobert Watson * files. If not, reject the entire operation. 1860ed5b7817SJulian Elischer */ 18612bc21ed9SDavid Malone fdp = data; 18625e3f7694SRobert Watson FILEDESC_SLOCK(fdescp); 1863df8bae1dSRodney W. Grimes for (i = 0; i < oldfds; i++) { 18648692c025SYoshinobu Inoue fd = *fdp++; 18658692c025SYoshinobu Inoue if ((unsigned)fd >= fdescp->fd_nfiles || 18662bc21ed9SDavid Malone fdescp->fd_ofiles[fd] == NULL) { 18675e3f7694SRobert Watson FILEDESC_SUNLOCK(fdescp); 18682bc21ed9SDavid Malone error = EBADF; 18692bc21ed9SDavid Malone goto out; 18702bc21ed9SDavid Malone } 1871e7d6662fSAlfred Perlstein fp = fdescp->fd_ofiles[fd]; 1872e7d6662fSAlfred Perlstein if (!(fp->f_ops->fo_flags & DFLAG_PASSABLE)) { 18735e3f7694SRobert Watson FILEDESC_SUNLOCK(fdescp); 1874e7d6662fSAlfred Perlstein error = EOPNOTSUPP; 1875e7d6662fSAlfred Perlstein goto out; 1876e7d6662fSAlfred Perlstein } 1877e7d6662fSAlfred Perlstein 1878df8bae1dSRodney W. Grimes } 18795e3f7694SRobert Watson 1880ed5b7817SJulian Elischer /* 18810b36cd25SRobert Watson * Now replace the integer FDs with pointers to the 18820b36cd25SRobert Watson * associated global file table entry.. 1883ed5b7817SJulian Elischer */ 18842bc21ed9SDavid Malone newlen = oldfds * sizeof(struct file *); 18852bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, newlen, 18862bc21ed9SDavid Malone SCM_RIGHTS, SOL_SOCKET); 18872bc21ed9SDavid Malone if (*controlp == NULL) { 18885e3f7694SRobert Watson FILEDESC_SUNLOCK(fdescp); 18892bc21ed9SDavid Malone error = E2BIG; 18902bc21ed9SDavid Malone goto out; 18918692c025SYoshinobu Inoue } 18922bc21ed9SDavid Malone fdp = data; 18932bc21ed9SDavid Malone rp = (struct file **) 18942bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 18958692c025SYoshinobu Inoue for (i = 0; i < oldfds; i++) { 18968692c025SYoshinobu Inoue fp = fdescp->fd_ofiles[*fdp++]; 1897df8bae1dSRodney W. Grimes *rp++ = fp; 1898397c19d1SJeff Roberson unp_internalize_fp(fp); 1899df8bae1dSRodney W. Grimes } 19005e3f7694SRobert Watson FILEDESC_SUNLOCK(fdescp); 19012bc21ed9SDavid Malone break; 19022bc21ed9SDavid Malone 19032bc21ed9SDavid Malone case SCM_TIMESTAMP: 19042bc21ed9SDavid Malone *controlp = sbcreatecontrol(NULL, sizeof(*tv), 19052bc21ed9SDavid Malone SCM_TIMESTAMP, SOL_SOCKET); 19062bc21ed9SDavid Malone if (*controlp == NULL) { 19072bc21ed9SDavid Malone error = ENOBUFS; 19082bc21ed9SDavid Malone goto out; 19098692c025SYoshinobu Inoue } 19102bc21ed9SDavid Malone tv = (struct timeval *) 19112bc21ed9SDavid Malone CMSG_DATA(mtod(*controlp, struct cmsghdr *)); 19122bc21ed9SDavid Malone microtime(tv); 19132bc21ed9SDavid Malone break; 19142bc21ed9SDavid Malone 19152bc21ed9SDavid Malone default: 19162bc21ed9SDavid Malone error = EINVAL; 19172bc21ed9SDavid Malone goto out; 19182bc21ed9SDavid Malone } 19192bc21ed9SDavid Malone 19202bc21ed9SDavid Malone controlp = &(*controlp)->m_next; 19212bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 19222bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 19232bc21ed9SDavid Malone cm = (struct cmsghdr *) 19242bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 19252bc21ed9SDavid Malone } else { 19262bc21ed9SDavid Malone clen = 0; 19272bc21ed9SDavid Malone cm = NULL; 19282bc21ed9SDavid Malone } 19292bc21ed9SDavid Malone } 19302bc21ed9SDavid Malone 19312bc21ed9SDavid Malone out: 19322bc21ed9SDavid Malone m_freem(control); 19332bc21ed9SDavid Malone return (error); 1934df8bae1dSRodney W. Grimes } 1935df8bae1dSRodney W. Grimes 19365b950deaSRobert Watson static struct mbuf * 19376a2989fdSMatthew N. Dodd unp_addsockcred(struct thread *td, struct mbuf *control) 19386a2989fdSMatthew N. Dodd { 193970df31f4SMaxim Konovalov struct mbuf *m, *n, *n_prev; 19406a2989fdSMatthew N. Dodd struct sockcred *sc; 194170df31f4SMaxim Konovalov const struct cmsghdr *cm; 19426a2989fdSMatthew N. Dodd int ngroups; 19436a2989fdSMatthew N. Dodd int i; 19446a2989fdSMatthew N. Dodd 19456a2989fdSMatthew N. Dodd ngroups = MIN(td->td_ucred->cr_ngroups, CMGROUP_MAX); 19466a2989fdSMatthew N. Dodd m = sbcreatecontrol(NULL, SOCKCREDSIZE(ngroups), SCM_CREDS, SOL_SOCKET); 19476a2989fdSMatthew N. Dodd if (m == NULL) 19486a2989fdSMatthew N. Dodd return (control); 19496a2989fdSMatthew N. Dodd 19506a2989fdSMatthew N. Dodd sc = (struct sockcred *) CMSG_DATA(mtod(m, struct cmsghdr *)); 19516a2989fdSMatthew N. Dodd sc->sc_uid = td->td_ucred->cr_ruid; 19526a2989fdSMatthew N. Dodd sc->sc_euid = td->td_ucred->cr_uid; 19536a2989fdSMatthew N. Dodd sc->sc_gid = td->td_ucred->cr_rgid; 19546a2989fdSMatthew N. Dodd sc->sc_egid = td->td_ucred->cr_gid; 19556a2989fdSMatthew N. Dodd sc->sc_ngroups = ngroups; 19566a2989fdSMatthew N. Dodd for (i = 0; i < sc->sc_ngroups; i++) 19576a2989fdSMatthew N. Dodd sc->sc_groups[i] = td->td_ucred->cr_groups[i]; 19586a2989fdSMatthew N. Dodd 19596a2989fdSMatthew N. Dodd /* 19601c381b19SRobert Watson * Unlink SCM_CREDS control messages (struct cmsgcred), since just 19611c381b19SRobert Watson * created SCM_CREDS control message (struct sockcred) has another 19621c381b19SRobert Watson * format. 19636a2989fdSMatthew N. Dodd */ 196470df31f4SMaxim Konovalov if (control != NULL) 196570df31f4SMaxim Konovalov for (n = control, n_prev = NULL; n != NULL;) { 196670df31f4SMaxim Konovalov cm = mtod(n, struct cmsghdr *); 196770df31f4SMaxim Konovalov if (cm->cmsg_level == SOL_SOCKET && 196870df31f4SMaxim Konovalov cm->cmsg_type == SCM_CREDS) { 196970df31f4SMaxim Konovalov if (n_prev == NULL) 197070df31f4SMaxim Konovalov control = n->m_next; 197170df31f4SMaxim Konovalov else 197270df31f4SMaxim Konovalov n_prev->m_next = n->m_next; 197370df31f4SMaxim Konovalov n = m_free(n); 197470df31f4SMaxim Konovalov } else { 197570df31f4SMaxim Konovalov n_prev = n; 197670df31f4SMaxim Konovalov n = n->m_next; 197770df31f4SMaxim Konovalov } 197870df31f4SMaxim Konovalov } 19796a2989fdSMatthew N. Dodd 198070df31f4SMaxim Konovalov /* Prepend it to the head. */ 198170df31f4SMaxim Konovalov m->m_next = control; 198270df31f4SMaxim Konovalov return (m); 19836a2989fdSMatthew N. Dodd } 19846a2989fdSMatthew N. Dodd 1985397c19d1SJeff Roberson static struct unpcb * 1986397c19d1SJeff Roberson fptounp(struct file *fp) 1987397c19d1SJeff Roberson { 1988397c19d1SJeff Roberson struct socket *so; 1989397c19d1SJeff Roberson 1990397c19d1SJeff Roberson if (fp->f_type != DTYPE_SOCKET) 1991397c19d1SJeff Roberson return (NULL); 1992397c19d1SJeff Roberson if ((so = fp->f_data) == NULL) 1993397c19d1SJeff Roberson return (NULL); 1994397c19d1SJeff Roberson if (so->so_proto->pr_domain != &localdomain) 1995397c19d1SJeff Roberson return (NULL); 1996397c19d1SJeff Roberson return sotounpcb(so); 1997397c19d1SJeff Roberson } 1998397c19d1SJeff Roberson 1999397c19d1SJeff Roberson static void 2000397c19d1SJeff Roberson unp_discard(struct file *fp) 2001397c19d1SJeff Roberson { 20020cb64678SKonstantin Belousov struct unp_defer *dr; 2003397c19d1SJeff Roberson 20040cb64678SKonstantin Belousov if (unp_externalize_fp(fp)) { 20050cb64678SKonstantin Belousov dr = malloc(sizeof(*dr), M_TEMP, M_WAITOK); 20060cb64678SKonstantin Belousov dr->ud_fp = fp; 20070cb64678SKonstantin Belousov UNP_DEFERRED_LOCK(); 20080cb64678SKonstantin Belousov SLIST_INSERT_HEAD(&unp_defers, dr, ud_link); 20090cb64678SKonstantin Belousov UNP_DEFERRED_UNLOCK(); 20100cb64678SKonstantin Belousov atomic_add_int(&unp_defers_count, 1); 20110cb64678SKonstantin Belousov taskqueue_enqueue(taskqueue_thread, &unp_defer_task); 20120cb64678SKonstantin Belousov } else 2013397c19d1SJeff Roberson (void) closef(fp, (struct thread *)NULL); 2014397c19d1SJeff Roberson } 2015397c19d1SJeff Roberson 2016397c19d1SJeff Roberson static void 20170cb64678SKonstantin Belousov unp_process_defers(void *arg __unused, int pending) 20180cb64678SKonstantin Belousov { 20190cb64678SKonstantin Belousov struct unp_defer *dr; 20200cb64678SKonstantin Belousov SLIST_HEAD(, unp_defer) drl; 20210cb64678SKonstantin Belousov int count; 20220cb64678SKonstantin Belousov 20230cb64678SKonstantin Belousov SLIST_INIT(&drl); 20240cb64678SKonstantin Belousov for (;;) { 20250cb64678SKonstantin Belousov UNP_DEFERRED_LOCK(); 20260cb64678SKonstantin Belousov if (SLIST_FIRST(&unp_defers) == NULL) { 20270cb64678SKonstantin Belousov UNP_DEFERRED_UNLOCK(); 20280cb64678SKonstantin Belousov break; 20290cb64678SKonstantin Belousov } 20300cb64678SKonstantin Belousov SLIST_SWAP(&unp_defers, &drl, unp_defer); 20310cb64678SKonstantin Belousov UNP_DEFERRED_UNLOCK(); 20320cb64678SKonstantin Belousov count = 0; 20330cb64678SKonstantin Belousov while ((dr = SLIST_FIRST(&drl)) != NULL) { 20340cb64678SKonstantin Belousov SLIST_REMOVE_HEAD(&drl, ud_link); 20350cb64678SKonstantin Belousov closef(dr->ud_fp, NULL); 20360cb64678SKonstantin Belousov free(dr, M_TEMP); 20370cb64678SKonstantin Belousov count++; 20380cb64678SKonstantin Belousov } 20390cb64678SKonstantin Belousov atomic_add_int(&unp_defers_count, -count); 20400cb64678SKonstantin Belousov } 20410cb64678SKonstantin Belousov } 20420cb64678SKonstantin Belousov 20430cb64678SKonstantin Belousov static void 2044397c19d1SJeff Roberson unp_internalize_fp(struct file *fp) 2045397c19d1SJeff Roberson { 2046397c19d1SJeff Roberson struct unpcb *unp; 2047397c19d1SJeff Roberson 20483dab55bcSRobert Watson UNP_LINK_WLOCK(); 2049397c19d1SJeff Roberson if ((unp = fptounp(fp)) != NULL) { 2050397c19d1SJeff Roberson unp->unp_file = fp; 2051397c19d1SJeff Roberson unp->unp_msgcount++; 2052397c19d1SJeff Roberson } 205341e0f66dSJeff Roberson fhold(fp); 2054397c19d1SJeff Roberson unp_rights++; 20553dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 2056397c19d1SJeff Roberson } 2057397c19d1SJeff Roberson 20580cb64678SKonstantin Belousov static int 2059397c19d1SJeff Roberson unp_externalize_fp(struct file *fp) 2060397c19d1SJeff Roberson { 2061397c19d1SJeff Roberson struct unpcb *unp; 20620cb64678SKonstantin Belousov int ret; 2063397c19d1SJeff Roberson 20643dab55bcSRobert Watson UNP_LINK_WLOCK(); 20650cb64678SKonstantin Belousov if ((unp = fptounp(fp)) != NULL) { 2066397c19d1SJeff Roberson unp->unp_msgcount--; 20670cb64678SKonstantin Belousov ret = 1; 20680cb64678SKonstantin Belousov } else 20690cb64678SKonstantin Belousov ret = 0; 2070397c19d1SJeff Roberson unp_rights--; 20713dab55bcSRobert Watson UNP_LINK_WUNLOCK(); 20720cb64678SKonstantin Belousov return (ret); 2073397c19d1SJeff Roberson } 2074397c19d1SJeff Roberson 2075161a0c7cSRobert Watson /* 2076a0ec558aSRobert Watson * unp_defer indicates whether additional work has been defered for a future 2077a0ec558aSRobert Watson * pass through unp_gc(). It is thread local and does not require explicit 2078a0ec558aSRobert Watson * synchronization. 2079161a0c7cSRobert Watson */ 2080397c19d1SJeff Roberson static int unp_marked; 2081397c19d1SJeff Roberson static int unp_unreachable; 2082a0ec558aSRobert Watson 2083397c19d1SJeff Roberson static void 2084397c19d1SJeff Roberson unp_accessable(struct file *fp) 2085397c19d1SJeff Roberson { 2086397c19d1SJeff Roberson struct unpcb *unp; 2087397c19d1SJeff Roberson 20886f552cb0SJeff Roberson if ((unp = fptounp(fp)) == NULL) 2089397c19d1SJeff Roberson return; 2090397c19d1SJeff Roberson if (unp->unp_gcflag & UNPGC_REF) 2091397c19d1SJeff Roberson return; 2092397c19d1SJeff Roberson unp->unp_gcflag &= ~UNPGC_DEAD; 2093397c19d1SJeff Roberson unp->unp_gcflag |= UNPGC_REF; 2094397c19d1SJeff Roberson unp_marked++; 2095397c19d1SJeff Roberson } 2096397c19d1SJeff Roberson 2097397c19d1SJeff Roberson static void 2098397c19d1SJeff Roberson unp_gc_process(struct unpcb *unp) 2099397c19d1SJeff Roberson { 2100397c19d1SJeff Roberson struct socket *soa; 2101397c19d1SJeff Roberson struct socket *so; 2102397c19d1SJeff Roberson struct file *fp; 2103397c19d1SJeff Roberson 2104397c19d1SJeff Roberson /* Already processed. */ 2105397c19d1SJeff Roberson if (unp->unp_gcflag & UNPGC_SCANNED) 2106397c19d1SJeff Roberson return; 2107397c19d1SJeff Roberson fp = unp->unp_file; 210860a5ef26SRobert Watson 2109397c19d1SJeff Roberson /* 2110397c19d1SJeff Roberson * Check for a socket potentially in a cycle. It must be in a 2111397c19d1SJeff Roberson * queue as indicated by msgcount, and this must equal the file 2112397c19d1SJeff Roberson * reference count. Note that when msgcount is 0 the file is NULL. 2113397c19d1SJeff Roberson */ 211441e0f66dSJeff Roberson if ((unp->unp_gcflag & UNPGC_REF) == 0 && fp && 211541e0f66dSJeff Roberson unp->unp_msgcount != 0 && fp->f_count == unp->unp_msgcount) { 2116397c19d1SJeff Roberson unp->unp_gcflag |= UNPGC_DEAD; 2117397c19d1SJeff Roberson unp_unreachable++; 2118397c19d1SJeff Roberson return; 2119397c19d1SJeff Roberson } 212060a5ef26SRobert Watson 2121397c19d1SJeff Roberson /* 2122397c19d1SJeff Roberson * Mark all sockets we reference with RIGHTS. 2123397c19d1SJeff Roberson */ 2124397c19d1SJeff Roberson so = unp->unp_socket; 2125397c19d1SJeff Roberson SOCKBUF_LOCK(&so->so_rcv); 2126397c19d1SJeff Roberson unp_scan(so->so_rcv.sb_mb, unp_accessable); 2127397c19d1SJeff Roberson SOCKBUF_UNLOCK(&so->so_rcv); 212860a5ef26SRobert Watson 2129397c19d1SJeff Roberson /* 2130397c19d1SJeff Roberson * Mark all sockets in our accept queue. 2131397c19d1SJeff Roberson */ 2132397c19d1SJeff Roberson ACCEPT_LOCK(); 2133397c19d1SJeff Roberson TAILQ_FOREACH(soa, &so->so_comp, so_list) { 2134397c19d1SJeff Roberson SOCKBUF_LOCK(&soa->so_rcv); 2135397c19d1SJeff Roberson unp_scan(soa->so_rcv.sb_mb, unp_accessable); 2136397c19d1SJeff Roberson SOCKBUF_UNLOCK(&soa->so_rcv); 2137397c19d1SJeff Roberson } 2138397c19d1SJeff Roberson ACCEPT_UNLOCK(); 2139397c19d1SJeff Roberson unp->unp_gcflag |= UNPGC_SCANNED; 2140397c19d1SJeff Roberson } 2141a0ec558aSRobert Watson 2142a0ec558aSRobert Watson static int unp_recycled; 2143be6b1304STom Rhodes SYSCTL_INT(_net_local, OID_AUTO, recycled, CTLFLAG_RD, &unp_recycled, 0, 2144be6b1304STom Rhodes "Number of unreachable sockets claimed by the garbage collector."); 2145df8bae1dSRodney W. Grimes 2146397c19d1SJeff Roberson static int unp_taskcount; 2147be6b1304STom Rhodes SYSCTL_INT(_net_local, OID_AUTO, taskcount, CTLFLAG_RD, &unp_taskcount, 0, 2148be6b1304STom Rhodes "Number of times the garbage collector has run."); 2149397c19d1SJeff Roberson 2150f708ef1bSPoul-Henning Kamp static void 2151a0ec558aSRobert Watson unp_gc(__unused void *arg, int pending) 2152df8bae1dSRodney W. Grimes { 215384d61770SRobert Watson struct unp_head *heads[] = { &unp_dhead, &unp_shead, &unp_sphead, 215484d61770SRobert Watson NULL }; 2155397c19d1SJeff Roberson struct unp_head **head; 2156*f7780c61SKonstantin Belousov struct file *f, **unref; 2157397c19d1SJeff Roberson struct unpcb *unp; 2158*f7780c61SKonstantin Belousov int i, total; 2159df8bae1dSRodney W. Grimes 2160a0ec558aSRobert Watson unp_taskcount++; 21613dab55bcSRobert Watson UNP_LIST_LOCK(); 2162ed5b7817SJulian Elischer /* 2163397c19d1SJeff Roberson * First clear all gc flags from previous runs. 2164ed5b7817SJulian Elischer */ 2165397c19d1SJeff Roberson for (head = heads; *head != NULL; head++) 2166397c19d1SJeff Roberson LIST_FOREACH(unp, *head, unp_link) 216741e0f66dSJeff Roberson unp->unp_gcflag = 0; 216860a5ef26SRobert Watson 2169397c19d1SJeff Roberson /* 2170397c19d1SJeff Roberson * Scan marking all reachable sockets with UNPGC_REF. Once a socket 2171397c19d1SJeff Roberson * is reachable all of the sockets it references are reachable. 2172397c19d1SJeff Roberson * Stop the scan once we do a complete loop without discovering 2173397c19d1SJeff Roberson * a new reachable socket. 2174397c19d1SJeff Roberson */ 2175df8bae1dSRodney W. Grimes do { 2176397c19d1SJeff Roberson unp_unreachable = 0; 2177397c19d1SJeff Roberson unp_marked = 0; 2178397c19d1SJeff Roberson for (head = heads; *head != NULL; head++) 2179397c19d1SJeff Roberson LIST_FOREACH(unp, *head, unp_link) 2180397c19d1SJeff Roberson unp_gc_process(unp); 2181397c19d1SJeff Roberson } while (unp_marked); 21823dab55bcSRobert Watson UNP_LIST_UNLOCK(); 2183397c19d1SJeff Roberson if (unp_unreachable == 0) 2184397c19d1SJeff Roberson return; 218560a5ef26SRobert Watson 2186ed5b7817SJulian Elischer /* 2187397c19d1SJeff Roberson * Allocate space for a local list of dead unpcbs. 2188ed5b7817SJulian Elischer */ 2189397c19d1SJeff Roberson unref = malloc(unp_unreachable * sizeof(struct file *), 2190397c19d1SJeff Roberson M_TEMP, M_WAITOK); 219160a5ef26SRobert Watson 2192ed5b7817SJulian Elischer /* 2193397c19d1SJeff Roberson * Iterate looking for sockets which have been specifically marked 2194397c19d1SJeff Roberson * as as unreachable and store them locally. 2195ed5b7817SJulian Elischer */ 2196*f7780c61SKonstantin Belousov UNP_LINK_RLOCK(); 21973dab55bcSRobert Watson UNP_LIST_LOCK(); 2198*f7780c61SKonstantin Belousov for (total = 0, head = heads; *head != NULL; head++) 2199397c19d1SJeff Roberson LIST_FOREACH(unp, *head, unp_link) 2200*f7780c61SKonstantin Belousov if ((unp->unp_gcflag & UNPGC_DEAD) != 0) { 2201*f7780c61SKonstantin Belousov f = unp->unp_file; 2202*f7780c61SKonstantin Belousov if (unp->unp_msgcount == 0 || f == NULL || 2203*f7780c61SKonstantin Belousov f->f_count != unp->unp_msgcount) 2204*f7780c61SKonstantin Belousov continue; 2205*f7780c61SKonstantin Belousov unref[total++] = f; 2206*f7780c61SKonstantin Belousov fhold(f); 2207*f7780c61SKonstantin Belousov KASSERT(total <= unp_unreachable, 2208397c19d1SJeff Roberson ("unp_gc: incorrect unreachable count.")); 2209397c19d1SJeff Roberson } 22103dab55bcSRobert Watson UNP_LIST_UNLOCK(); 2211*f7780c61SKonstantin Belousov UNP_LINK_RUNLOCK(); 221260a5ef26SRobert Watson 2213ed5b7817SJulian Elischer /* 2214397c19d1SJeff Roberson * Now flush all sockets, free'ing rights. This will free the 2215397c19d1SJeff Roberson * struct files associated with these sockets but leave each socket 2216397c19d1SJeff Roberson * with one remaining ref. 2217ed5b7817SJulian Elischer */ 2218*f7780c61SKonstantin Belousov for (i = 0; i < total; i++) 2219397c19d1SJeff Roberson sorflush(unref[i]->f_data); 222060a5ef26SRobert Watson 2221ed5b7817SJulian Elischer /* 2222397c19d1SJeff Roberson * And finally release the sockets so they can be reclaimed. 2223ed5b7817SJulian Elischer */ 2224*f7780c61SKonstantin Belousov for (i = 0; i < total; i++) 2225397c19d1SJeff Roberson fdrop(unref[i], NULL); 2226*f7780c61SKonstantin Belousov unp_recycled += total; 2227397c19d1SJeff Roberson free(unref, M_TEMP); 2228df8bae1dSRodney W. Grimes } 2229df8bae1dSRodney W. Grimes 22300b36cd25SRobert Watson static void 2231892af6b9SRobert Watson unp_dispose(struct mbuf *m) 2232df8bae1dSRodney W. Grimes { 2233996c772fSJohn Dyson 2234df8bae1dSRodney W. Grimes if (m) 2235df8bae1dSRodney W. Grimes unp_scan(m, unp_discard); 2236df8bae1dSRodney W. Grimes } 2237df8bae1dSRodney W. Grimes 2238f708ef1bSPoul-Henning Kamp static void 2239892af6b9SRobert Watson unp_scan(struct mbuf *m0, void (*op)(struct file *)) 2240df8bae1dSRodney W. Grimes { 22412bc21ed9SDavid Malone struct mbuf *m; 22422bc21ed9SDavid Malone struct file **rp; 22432bc21ed9SDavid Malone struct cmsghdr *cm; 22442bc21ed9SDavid Malone void *data; 22452bc21ed9SDavid Malone int i; 22462bc21ed9SDavid Malone socklen_t clen, datalen; 2247df8bae1dSRodney W. Grimes int qfds; 2248df8bae1dSRodney W. Grimes 2249fc3fcacfSRobert Watson while (m0 != NULL) { 22502bc21ed9SDavid Malone for (m = m0; m; m = m->m_next) { 225112396bdcSDavid Malone if (m->m_type != MT_CONTROL) 2252df8bae1dSRodney W. Grimes continue; 22532bc21ed9SDavid Malone 22542bc21ed9SDavid Malone cm = mtod(m, struct cmsghdr *); 22552bc21ed9SDavid Malone clen = m->m_len; 22562bc21ed9SDavid Malone 22572bc21ed9SDavid Malone while (cm != NULL) { 22582bc21ed9SDavid Malone if (sizeof(*cm) > clen || cm->cmsg_len > clen) 22592bc21ed9SDavid Malone break; 22602bc21ed9SDavid Malone 22612bc21ed9SDavid Malone data = CMSG_DATA(cm); 22622bc21ed9SDavid Malone datalen = (caddr_t)cm + cm->cmsg_len 22632bc21ed9SDavid Malone - (caddr_t)data; 22642bc21ed9SDavid Malone 22652bc21ed9SDavid Malone if (cm->cmsg_level == SOL_SOCKET && 22662bc21ed9SDavid Malone cm->cmsg_type == SCM_RIGHTS) { 22672bc21ed9SDavid Malone qfds = datalen / sizeof (struct file *); 22682bc21ed9SDavid Malone rp = data; 2269df8bae1dSRodney W. Grimes for (i = 0; i < qfds; i++) 2270df8bae1dSRodney W. Grimes (*op)(*rp++); 22712bc21ed9SDavid Malone } 22722bc21ed9SDavid Malone 22732bc21ed9SDavid Malone if (CMSG_SPACE(datalen) < clen) { 22742bc21ed9SDavid Malone clen -= CMSG_SPACE(datalen); 22752bc21ed9SDavid Malone cm = (struct cmsghdr *) 22762bc21ed9SDavid Malone ((caddr_t)cm + CMSG_SPACE(datalen)); 22772bc21ed9SDavid Malone } else { 22782bc21ed9SDavid Malone clen = 0; 22792bc21ed9SDavid Malone cm = NULL; 22802bc21ed9SDavid Malone } 22812bc21ed9SDavid Malone } 2282df8bae1dSRodney W. Grimes } 2283df8bae1dSRodney W. Grimes m0 = m0->m_act; 2284df8bae1dSRodney W. Grimes } 2285df8bae1dSRodney W. Grimes } 2286df8bae1dSRodney W. Grimes 228703c96c31SRobert Watson #ifdef DDB 228803c96c31SRobert Watson static void 228903c96c31SRobert Watson db_print_indent(int indent) 229003c96c31SRobert Watson { 229103c96c31SRobert Watson int i; 229203c96c31SRobert Watson 229303c96c31SRobert Watson for (i = 0; i < indent; i++) 229403c96c31SRobert Watson db_printf(" "); 229503c96c31SRobert Watson } 229603c96c31SRobert Watson 229703c96c31SRobert Watson static void 229803c96c31SRobert Watson db_print_unpflags(int unp_flags) 229903c96c31SRobert Watson { 230003c96c31SRobert Watson int comma; 230103c96c31SRobert Watson 230203c96c31SRobert Watson comma = 0; 230303c96c31SRobert Watson if (unp_flags & UNP_HAVEPC) { 230403c96c31SRobert Watson db_printf("%sUNP_HAVEPC", comma ? ", " : ""); 230503c96c31SRobert Watson comma = 1; 230603c96c31SRobert Watson } 230703c96c31SRobert Watson if (unp_flags & UNP_HAVEPCCACHED) { 230803c96c31SRobert Watson db_printf("%sUNP_HAVEPCCACHED", comma ? ", " : ""); 230903c96c31SRobert Watson comma = 1; 231003c96c31SRobert Watson } 231103c96c31SRobert Watson if (unp_flags & UNP_WANTCRED) { 231203c96c31SRobert Watson db_printf("%sUNP_WANTCRED", comma ? ", " : ""); 231303c96c31SRobert Watson comma = 1; 231403c96c31SRobert Watson } 231503c96c31SRobert Watson if (unp_flags & UNP_CONNWAIT) { 231603c96c31SRobert Watson db_printf("%sUNP_CONNWAIT", comma ? ", " : ""); 231703c96c31SRobert Watson comma = 1; 231803c96c31SRobert Watson } 231903c96c31SRobert Watson if (unp_flags & UNP_CONNECTING) { 232003c96c31SRobert Watson db_printf("%sUNP_CONNECTING", comma ? ", " : ""); 232103c96c31SRobert Watson comma = 1; 232203c96c31SRobert Watson } 232303c96c31SRobert Watson if (unp_flags & UNP_BINDING) { 232403c96c31SRobert Watson db_printf("%sUNP_BINDING", comma ? ", " : ""); 232503c96c31SRobert Watson comma = 1; 232603c96c31SRobert Watson } 232703c96c31SRobert Watson } 232803c96c31SRobert Watson 232903c96c31SRobert Watson static void 233003c96c31SRobert Watson db_print_xucred(int indent, struct xucred *xu) 233103c96c31SRobert Watson { 233203c96c31SRobert Watson int comma, i; 233303c96c31SRobert Watson 233403c96c31SRobert Watson db_print_indent(indent); 233503c96c31SRobert Watson db_printf("cr_version: %u cr_uid: %u cr_ngroups: %d\n", 233603c96c31SRobert Watson xu->cr_version, xu->cr_uid, xu->cr_ngroups); 233703c96c31SRobert Watson db_print_indent(indent); 233803c96c31SRobert Watson db_printf("cr_groups: "); 233903c96c31SRobert Watson comma = 0; 234003c96c31SRobert Watson for (i = 0; i < xu->cr_ngroups; i++) { 234103c96c31SRobert Watson db_printf("%s%u", comma ? ", " : "", xu->cr_groups[i]); 234203c96c31SRobert Watson comma = 1; 234303c96c31SRobert Watson } 234403c96c31SRobert Watson db_printf("\n"); 234503c96c31SRobert Watson } 234603c96c31SRobert Watson 234703c96c31SRobert Watson static void 234803c96c31SRobert Watson db_print_unprefs(int indent, struct unp_head *uh) 234903c96c31SRobert Watson { 235003c96c31SRobert Watson struct unpcb *unp; 235103c96c31SRobert Watson int counter; 235203c96c31SRobert Watson 235303c96c31SRobert Watson counter = 0; 235403c96c31SRobert Watson LIST_FOREACH(unp, uh, unp_reflink) { 235503c96c31SRobert Watson if (counter % 4 == 0) 235603c96c31SRobert Watson db_print_indent(indent); 235703c96c31SRobert Watson db_printf("%p ", unp); 235803c96c31SRobert Watson if (counter % 4 == 3) 235903c96c31SRobert Watson db_printf("\n"); 236003c96c31SRobert Watson counter++; 236103c96c31SRobert Watson } 236203c96c31SRobert Watson if (counter != 0 && counter % 4 != 0) 236303c96c31SRobert Watson db_printf("\n"); 236403c96c31SRobert Watson } 236503c96c31SRobert Watson 236603c96c31SRobert Watson DB_SHOW_COMMAND(unpcb, db_show_unpcb) 236703c96c31SRobert Watson { 236803c96c31SRobert Watson struct unpcb *unp; 236903c96c31SRobert Watson 237003c96c31SRobert Watson if (!have_addr) { 237103c96c31SRobert Watson db_printf("usage: show unpcb <addr>\n"); 237203c96c31SRobert Watson return; 237303c96c31SRobert Watson } 237403c96c31SRobert Watson unp = (struct unpcb *)addr; 237503c96c31SRobert Watson 237603c96c31SRobert Watson db_printf("unp_socket: %p unp_vnode: %p\n", unp->unp_socket, 237703c96c31SRobert Watson unp->unp_vnode); 237803c96c31SRobert Watson 237903c96c31SRobert Watson db_printf("unp_ino: %d unp_conn: %p\n", unp->unp_ino, 238003c96c31SRobert Watson unp->unp_conn); 238103c96c31SRobert Watson 238203c96c31SRobert Watson db_printf("unp_refs:\n"); 238303c96c31SRobert Watson db_print_unprefs(2, &unp->unp_refs); 238403c96c31SRobert Watson 238503c96c31SRobert Watson /* XXXRW: Would be nice to print the full address, if any. */ 238603c96c31SRobert Watson db_printf("unp_addr: %p\n", unp->unp_addr); 238703c96c31SRobert Watson 238803c96c31SRobert Watson db_printf("unp_cc: %d unp_mbcnt: %d unp_gencnt: %llu\n", 238903c96c31SRobert Watson unp->unp_cc, unp->unp_mbcnt, 239003c96c31SRobert Watson (unsigned long long)unp->unp_gencnt); 239103c96c31SRobert Watson 239203c96c31SRobert Watson db_printf("unp_flags: %x (", unp->unp_flags); 239303c96c31SRobert Watson db_print_unpflags(unp->unp_flags); 239403c96c31SRobert Watson db_printf(")\n"); 239503c96c31SRobert Watson 239603c96c31SRobert Watson db_printf("unp_peercred:\n"); 239703c96c31SRobert Watson db_print_xucred(2, &unp->unp_peercred); 239803c96c31SRobert Watson 239903c96c31SRobert Watson db_printf("unp_refcount: %u\n", unp->unp_refcount); 240003c96c31SRobert Watson } 240103c96c31SRobert Watson #endif 2402