19454b2d8SWarner Losh /*- 28a36da99SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 38a36da99SPedro F. Giffuni * 4413628a7SBjoern A. Zeeb * Copyright (c) 1999 Poul-Henning Kamp. 5413628a7SBjoern A. Zeeb * Copyright (c) 2008 Bjoern A. Zeeb. 6b38ff370SJamie Gritton * Copyright (c) 2009 James Gritton. 7413628a7SBjoern A. Zeeb * All rights reserved. 8b9f0b66cSBjoern A. Zeeb * 9b9f0b66cSBjoern A. Zeeb * Redistribution and use in source and binary forms, with or without 10b9f0b66cSBjoern A. Zeeb * modification, are permitted provided that the following conditions 11b9f0b66cSBjoern A. Zeeb * are met: 12b9f0b66cSBjoern A. Zeeb * 1. Redistributions of source code must retain the above copyright 13b9f0b66cSBjoern A. Zeeb * notice, this list of conditions and the following disclaimer. 14b9f0b66cSBjoern A. Zeeb * 2. Redistributions in binary form must reproduce the above copyright 15b9f0b66cSBjoern A. Zeeb * notice, this list of conditions and the following disclaimer in the 16b9f0b66cSBjoern A. Zeeb * documentation and/or other materials provided with the distribution. 17b9f0b66cSBjoern A. Zeeb * 18b9f0b66cSBjoern A. Zeeb * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 19b9f0b66cSBjoern A. Zeeb * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 20b9f0b66cSBjoern A. Zeeb * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 21b9f0b66cSBjoern A. Zeeb * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 22b9f0b66cSBjoern A. Zeeb * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 23b9f0b66cSBjoern A. Zeeb * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 24b9f0b66cSBjoern A. Zeeb * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 25b9f0b66cSBjoern A. Zeeb * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 26b9f0b66cSBjoern A. Zeeb * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 27b9f0b66cSBjoern A. Zeeb * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 28b9f0b66cSBjoern A. Zeeb * SUCH DAMAGE. 2907901f22SPoul-Henning Kamp */ 3075c13541SPoul-Henning Kamp 31677b542eSDavid E. O'Brien #include <sys/cdefs.h> 32677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 33677b542eSDavid E. O'Brien 34413628a7SBjoern A. Zeeb #include "opt_ddb.h" 35413628a7SBjoern A. Zeeb #include "opt_inet.h" 36413628a7SBjoern A. Zeeb #include "opt_inet6.h" 3746e3b1cbSPawel Jakub Dawidek 3875c13541SPoul-Henning Kamp #include <sys/param.h> 3975c13541SPoul-Henning Kamp #include <sys/types.h> 4075c13541SPoul-Henning Kamp #include <sys/kernel.h> 4175c13541SPoul-Henning Kamp #include <sys/systm.h> 4275c13541SPoul-Henning Kamp #include <sys/errno.h> 4375c13541SPoul-Henning Kamp #include <sys/sysproto.h> 4475c13541SPoul-Henning Kamp #include <sys/malloc.h> 450304c731SJamie Gritton #include <sys/osd.h> 46800c9408SRobert Watson #include <sys/priv.h> 4775c13541SPoul-Henning Kamp #include <sys/proc.h> 48b3059e09SRobert Watson #include <sys/taskqueue.h> 4957b4252eSKonstantin Belousov #include <sys/fcntl.h> 5075c13541SPoul-Henning Kamp #include <sys/jail.h> 5101137630SRobert Watson #include <sys/lock.h> 5201137630SRobert Watson #include <sys/mutex.h> 53097055e2SEdward Tomasz Napierala #include <sys/racct.h> 54f87beb93SAndriy Gapon #include <sys/rctl.h> 55a7ad07bfSEdward Tomasz Napierala #include <sys/refcount.h> 56dc68a633SPawel Jakub Dawidek #include <sys/sx.h> 5776ca6f88SJamie Gritton #include <sys/sysent.h> 58fd7a8150SMike Barcroft #include <sys/namei.h> 59820a0de9SPawel Jakub Dawidek #include <sys/mount.h> 60fd7a8150SMike Barcroft #include <sys/queue.h> 6175c13541SPoul-Henning Kamp #include <sys/socket.h> 62fd7a8150SMike Barcroft #include <sys/syscallsubr.h> 6383f1e257SRobert Watson #include <sys/sysctl.h> 64fd7a8150SMike Barcroft #include <sys/vnode.h> 65530c0060SRobert Watson 6675c13541SPoul-Henning Kamp #include <net/if.h> 67530c0060SRobert Watson #include <net/vnet.h> 68530c0060SRobert Watson 6975c13541SPoul-Henning Kamp #include <netinet/in.h> 70530c0060SRobert Watson 71413628a7SBjoern A. Zeeb #ifdef DDB 72413628a7SBjoern A. Zeeb #include <ddb/ddb.h> 73413628a7SBjoern A. Zeeb #endif /* DDB */ 7475c13541SPoul-Henning Kamp 75aed55708SRobert Watson #include <security/mac/mac_framework.h> 76aed55708SRobert Watson 778986e3a0SJamie Gritton #define DEFAULT_HOSTUUID "00000000-0000-0000-0000-000000000000" 788986e3a0SJamie Gritton 7975c13541SPoul-Henning Kamp MALLOC_DEFINE(M_PRISON, "prison", "Prison structures"); 80d745c852SEd Schouten static MALLOC_DEFINE(M_PRISON_RACCT, "prison_racct", "Prison racct structures"); 8175c13541SPoul-Henning Kamp 82592bcae8SBjoern A. Zeeb /* Keep struct prison prison0 and some code in kern_jail_set() readable. */ 83592bcae8SBjoern A. Zeeb #ifdef INET 84592bcae8SBjoern A. Zeeb #ifdef INET6 85592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL PR_IP4_SADDRSEL|PR_IP6_SADDRSEL 86592bcae8SBjoern A. Zeeb #else 87592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL PR_IP4_SADDRSEL 88592bcae8SBjoern A. Zeeb #endif 89592bcae8SBjoern A. Zeeb #else /* !INET */ 90592bcae8SBjoern A. Zeeb #ifdef INET6 91592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL PR_IP6_SADDRSEL 92592bcae8SBjoern A. Zeeb #else 93592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL 0 94592bcae8SBjoern A. Zeeb #endif 95592bcae8SBjoern A. Zeeb #endif 96592bcae8SBjoern A. Zeeb 970304c731SJamie Gritton /* prison0 describes what is "real" about the system. */ 980304c731SJamie Gritton struct prison prison0 = { 990304c731SJamie Gritton .pr_id = 0, 1000304c731SJamie Gritton .pr_name = "0", 1010304c731SJamie Gritton .pr_ref = 1, 1020304c731SJamie Gritton .pr_uref = 1, 1030304c731SJamie Gritton .pr_path = "/", 1040304c731SJamie Gritton .pr_securelevel = -1, 1050cc207a6SMartin Matuska .pr_devfs_rsnum = 0, 106b97457e2SJamie Gritton .pr_childmax = JAIL_MAX, 1078986e3a0SJamie Gritton .pr_hostuuid = DEFAULT_HOSTUUID, 10813e403fdSAntoine Brodin .pr_children = LIST_HEAD_INITIALIZER(prison0.pr_children), 109eb79e1c7SBjoern A. Zeeb #ifdef VIMAGE 110592bcae8SBjoern A. Zeeb .pr_flags = PR_HOST|PR_VNET|_PR_IP_SADDRSEL, 111eb79e1c7SBjoern A. Zeeb #else 112592bcae8SBjoern A. Zeeb .pr_flags = PR_HOST|_PR_IP_SADDRSEL, 113eb79e1c7SBjoern A. Zeeb #endif 1140e5c6bd4SJamie Gritton .pr_allow = PR_ALLOW_ALL_STATIC, 1150304c731SJamie Gritton }; 1160304c731SJamie Gritton MTX_SYSINIT(prison0, &prison0.pr_mtx, "jail mutex", MTX_DEF); 11783f1e257SRobert Watson 118672756aaSJamie Gritton struct bool_flags { 119672756aaSJamie Gritton const char *name; 120672756aaSJamie Gritton const char *noname; 121672756aaSJamie Gritton unsigned flag; 122672756aaSJamie Gritton }; 123672756aaSJamie Gritton struct jailsys_flags { 124672756aaSJamie Gritton const char *name; 125672756aaSJamie Gritton unsigned disable; 126672756aaSJamie Gritton unsigned new; 127672756aaSJamie Gritton }; 128672756aaSJamie Gritton 129a7ad07bfSEdward Tomasz Napierala /* allprison, allprison_racct and lastprid are protected by allprison_lock. */ 130dc68a633SPawel Jakub Dawidek struct sx allprison_lock; 131b38ff370SJamie Gritton SX_SYSINIT(allprison_lock, &allprison_lock, "allprison"); 132b38ff370SJamie Gritton struct prisonlist allprison = TAILQ_HEAD_INITIALIZER(allprison); 133a7ad07bfSEdward Tomasz Napierala LIST_HEAD(, prison_racct) allprison_racct; 1342110d913SXin LI int lastprid = 0; 135fd7a8150SMike Barcroft 136b38ff370SJamie Gritton static int do_jail_attach(struct thread *td, struct prison *pr); 137b3059e09SRobert Watson static void prison_complete(void *context, int pending); 138b38ff370SJamie Gritton static void prison_deref(struct prison *pr, int flags); 1390304c731SJamie Gritton static char *prison_path(struct prison *pr1, struct prison *pr2); 1400304c731SJamie Gritton static void prison_remove_one(struct prison *pr); 141a7ad07bfSEdward Tomasz Napierala #ifdef RACCT 142a7ad07bfSEdward Tomasz Napierala static void prison_racct_attach(struct prison *pr); 143c34bbd2aSEdward Tomasz Napierala static void prison_racct_modify(struct prison *pr); 144a7ad07bfSEdward Tomasz Napierala static void prison_racct_detach(struct prison *pr); 145a7ad07bfSEdward Tomasz Napierala #endif 146fd7a8150SMike Barcroft 147b38ff370SJamie Gritton /* Flags for prison_deref */ 148b38ff370SJamie Gritton #define PD_DEREF 0x01 149b38ff370SJamie Gritton #define PD_DEUREF 0x02 150b38ff370SJamie Gritton #define PD_LOCKED 0x04 151b38ff370SJamie Gritton #define PD_LIST_SLOCKED 0x08 152b38ff370SJamie Gritton #define PD_LIST_XLOCKED 0x10 153fd7a8150SMike Barcroft 1540304c731SJamie Gritton /* 1555cc70397SBjoern A. Zeeb * Parameter names corresponding to PR_* flag values. Size values are for kvm 1565cc70397SBjoern A. Zeeb * as we cannot figure out the size of a sparse array, or an array without a 1575cc70397SBjoern A. Zeeb * terminating entry. 1580304c731SJamie Gritton */ 159672756aaSJamie Gritton static struct bool_flags pr_flag_bool[] = { 160672756aaSJamie Gritton {"persist", "nopersist", PR_PERSIST}, 161592bcae8SBjoern A. Zeeb #ifdef INET 162672756aaSJamie Gritton {"ip4.saddrsel", "ip4.nosaddrsel", PR_IP4_SADDRSEL}, 163592bcae8SBjoern A. Zeeb #endif 164592bcae8SBjoern A. Zeeb #ifdef INET6 165672756aaSJamie Gritton {"ip6.saddrsel", "ip6.nosaddrsel", PR_IP6_SADDRSEL}, 166592bcae8SBjoern A. Zeeb #endif 1670304c731SJamie Gritton }; 168672756aaSJamie Gritton const size_t pr_flag_bool_size = sizeof(pr_flag_bool); 1690304c731SJamie Gritton 170672756aaSJamie Gritton static struct jailsys_flags pr_flag_jailsys[] = { 1717cbf7213SJamie Gritton {"host", 0, PR_HOST}, 1727cbf7213SJamie Gritton #ifdef VIMAGE 1737cbf7213SJamie Gritton {"vnet", 0, PR_VNET}, 1747cbf7213SJamie Gritton #endif 1750304c731SJamie Gritton #ifdef INET 1766a3f2779SJamie Gritton {"ip4", PR_IP4_USER, PR_IP4_USER}, 1770304c731SJamie Gritton #endif 1780304c731SJamie Gritton #ifdef INET6 1796a3f2779SJamie Gritton {"ip6", PR_IP6_USER, PR_IP6_USER}, 180679e1390SJamie Gritton #endif 1810304c731SJamie Gritton }; 1825cc70397SBjoern A. Zeeb const size_t pr_flag_jailsys_size = sizeof(pr_flag_jailsys); 1830304c731SJamie Gritton 1840e5c6bd4SJamie Gritton /* Make this array full-size so dynamic parameters can be added. */ 1850e5c6bd4SJamie Gritton static struct bool_flags pr_flag_allow[NBBY * NBPW] = { 186672756aaSJamie Gritton {"allow.set_hostname", "allow.noset_hostname", PR_ALLOW_SET_HOSTNAME}, 187672756aaSJamie Gritton {"allow.sysvipc", "allow.nosysvipc", PR_ALLOW_SYSVIPC}, 188672756aaSJamie Gritton {"allow.raw_sockets", "allow.noraw_sockets", PR_ALLOW_RAW_SOCKETS}, 189672756aaSJamie Gritton {"allow.chflags", "allow.nochflags", PR_ALLOW_CHFLAGS}, 190672756aaSJamie Gritton {"allow.mount", "allow.nomount", PR_ALLOW_MOUNT}, 191672756aaSJamie Gritton {"allow.quotas", "allow.noquotas", PR_ALLOW_QUOTAS}, 192672756aaSJamie Gritton {"allow.socket_af", "allow.nosocket_af", PR_ALLOW_SOCKET_AF}, 193ccd6ac9fSAntoine Brodin {"allow.mlock", "allow.nomlock", PR_ALLOW_MLOCK}, 194672756aaSJamie Gritton {"allow.reserved_ports", "allow.noreserved_ports", 195672756aaSJamie Gritton PR_ALLOW_RESERVED_PORTS}, 196b19d66fdSJamie Gritton {"allow.read_msgbuf", "allow.noread_msgbuf", PR_ALLOW_READ_MSGBUF}, 197b3079544SJamie Gritton {"allow.unprivileged_proc_debug", "allow.nounprivileged_proc_debug", 198b3079544SJamie Gritton PR_ALLOW_UNPRIV_DEBUG}, 1990304c731SJamie Gritton }; 200672756aaSJamie Gritton const size_t pr_flag_allow_size = sizeof(pr_flag_allow); 2010304c731SJamie Gritton 202b3079544SJamie Gritton #define JAIL_DEFAULT_ALLOW (PR_ALLOW_SET_HOSTNAME | \ 203b3079544SJamie Gritton PR_ALLOW_RESERVED_PORTS | \ 204b3079544SJamie Gritton PR_ALLOW_UNPRIV_DEBUG) 20542bebd82SJamie Gritton #define JAIL_DEFAULT_ENFORCE_STATFS 2 206bf3db8aaSMartin Matuska #define JAIL_DEFAULT_DEVFS_RSNUM 0 2070304c731SJamie Gritton static unsigned jail_default_allow = JAIL_DEFAULT_ALLOW; 20842bebd82SJamie Gritton static int jail_default_enforce_statfs = JAIL_DEFAULT_ENFORCE_STATFS; 2090cc207a6SMartin Matuska static int jail_default_devfs_rsnum = JAIL_DEFAULT_DEVFS_RSNUM; 2100304c731SJamie Gritton #if defined(INET) || defined(INET6) 211e92e0574SJamie Gritton static unsigned jail_max_af_ips = 255; 2120304c731SJamie Gritton #endif 2130304c731SJamie Gritton 214b96bd95bSIan Lepore /* 215b96bd95bSIan Lepore * Initialize the parts of prison0 that can't be static-initialized with 216b96bd95bSIan Lepore * constants. This is called from proc0_init() after creating thread0 cpuset. 217b96bd95bSIan Lepore */ 218b96bd95bSIan Lepore void 219b96bd95bSIan Lepore prison0_init(void) 220b96bd95bSIan Lepore { 221b96bd95bSIan Lepore 222b96bd95bSIan Lepore prison0.pr_cpuset = cpuset_ref(thread0.td_cpuset); 223b96bd95bSIan Lepore prison0.pr_osreldate = osreldate; 224b96bd95bSIan Lepore strlcpy(prison0.pr_osrelease, osrelease, sizeof(prison0.pr_osrelease)); 225b96bd95bSIan Lepore } 226b96bd95bSIan Lepore 227116734c4SMatthew Dillon /* 2289ddb7954SMike Barcroft * struct jail_args { 2299ddb7954SMike Barcroft * struct jail *jail; 2309ddb7954SMike Barcroft * }; 231116734c4SMatthew Dillon */ 23275c13541SPoul-Henning Kamp int 233c542c43eSJamie Gritton sys_jail(struct thread *td, struct jail_args *uap) 23475c13541SPoul-Henning Kamp { 235413628a7SBjoern A. Zeeb uint32_t version; 236413628a7SBjoern A. Zeeb int error; 2370304c731SJamie Gritton struct jail j; 238413628a7SBjoern A. Zeeb 239413628a7SBjoern A. Zeeb error = copyin(uap->jail, &version, sizeof(uint32_t)); 240413628a7SBjoern A. Zeeb if (error) 241413628a7SBjoern A. Zeeb return (error); 242413628a7SBjoern A. Zeeb 243413628a7SBjoern A. Zeeb switch (version) { 244413628a7SBjoern A. Zeeb case 0: 245413628a7SBjoern A. Zeeb { 246413628a7SBjoern A. Zeeb struct jail_v0 j0; 247413628a7SBjoern A. Zeeb 2480304c731SJamie Gritton /* FreeBSD single IPv4 jails. */ 2490304c731SJamie Gritton bzero(&j, sizeof(struct jail)); 250413628a7SBjoern A. Zeeb error = copyin(uap->jail, &j0, sizeof(struct jail_v0)); 251413628a7SBjoern A. Zeeb if (error) 252413628a7SBjoern A. Zeeb return (error); 2530304c731SJamie Gritton j.version = j0.version; 2540304c731SJamie Gritton j.path = j0.path; 2550304c731SJamie Gritton j.hostname = j0.hostname; 256b5019bc4SPeter Wemm j.ip4s = htonl(j0.ip_number); /* jail_v0 is host order */ 257413628a7SBjoern A. Zeeb break; 258413628a7SBjoern A. Zeeb } 259413628a7SBjoern A. Zeeb 260413628a7SBjoern A. Zeeb case 1: 261413628a7SBjoern A. Zeeb /* 262413628a7SBjoern A. Zeeb * Version 1 was used by multi-IPv4 jail implementations 263413628a7SBjoern A. Zeeb * that never made it into the official kernel. 264413628a7SBjoern A. Zeeb */ 265413628a7SBjoern A. Zeeb return (EINVAL); 266413628a7SBjoern A. Zeeb 267413628a7SBjoern A. Zeeb case 2: /* JAIL_API_VERSION */ 268413628a7SBjoern A. Zeeb /* FreeBSD multi-IPv4/IPv6,noIP jails. */ 269413628a7SBjoern A. Zeeb error = copyin(uap->jail, &j, sizeof(struct jail)); 270413628a7SBjoern A. Zeeb if (error) 271413628a7SBjoern A. Zeeb return (error); 2720304c731SJamie Gritton break; 2730304c731SJamie Gritton 2740304c731SJamie Gritton default: 2750304c731SJamie Gritton /* Sci-Fi jails are not supported, sorry. */ 2760304c731SJamie Gritton return (EINVAL); 2770304c731SJamie Gritton } 278c542c43eSJamie Gritton return (kern_jail(td, &j)); 2790304c731SJamie Gritton } 2800304c731SJamie Gritton 2810304c731SJamie Gritton int 282c542c43eSJamie Gritton kern_jail(struct thread *td, struct jail *j) 2830304c731SJamie Gritton { 284c542c43eSJamie Gritton struct iovec optiov[2 * (4 + nitems(pr_flag_allow) 285e92e0574SJamie Gritton #ifdef INET 286e92e0574SJamie Gritton + 1 287e92e0574SJamie Gritton #endif 288e92e0574SJamie Gritton #ifdef INET6 289e92e0574SJamie Gritton + 1 290e92e0574SJamie Gritton #endif 291e92e0574SJamie Gritton )]; 2920304c731SJamie Gritton struct uio opt; 2930304c731SJamie Gritton char *u_path, *u_hostname, *u_name; 294672756aaSJamie Gritton struct bool_flags *bf; 2950304c731SJamie Gritton #ifdef INET 296e92e0574SJamie Gritton uint32_t ip4s; 2970304c731SJamie Gritton struct in_addr *u_ip4; 2980304c731SJamie Gritton #endif 2990304c731SJamie Gritton #ifdef INET6 3000304c731SJamie Gritton struct in6_addr *u_ip6; 3010304c731SJamie Gritton #endif 3020304c731SJamie Gritton size_t tmplen; 303c542c43eSJamie Gritton int error, enforce_statfs; 3040304c731SJamie Gritton 3050304c731SJamie Gritton bzero(&optiov, sizeof(optiov)); 3060304c731SJamie Gritton opt.uio_iov = optiov; 3070304c731SJamie Gritton opt.uio_iovcnt = 0; 3080304c731SJamie Gritton opt.uio_offset = -1; 3090304c731SJamie Gritton opt.uio_resid = -1; 3100304c731SJamie Gritton opt.uio_segflg = UIO_SYSSPACE; 3110304c731SJamie Gritton opt.uio_rw = UIO_READ; 3120304c731SJamie Gritton opt.uio_td = td; 3130304c731SJamie Gritton 3140304c731SJamie Gritton /* Set permissions for top-level jails from sysctls. */ 3150304c731SJamie Gritton if (!jailed(td->td_ucred)) { 316672756aaSJamie Gritton for (bf = pr_flag_allow; 3170e5c6bd4SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && 3180e5c6bd4SJamie Gritton bf->flag != 0; 319672756aaSJamie Gritton bf++) { 320672756aaSJamie Gritton optiov[opt.uio_iovcnt].iov_base = __DECONST(char *, 321672756aaSJamie Gritton (jail_default_allow & bf->flag) 322672756aaSJamie Gritton ? bf->name : bf->noname); 3230304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = 3240304c731SJamie Gritton strlen(optiov[opt.uio_iovcnt].iov_base) + 1; 3250304c731SJamie Gritton opt.uio_iovcnt += 2; 3260304c731SJamie Gritton } 3270304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "enforce_statfs"; 3280304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("enforce_statfs"); 3290304c731SJamie Gritton opt.uio_iovcnt++; 3300304c731SJamie Gritton enforce_statfs = jail_default_enforce_statfs; 3310304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = &enforce_statfs; 3320304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof(enforce_statfs); 3330304c731SJamie Gritton opt.uio_iovcnt++; 3340304c731SJamie Gritton } 3350304c731SJamie Gritton 336b38ff370SJamie Gritton tmplen = MAXPATHLEN + MAXHOSTNAMELEN + MAXHOSTNAMELEN; 337b38ff370SJamie Gritton #ifdef INET 3380304c731SJamie Gritton ip4s = (j->version == 0) ? 1 : j->ip4s; 3390304c731SJamie Gritton if (ip4s > jail_max_af_ips) 340b38ff370SJamie Gritton return (EINVAL); 3410304c731SJamie Gritton tmplen += ip4s * sizeof(struct in_addr); 342b38ff370SJamie Gritton #else 3430304c731SJamie Gritton if (j->ip4s > 0) 344b38ff370SJamie Gritton return (EINVAL); 345b38ff370SJamie Gritton #endif 346b38ff370SJamie Gritton #ifdef INET6 3470304c731SJamie Gritton if (j->ip6s > jail_max_af_ips) 348b38ff370SJamie Gritton return (EINVAL); 3490304c731SJamie Gritton tmplen += j->ip6s * sizeof(struct in6_addr); 350b38ff370SJamie Gritton #else 3510304c731SJamie Gritton if (j->ip6s > 0) 352b38ff370SJamie Gritton return (EINVAL); 353b38ff370SJamie Gritton #endif 354b38ff370SJamie Gritton u_path = malloc(tmplen, M_TEMP, M_WAITOK); 355b38ff370SJamie Gritton u_hostname = u_path + MAXPATHLEN; 356b38ff370SJamie Gritton u_name = u_hostname + MAXHOSTNAMELEN; 357b38ff370SJamie Gritton #ifdef INET 358b38ff370SJamie Gritton u_ip4 = (struct in_addr *)(u_name + MAXHOSTNAMELEN); 359b38ff370SJamie Gritton #endif 360b38ff370SJamie Gritton #ifdef INET6 361b38ff370SJamie Gritton #ifdef INET 3620304c731SJamie Gritton u_ip6 = (struct in6_addr *)(u_ip4 + ip4s); 363b38ff370SJamie Gritton #else 364b38ff370SJamie Gritton u_ip6 = (struct in6_addr *)(u_name + MAXHOSTNAMELEN); 365b38ff370SJamie Gritton #endif 366b38ff370SJamie Gritton #endif 3670304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "path"; 3680304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("path"); 3690304c731SJamie Gritton opt.uio_iovcnt++; 3700304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_path; 3710304c731SJamie Gritton error = copyinstr(j->path, u_path, MAXPATHLEN, 3720304c731SJamie Gritton &optiov[opt.uio_iovcnt].iov_len); 373b38ff370SJamie Gritton if (error) { 374b38ff370SJamie Gritton free(u_path, M_TEMP); 375b38ff370SJamie Gritton return (error); 376b38ff370SJamie Gritton } 3770304c731SJamie Gritton opt.uio_iovcnt++; 3780304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "host.hostname"; 3790304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("host.hostname"); 3800304c731SJamie Gritton opt.uio_iovcnt++; 3810304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_hostname; 3820304c731SJamie Gritton error = copyinstr(j->hostname, u_hostname, MAXHOSTNAMELEN, 3830304c731SJamie Gritton &optiov[opt.uio_iovcnt].iov_len); 384b38ff370SJamie Gritton if (error) { 385b38ff370SJamie Gritton free(u_path, M_TEMP); 386b38ff370SJamie Gritton return (error); 387b38ff370SJamie Gritton } 3880304c731SJamie Gritton opt.uio_iovcnt++; 3890304c731SJamie Gritton if (j->jailname != NULL) { 390b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "name"; 391b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("name"); 392b38ff370SJamie Gritton opt.uio_iovcnt++; 393b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_name; 3940304c731SJamie Gritton error = copyinstr(j->jailname, u_name, MAXHOSTNAMELEN, 395b38ff370SJamie Gritton &optiov[opt.uio_iovcnt].iov_len); 396b38ff370SJamie Gritton if (error) { 397b38ff370SJamie Gritton free(u_path, M_TEMP); 398b38ff370SJamie Gritton return (error); 399b38ff370SJamie Gritton } 400b38ff370SJamie Gritton opt.uio_iovcnt++; 401b38ff370SJamie Gritton } 402b38ff370SJamie Gritton #ifdef INET 403b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "ip4.addr"; 404b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("ip4.addr"); 405b38ff370SJamie Gritton opt.uio_iovcnt++; 406b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_ip4; 4070304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = ip4s * sizeof(struct in_addr); 4080304c731SJamie Gritton if (j->version == 0) 4090304c731SJamie Gritton u_ip4->s_addr = j->ip4s; 4100304c731SJamie Gritton else { 4110304c731SJamie Gritton error = copyin(j->ip4, u_ip4, optiov[opt.uio_iovcnt].iov_len); 412b38ff370SJamie Gritton if (error) { 413b38ff370SJamie Gritton free(u_path, M_TEMP); 414b38ff370SJamie Gritton return (error); 415b38ff370SJamie Gritton } 4160304c731SJamie Gritton } 417b38ff370SJamie Gritton opt.uio_iovcnt++; 418b38ff370SJamie Gritton #endif 419b38ff370SJamie Gritton #ifdef INET6 420b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "ip6.addr"; 421b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("ip6.addr"); 422b38ff370SJamie Gritton opt.uio_iovcnt++; 423b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_ip6; 4240304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = j->ip6s * sizeof(struct in6_addr); 4250304c731SJamie Gritton error = copyin(j->ip6, u_ip6, optiov[opt.uio_iovcnt].iov_len); 426b38ff370SJamie Gritton if (error) { 427b38ff370SJamie Gritton free(u_path, M_TEMP); 428b38ff370SJamie Gritton return (error); 429b38ff370SJamie Gritton } 430b38ff370SJamie Gritton opt.uio_iovcnt++; 431b38ff370SJamie Gritton #endif 43202abd400SPedro F. Giffuni KASSERT(opt.uio_iovcnt <= nitems(optiov), 4330304c731SJamie Gritton ("kern_jail: too many iovecs (%d)", opt.uio_iovcnt)); 434b38ff370SJamie Gritton error = kern_jail_set(td, &opt, JAIL_CREATE | JAIL_ATTACH); 435b38ff370SJamie Gritton free(u_path, M_TEMP); 436b38ff370SJamie Gritton return (error); 437b38ff370SJamie Gritton } 438b38ff370SJamie Gritton 439b38ff370SJamie Gritton /* 440b38ff370SJamie Gritton * struct jail_set_args { 441b38ff370SJamie Gritton * struct iovec *iovp; 442b38ff370SJamie Gritton * unsigned int iovcnt; 443b38ff370SJamie Gritton * int flags; 444b38ff370SJamie Gritton * }; 445b38ff370SJamie Gritton */ 446b38ff370SJamie Gritton int 4478451d0ddSKip Macy sys_jail_set(struct thread *td, struct jail_set_args *uap) 448b38ff370SJamie Gritton { 449b38ff370SJamie Gritton struct uio *auio; 450b38ff370SJamie Gritton int error; 451b38ff370SJamie Gritton 452b38ff370SJamie Gritton /* Check that we have an even number of iovecs. */ 453b38ff370SJamie Gritton if (uap->iovcnt & 1) 454b38ff370SJamie Gritton return (EINVAL); 455b38ff370SJamie Gritton 456b38ff370SJamie Gritton error = copyinuio(uap->iovp, uap->iovcnt, &auio); 457b38ff370SJamie Gritton if (error) 458b38ff370SJamie Gritton return (error); 459b38ff370SJamie Gritton error = kern_jail_set(td, auio, uap->flags); 460b38ff370SJamie Gritton free(auio, M_IOV); 461b38ff370SJamie Gritton return (error); 462413628a7SBjoern A. Zeeb } 463413628a7SBjoern A. Zeeb 464413628a7SBjoern A. Zeeb int 465b38ff370SJamie Gritton kern_jail_set(struct thread *td, struct uio *optuio, int flags) 466413628a7SBjoern A. Zeeb { 467fd7a8150SMike Barcroft struct nameidata nd; 468b38ff370SJamie Gritton #ifdef INET 469b38ff370SJamie Gritton struct in_addr *ip4; 470413628a7SBjoern A. Zeeb #endif 471b38ff370SJamie Gritton #ifdef INET6 472b38ff370SJamie Gritton struct in6_addr *ip6; 473b38ff370SJamie Gritton #endif 474b38ff370SJamie Gritton struct vfsopt *opt; 475b38ff370SJamie Gritton struct vfsoptlist *opts; 47657aea6dfSBjoern A. Zeeb struct prison *pr, *deadpr, *mypr, *ppr, *tpr; 477b38ff370SJamie Gritton struct vnode *root; 478babbbb9cSJamie Gritton char *domain, *errmsg, *host, *name, *namelc, *p, *path, *uuid; 479b96bd95bSIan Lepore char *g_path, *osrelstr; 480672756aaSJamie Gritton struct bool_flags *bf; 481672756aaSJamie Gritton struct jailsys_flags *jsf; 4820304c731SJamie Gritton #if defined(INET) || defined(INET6) 48357aea6dfSBjoern A. Zeeb struct prison *tppr; 484b38ff370SJamie Gritton void *op; 4850304c731SJamie Gritton #endif 48676ca6f88SJamie Gritton unsigned long hid; 487b6f47c23SJamie Gritton size_t namelen, onamelen, pnamelen; 488cc5fd8c7SJamie Gritton int born, created, cuflags, descend, enforce; 489cc5fd8c7SJamie Gritton int error, errmsg_len, errmsg_pos; 4900cc207a6SMartin Matuska int gotchildmax, gotenforce, gothid, gotrsnum, gotslevel; 491672756aaSJamie Gritton int jid, jsys, len, level; 492b96bd95bSIan Lepore int childmax, osreldt, rsnum, slevel; 493d465a41dSBjoern A. Zeeb #if defined(INET) || defined(INET6) 4940304c731SJamie Gritton int ii, ij; 495413628a7SBjoern A. Zeeb #endif 496413628a7SBjoern A. Zeeb #ifdef INET 4972b0d6f81SJamie Gritton int ip4s, redo_ip4; 498413628a7SBjoern A. Zeeb #endif 499b38ff370SJamie Gritton #ifdef INET6 5002b0d6f81SJamie Gritton int ip6s, redo_ip6; 501b38ff370SJamie Gritton #endif 5026beb3bb4SKirk McKusick uint64_t pr_allow, ch_allow, pr_flags, ch_flags; 503b3079544SJamie Gritton uint64_t pr_allow_diff; 5046beb3bb4SKirk McKusick unsigned tallow; 505b38ff370SJamie Gritton char numbuf[12]; 506b38ff370SJamie Gritton 507b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_SET); 508b38ff370SJamie Gritton if (!error && (flags & JAIL_ATTACH)) 509b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_ATTACH); 510b38ff370SJamie Gritton if (error) 51175c13541SPoul-Henning Kamp return (error); 512b6f47c23SJamie Gritton mypr = td->td_ucred->cr_prison; 513b97457e2SJamie Gritton if ((flags & JAIL_CREATE) && mypr->pr_childmax == 0) 5140304c731SJamie Gritton return (EPERM); 515b38ff370SJamie Gritton if (flags & ~JAIL_SET_MASK) 516b38ff370SJamie Gritton return (EINVAL); 517b38ff370SJamie Gritton 518b38ff370SJamie Gritton /* 519b38ff370SJamie Gritton * Check all the parameters before committing to anything. Not all 520b38ff370SJamie Gritton * errors can be caught early, but we may as well try. Also, this 521b38ff370SJamie Gritton * takes care of some expensive stuff (path lookup) before getting 522b38ff370SJamie Gritton * the allprison lock. 523b38ff370SJamie Gritton * 524b38ff370SJamie Gritton * XXX Jails are not filesystems, and jail parameters are not mount 525b38ff370SJamie Gritton * options. But it makes more sense to re-use the vfsopt code 526b38ff370SJamie Gritton * than duplicate it under a different name. 527b38ff370SJamie Gritton */ 528b38ff370SJamie Gritton error = vfs_buildopts(optuio, &opts); 529b38ff370SJamie Gritton if (error) 530b38ff370SJamie Gritton return (error); 531b38ff370SJamie Gritton #ifdef INET 532b38ff370SJamie Gritton ip4 = NULL; 533b38ff370SJamie Gritton #endif 534b38ff370SJamie Gritton #ifdef INET6 535b38ff370SJamie Gritton ip6 = NULL; 536b38ff370SJamie Gritton #endif 5376dfe0a3dSMartin Matuska g_path = NULL; 538b38ff370SJamie Gritton 539b6f47c23SJamie Gritton cuflags = flags & (JAIL_CREATE | JAIL_UPDATE); 540b6f47c23SJamie Gritton if (!cuflags) { 541b6f47c23SJamie Gritton error = EINVAL; 542b6f47c23SJamie Gritton vfs_opterror(opts, "no valid operation (create or update)"); 543b6f47c23SJamie Gritton goto done_errmsg; 544b6f47c23SJamie Gritton } 545b6f47c23SJamie Gritton 546b38ff370SJamie Gritton error = vfs_copyopt(opts, "jid", &jid, sizeof(jid)); 547b38ff370SJamie Gritton if (error == ENOENT) 548b38ff370SJamie Gritton jid = 0; 549b38ff370SJamie Gritton else if (error != 0) 550b38ff370SJamie Gritton goto done_free; 551b38ff370SJamie Gritton 552b38ff370SJamie Gritton error = vfs_copyopt(opts, "securelevel", &slevel, sizeof(slevel)); 553b38ff370SJamie Gritton if (error == ENOENT) 554b38ff370SJamie Gritton gotslevel = 0; 555b38ff370SJamie Gritton else if (error != 0) 556b38ff370SJamie Gritton goto done_free; 557b38ff370SJamie Gritton else 558b38ff370SJamie Gritton gotslevel = 1; 559b38ff370SJamie Gritton 560b97457e2SJamie Gritton error = 561b97457e2SJamie Gritton vfs_copyopt(opts, "children.max", &childmax, sizeof(childmax)); 562b97457e2SJamie Gritton if (error == ENOENT) 563b97457e2SJamie Gritton gotchildmax = 0; 564b97457e2SJamie Gritton else if (error != 0) 565b97457e2SJamie Gritton goto done_free; 566b97457e2SJamie Gritton else 567b97457e2SJamie Gritton gotchildmax = 1; 568b97457e2SJamie Gritton 5690304c731SJamie Gritton error = vfs_copyopt(opts, "enforce_statfs", &enforce, sizeof(enforce)); 570f337198dSJamie Gritton if (error == ENOENT) 571f337198dSJamie Gritton gotenforce = 0; 572f337198dSJamie Gritton else if (error != 0) 5730304c731SJamie Gritton goto done_free; 574f337198dSJamie Gritton else if (enforce < 0 || enforce > 2) { 575f337198dSJamie Gritton error = EINVAL; 576f337198dSJamie Gritton goto done_free; 577f337198dSJamie Gritton } else 578f337198dSJamie Gritton gotenforce = 1; 5790304c731SJamie Gritton 5800cc207a6SMartin Matuska error = vfs_copyopt(opts, "devfs_ruleset", &rsnum, sizeof(rsnum)); 5810cc207a6SMartin Matuska if (error == ENOENT) 5820cc207a6SMartin Matuska gotrsnum = 0; 5830cc207a6SMartin Matuska else if (error != 0) 5840cc207a6SMartin Matuska goto done_free; 5850cc207a6SMartin Matuska else 5860cc207a6SMartin Matuska gotrsnum = 1; 5870cc207a6SMartin Matuska 588b38ff370SJamie Gritton pr_flags = ch_flags = 0; 589672756aaSJamie Gritton for (bf = pr_flag_bool; 590672756aaSJamie Gritton bf < pr_flag_bool + nitems(pr_flag_bool); 591672756aaSJamie Gritton bf++) { 592672756aaSJamie Gritton vfs_flagopt(opts, bf->name, &pr_flags, bf->flag); 593672756aaSJamie Gritton vfs_flagopt(opts, bf->noname, &ch_flags, bf->flag); 5940304c731SJamie Gritton } 595b38ff370SJamie Gritton ch_flags |= pr_flags; 596672756aaSJamie Gritton for (jsf = pr_flag_jailsys; 597672756aaSJamie Gritton jsf < pr_flag_jailsys + nitems(pr_flag_jailsys); 598672756aaSJamie Gritton jsf++) { 599672756aaSJamie Gritton error = vfs_copyopt(opts, jsf->name, &jsys, sizeof(jsys)); 6007cbf7213SJamie Gritton if (error == ENOENT) 6017cbf7213SJamie Gritton continue; 6027cbf7213SJamie Gritton if (error != 0) 6037cbf7213SJamie Gritton goto done_free; 6047cbf7213SJamie Gritton switch (jsys) { 6057cbf7213SJamie Gritton case JAIL_SYS_DISABLE: 606672756aaSJamie Gritton if (!jsf->disable) { 6077cbf7213SJamie Gritton error = EINVAL; 6087cbf7213SJamie Gritton goto done_free; 6097cbf7213SJamie Gritton } 610672756aaSJamie Gritton pr_flags |= jsf->disable; 6117cbf7213SJamie Gritton break; 6127cbf7213SJamie Gritton case JAIL_SYS_NEW: 613672756aaSJamie Gritton pr_flags |= jsf->new; 6147cbf7213SJamie Gritton break; 6157cbf7213SJamie Gritton case JAIL_SYS_INHERIT: 6167cbf7213SJamie Gritton break; 6177cbf7213SJamie Gritton default: 6187cbf7213SJamie Gritton error = EINVAL; 6197cbf7213SJamie Gritton goto done_free; 6207cbf7213SJamie Gritton } 621672756aaSJamie Gritton ch_flags |= jsf->new | jsf->disable; 6227cbf7213SJamie Gritton } 6234affa14cSJamie Gritton if ((flags & (JAIL_CREATE | JAIL_UPDATE | JAIL_ATTACH)) == JAIL_CREATE 6244affa14cSJamie Gritton && !(pr_flags & PR_PERSIST)) { 6254affa14cSJamie Gritton error = EINVAL; 6264affa14cSJamie Gritton vfs_opterror(opts, "new jail must persist or attach"); 6274affa14cSJamie Gritton goto done_errmsg; 6284affa14cSJamie Gritton } 629679e1390SJamie Gritton #ifdef VIMAGE 630679e1390SJamie Gritton if ((flags & JAIL_UPDATE) && (ch_flags & PR_VNET)) { 631679e1390SJamie Gritton error = EINVAL; 632679e1390SJamie Gritton vfs_opterror(opts, "vnet cannot be changed after creation"); 633679e1390SJamie Gritton goto done_errmsg; 634679e1390SJamie Gritton } 635679e1390SJamie Gritton #endif 6362b0d6f81SJamie Gritton #ifdef INET 6372b0d6f81SJamie Gritton if ((flags & JAIL_UPDATE) && (ch_flags & PR_IP4_USER)) { 6382b0d6f81SJamie Gritton error = EINVAL; 6392b0d6f81SJamie Gritton vfs_opterror(opts, "ip4 cannot be changed after creation"); 6402b0d6f81SJamie Gritton goto done_errmsg; 6412b0d6f81SJamie Gritton } 6422b0d6f81SJamie Gritton #endif 6432b0d6f81SJamie Gritton #ifdef INET6 6442b0d6f81SJamie Gritton if ((flags & JAIL_UPDATE) && (ch_flags & PR_IP6_USER)) { 6452b0d6f81SJamie Gritton error = EINVAL; 6462b0d6f81SJamie Gritton vfs_opterror(opts, "ip6 cannot be changed after creation"); 6472b0d6f81SJamie Gritton goto done_errmsg; 6482b0d6f81SJamie Gritton } 6492b0d6f81SJamie Gritton #endif 650b38ff370SJamie Gritton 6510304c731SJamie Gritton pr_allow = ch_allow = 0; 652672756aaSJamie Gritton for (bf = pr_flag_allow; 6530e5c6bd4SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && bf->flag != 0; 654672756aaSJamie Gritton bf++) { 655672756aaSJamie Gritton vfs_flagopt(opts, bf->name, &pr_allow, bf->flag); 656672756aaSJamie Gritton vfs_flagopt(opts, bf->noname, &ch_allow, bf->flag); 6570304c731SJamie Gritton } 6580304c731SJamie Gritton ch_allow |= pr_allow; 6590304c731SJamie Gritton 660b38ff370SJamie Gritton error = vfs_getopt(opts, "name", (void **)&name, &len); 661b38ff370SJamie Gritton if (error == ENOENT) 662b38ff370SJamie Gritton name = NULL; 663b38ff370SJamie Gritton else if (error != 0) 664b38ff370SJamie Gritton goto done_free; 665b38ff370SJamie Gritton else { 666b38ff370SJamie Gritton if (len == 0 || name[len - 1] != '\0') { 667b38ff370SJamie Gritton error = EINVAL; 668b38ff370SJamie Gritton goto done_free; 669b38ff370SJamie Gritton } 670b38ff370SJamie Gritton if (len > MAXHOSTNAMELEN) { 671b38ff370SJamie Gritton error = ENAMETOOLONG; 672b38ff370SJamie Gritton goto done_free; 673b38ff370SJamie Gritton } 674b38ff370SJamie Gritton } 675b38ff370SJamie Gritton 676b38ff370SJamie Gritton error = vfs_getopt(opts, "host.hostname", (void **)&host, &len); 677b38ff370SJamie Gritton if (error == ENOENT) 678b38ff370SJamie Gritton host = NULL; 679b38ff370SJamie Gritton else if (error != 0) 680b38ff370SJamie Gritton goto done_free; 681b38ff370SJamie Gritton else { 68276ca6f88SJamie Gritton ch_flags |= PR_HOST; 68376ca6f88SJamie Gritton pr_flags |= PR_HOST; 684b38ff370SJamie Gritton if (len == 0 || host[len - 1] != '\0') { 685b38ff370SJamie Gritton error = EINVAL; 686b38ff370SJamie Gritton goto done_free; 687b38ff370SJamie Gritton } 688b38ff370SJamie Gritton if (len > MAXHOSTNAMELEN) { 689b38ff370SJamie Gritton error = ENAMETOOLONG; 690b38ff370SJamie Gritton goto done_free; 691b38ff370SJamie Gritton } 692b38ff370SJamie Gritton } 693b38ff370SJamie Gritton 69476ca6f88SJamie Gritton error = vfs_getopt(opts, "host.domainname", (void **)&domain, &len); 69576ca6f88SJamie Gritton if (error == ENOENT) 69676ca6f88SJamie Gritton domain = NULL; 69776ca6f88SJamie Gritton else if (error != 0) 69876ca6f88SJamie Gritton goto done_free; 69976ca6f88SJamie Gritton else { 70076ca6f88SJamie Gritton ch_flags |= PR_HOST; 70176ca6f88SJamie Gritton pr_flags |= PR_HOST; 70276ca6f88SJamie Gritton if (len == 0 || domain[len - 1] != '\0') { 70376ca6f88SJamie Gritton error = EINVAL; 70476ca6f88SJamie Gritton goto done_free; 70576ca6f88SJamie Gritton } 70676ca6f88SJamie Gritton if (len > MAXHOSTNAMELEN) { 70776ca6f88SJamie Gritton error = ENAMETOOLONG; 70876ca6f88SJamie Gritton goto done_free; 70976ca6f88SJamie Gritton } 71076ca6f88SJamie Gritton } 71176ca6f88SJamie Gritton 71276ca6f88SJamie Gritton error = vfs_getopt(opts, "host.hostuuid", (void **)&uuid, &len); 71376ca6f88SJamie Gritton if (error == ENOENT) 71476ca6f88SJamie Gritton uuid = NULL; 71576ca6f88SJamie Gritton else if (error != 0) 71676ca6f88SJamie Gritton goto done_free; 71776ca6f88SJamie Gritton else { 71876ca6f88SJamie Gritton ch_flags |= PR_HOST; 71976ca6f88SJamie Gritton pr_flags |= PR_HOST; 72076ca6f88SJamie Gritton if (len == 0 || uuid[len - 1] != '\0') { 72176ca6f88SJamie Gritton error = EINVAL; 72276ca6f88SJamie Gritton goto done_free; 72376ca6f88SJamie Gritton } 72476ca6f88SJamie Gritton if (len > HOSTUUIDLEN) { 72576ca6f88SJamie Gritton error = ENAMETOOLONG; 72676ca6f88SJamie Gritton goto done_free; 72776ca6f88SJamie Gritton } 72876ca6f88SJamie Gritton } 72976ca6f88SJamie Gritton 730841c0c7eSNathan Whitehorn #ifdef COMPAT_FREEBSD32 731a5c1afadSDmitry Chagin if (SV_PROC_FLAG(td->td_proc, SV_ILP32)) { 73276ca6f88SJamie Gritton uint32_t hid32; 73376ca6f88SJamie Gritton 73476ca6f88SJamie Gritton error = vfs_copyopt(opts, "host.hostid", &hid32, sizeof(hid32)); 73576ca6f88SJamie Gritton hid = hid32; 73676ca6f88SJamie Gritton } else 73776ca6f88SJamie Gritton #endif 73876ca6f88SJamie Gritton error = vfs_copyopt(opts, "host.hostid", &hid, sizeof(hid)); 73976ca6f88SJamie Gritton if (error == ENOENT) 74076ca6f88SJamie Gritton gothid = 0; 74176ca6f88SJamie Gritton else if (error != 0) 74276ca6f88SJamie Gritton goto done_free; 74376ca6f88SJamie Gritton else { 74476ca6f88SJamie Gritton gothid = 1; 74576ca6f88SJamie Gritton ch_flags |= PR_HOST; 74676ca6f88SJamie Gritton pr_flags |= PR_HOST; 74776ca6f88SJamie Gritton } 74876ca6f88SJamie Gritton 749b38ff370SJamie Gritton #ifdef INET 750b38ff370SJamie Gritton error = vfs_getopt(opts, "ip4.addr", &op, &ip4s); 751b38ff370SJamie Gritton if (error == ENOENT) 7520e5e396eSJamie Gritton ip4s = 0; 753b38ff370SJamie Gritton else if (error != 0) 754b38ff370SJamie Gritton goto done_free; 755b38ff370SJamie Gritton else if (ip4s & (sizeof(*ip4) - 1)) { 756b38ff370SJamie Gritton error = EINVAL; 757b38ff370SJamie Gritton goto done_free; 7580304c731SJamie Gritton } else { 7596a3f2779SJamie Gritton ch_flags |= PR_IP4_USER; 7606a3f2779SJamie Gritton pr_flags |= PR_IP4_USER; 7616a3f2779SJamie Gritton if (ip4s > 0) { 762b38ff370SJamie Gritton ip4s /= sizeof(*ip4); 763b38ff370SJamie Gritton if (ip4s > jail_max_af_ips) { 764b38ff370SJamie Gritton error = EINVAL; 765b38ff370SJamie Gritton vfs_opterror(opts, "too many IPv4 addresses"); 766b38ff370SJamie Gritton goto done_errmsg; 767b38ff370SJamie Gritton } 7682b0d6f81SJamie Gritton ip4 = malloc(ip4s * sizeof(*ip4), M_PRISON, M_WAITOK); 769b38ff370SJamie Gritton bcopy(op, ip4, ip4s * sizeof(*ip4)); 770b38ff370SJamie Gritton /* 7710304c731SJamie Gritton * IP addresses are all sorted but ip[0] to preserve 7720304c731SJamie Gritton * the primary IP address as given from userland. 7730304c731SJamie Gritton * This special IP is used for unbound outgoing 774bef916f9SBjoern A. Zeeb * connections as well for "loopback" traffic in case 775bef916f9SBjoern A. Zeeb * source address selection cannot find any more fitting 776bef916f9SBjoern A. Zeeb * address to connect from. 777b38ff370SJamie Gritton */ 778b38ff370SJamie Gritton if (ip4s > 1) 7790ce1624dSStephen J. Kiernan qsort(ip4 + 1, ip4s - 1, sizeof(*ip4), 7800ce1624dSStephen J. Kiernan prison_qcmp_v4); 781b38ff370SJamie Gritton /* 7820304c731SJamie Gritton * Check for duplicate addresses and do some simple 7830304c731SJamie Gritton * zero and broadcast checks. If users give other bogus 7840304c731SJamie Gritton * addresses it is their problem. 785b38ff370SJamie Gritton * 7860304c731SJamie Gritton * We do not have to care about byte order for these 7870304c731SJamie Gritton * checks so we will do them in NBO. 788b38ff370SJamie Gritton */ 789b38ff370SJamie Gritton for (ii = 0; ii < ip4s; ii++) { 790b38ff370SJamie Gritton if (ip4[ii].s_addr == INADDR_ANY || 791b38ff370SJamie Gritton ip4[ii].s_addr == INADDR_BROADCAST) { 792b38ff370SJamie Gritton error = EINVAL; 793b38ff370SJamie Gritton goto done_free; 794b38ff370SJamie Gritton } 795b38ff370SJamie Gritton if ((ii+1) < ip4s && 796b38ff370SJamie Gritton (ip4[0].s_addr == ip4[ii+1].s_addr || 797b38ff370SJamie Gritton ip4[ii].s_addr == ip4[ii+1].s_addr)) { 798b38ff370SJamie Gritton error = EINVAL; 799b38ff370SJamie Gritton goto done_free; 800b38ff370SJamie Gritton } 801b38ff370SJamie Gritton } 802b38ff370SJamie Gritton } 8030304c731SJamie Gritton } 804b38ff370SJamie Gritton #endif 805b38ff370SJamie Gritton 806b38ff370SJamie Gritton #ifdef INET6 807b38ff370SJamie Gritton error = vfs_getopt(opts, "ip6.addr", &op, &ip6s); 808b38ff370SJamie Gritton if (error == ENOENT) 8090e5e396eSJamie Gritton ip6s = 0; 810b38ff370SJamie Gritton else if (error != 0) 811b38ff370SJamie Gritton goto done_free; 812b38ff370SJamie Gritton else if (ip6s & (sizeof(*ip6) - 1)) { 813b38ff370SJamie Gritton error = EINVAL; 814b38ff370SJamie Gritton goto done_free; 8150304c731SJamie Gritton } else { 8166a3f2779SJamie Gritton ch_flags |= PR_IP6_USER; 8176a3f2779SJamie Gritton pr_flags |= PR_IP6_USER; 8186a3f2779SJamie Gritton if (ip6s > 0) { 819b38ff370SJamie Gritton ip6s /= sizeof(*ip6); 820b38ff370SJamie Gritton if (ip6s > jail_max_af_ips) { 821b38ff370SJamie Gritton error = EINVAL; 822b38ff370SJamie Gritton vfs_opterror(opts, "too many IPv6 addresses"); 823b38ff370SJamie Gritton goto done_errmsg; 824b38ff370SJamie Gritton } 8252b0d6f81SJamie Gritton ip6 = malloc(ip6s * sizeof(*ip6), M_PRISON, M_WAITOK); 826b38ff370SJamie Gritton bcopy(op, ip6, ip6s * sizeof(*ip6)); 827b38ff370SJamie Gritton if (ip6s > 1) 8280ce1624dSStephen J. Kiernan qsort(ip6 + 1, ip6s - 1, sizeof(*ip6), 8290ce1624dSStephen J. Kiernan prison_qcmp_v6); 830b38ff370SJamie Gritton for (ii = 0; ii < ip6s; ii++) { 8310304c731SJamie Gritton if (IN6_IS_ADDR_UNSPECIFIED(&ip6[ii])) { 832b38ff370SJamie Gritton error = EINVAL; 833b38ff370SJamie Gritton goto done_free; 834b38ff370SJamie Gritton } 835b38ff370SJamie Gritton if ((ii+1) < ip6s && 836b38ff370SJamie Gritton (IN6_ARE_ADDR_EQUAL(&ip6[0], &ip6[ii+1]) || 837b38ff370SJamie Gritton IN6_ARE_ADDR_EQUAL(&ip6[ii], &ip6[ii+1]))) 838b38ff370SJamie Gritton { 839b38ff370SJamie Gritton error = EINVAL; 840b38ff370SJamie Gritton goto done_free; 841b38ff370SJamie Gritton } 842b38ff370SJamie Gritton } 843b38ff370SJamie Gritton } 8440304c731SJamie Gritton } 845b38ff370SJamie Gritton #endif 846b38ff370SJamie Gritton 847bdfc8cc4SJamie Gritton #if defined(VIMAGE) && (defined(INET) || defined(INET6)) 848bdfc8cc4SJamie Gritton if ((ch_flags & PR_VNET) && (ch_flags & (PR_IP4_USER | PR_IP6_USER))) { 849bdfc8cc4SJamie Gritton error = EINVAL; 850bdfc8cc4SJamie Gritton vfs_opterror(opts, 851bdfc8cc4SJamie Gritton "vnet jails cannot have IP address restrictions"); 852bdfc8cc4SJamie Gritton goto done_errmsg; 853bdfc8cc4SJamie Gritton } 854bdfc8cc4SJamie Gritton #endif 855bdfc8cc4SJamie Gritton 856cf0313c6SJamie Gritton error = vfs_getopt(opts, "osrelease", (void **)&osrelstr, &len); 857cf0313c6SJamie Gritton if (error == ENOENT) 858cf0313c6SJamie Gritton osrelstr = NULL; 859cf0313c6SJamie Gritton else if (error != 0) 860cf0313c6SJamie Gritton goto done_free; 861cf0313c6SJamie Gritton else { 862cf0313c6SJamie Gritton if (flags & JAIL_UPDATE) { 863cf0313c6SJamie Gritton error = EINVAL; 864cf0313c6SJamie Gritton vfs_opterror(opts, 865cf0313c6SJamie Gritton "osrelease cannot be changed after creation"); 866cf0313c6SJamie Gritton goto done_errmsg; 867cf0313c6SJamie Gritton } 868*1b786d01SBjoern A. Zeeb if (len == 0 || osrelstr[len - 1] != '\0') { 869cf0313c6SJamie Gritton error = EINVAL; 870*1b786d01SBjoern A. Zeeb goto done_free; 871*1b786d01SBjoern A. Zeeb } 872*1b786d01SBjoern A. Zeeb if (len >= OSRELEASELEN) { 873*1b786d01SBjoern A. Zeeb error = ENAMETOOLONG; 874cf0313c6SJamie Gritton vfs_opterror(opts, 875cf0313c6SJamie Gritton "osrelease string must be 1-%d bytes long", 876cf0313c6SJamie Gritton OSRELEASELEN - 1); 877cf0313c6SJamie Gritton goto done_errmsg; 878cf0313c6SJamie Gritton } 879cf0313c6SJamie Gritton } 880cf0313c6SJamie Gritton 881cf0313c6SJamie Gritton error = vfs_copyopt(opts, "osreldate", &osreldt, sizeof(osreldt)); 882cf0313c6SJamie Gritton if (error == ENOENT) 883cf0313c6SJamie Gritton osreldt = 0; 884cf0313c6SJamie Gritton else if (error != 0) 885cf0313c6SJamie Gritton goto done_free; 886cf0313c6SJamie Gritton else { 887cf0313c6SJamie Gritton if (flags & JAIL_UPDATE) { 888cf0313c6SJamie Gritton error = EINVAL; 889cf0313c6SJamie Gritton vfs_opterror(opts, 890cf0313c6SJamie Gritton "osreldate cannot be changed after creation"); 891cf0313c6SJamie Gritton goto done_errmsg; 892cf0313c6SJamie Gritton } 893cf0313c6SJamie Gritton if (osreldt == 0) { 894cf0313c6SJamie Gritton error = EINVAL; 895cf0313c6SJamie Gritton vfs_opterror(opts, "osreldate cannot be 0"); 896cf0313c6SJamie Gritton goto done_errmsg; 897cf0313c6SJamie Gritton } 898cf0313c6SJamie Gritton } 899cf0313c6SJamie Gritton 900b38ff370SJamie Gritton root = NULL; 901b38ff370SJamie Gritton error = vfs_getopt(opts, "path", (void **)&path, &len); 902b38ff370SJamie Gritton if (error == ENOENT) 903b38ff370SJamie Gritton path = NULL; 904b38ff370SJamie Gritton else if (error != 0) 905b38ff370SJamie Gritton goto done_free; 906b38ff370SJamie Gritton else { 907b38ff370SJamie Gritton if (flags & JAIL_UPDATE) { 908b38ff370SJamie Gritton error = EINVAL; 909b38ff370SJamie Gritton vfs_opterror(opts, 910b38ff370SJamie Gritton "path cannot be changed after creation"); 911b38ff370SJamie Gritton goto done_errmsg; 912b38ff370SJamie Gritton } 913b38ff370SJamie Gritton if (len == 0 || path[len - 1] != '\0') { 914b38ff370SJamie Gritton error = EINVAL; 915b38ff370SJamie Gritton goto done_free; 916b38ff370SJamie Gritton } 9175050aa86SKonstantin Belousov NDINIT(&nd, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, 918b38ff370SJamie Gritton path, td); 919b38ff370SJamie Gritton error = namei(&nd); 920b38ff370SJamie Gritton if (error) 921b38ff370SJamie Gritton goto done_free; 922b38ff370SJamie Gritton root = nd.ni_vp; 923b38ff370SJamie Gritton NDFREE(&nd, NDF_ONLY_PNBUF); 9246dfe0a3dSMartin Matuska g_path = malloc(MAXPATHLEN, M_TEMP, M_WAITOK); 9256dfe0a3dSMartin Matuska strlcpy(g_path, path, MAXPATHLEN); 9266dfe0a3dSMartin Matuska error = vn_path_to_global_path(td, root, g_path, MAXPATHLEN); 9273eb6b656SMateusz Guzik if (error == 0) { 9286dfe0a3dSMartin Matuska path = g_path; 9296dfe0a3dSMartin Matuska } else { 930f6e633a9SMartin Matuska /* exit on other errors */ 931b38ff370SJamie Gritton goto done_free; 932b38ff370SJamie Gritton } 933f6e633a9SMartin Matuska if (root->v_type != VDIR) { 934f6e633a9SMartin Matuska error = ENOTDIR; 935f6e633a9SMartin Matuska vput(root); 936f6e633a9SMartin Matuska goto done_free; 937f6e633a9SMartin Matuska } 938b249ce48SMateusz Guzik VOP_UNLOCK(root); 939b38ff370SJamie Gritton } 940b38ff370SJamie Gritton 941b38ff370SJamie Gritton /* 942b6f47c23SJamie Gritton * Find the specified jail, or at least its parent. 943b38ff370SJamie Gritton * This abuses the file error codes ENOENT and EEXIST. 944b38ff370SJamie Gritton */ 945b38ff370SJamie Gritton pr = NULL; 946b6f47c23SJamie Gritton ppr = mypr; 947babbbb9cSJamie Gritton if (cuflags == JAIL_CREATE && jid == 0 && name != NULL) { 948babbbb9cSJamie Gritton namelc = strrchr(name, '.'); 949babbbb9cSJamie Gritton jid = strtoul(namelc != NULL ? namelc + 1 : name, &p, 10); 950babbbb9cSJamie Gritton if (*p != '\0') 951babbbb9cSJamie Gritton jid = 0; 952babbbb9cSJamie Gritton } 953b6f47c23SJamie Gritton sx_xlock(&allprison_lock); 954b38ff370SJamie Gritton if (jid != 0) { 9550304c731SJamie Gritton /* 9560304c731SJamie Gritton * See if a requested jid already exists. There is an 9570304c731SJamie Gritton * information leak here if the jid exists but is not within 9580304c731SJamie Gritton * the caller's jail hierarchy. Jail creators will get EEXIST 9590304c731SJamie Gritton * even though they cannot see the jail, and CREATE | UPDATE 9600304c731SJamie Gritton * will return ENOENT which is not normally a valid error. 9610304c731SJamie Gritton */ 962b38ff370SJamie Gritton if (jid < 0) { 963b38ff370SJamie Gritton error = EINVAL; 964b38ff370SJamie Gritton vfs_opterror(opts, "negative jid"); 965b38ff370SJamie Gritton goto done_unlock_list; 966b38ff370SJamie Gritton } 967b38ff370SJamie Gritton pr = prison_find(jid); 968b38ff370SJamie Gritton if (pr != NULL) { 9690304c731SJamie Gritton ppr = pr->pr_parent; 970b38ff370SJamie Gritton /* Create: jid must not exist. */ 971b38ff370SJamie Gritton if (cuflags == JAIL_CREATE) { 972b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 973b38ff370SJamie Gritton error = EEXIST; 974b38ff370SJamie Gritton vfs_opterror(opts, "jail %d already exists", 975b38ff370SJamie Gritton jid); 976b38ff370SJamie Gritton goto done_unlock_list; 977b38ff370SJamie Gritton } 9780304c731SJamie Gritton if (!prison_ischild(mypr, pr)) { 9790304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 9800304c731SJamie Gritton pr = NULL; 9810304c731SJamie Gritton } else if (pr->pr_uref == 0) { 982b38ff370SJamie Gritton if (!(flags & JAIL_DYING)) { 983b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 984b38ff370SJamie Gritton error = ENOENT; 985b38ff370SJamie Gritton vfs_opterror(opts, "jail %d is dying", 986b38ff370SJamie Gritton jid); 987b38ff370SJamie Gritton goto done_unlock_list; 988b38ff370SJamie Gritton } else if ((flags & JAIL_ATTACH) || 989b38ff370SJamie Gritton (pr_flags & PR_PERSIST)) { 990b38ff370SJamie Gritton /* 991b38ff370SJamie Gritton * A dying jail might be resurrected 992b38ff370SJamie Gritton * (via attach or persist), but first 993b38ff370SJamie Gritton * it must determine if another jail 994b38ff370SJamie Gritton * has claimed its name. Accomplish 995b38ff370SJamie Gritton * this by implicitly re-setting the 996b38ff370SJamie Gritton * name. 997b38ff370SJamie Gritton */ 998b38ff370SJamie Gritton if (name == NULL) 9990304c731SJamie Gritton name = prison_name(mypr, pr); 1000b38ff370SJamie Gritton } 1001b38ff370SJamie Gritton } 1002b38ff370SJamie Gritton } 1003b38ff370SJamie Gritton if (pr == NULL) { 1004b38ff370SJamie Gritton /* Update: jid must exist. */ 1005b38ff370SJamie Gritton if (cuflags == JAIL_UPDATE) { 1006b38ff370SJamie Gritton error = ENOENT; 1007b38ff370SJamie Gritton vfs_opterror(opts, "jail %d not found", jid); 1008b38ff370SJamie Gritton goto done_unlock_list; 1009b38ff370SJamie Gritton } 1010b38ff370SJamie Gritton } 1011b38ff370SJamie Gritton } 1012b38ff370SJamie Gritton /* 1013b38ff370SJamie Gritton * If the caller provided a name, look for a jail by that name. 1014b38ff370SJamie Gritton * This has different semantics for creates and updates keyed by jid 1015b38ff370SJamie Gritton * (where the name must not already exist in a different jail), 1016b38ff370SJamie Gritton * and updates keyed by the name itself (where the name must exist 1017b38ff370SJamie Gritton * because that is the jail being updated). 1018b38ff370SJamie Gritton */ 1019b6f47c23SJamie Gritton namelc = NULL; 1020b38ff370SJamie Gritton if (name != NULL) { 1021babbbb9cSJamie Gritton namelc = strrchr(name, '.'); 1022babbbb9cSJamie Gritton if (namelc == NULL) 1023babbbb9cSJamie Gritton namelc = name; 1024babbbb9cSJamie Gritton else { 10250304c731SJamie Gritton /* 10260304c731SJamie Gritton * This is a hierarchical name. Split it into the 10270304c731SJamie Gritton * parent and child names, and make sure the parent 10280304c731SJamie Gritton * exists or matches an already found jail. 10290304c731SJamie Gritton */ 10300304c731SJamie Gritton if (pr != NULL) { 1031babbbb9cSJamie Gritton if (strncmp(name, ppr->pr_name, namelc - name) 1032babbbb9cSJamie Gritton || ppr->pr_name[namelc - name] != '\0') { 10330304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 10340304c731SJamie Gritton error = EINVAL; 10350304c731SJamie Gritton vfs_opterror(opts, 10360304c731SJamie Gritton "cannot change jail's parent"); 10370304c731SJamie Gritton goto done_unlock_list; 10380304c731SJamie Gritton } 10390304c731SJamie Gritton } else { 1040b6f47c23SJamie Gritton *namelc = '\0'; 10410304c731SJamie Gritton ppr = prison_find_name(mypr, name); 10420304c731SJamie Gritton if (ppr == NULL) { 10430304c731SJamie Gritton error = ENOENT; 10440304c731SJamie Gritton vfs_opterror(opts, 10450304c731SJamie Gritton "jail \"%s\" not found", name); 10460304c731SJamie Gritton goto done_unlock_list; 10470304c731SJamie Gritton } 10480304c731SJamie Gritton mtx_unlock(&ppr->pr_mtx); 1049b6f47c23SJamie Gritton *namelc = '.'; 10500304c731SJamie Gritton } 1051b6f47c23SJamie Gritton namelc++; 10520304c731SJamie Gritton } 1053b6f47c23SJamie Gritton if (namelc[0] != '\0') { 1054b6f47c23SJamie Gritton pnamelen = 10550304c731SJamie Gritton (ppr == &prison0) ? 0 : strlen(ppr->pr_name) + 1; 1056b38ff370SJamie Gritton name_again: 10570304c731SJamie Gritton deadpr = NULL; 10580304c731SJamie Gritton FOREACH_PRISON_CHILD(ppr, tpr) { 1059b38ff370SJamie Gritton if (tpr != pr && tpr->pr_ref > 0 && 1060b6f47c23SJamie Gritton !strcmp(tpr->pr_name + pnamelen, namelc)) { 1061b38ff370SJamie Gritton if (pr == NULL && 1062b38ff370SJamie Gritton cuflags != JAIL_CREATE) { 1063b38ff370SJamie Gritton mtx_lock(&tpr->pr_mtx); 1064b38ff370SJamie Gritton if (tpr->pr_ref > 0) { 1065b38ff370SJamie Gritton /* 1066b38ff370SJamie Gritton * Use this jail 1067b38ff370SJamie Gritton * for updates. 1068b38ff370SJamie Gritton */ 1069b38ff370SJamie Gritton if (tpr->pr_uref > 0) { 1070b38ff370SJamie Gritton pr = tpr; 1071b38ff370SJamie Gritton break; 1072b38ff370SJamie Gritton } 1073b38ff370SJamie Gritton deadpr = tpr; 1074b38ff370SJamie Gritton } 1075b38ff370SJamie Gritton mtx_unlock(&tpr->pr_mtx); 1076b38ff370SJamie Gritton } else if (tpr->pr_uref > 0) { 1077b38ff370SJamie Gritton /* 1078b38ff370SJamie Gritton * Create, or update(jid): 1079b38ff370SJamie Gritton * name must not exist in an 10800304c731SJamie Gritton * active sibling jail. 1081b38ff370SJamie Gritton */ 1082b38ff370SJamie Gritton error = EEXIST; 1083b38ff370SJamie Gritton if (pr != NULL) 1084b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 1085b38ff370SJamie Gritton vfs_opterror(opts, 1086b38ff370SJamie Gritton "jail \"%s\" already exists", 1087b38ff370SJamie Gritton name); 1088b38ff370SJamie Gritton goto done_unlock_list; 1089b38ff370SJamie Gritton } 1090b38ff370SJamie Gritton } 1091b38ff370SJamie Gritton } 1092b38ff370SJamie Gritton /* If no active jail is found, use a dying one. */ 1093b38ff370SJamie Gritton if (deadpr != NULL && pr == NULL) { 1094b38ff370SJamie Gritton if (flags & JAIL_DYING) { 1095b38ff370SJamie Gritton mtx_lock(&deadpr->pr_mtx); 1096b38ff370SJamie Gritton if (deadpr->pr_ref == 0) { 1097b38ff370SJamie Gritton mtx_unlock(&deadpr->pr_mtx); 1098b38ff370SJamie Gritton goto name_again; 1099b38ff370SJamie Gritton } 1100b38ff370SJamie Gritton pr = deadpr; 1101b38ff370SJamie Gritton } else if (cuflags == JAIL_UPDATE) { 1102b38ff370SJamie Gritton error = ENOENT; 1103b38ff370SJamie Gritton vfs_opterror(opts, 1104b38ff370SJamie Gritton "jail \"%s\" is dying", name); 1105b38ff370SJamie Gritton goto done_unlock_list; 1106b38ff370SJamie Gritton } 1107b38ff370SJamie Gritton } 1108b38ff370SJamie Gritton /* Update: name must exist if no jid. */ 1109b38ff370SJamie Gritton else if (cuflags == JAIL_UPDATE && pr == NULL) { 1110b38ff370SJamie Gritton error = ENOENT; 1111b38ff370SJamie Gritton vfs_opterror(opts, "jail \"%s\" not found", 1112b38ff370SJamie Gritton name); 1113b38ff370SJamie Gritton goto done_unlock_list; 1114b38ff370SJamie Gritton } 1115b38ff370SJamie Gritton } 1116b38ff370SJamie Gritton } 1117b38ff370SJamie Gritton /* Update: must provide a jid or name. */ 1118b38ff370SJamie Gritton else if (cuflags == JAIL_UPDATE && pr == NULL) { 1119b38ff370SJamie Gritton error = ENOENT; 1120b38ff370SJamie Gritton vfs_opterror(opts, "update specified no jail"); 1121b38ff370SJamie Gritton goto done_unlock_list; 1122b38ff370SJamie Gritton } 1123b38ff370SJamie Gritton 1124b38ff370SJamie Gritton /* If there's no prison to update, create a new one and link it in. */ 1125b38ff370SJamie Gritton if (pr == NULL) { 1126b97457e2SJamie Gritton for (tpr = mypr; tpr != NULL; tpr = tpr->pr_parent) 1127b97457e2SJamie Gritton if (tpr->pr_childcount >= tpr->pr_childmax) { 1128b97457e2SJamie Gritton error = EPERM; 1129b97457e2SJamie Gritton vfs_opterror(opts, "prison limit exceeded"); 1130b97457e2SJamie Gritton goto done_unlock_list; 1131b97457e2SJamie Gritton } 1132b38ff370SJamie Gritton created = 1; 11330304c731SJamie Gritton mtx_lock(&ppr->pr_mtx); 11342a549507SJamie Gritton if (ppr->pr_ref == 0) { 11350304c731SJamie Gritton mtx_unlock(&ppr->pr_mtx); 11360304c731SJamie Gritton error = ENOENT; 1137b6f47c23SJamie Gritton vfs_opterror(opts, "jail \"%s\" not found", 1138b6f47c23SJamie Gritton prison_name(mypr, ppr)); 11390304c731SJamie Gritton goto done_unlock_list; 11400304c731SJamie Gritton } 11410304c731SJamie Gritton ppr->pr_ref++; 11420304c731SJamie Gritton ppr->pr_uref++; 11430304c731SJamie Gritton mtx_unlock(&ppr->pr_mtx); 1144b38ff370SJamie Gritton pr = malloc(sizeof(*pr), M_PRISON, M_WAITOK | M_ZERO); 1145b38ff370SJamie Gritton if (jid == 0) { 1146b38ff370SJamie Gritton /* Find the next free jid. */ 1147b38ff370SJamie Gritton jid = lastprid + 1; 1148b38ff370SJamie Gritton findnext: 1149b38ff370SJamie Gritton if (jid == JAIL_MAX) 1150b38ff370SJamie Gritton jid = 1; 1151b38ff370SJamie Gritton TAILQ_FOREACH(tpr, &allprison, pr_list) { 1152b38ff370SJamie Gritton if (tpr->pr_id < jid) 1153b38ff370SJamie Gritton continue; 1154b38ff370SJamie Gritton if (tpr->pr_id > jid || tpr->pr_ref == 0) { 1155b38ff370SJamie Gritton TAILQ_INSERT_BEFORE(tpr, pr, pr_list); 1156b38ff370SJamie Gritton break; 1157b38ff370SJamie Gritton } 1158b38ff370SJamie Gritton if (jid == lastprid) { 1159b38ff370SJamie Gritton error = EAGAIN; 1160b38ff370SJamie Gritton vfs_opterror(opts, 1161b38ff370SJamie Gritton "no available jail IDs"); 1162b38ff370SJamie Gritton free(pr, M_PRISON); 11630304c731SJamie Gritton prison_deref(ppr, PD_DEREF | 11640304c731SJamie Gritton PD_DEUREF | PD_LIST_XLOCKED); 11650304c731SJamie Gritton goto done_releroot; 1166b38ff370SJamie Gritton } 1167b38ff370SJamie Gritton jid++; 1168b38ff370SJamie Gritton goto findnext; 1169b38ff370SJamie Gritton } 1170b38ff370SJamie Gritton lastprid = jid; 1171b38ff370SJamie Gritton } else { 1172b38ff370SJamie Gritton /* 1173b38ff370SJamie Gritton * The jail already has a jid (that did not yet exist), 1174b38ff370SJamie Gritton * so just find where to insert it. 1175b38ff370SJamie Gritton */ 1176b38ff370SJamie Gritton TAILQ_FOREACH(tpr, &allprison, pr_list) 1177b38ff370SJamie Gritton if (tpr->pr_id >= jid) { 1178b38ff370SJamie Gritton TAILQ_INSERT_BEFORE(tpr, pr, pr_list); 1179b38ff370SJamie Gritton break; 1180b38ff370SJamie Gritton } 1181b38ff370SJamie Gritton } 1182b38ff370SJamie Gritton if (tpr == NULL) 1183b38ff370SJamie Gritton TAILQ_INSERT_TAIL(&allprison, pr, pr_list); 11840304c731SJamie Gritton LIST_INSERT_HEAD(&ppr->pr_children, pr, pr_sibling); 11850304c731SJamie Gritton for (tpr = ppr; tpr != NULL; tpr = tpr->pr_parent) 1186b97457e2SJamie Gritton tpr->pr_childcount++; 1187b38ff370SJamie Gritton 11880304c731SJamie Gritton pr->pr_parent = ppr; 1189b38ff370SJamie Gritton pr->pr_id = jid; 11900304c731SJamie Gritton 11910304c731SJamie Gritton /* Set some default values, and inherit some from the parent. */ 1192b6f47c23SJamie Gritton if (namelc == NULL) 1193b6f47c23SJamie Gritton namelc = ""; 1194b38ff370SJamie Gritton if (path == NULL) { 1195b38ff370SJamie Gritton path = "/"; 11960304c731SJamie Gritton root = mypr->pr_root; 1197b38ff370SJamie Gritton vref(root); 1198b38ff370SJamie Gritton } 11998986e3a0SJamie Gritton strlcpy(pr->pr_hostuuid, DEFAULT_HOSTUUID, HOSTUUIDLEN); 12008986e3a0SJamie Gritton pr->pr_flags |= PR_HOST; 1201bdfc8cc4SJamie Gritton #if defined(INET) || defined(INET6) 1202bdfc8cc4SJamie Gritton #ifdef VIMAGE 1203bdfc8cc4SJamie Gritton if (!(pr_flags & PR_VNET)) 1204bdfc8cc4SJamie Gritton #endif 1205bdfc8cc4SJamie Gritton { 12060304c731SJamie Gritton #ifdef INET 12072b0d6f81SJamie Gritton if (!(ch_flags & PR_IP4_USER)) 12086a3f2779SJamie Gritton pr->pr_flags |= PR_IP4 | PR_IP4_USER; 12092b0d6f81SJamie Gritton else if (!(pr_flags & PR_IP4_USER)) { 12102b0d6f81SJamie Gritton pr->pr_flags |= ppr->pr_flags & PR_IP4; 12112b0d6f81SJamie Gritton if (ppr->pr_ip4 != NULL) { 12122b0d6f81SJamie Gritton pr->pr_ip4s = ppr->pr_ip4s; 12132b0d6f81SJamie Gritton pr->pr_ip4 = malloc(pr->pr_ip4s * 12142b0d6f81SJamie Gritton sizeof(struct in_addr), M_PRISON, 12152b0d6f81SJamie Gritton M_WAITOK); 12162b0d6f81SJamie Gritton bcopy(ppr->pr_ip4, pr->pr_ip4, 12172b0d6f81SJamie Gritton pr->pr_ip4s * sizeof(*pr->pr_ip4)); 12182b0d6f81SJamie Gritton } 12192b0d6f81SJamie Gritton } 12200304c731SJamie Gritton #endif 12210304c731SJamie Gritton #ifdef INET6 12222b0d6f81SJamie Gritton if (!(ch_flags & PR_IP6_USER)) 12236a3f2779SJamie Gritton pr->pr_flags |= PR_IP6 | PR_IP6_USER; 12242b0d6f81SJamie Gritton else if (!(pr_flags & PR_IP6_USER)) { 12252b0d6f81SJamie Gritton pr->pr_flags |= ppr->pr_flags & PR_IP6; 12262b0d6f81SJamie Gritton if (ppr->pr_ip6 != NULL) { 12272b0d6f81SJamie Gritton pr->pr_ip6s = ppr->pr_ip6s; 12282b0d6f81SJamie Gritton pr->pr_ip6 = malloc(pr->pr_ip6s * 12292b0d6f81SJamie Gritton sizeof(struct in6_addr), M_PRISON, 12302b0d6f81SJamie Gritton M_WAITOK); 12312b0d6f81SJamie Gritton bcopy(ppr->pr_ip6, pr->pr_ip6, 12322b0d6f81SJamie Gritton pr->pr_ip6s * sizeof(*pr->pr_ip6)); 12332b0d6f81SJamie Gritton } 12342b0d6f81SJamie Gritton } 12350304c731SJamie Gritton #endif 1236bdfc8cc4SJamie Gritton } 1237bdfc8cc4SJamie Gritton #endif 1238592bcae8SBjoern A. Zeeb /* Source address selection is always on by default. */ 1239592bcae8SBjoern A. Zeeb pr->pr_flags |= _PR_IP_SADDRSEL; 1240592bcae8SBjoern A. Zeeb 12410304c731SJamie Gritton pr->pr_securelevel = ppr->pr_securelevel; 12420304c731SJamie Gritton pr->pr_allow = JAIL_DEFAULT_ALLOW & ppr->pr_allow; 1243af10bf05SBjoern A. Zeeb pr->pr_enforce_statfs = jail_default_enforce_statfs; 1244bf3db8aaSMartin Matuska pr->pr_devfs_rsnum = ppr->pr_devfs_rsnum; 1245b38ff370SJamie Gritton 1246b96bd95bSIan Lepore pr->pr_osreldate = osreldt ? osreldt : ppr->pr_osreldate; 1247b96bd95bSIan Lepore if (osrelstr == NULL) 1248*1b786d01SBjoern A. Zeeb strlcpy(pr->pr_osrelease, ppr->pr_osrelease, 1249*1b786d01SBjoern A. Zeeb sizeof(pr->pr_osrelease)); 1250b96bd95bSIan Lepore else 1251*1b786d01SBjoern A. Zeeb strlcpy(pr->pr_osrelease, osrelstr, 1252*1b786d01SBjoern A. Zeeb sizeof(pr->pr_osrelease)); 1253b96bd95bSIan Lepore 12540304c731SJamie Gritton LIST_INIT(&pr->pr_children); 12550304c731SJamie Gritton mtx_init(&pr->pr_mtx, "jail mutex", NULL, MTX_DEF | MTX_DUPOK); 125673d9e52dSJamie Gritton TASK_INIT(&pr->pr_task, 0, prison_complete, pr); 1257b38ff370SJamie Gritton 1258679e1390SJamie Gritton #ifdef VIMAGE 1259679e1390SJamie Gritton /* Allocate a new vnet if specified. */ 1260679e1390SJamie Gritton pr->pr_vnet = (pr_flags & PR_VNET) 1261679e1390SJamie Gritton ? vnet_alloc() : ppr->pr_vnet; 1262679e1390SJamie Gritton #endif 1263b38ff370SJamie Gritton /* 1264b38ff370SJamie Gritton * Allocate a dedicated cpuset for each jail. 1265b38ff370SJamie Gritton * Unlike other initial settings, this may return an erorr. 1266b38ff370SJamie Gritton */ 12670304c731SJamie Gritton error = cpuset_create_root(ppr, &pr->pr_cpuset); 1268b38ff370SJamie Gritton if (error) { 1269b38ff370SJamie Gritton prison_deref(pr, PD_LIST_XLOCKED); 1270b38ff370SJamie Gritton goto done_releroot; 1271b38ff370SJamie Gritton } 1272b38ff370SJamie Gritton 1273b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 1274b38ff370SJamie Gritton /* 1275b38ff370SJamie Gritton * New prisons do not yet have a reference, because we do not 1276b6f47c23SJamie Gritton * want others to see the incomplete prison once the 1277b38ff370SJamie Gritton * allprison_lock is downgraded. 1278b38ff370SJamie Gritton */ 1279b38ff370SJamie Gritton } else { 1280b38ff370SJamie Gritton created = 0; 12812b0d6f81SJamie Gritton /* 12822b0d6f81SJamie Gritton * Grab a reference for existing prisons, to ensure they 12832b0d6f81SJamie Gritton * continue to exist for the duration of the call. 12842b0d6f81SJamie Gritton */ 12852b0d6f81SJamie Gritton pr->pr_ref++; 1286bdfc8cc4SJamie Gritton #if defined(VIMAGE) && (defined(INET) || defined(INET6)) 1287bdfc8cc4SJamie Gritton if ((pr->pr_flags & PR_VNET) && 1288bdfc8cc4SJamie Gritton (ch_flags & (PR_IP4_USER | PR_IP6_USER))) { 1289bdfc8cc4SJamie Gritton error = EINVAL; 1290bdfc8cc4SJamie Gritton vfs_opterror(opts, 1291bdfc8cc4SJamie Gritton "vnet jails cannot have IP address restrictions"); 1292bdfc8cc4SJamie Gritton goto done_deref_locked; 1293bdfc8cc4SJamie Gritton } 1294bdfc8cc4SJamie Gritton #endif 12952b0d6f81SJamie Gritton #ifdef INET 12962b0d6f81SJamie Gritton if (PR_IP4_USER & ch_flags & (pr_flags ^ pr->pr_flags)) { 12972b0d6f81SJamie Gritton error = EINVAL; 12982b0d6f81SJamie Gritton vfs_opterror(opts, 12992b0d6f81SJamie Gritton "ip4 cannot be changed after creation"); 13002b0d6f81SJamie Gritton goto done_deref_locked; 13012b0d6f81SJamie Gritton } 13022b0d6f81SJamie Gritton #endif 13032b0d6f81SJamie Gritton #ifdef INET6 13042b0d6f81SJamie Gritton if (PR_IP6_USER & ch_flags & (pr_flags ^ pr->pr_flags)) { 13052b0d6f81SJamie Gritton error = EINVAL; 13062b0d6f81SJamie Gritton vfs_opterror(opts, 13072b0d6f81SJamie Gritton "ip6 cannot be changed after creation"); 13082b0d6f81SJamie Gritton goto done_deref_locked; 13092b0d6f81SJamie Gritton } 13102b0d6f81SJamie Gritton #endif 1311b38ff370SJamie Gritton } 1312b38ff370SJamie Gritton 1313b38ff370SJamie Gritton /* Do final error checking before setting anything. */ 13140304c731SJamie Gritton if (gotslevel) { 13150304c731SJamie Gritton if (slevel < ppr->pr_securelevel) { 13160304c731SJamie Gritton error = EPERM; 13170304c731SJamie Gritton goto done_deref_locked; 13180304c731SJamie Gritton } 13190304c731SJamie Gritton } 1320b97457e2SJamie Gritton if (gotchildmax) { 1321b97457e2SJamie Gritton if (childmax >= ppr->pr_childmax) { 1322b97457e2SJamie Gritton error = EPERM; 1323b97457e2SJamie Gritton goto done_deref_locked; 1324b97457e2SJamie Gritton } 1325b97457e2SJamie Gritton } 13260304c731SJamie Gritton if (gotenforce) { 13270304c731SJamie Gritton if (enforce < ppr->pr_enforce_statfs) { 13280304c731SJamie Gritton error = EPERM; 13290304c731SJamie Gritton goto done_deref_locked; 13300304c731SJamie Gritton } 13310304c731SJamie Gritton } 13320cc207a6SMartin Matuska if (gotrsnum) { 13330cc207a6SMartin Matuska /* 13340cc207a6SMartin Matuska * devfs_rsnum is a uint16_t 13350cc207a6SMartin Matuska */ 1336bf3db8aaSMartin Matuska if (rsnum < 0 || rsnum > 65535) { 13370cc207a6SMartin Matuska error = EINVAL; 13380cc207a6SMartin Matuska goto done_deref_locked; 13390cc207a6SMartin Matuska } 13400cc207a6SMartin Matuska /* 1341bf3db8aaSMartin Matuska * Nested jails always inherit parent's devfs ruleset 13420cc207a6SMartin Matuska */ 13430cc207a6SMartin Matuska if (jailed(td->td_ucred)) { 13440cc207a6SMartin Matuska if (rsnum > 0 && rsnum != ppr->pr_devfs_rsnum) { 13450cc207a6SMartin Matuska error = EPERM; 13460cc207a6SMartin Matuska goto done_deref_locked; 1347bf3db8aaSMartin Matuska } else 13480cc207a6SMartin Matuska rsnum = ppr->pr_devfs_rsnum; 13490cc207a6SMartin Matuska } 13500cc207a6SMartin Matuska } 1351b38ff370SJamie Gritton #ifdef INET 13522b0d6f81SJamie Gritton if (ip4s > 0) { 13530304c731SJamie Gritton if (ppr->pr_flags & PR_IP4) { 13540304c731SJamie Gritton /* 13550304c731SJamie Gritton * Make sure the new set of IP addresses is a 13560304c731SJamie Gritton * subset of the parent's list. Don't worry 13570304c731SJamie Gritton * about the parent being unlocked, as any 13580304c731SJamie Gritton * setting is done with allprison_lock held. 13590304c731SJamie Gritton */ 13600304c731SJamie Gritton for (ij = 0; ij < ppr->pr_ip4s; ij++) 13612b0d6f81SJamie Gritton if (ip4[0].s_addr == ppr->pr_ip4[ij].s_addr) 13620304c731SJamie Gritton break; 13630304c731SJamie Gritton if (ij == ppr->pr_ip4s) { 13640304c731SJamie Gritton error = EPERM; 13650304c731SJamie Gritton goto done_deref_locked; 13660304c731SJamie Gritton } 13670304c731SJamie Gritton if (ip4s > 1) { 13680304c731SJamie Gritton for (ii = ij = 1; ii < ip4s; ii++) { 13690304c731SJamie Gritton if (ip4[ii].s_addr == 13700304c731SJamie Gritton ppr->pr_ip4[0].s_addr) 1371b38ff370SJamie Gritton continue; 13720304c731SJamie Gritton for (; ij < ppr->pr_ip4s; ij++) 13730304c731SJamie Gritton if (ip4[ii].s_addr == 13740304c731SJamie Gritton ppr->pr_ip4[ij].s_addr) 13750304c731SJamie Gritton break; 13760304c731SJamie Gritton if (ij == ppr->pr_ip4s) 13770304c731SJamie Gritton break; 13780304c731SJamie Gritton } 13790304c731SJamie Gritton if (ij == ppr->pr_ip4s) { 13800304c731SJamie Gritton error = EPERM; 13810304c731SJamie Gritton goto done_deref_locked; 13820304c731SJamie Gritton } 13830304c731SJamie Gritton } 13840304c731SJamie Gritton } 13850304c731SJamie Gritton /* 13860304c731SJamie Gritton * Check for conflicting IP addresses. We permit them 13870304c731SJamie Gritton * if there is no more than one IP on each jail. If 13880304c731SJamie Gritton * there is a duplicate on a jail with more than one 13890304c731SJamie Gritton * IP stop checking and return error. 13900304c731SJamie Gritton */ 1391bdfc8cc4SJamie Gritton #ifdef VIMAGE 139208b43333SJamie Gritton for (tppr = ppr; tppr != &prison0; tppr = tppr->pr_parent) 1393bdfc8cc4SJamie Gritton if (tppr->pr_flags & PR_VNET) 1394bdfc8cc4SJamie Gritton break; 139508b43333SJamie Gritton #else 139608b43333SJamie Gritton tppr = &prison0; 1397bdfc8cc4SJamie Gritton #endif 1398bdfc8cc4SJamie Gritton FOREACH_PRISON_DESCENDANT(tppr, tpr, descend) { 1399bdfc8cc4SJamie Gritton if (tpr == pr || 1400bdfc8cc4SJamie Gritton #ifdef VIMAGE 14012b0d6f81SJamie Gritton (tpr != tppr && (tpr->pr_flags & PR_VNET)) || 1402bdfc8cc4SJamie Gritton #endif 1403bdfc8cc4SJamie Gritton tpr->pr_uref == 0) { 14040304c731SJamie Gritton descend = 0; 14050304c731SJamie Gritton continue; 14060304c731SJamie Gritton } 14070304c731SJamie Gritton if (!(tpr->pr_flags & PR_IP4_USER)) 14080304c731SJamie Gritton continue; 14090304c731SJamie Gritton descend = 0; 14100304c731SJamie Gritton if (tpr->pr_ip4 == NULL || 14110304c731SJamie Gritton (ip4s == 1 && tpr->pr_ip4s == 1)) 14120304c731SJamie Gritton continue; 14130304c731SJamie Gritton for (ii = 0; ii < ip4s; ii++) { 14140ce1624dSStephen J. Kiernan if (prison_check_ip4_locked(tpr, &ip4[ii]) == 14150ce1624dSStephen J. Kiernan 0) { 14160304c731SJamie Gritton error = EADDRINUSE; 1417b38ff370SJamie Gritton vfs_opterror(opts, 1418b38ff370SJamie Gritton "IPv4 addresses clash"); 1419b38ff370SJamie Gritton goto done_deref_locked; 1420b38ff370SJamie Gritton } 14210304c731SJamie Gritton } 14220304c731SJamie Gritton } 14230304c731SJamie Gritton } 1424b38ff370SJamie Gritton #endif 1425b38ff370SJamie Gritton #ifdef INET6 14262b0d6f81SJamie Gritton if (ip6s > 0) { 14270304c731SJamie Gritton if (ppr->pr_flags & PR_IP6) { 14280304c731SJamie Gritton /* 14290304c731SJamie Gritton * Make sure the new set of IP addresses is a 14300304c731SJamie Gritton * subset of the parent's list. 14310304c731SJamie Gritton */ 14320304c731SJamie Gritton for (ij = 0; ij < ppr->pr_ip6s; ij++) 14330304c731SJamie Gritton if (IN6_ARE_ADDR_EQUAL(&ip6[0], 14340304c731SJamie Gritton &ppr->pr_ip6[ij])) 14350304c731SJamie Gritton break; 14360304c731SJamie Gritton if (ij == ppr->pr_ip6s) { 14370304c731SJamie Gritton error = EPERM; 14380304c731SJamie Gritton goto done_deref_locked; 14390304c731SJamie Gritton } 14400304c731SJamie Gritton if (ip6s > 1) { 14410304c731SJamie Gritton for (ii = ij = 1; ii < ip6s; ii++) { 14420304c731SJamie Gritton if (IN6_ARE_ADDR_EQUAL(&ip6[ii], 14430304c731SJamie Gritton &ppr->pr_ip6[0])) 14440304c731SJamie Gritton continue; 14450304c731SJamie Gritton for (; ij < ppr->pr_ip6s; ij++) 14460304c731SJamie Gritton if (IN6_ARE_ADDR_EQUAL( 14472b0d6f81SJamie Gritton &ip6[ii], &ppr->pr_ip6[ij])) 14480304c731SJamie Gritton break; 14490304c731SJamie Gritton if (ij == ppr->pr_ip6s) 14500304c731SJamie Gritton break; 14510304c731SJamie Gritton } 14520304c731SJamie Gritton if (ij == ppr->pr_ip6s) { 14530304c731SJamie Gritton error = EPERM; 14540304c731SJamie Gritton goto done_deref_locked; 14550304c731SJamie Gritton } 14560304c731SJamie Gritton } 14570304c731SJamie Gritton } 14580304c731SJamie Gritton /* Check for conflicting IP addresses. */ 1459bdfc8cc4SJamie Gritton #ifdef VIMAGE 146008b43333SJamie Gritton for (tppr = ppr; tppr != &prison0; tppr = tppr->pr_parent) 1461bdfc8cc4SJamie Gritton if (tppr->pr_flags & PR_VNET) 1462bdfc8cc4SJamie Gritton break; 146308b43333SJamie Gritton #else 146408b43333SJamie Gritton tppr = &prison0; 1465bdfc8cc4SJamie Gritton #endif 1466bdfc8cc4SJamie Gritton FOREACH_PRISON_DESCENDANT(tppr, tpr, descend) { 1467bdfc8cc4SJamie Gritton if (tpr == pr || 1468bdfc8cc4SJamie Gritton #ifdef VIMAGE 14692b0d6f81SJamie Gritton (tpr != tppr && (tpr->pr_flags & PR_VNET)) || 1470bdfc8cc4SJamie Gritton #endif 1471bdfc8cc4SJamie Gritton tpr->pr_uref == 0) { 14720304c731SJamie Gritton descend = 0; 14730304c731SJamie Gritton continue; 14740304c731SJamie Gritton } 14750304c731SJamie Gritton if (!(tpr->pr_flags & PR_IP6_USER)) 14760304c731SJamie Gritton continue; 14770304c731SJamie Gritton descend = 0; 14780304c731SJamie Gritton if (tpr->pr_ip6 == NULL || 14790304c731SJamie Gritton (ip6s == 1 && tpr->pr_ip6s == 1)) 14800304c731SJamie Gritton continue; 14810304c731SJamie Gritton for (ii = 0; ii < ip6s; ii++) { 14820ce1624dSStephen J. Kiernan if (prison_check_ip6_locked(tpr, &ip6[ii]) == 14830ce1624dSStephen J. Kiernan 0) { 14840304c731SJamie Gritton error = EADDRINUSE; 1485b38ff370SJamie Gritton vfs_opterror(opts, 1486b38ff370SJamie Gritton "IPv6 addresses clash"); 1487b38ff370SJamie Gritton goto done_deref_locked; 1488b38ff370SJamie Gritton } 14890304c731SJamie Gritton } 14900304c731SJamie Gritton } 14910304c731SJamie Gritton } 1492b38ff370SJamie Gritton #endif 14930304c731SJamie Gritton onamelen = namelen = 0; 1494b6f47c23SJamie Gritton if (namelc != NULL) { 14956ab6058eSJamie Gritton /* Give a default name of the jid. Also allow the name to be 14966ab6058eSJamie Gritton * explicitly the jid - but not any other number, and only in 14976ab6058eSJamie Gritton * normal form (no leading zero/etc). 14986ab6058eSJamie Gritton */ 1499b6f47c23SJamie Gritton if (namelc[0] == '\0') 1500b6f47c23SJamie Gritton snprintf(namelc = numbuf, sizeof(numbuf), "%d", jid); 15016ab6058eSJamie Gritton else if ((strtoul(namelc, &p, 10) != jid || 15026ab6058eSJamie Gritton namelc[0] < '1' || namelc[0] > '9') && *p == '\0') { 1503b38ff370SJamie Gritton error = EINVAL; 1504babbbb9cSJamie Gritton vfs_opterror(opts, 1505babbbb9cSJamie Gritton "name cannot be numeric (unless it is the jid)"); 15060304c731SJamie Gritton goto done_deref_locked; 1507b38ff370SJamie Gritton } 1508b38ff370SJamie Gritton /* 15090304c731SJamie Gritton * Make sure the name isn't too long for the prison or its 15100304c731SJamie Gritton * children. 1511b38ff370SJamie Gritton */ 1512b6f47c23SJamie Gritton pnamelen = (ppr == &prison0) ? 0 : strlen(ppr->pr_name) + 1; 1513b6f47c23SJamie Gritton onamelen = strlen(pr->pr_name + pnamelen); 1514b6f47c23SJamie Gritton namelen = strlen(namelc); 1515b6f47c23SJamie Gritton if (pnamelen + namelen + 1 > sizeof(pr->pr_name)) { 15160304c731SJamie Gritton error = ENAMETOOLONG; 15170304c731SJamie Gritton goto done_deref_locked; 15180304c731SJamie Gritton } 15190304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(pr, tpr, descend) { 15200304c731SJamie Gritton if (strlen(tpr->pr_name) + (namelen - onamelen) >= 15210304c731SJamie Gritton sizeof(pr->pr_name)) { 15220304c731SJamie Gritton error = ENAMETOOLONG; 15230304c731SJamie Gritton goto done_deref_locked; 15240304c731SJamie Gritton } 15250304c731SJamie Gritton } 15260304c731SJamie Gritton } 1527b3079544SJamie Gritton pr_allow_diff = pr_allow & ~ppr->pr_allow; 1528b3079544SJamie Gritton if (pr_allow_diff & ~PR_ALLOW_DIFFERENCES) { 15290304c731SJamie Gritton error = EPERM; 15300304c731SJamie Gritton goto done_deref_locked; 1531b38ff370SJamie Gritton } 1532b38ff370SJamie Gritton 1533b6f47c23SJamie Gritton /* 1534b6f47c23SJamie Gritton * Let modules check their parameters. This requires unlocking and 1535b6f47c23SJamie Gritton * then re-locking the prison, but this is still a valid state as long 1536b6f47c23SJamie Gritton * as allprison_lock remains xlocked. 1537b6f47c23SJamie Gritton */ 1538b6f47c23SJamie Gritton mtx_unlock(&pr->pr_mtx); 1539b6f47c23SJamie Gritton error = osd_jail_call(pr, PR_METHOD_CHECK, opts); 1540b6f47c23SJamie Gritton if (error != 0) { 1541b6f47c23SJamie Gritton prison_deref(pr, created 1542b6f47c23SJamie Gritton ? PD_LIST_XLOCKED 1543b6f47c23SJamie Gritton : PD_DEREF | PD_LIST_XLOCKED); 1544b6f47c23SJamie Gritton goto done_releroot; 1545b6f47c23SJamie Gritton } 1546b6f47c23SJamie Gritton mtx_lock(&pr->pr_mtx); 1547b6f47c23SJamie Gritton 1548b6f47c23SJamie Gritton /* At this point, all valid parameters should have been noted. */ 1549b6f47c23SJamie Gritton TAILQ_FOREACH(opt, opts, link) { 1550b6f47c23SJamie Gritton if (!opt->seen && strcmp(opt->name, "errmsg")) { 1551b6f47c23SJamie Gritton error = EINVAL; 1552b6f47c23SJamie Gritton vfs_opterror(opts, "unknown parameter: %s", opt->name); 1553b6f47c23SJamie Gritton goto done_deref_locked; 1554b6f47c23SJamie Gritton } 1555b6f47c23SJamie Gritton } 1556b6f47c23SJamie Gritton 1557b38ff370SJamie Gritton /* Set the parameters of the prison. */ 1558b38ff370SJamie Gritton #ifdef INET 15590304c731SJamie Gritton redo_ip4 = 0; 15600304c731SJamie Gritton if (pr_flags & PR_IP4_USER) { 15610304c731SJamie Gritton pr->pr_flags |= PR_IP4; 1562b38ff370SJamie Gritton free(pr->pr_ip4, M_PRISON); 15630304c731SJamie Gritton pr->pr_ip4s = ip4s; 1564b38ff370SJamie Gritton pr->pr_ip4 = ip4; 1565b38ff370SJamie Gritton ip4 = NULL; 15660304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1567bdfc8cc4SJamie Gritton #ifdef VIMAGE 1568bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1569bdfc8cc4SJamie Gritton descend = 0; 1570bdfc8cc4SJamie Gritton continue; 1571bdfc8cc4SJamie Gritton } 1572bdfc8cc4SJamie Gritton #endif 15730304c731SJamie Gritton if (prison_restrict_ip4(tpr, NULL)) { 15740304c731SJamie Gritton redo_ip4 = 1; 15750304c731SJamie Gritton descend = 0; 15760304c731SJamie Gritton } 15770304c731SJamie Gritton } 15780304c731SJamie Gritton } 1579b38ff370SJamie Gritton #endif 1580b38ff370SJamie Gritton #ifdef INET6 15810304c731SJamie Gritton redo_ip6 = 0; 15820304c731SJamie Gritton if (pr_flags & PR_IP6_USER) { 15830304c731SJamie Gritton pr->pr_flags |= PR_IP6; 1584b38ff370SJamie Gritton free(pr->pr_ip6, M_PRISON); 15850304c731SJamie Gritton pr->pr_ip6s = ip6s; 1586b38ff370SJamie Gritton pr->pr_ip6 = ip6; 1587b38ff370SJamie Gritton ip6 = NULL; 15880304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1589bdfc8cc4SJamie Gritton #ifdef VIMAGE 1590bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1591bdfc8cc4SJamie Gritton descend = 0; 1592bdfc8cc4SJamie Gritton continue; 1593bdfc8cc4SJamie Gritton } 1594bdfc8cc4SJamie Gritton #endif 15950304c731SJamie Gritton if (prison_restrict_ip6(tpr, NULL)) { 15960304c731SJamie Gritton redo_ip6 = 1; 15970304c731SJamie Gritton descend = 0; 15980304c731SJamie Gritton } 15990304c731SJamie Gritton } 16000304c731SJamie Gritton } 1601b38ff370SJamie Gritton #endif 16020304c731SJamie Gritton if (gotslevel) { 1603b38ff370SJamie Gritton pr->pr_securelevel = slevel; 16040304c731SJamie Gritton /* Set all child jails to be at least this level. */ 16050304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16060304c731SJamie Gritton if (tpr->pr_securelevel < slevel) 16070304c731SJamie Gritton tpr->pr_securelevel = slevel; 16080304c731SJamie Gritton } 1609b97457e2SJamie Gritton if (gotchildmax) { 1610b97457e2SJamie Gritton pr->pr_childmax = childmax; 1611b97457e2SJamie Gritton /* Set all child jails to under this limit. */ 1612b97457e2SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED_LEVEL(pr, tpr, descend, level) 1613b97457e2SJamie Gritton if (tpr->pr_childmax > childmax - level) 1614b97457e2SJamie Gritton tpr->pr_childmax = childmax > level 1615b97457e2SJamie Gritton ? childmax - level : 0; 1616b97457e2SJamie Gritton } 16170304c731SJamie Gritton if (gotenforce) { 16180304c731SJamie Gritton pr->pr_enforce_statfs = enforce; 16190304c731SJamie Gritton /* Pass this restriction on to the children. */ 16200304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16210304c731SJamie Gritton if (tpr->pr_enforce_statfs < enforce) 16220304c731SJamie Gritton tpr->pr_enforce_statfs = enforce; 16230304c731SJamie Gritton } 16240cc207a6SMartin Matuska if (gotrsnum) { 16250cc207a6SMartin Matuska pr->pr_devfs_rsnum = rsnum; 16260cc207a6SMartin Matuska /* Pass this restriction on to the children. */ 16270cc207a6SMartin Matuska FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16280cc207a6SMartin Matuska tpr->pr_devfs_rsnum = rsnum; 16290cc207a6SMartin Matuska } 1630b6f47c23SJamie Gritton if (namelc != NULL) { 16310304c731SJamie Gritton if (ppr == &prison0) 1632b6f47c23SJamie Gritton strlcpy(pr->pr_name, namelc, sizeof(pr->pr_name)); 16330304c731SJamie Gritton else 16340304c731SJamie Gritton snprintf(pr->pr_name, sizeof(pr->pr_name), "%s.%s", 1635b6f47c23SJamie Gritton ppr->pr_name, namelc); 16360304c731SJamie Gritton /* Change this component of child names. */ 16370304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 16380304c731SJamie Gritton bcopy(tpr->pr_name + onamelen, tpr->pr_name + namelen, 16390304c731SJamie Gritton strlen(tpr->pr_name + onamelen) + 1); 16400304c731SJamie Gritton bcopy(pr->pr_name, tpr->pr_name, namelen); 16410304c731SJamie Gritton } 16420304c731SJamie Gritton } 1643b38ff370SJamie Gritton if (path != NULL) { 16440304c731SJamie Gritton /* Try to keep a real-rooted full pathname. */ 1645b38ff370SJamie Gritton strlcpy(pr->pr_path, path, sizeof(pr->pr_path)); 1646b38ff370SJamie Gritton pr->pr_root = root; 1647b38ff370SJamie Gritton } 164876ca6f88SJamie Gritton if (PR_HOST & ch_flags & ~pr_flags) { 164976ca6f88SJamie Gritton if (pr->pr_flags & PR_HOST) { 165076ca6f88SJamie Gritton /* 165176ca6f88SJamie Gritton * Copy the parent's host info. As with pr_ip4 above, 165276ca6f88SJamie Gritton * the lack of a lock on the parent is not a problem; 165376ca6f88SJamie Gritton * it is always set with allprison_lock at least 165476ca6f88SJamie Gritton * shared, and is held exclusively here. 165576ca6f88SJamie Gritton */ 1656c1f19219SJamie Gritton strlcpy(pr->pr_hostname, pr->pr_parent->pr_hostname, 1657c1f19219SJamie Gritton sizeof(pr->pr_hostname)); 1658c1f19219SJamie Gritton strlcpy(pr->pr_domainname, pr->pr_parent->pr_domainname, 1659c1f19219SJamie Gritton sizeof(pr->pr_domainname)); 1660c1f19219SJamie Gritton strlcpy(pr->pr_hostuuid, pr->pr_parent->pr_hostuuid, 1661c1f19219SJamie Gritton sizeof(pr->pr_hostuuid)); 166276ca6f88SJamie Gritton pr->pr_hostid = pr->pr_parent->pr_hostid; 166376ca6f88SJamie Gritton } 166476ca6f88SJamie Gritton } else if (host != NULL || domain != NULL || uuid != NULL || gothid) { 166576ca6f88SJamie Gritton /* Set this prison, and any descendants without PR_HOST. */ 1666b38ff370SJamie Gritton if (host != NULL) 1667c1f19219SJamie Gritton strlcpy(pr->pr_hostname, host, sizeof(pr->pr_hostname)); 166876ca6f88SJamie Gritton if (domain != NULL) 1669c1f19219SJamie Gritton strlcpy(pr->pr_domainname, domain, 1670c1f19219SJamie Gritton sizeof(pr->pr_domainname)); 167176ca6f88SJamie Gritton if (uuid != NULL) 1672c1f19219SJamie Gritton strlcpy(pr->pr_hostuuid, uuid, sizeof(pr->pr_hostuuid)); 167376ca6f88SJamie Gritton if (gothid) 167476ca6f88SJamie Gritton pr->pr_hostid = hid; 167576ca6f88SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 167676ca6f88SJamie Gritton if (tpr->pr_flags & PR_HOST) 167776ca6f88SJamie Gritton descend = 0; 167876ca6f88SJamie Gritton else { 167976ca6f88SJamie Gritton if (host != NULL) 1680c1f19219SJamie Gritton strlcpy(tpr->pr_hostname, 1681c1f19219SJamie Gritton pr->pr_hostname, 1682c1f19219SJamie Gritton sizeof(tpr->pr_hostname)); 168376ca6f88SJamie Gritton if (domain != NULL) 1684c1f19219SJamie Gritton strlcpy(tpr->pr_domainname, 1685c1f19219SJamie Gritton pr->pr_domainname, 1686c1f19219SJamie Gritton sizeof(tpr->pr_domainname)); 168776ca6f88SJamie Gritton if (uuid != NULL) 1688c1f19219SJamie Gritton strlcpy(tpr->pr_hostuuid, 1689c1f19219SJamie Gritton pr->pr_hostuuid, 1690c1f19219SJamie Gritton sizeof(tpr->pr_hostuuid)); 169176ca6f88SJamie Gritton if (gothid) 169276ca6f88SJamie Gritton tpr->pr_hostid = hid; 169376ca6f88SJamie Gritton } 169476ca6f88SJamie Gritton } 169576ca6f88SJamie Gritton } 16960304c731SJamie Gritton if ((tallow = ch_allow & ~pr_allow)) { 16970304c731SJamie Gritton /* Clear allow bits in all children. */ 16980304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16990304c731SJamie Gritton tpr->pr_allow &= ~tallow; 17000304c731SJamie Gritton } 17010304c731SJamie Gritton pr->pr_allow = (pr->pr_allow & ~ch_allow) | pr_allow; 1702b38ff370SJamie Gritton /* 1703b38ff370SJamie Gritton * Persistent prisons get an extra reference, and prisons losing their 1704b38ff370SJamie Gritton * persist flag lose that reference. Only do this for existing prisons 1705b38ff370SJamie Gritton * for now, so new ones will remain unseen until after the module 1706b38ff370SJamie Gritton * handlers have completed. 1707b38ff370SJamie Gritton */ 1708cc5fd8c7SJamie Gritton born = pr->pr_uref == 0; 1709b38ff370SJamie Gritton if (!created && (ch_flags & PR_PERSIST & (pr_flags ^ pr->pr_flags))) { 1710b38ff370SJamie Gritton if (pr_flags & PR_PERSIST) { 1711b38ff370SJamie Gritton pr->pr_ref++; 1712b38ff370SJamie Gritton pr->pr_uref++; 1713b38ff370SJamie Gritton } else { 1714b38ff370SJamie Gritton pr->pr_ref--; 1715b38ff370SJamie Gritton pr->pr_uref--; 1716b38ff370SJamie Gritton } 1717b38ff370SJamie Gritton } 1718b38ff370SJamie Gritton pr->pr_flags = (pr->pr_flags & ~ch_flags) | pr_flags; 1719b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 1720b38ff370SJamie Gritton 1721a7ad07bfSEdward Tomasz Napierala #ifdef RACCT 17224b5c9cf6SEdward Tomasz Napierala if (racct_enable && created) 1723a7ad07bfSEdward Tomasz Napierala prison_racct_attach(pr); 1724a7ad07bfSEdward Tomasz Napierala #endif 1725a7ad07bfSEdward Tomasz Napierala 17260304c731SJamie Gritton /* Locks may have prevented a complete restriction of child IP 17270304c731SJamie Gritton * addresses. If so, allocate some more memory and try again. 17280304c731SJamie Gritton */ 17290304c731SJamie Gritton #ifdef INET 17300304c731SJamie Gritton while (redo_ip4) { 17310304c731SJamie Gritton ip4s = pr->pr_ip4s; 17320304c731SJamie Gritton ip4 = malloc(ip4s * sizeof(*ip4), M_PRISON, M_WAITOK); 17330304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 17340304c731SJamie Gritton redo_ip4 = 0; 17350304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1736bdfc8cc4SJamie Gritton #ifdef VIMAGE 1737bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1738bdfc8cc4SJamie Gritton descend = 0; 1739bdfc8cc4SJamie Gritton continue; 1740bdfc8cc4SJamie Gritton } 1741bdfc8cc4SJamie Gritton #endif 17420304c731SJamie Gritton if (prison_restrict_ip4(tpr, ip4)) { 17430304c731SJamie Gritton if (ip4 != NULL) 17440304c731SJamie Gritton ip4 = NULL; 17450304c731SJamie Gritton else 17460304c731SJamie Gritton redo_ip4 = 1; 17470304c731SJamie Gritton } 17480304c731SJamie Gritton } 17490304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 17500304c731SJamie Gritton } 17510304c731SJamie Gritton #endif 17520304c731SJamie Gritton #ifdef INET6 17530304c731SJamie Gritton while (redo_ip6) { 17540304c731SJamie Gritton ip6s = pr->pr_ip6s; 17550304c731SJamie Gritton ip6 = malloc(ip6s * sizeof(*ip6), M_PRISON, M_WAITOK); 17560304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 17570304c731SJamie Gritton redo_ip6 = 0; 17580304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1759bdfc8cc4SJamie Gritton #ifdef VIMAGE 1760bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1761bdfc8cc4SJamie Gritton descend = 0; 1762bdfc8cc4SJamie Gritton continue; 1763bdfc8cc4SJamie Gritton } 1764bdfc8cc4SJamie Gritton #endif 17650304c731SJamie Gritton if (prison_restrict_ip6(tpr, ip6)) { 17660304c731SJamie Gritton if (ip6 != NULL) 17670304c731SJamie Gritton ip6 = NULL; 17680304c731SJamie Gritton else 17690304c731SJamie Gritton redo_ip6 = 1; 17700304c731SJamie Gritton } 17710304c731SJamie Gritton } 17720304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 17730304c731SJamie Gritton } 17740304c731SJamie Gritton #endif 17750304c731SJamie Gritton 1776b38ff370SJamie Gritton /* Let the modules do their work. */ 1777b38ff370SJamie Gritton sx_downgrade(&allprison_lock); 1778cc5fd8c7SJamie Gritton if (born) { 1779b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_CREATE, opts); 1780b38ff370SJamie Gritton if (error) { 1781cc5fd8c7SJamie Gritton (void)osd_jail_call(pr, PR_METHOD_REMOVE, NULL); 1782cc5fd8c7SJamie Gritton prison_deref(pr, created 1783cc5fd8c7SJamie Gritton ? PD_LIST_SLOCKED 1784cc5fd8c7SJamie Gritton : PD_DEREF | PD_LIST_SLOCKED); 1785b38ff370SJamie Gritton goto done_errmsg; 1786b38ff370SJamie Gritton } 1787b38ff370SJamie Gritton } 1788b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_SET, opts); 1789b38ff370SJamie Gritton if (error) { 1790cc5fd8c7SJamie Gritton if (born) 1791cc5fd8c7SJamie Gritton (void)osd_jail_call(pr, PR_METHOD_REMOVE, NULL); 1792b38ff370SJamie Gritton prison_deref(pr, created 1793b38ff370SJamie Gritton ? PD_LIST_SLOCKED 1794b38ff370SJamie Gritton : PD_DEREF | PD_LIST_SLOCKED); 1795b38ff370SJamie Gritton goto done_errmsg; 1796b38ff370SJamie Gritton } 1797b38ff370SJamie Gritton 1798b38ff370SJamie Gritton /* Attach this process to the prison if requested. */ 1799b38ff370SJamie Gritton if (flags & JAIL_ATTACH) { 1800b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 1801b38ff370SJamie Gritton error = do_jail_attach(td, pr); 1802b38ff370SJamie Gritton if (error) { 1803b38ff370SJamie Gritton vfs_opterror(opts, "attach failed"); 1804b38ff370SJamie Gritton if (!created) 1805b38ff370SJamie Gritton prison_deref(pr, PD_DEREF); 1806b38ff370SJamie Gritton goto done_errmsg; 1807b38ff370SJamie Gritton } 1808b38ff370SJamie Gritton } 1809b38ff370SJamie Gritton 18101fb24974SEdward Tomasz Napierala #ifdef RACCT 18114b5c9cf6SEdward Tomasz Napierala if (racct_enable && !created) { 1812f514b97bSEdward Tomasz Napierala if (!(flags & JAIL_ATTACH)) 18131fb24974SEdward Tomasz Napierala sx_sunlock(&allprison_lock); 18141fb24974SEdward Tomasz Napierala prison_racct_modify(pr); 1815f514b97bSEdward Tomasz Napierala if (!(flags & JAIL_ATTACH)) 18161fb24974SEdward Tomasz Napierala sx_slock(&allprison_lock); 18171fb24974SEdward Tomasz Napierala } 18181fb24974SEdward Tomasz Napierala #endif 18191fb24974SEdward Tomasz Napierala 18201fb24974SEdward Tomasz Napierala td->td_retval[0] = pr->pr_id; 18211fb24974SEdward Tomasz Napierala 1822b38ff370SJamie Gritton /* 1823b38ff370SJamie Gritton * Now that it is all there, drop the temporary reference from existing 1824b38ff370SJamie Gritton * prisons. Or add a reference to newly created persistent prisons 1825b38ff370SJamie Gritton * (which was not done earlier so that the prison would not be publicly 1826b38ff370SJamie Gritton * visible). 1827b38ff370SJamie Gritton */ 1828b38ff370SJamie Gritton if (!created) { 1829b38ff370SJamie Gritton prison_deref(pr, (flags & JAIL_ATTACH) 1830b38ff370SJamie Gritton ? PD_DEREF 1831b38ff370SJamie Gritton : PD_DEREF | PD_LIST_SLOCKED); 1832b38ff370SJamie Gritton } else { 1833b38ff370SJamie Gritton if (pr_flags & PR_PERSIST) { 1834b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 1835b38ff370SJamie Gritton pr->pr_ref++; 1836b38ff370SJamie Gritton pr->pr_uref++; 1837b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 1838b38ff370SJamie Gritton } 1839b38ff370SJamie Gritton if (!(flags & JAIL_ATTACH)) 1840b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 1841b38ff370SJamie Gritton } 1842c34bbd2aSEdward Tomasz Napierala 1843cc5fd8c7SJamie Gritton goto done_free; 1844b38ff370SJamie Gritton 18450304c731SJamie Gritton done_deref_locked: 18460304c731SJamie Gritton prison_deref(pr, created 18470304c731SJamie Gritton ? PD_LOCKED | PD_LIST_XLOCKED 18480304c731SJamie Gritton : PD_DEREF | PD_LOCKED | PD_LIST_XLOCKED); 18490304c731SJamie Gritton goto done_releroot; 1850b38ff370SJamie Gritton done_unlock_list: 1851b38ff370SJamie Gritton sx_xunlock(&allprison_lock); 1852b38ff370SJamie Gritton done_releroot: 18535050aa86SKonstantin Belousov if (root != NULL) 1854b38ff370SJamie Gritton vrele(root); 1855b38ff370SJamie Gritton done_errmsg: 1856b38ff370SJamie Gritton if (error) { 1857176ff3a0SJamie Gritton if (vfs_getopt(opts, "errmsg", (void **)&errmsg, 1858176ff3a0SJamie Gritton &errmsg_len) == 0 && errmsg_len > 0) { 1859b38ff370SJamie Gritton errmsg_pos = 2 * vfs_getopt_pos(opts, "errmsg") + 1; 1860b38ff370SJamie Gritton if (optuio->uio_segflg == UIO_SYSSPACE) 1861b38ff370SJamie Gritton bcopy(errmsg, 1862b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 1863b38ff370SJamie Gritton errmsg_len); 1864b38ff370SJamie Gritton else 1865b38ff370SJamie Gritton copyout(errmsg, 1866b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 1867b38ff370SJamie Gritton errmsg_len); 1868b38ff370SJamie Gritton } 1869b38ff370SJamie Gritton } 1870b38ff370SJamie Gritton done_free: 1871b38ff370SJamie Gritton #ifdef INET 1872b38ff370SJamie Gritton free(ip4, M_PRISON); 1873b38ff370SJamie Gritton #endif 1874b38ff370SJamie Gritton #ifdef INET6 1875b38ff370SJamie Gritton free(ip6, M_PRISON); 1876b38ff370SJamie Gritton #endif 18776dfe0a3dSMartin Matuska if (g_path != NULL) 18786dfe0a3dSMartin Matuska free(g_path, M_TEMP); 1879b38ff370SJamie Gritton vfs_freeopts(opts); 1880b38ff370SJamie Gritton return (error); 1881b38ff370SJamie Gritton } 1882b38ff370SJamie Gritton 1883b38ff370SJamie Gritton /* 1884b38ff370SJamie Gritton * struct jail_get_args { 1885b38ff370SJamie Gritton * struct iovec *iovp; 1886b38ff370SJamie Gritton * unsigned int iovcnt; 1887b38ff370SJamie Gritton * int flags; 1888b38ff370SJamie Gritton * }; 1889b38ff370SJamie Gritton */ 1890b38ff370SJamie Gritton int 18918451d0ddSKip Macy sys_jail_get(struct thread *td, struct jail_get_args *uap) 1892b38ff370SJamie Gritton { 1893b38ff370SJamie Gritton struct uio *auio; 1894b38ff370SJamie Gritton int error; 1895b38ff370SJamie Gritton 1896b38ff370SJamie Gritton /* Check that we have an even number of iovecs. */ 1897b38ff370SJamie Gritton if (uap->iovcnt & 1) 1898b38ff370SJamie Gritton return (EINVAL); 1899b38ff370SJamie Gritton 1900b38ff370SJamie Gritton error = copyinuio(uap->iovp, uap->iovcnt, &auio); 1901b38ff370SJamie Gritton if (error) 1902b38ff370SJamie Gritton return (error); 1903b38ff370SJamie Gritton error = kern_jail_get(td, auio, uap->flags); 1904b38ff370SJamie Gritton if (error == 0) 1905b38ff370SJamie Gritton error = copyout(auio->uio_iov, uap->iovp, 1906b38ff370SJamie Gritton uap->iovcnt * sizeof (struct iovec)); 1907b38ff370SJamie Gritton free(auio, M_IOV); 1908b38ff370SJamie Gritton return (error); 1909b38ff370SJamie Gritton } 1910b38ff370SJamie Gritton 1911b38ff370SJamie Gritton int 1912b38ff370SJamie Gritton kern_jail_get(struct thread *td, struct uio *optuio, int flags) 1913b38ff370SJamie Gritton { 1914672756aaSJamie Gritton struct bool_flags *bf; 1915672756aaSJamie Gritton struct jailsys_flags *jsf; 19160304c731SJamie Gritton struct prison *pr, *mypr; 1917b38ff370SJamie Gritton struct vfsopt *opt; 1918b38ff370SJamie Gritton struct vfsoptlist *opts; 1919b38ff370SJamie Gritton char *errmsg, *name; 1920672756aaSJamie Gritton int error, errmsg_len, errmsg_pos, i, jid, len, locked, pos; 1921672756aaSJamie Gritton unsigned f; 1922b38ff370SJamie Gritton 1923b38ff370SJamie Gritton if (flags & ~JAIL_GET_MASK) 1924b38ff370SJamie Gritton return (EINVAL); 1925b38ff370SJamie Gritton 1926b38ff370SJamie Gritton /* Get the parameter list. */ 1927b38ff370SJamie Gritton error = vfs_buildopts(optuio, &opts); 1928b38ff370SJamie Gritton if (error) 1929b38ff370SJamie Gritton return (error); 1930b38ff370SJamie Gritton errmsg_pos = vfs_getopt_pos(opts, "errmsg"); 19310304c731SJamie Gritton mypr = td->td_ucred->cr_prison; 19321e2a13e6SJamie Gritton 1933b38ff370SJamie Gritton /* 1934b38ff370SJamie Gritton * Find the prison specified by one of: lastjid, jid, name. 1935b38ff370SJamie Gritton */ 1936b38ff370SJamie Gritton sx_slock(&allprison_lock); 1937b38ff370SJamie Gritton error = vfs_copyopt(opts, "lastjid", &jid, sizeof(jid)); 1938b38ff370SJamie Gritton if (error == 0) { 1939b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) { 19400304c731SJamie Gritton if (pr->pr_id > jid && prison_ischild(mypr, pr)) { 1941b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 1942b38ff370SJamie Gritton if (pr->pr_ref > 0 && 1943b38ff370SJamie Gritton (pr->pr_uref > 0 || (flags & JAIL_DYING))) 1944b38ff370SJamie Gritton break; 1945b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 1946b38ff370SJamie Gritton } 1947b38ff370SJamie Gritton } 1948b38ff370SJamie Gritton if (pr != NULL) 1949b38ff370SJamie Gritton goto found_prison; 1950b38ff370SJamie Gritton error = ENOENT; 1951b38ff370SJamie Gritton vfs_opterror(opts, "no jail after %d", jid); 1952b38ff370SJamie Gritton goto done_unlock_list; 1953b38ff370SJamie Gritton } else if (error != ENOENT) 1954b38ff370SJamie Gritton goto done_unlock_list; 1955b38ff370SJamie Gritton 1956b38ff370SJamie Gritton error = vfs_copyopt(opts, "jid", &jid, sizeof(jid)); 1957b38ff370SJamie Gritton if (error == 0) { 1958b38ff370SJamie Gritton if (jid != 0) { 19590304c731SJamie Gritton pr = prison_find_child(mypr, jid); 1960b38ff370SJamie Gritton if (pr != NULL) { 1961b38ff370SJamie Gritton if (pr->pr_uref == 0 && !(flags & JAIL_DYING)) { 1962b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 1963b38ff370SJamie Gritton error = ENOENT; 1964b38ff370SJamie Gritton vfs_opterror(opts, "jail %d is dying", 1965b38ff370SJamie Gritton jid); 1966b38ff370SJamie Gritton goto done_unlock_list; 1967b38ff370SJamie Gritton } 1968b38ff370SJamie Gritton goto found_prison; 1969b38ff370SJamie Gritton } 1970b38ff370SJamie Gritton error = ENOENT; 1971b38ff370SJamie Gritton vfs_opterror(opts, "jail %d not found", jid); 1972b38ff370SJamie Gritton goto done_unlock_list; 1973b38ff370SJamie Gritton } 1974b38ff370SJamie Gritton } else if (error != ENOENT) 1975b38ff370SJamie Gritton goto done_unlock_list; 1976b38ff370SJamie Gritton 1977b38ff370SJamie Gritton error = vfs_getopt(opts, "name", (void **)&name, &len); 1978b38ff370SJamie Gritton if (error == 0) { 1979b38ff370SJamie Gritton if (len == 0 || name[len - 1] != '\0') { 1980b38ff370SJamie Gritton error = EINVAL; 1981b38ff370SJamie Gritton goto done_unlock_list; 1982b38ff370SJamie Gritton } 19830304c731SJamie Gritton pr = prison_find_name(mypr, name); 1984b38ff370SJamie Gritton if (pr != NULL) { 1985b38ff370SJamie Gritton if (pr->pr_uref == 0 && !(flags & JAIL_DYING)) { 1986b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 1987b38ff370SJamie Gritton error = ENOENT; 1988b38ff370SJamie Gritton vfs_opterror(opts, "jail \"%s\" is dying", 1989b38ff370SJamie Gritton name); 1990b38ff370SJamie Gritton goto done_unlock_list; 1991b38ff370SJamie Gritton } 1992b38ff370SJamie Gritton goto found_prison; 1993b38ff370SJamie Gritton } 1994b38ff370SJamie Gritton error = ENOENT; 1995b38ff370SJamie Gritton vfs_opterror(opts, "jail \"%s\" not found", name); 1996b38ff370SJamie Gritton goto done_unlock_list; 1997b38ff370SJamie Gritton } else if (error != ENOENT) 1998b38ff370SJamie Gritton goto done_unlock_list; 1999b38ff370SJamie Gritton 2000b38ff370SJamie Gritton vfs_opterror(opts, "no jail specified"); 2001b38ff370SJamie Gritton error = ENOENT; 2002b38ff370SJamie Gritton goto done_unlock_list; 2003b38ff370SJamie Gritton 2004b38ff370SJamie Gritton found_prison: 2005b38ff370SJamie Gritton /* Get the parameters of the prison. */ 2006b38ff370SJamie Gritton pr->pr_ref++; 2007b38ff370SJamie Gritton locked = PD_LOCKED; 2008b38ff370SJamie Gritton td->td_retval[0] = pr->pr_id; 2009b38ff370SJamie Gritton error = vfs_setopt(opts, "jid", &pr->pr_id, sizeof(pr->pr_id)); 2010b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2011b38ff370SJamie Gritton goto done_deref; 20120304c731SJamie Gritton i = (pr->pr_parent == mypr) ? 0 : pr->pr_parent->pr_id; 20130304c731SJamie Gritton error = vfs_setopt(opts, "parent", &i, sizeof(i)); 2014b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2015b38ff370SJamie Gritton goto done_deref; 20160304c731SJamie Gritton error = vfs_setopts(opts, "name", prison_name(mypr, pr)); 20170304c731SJamie Gritton if (error != 0 && error != ENOENT) 20180304c731SJamie Gritton goto done_deref; 20190304c731SJamie Gritton error = vfs_setopt(opts, "cpuset.id", &pr->pr_cpuset->cs_id, 2020b38ff370SJamie Gritton sizeof(pr->pr_cpuset->cs_id)); 2021b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2022b38ff370SJamie Gritton goto done_deref; 20230304c731SJamie Gritton error = vfs_setopts(opts, "path", prison_path(mypr, pr)); 2024b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2025b38ff370SJamie Gritton goto done_deref; 2026b38ff370SJamie Gritton #ifdef INET 2027b38ff370SJamie Gritton error = vfs_setopt_part(opts, "ip4.addr", pr->pr_ip4, 2028b38ff370SJamie Gritton pr->pr_ip4s * sizeof(*pr->pr_ip4)); 2029b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2030b38ff370SJamie Gritton goto done_deref; 2031b38ff370SJamie Gritton #endif 2032b38ff370SJamie Gritton #ifdef INET6 2033b38ff370SJamie Gritton error = vfs_setopt_part(opts, "ip6.addr", pr->pr_ip6, 2034b38ff370SJamie Gritton pr->pr_ip6s * sizeof(*pr->pr_ip6)); 2035b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2036b38ff370SJamie Gritton goto done_deref; 2037b38ff370SJamie Gritton #endif 2038b38ff370SJamie Gritton error = vfs_setopt(opts, "securelevel", &pr->pr_securelevel, 2039b38ff370SJamie Gritton sizeof(pr->pr_securelevel)); 2040b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2041b38ff370SJamie Gritton goto done_deref; 2042b97457e2SJamie Gritton error = vfs_setopt(opts, "children.cur", &pr->pr_childcount, 2043b97457e2SJamie Gritton sizeof(pr->pr_childcount)); 2044b97457e2SJamie Gritton if (error != 0 && error != ENOENT) 2045b97457e2SJamie Gritton goto done_deref; 2046b97457e2SJamie Gritton error = vfs_setopt(opts, "children.max", &pr->pr_childmax, 2047b97457e2SJamie Gritton sizeof(pr->pr_childmax)); 2048b97457e2SJamie Gritton if (error != 0 && error != ENOENT) 2049b97457e2SJamie Gritton goto done_deref; 2050c1f19219SJamie Gritton error = vfs_setopts(opts, "host.hostname", pr->pr_hostname); 2051b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2052b38ff370SJamie Gritton goto done_deref; 2053c1f19219SJamie Gritton error = vfs_setopts(opts, "host.domainname", pr->pr_domainname); 205476ca6f88SJamie Gritton if (error != 0 && error != ENOENT) 205576ca6f88SJamie Gritton goto done_deref; 2056c1f19219SJamie Gritton error = vfs_setopts(opts, "host.hostuuid", pr->pr_hostuuid); 205776ca6f88SJamie Gritton if (error != 0 && error != ENOENT) 205876ca6f88SJamie Gritton goto done_deref; 2059841c0c7eSNathan Whitehorn #ifdef COMPAT_FREEBSD32 2060a5c1afadSDmitry Chagin if (SV_PROC_FLAG(td->td_proc, SV_ILP32)) { 206176ca6f88SJamie Gritton uint32_t hid32 = pr->pr_hostid; 206276ca6f88SJamie Gritton 206376ca6f88SJamie Gritton error = vfs_setopt(opts, "host.hostid", &hid32, sizeof(hid32)); 206476ca6f88SJamie Gritton } else 206576ca6f88SJamie Gritton #endif 206676ca6f88SJamie Gritton error = vfs_setopt(opts, "host.hostid", &pr->pr_hostid, 206776ca6f88SJamie Gritton sizeof(pr->pr_hostid)); 206876ca6f88SJamie Gritton if (error != 0 && error != ENOENT) 206976ca6f88SJamie Gritton goto done_deref; 20700304c731SJamie Gritton error = vfs_setopt(opts, "enforce_statfs", &pr->pr_enforce_statfs, 20710304c731SJamie Gritton sizeof(pr->pr_enforce_statfs)); 20720304c731SJamie Gritton if (error != 0 && error != ENOENT) 20730304c731SJamie Gritton goto done_deref; 20740cc207a6SMartin Matuska error = vfs_setopt(opts, "devfs_ruleset", &pr->pr_devfs_rsnum, 20750cc207a6SMartin Matuska sizeof(pr->pr_devfs_rsnum)); 20760cc207a6SMartin Matuska if (error != 0 && error != ENOENT) 20770cc207a6SMartin Matuska goto done_deref; 2078672756aaSJamie Gritton for (bf = pr_flag_bool; 2079672756aaSJamie Gritton bf < pr_flag_bool + nitems(pr_flag_bool); 2080672756aaSJamie Gritton bf++) { 2081672756aaSJamie Gritton i = (pr->pr_flags & bf->flag) ? 1 : 0; 2082672756aaSJamie Gritton error = vfs_setopt(opts, bf->name, &i, sizeof(i)); 2083b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2084b38ff370SJamie Gritton goto done_deref; 2085b38ff370SJamie Gritton i = !i; 2086672756aaSJamie Gritton error = vfs_setopt(opts, bf->noname, &i, sizeof(i)); 2087b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2088b38ff370SJamie Gritton goto done_deref; 20890304c731SJamie Gritton } 2090672756aaSJamie Gritton for (jsf = pr_flag_jailsys; 2091672756aaSJamie Gritton jsf < pr_flag_jailsys + nitems(pr_flag_jailsys); 2092672756aaSJamie Gritton jsf++) { 2093672756aaSJamie Gritton f = pr->pr_flags & (jsf->disable | jsf->new); 2094672756aaSJamie Gritton i = (f != 0 && f == jsf->disable) ? JAIL_SYS_DISABLE 2095672756aaSJamie Gritton : (f == jsf->new) ? JAIL_SYS_NEW 20967cbf7213SJamie Gritton : JAIL_SYS_INHERIT; 2097672756aaSJamie Gritton error = vfs_setopt(opts, jsf->name, &i, sizeof(i)); 20987cbf7213SJamie Gritton if (error != 0 && error != ENOENT) 20997cbf7213SJamie Gritton goto done_deref; 21007cbf7213SJamie Gritton } 2101672756aaSJamie Gritton for (bf = pr_flag_allow; 21020e5c6bd4SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && bf->flag != 0; 2103672756aaSJamie Gritton bf++) { 2104672756aaSJamie Gritton i = (pr->pr_allow & bf->flag) ? 1 : 0; 2105672756aaSJamie Gritton error = vfs_setopt(opts, bf->name, &i, sizeof(i)); 21060304c731SJamie Gritton if (error != 0 && error != ENOENT) 21070304c731SJamie Gritton goto done_deref; 21080304c731SJamie Gritton i = !i; 2109672756aaSJamie Gritton error = vfs_setopt(opts, bf->noname, &i, sizeof(i)); 21100304c731SJamie Gritton if (error != 0 && error != ENOENT) 21110304c731SJamie Gritton goto done_deref; 21120304c731SJamie Gritton } 2113b38ff370SJamie Gritton i = (pr->pr_uref == 0); 2114b38ff370SJamie Gritton error = vfs_setopt(opts, "dying", &i, sizeof(i)); 2115b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2116b38ff370SJamie Gritton goto done_deref; 2117b38ff370SJamie Gritton i = !i; 2118b38ff370SJamie Gritton error = vfs_setopt(opts, "nodying", &i, sizeof(i)); 2119b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 2120b38ff370SJamie Gritton goto done_deref; 2121bd96bd15SIan Lepore error = vfs_setopt(opts, "osreldate", &pr->pr_osreldate, 2122bd96bd15SIan Lepore sizeof(pr->pr_osreldate)); 2123a1a4c1b0SIan Lepore if (error != 0 && error != ENOENT) 2124a1a4c1b0SIan Lepore goto done_deref; 2125a1a4c1b0SIan Lepore error = vfs_setopts(opts, "osrelease", pr->pr_osrelease); 2126a1a4c1b0SIan Lepore if (error != 0 && error != ENOENT) 2127a1a4c1b0SIan Lepore goto done_deref; 2128b38ff370SJamie Gritton 2129b38ff370SJamie Gritton /* Get the module parameters. */ 2130b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2131b38ff370SJamie Gritton locked = 0; 2132b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_GET, opts); 2133b38ff370SJamie Gritton if (error) 2134b38ff370SJamie Gritton goto done_deref; 2135b38ff370SJamie Gritton prison_deref(pr, PD_DEREF | PD_LIST_SLOCKED); 2136b38ff370SJamie Gritton 2137b38ff370SJamie Gritton /* By now, all parameters should have been noted. */ 2138b38ff370SJamie Gritton TAILQ_FOREACH(opt, opts, link) { 2139b38ff370SJamie Gritton if (!opt->seen && strcmp(opt->name, "errmsg")) { 2140b38ff370SJamie Gritton error = EINVAL; 2141b38ff370SJamie Gritton vfs_opterror(opts, "unknown parameter: %s", opt->name); 2142b38ff370SJamie Gritton goto done_errmsg; 2143b38ff370SJamie Gritton } 2144b38ff370SJamie Gritton } 2145b38ff370SJamie Gritton 2146b38ff370SJamie Gritton /* Write the fetched parameters back to userspace. */ 2147b38ff370SJamie Gritton error = 0; 2148b38ff370SJamie Gritton TAILQ_FOREACH(opt, opts, link) { 2149b38ff370SJamie Gritton if (opt->pos >= 0 && opt->pos != errmsg_pos) { 2150b38ff370SJamie Gritton pos = 2 * opt->pos + 1; 2151b38ff370SJamie Gritton optuio->uio_iov[pos].iov_len = opt->len; 2152b38ff370SJamie Gritton if (opt->value != NULL) { 2153b38ff370SJamie Gritton if (optuio->uio_segflg == UIO_SYSSPACE) { 2154b38ff370SJamie Gritton bcopy(opt->value, 2155b38ff370SJamie Gritton optuio->uio_iov[pos].iov_base, 2156b38ff370SJamie Gritton opt->len); 2157b38ff370SJamie Gritton } else { 2158b38ff370SJamie Gritton error = copyout(opt->value, 2159b38ff370SJamie Gritton optuio->uio_iov[pos].iov_base, 2160b38ff370SJamie Gritton opt->len); 2161b38ff370SJamie Gritton if (error) 2162b38ff370SJamie Gritton break; 2163b38ff370SJamie Gritton } 2164b38ff370SJamie Gritton } 2165b38ff370SJamie Gritton } 2166b38ff370SJamie Gritton } 2167b38ff370SJamie Gritton goto done_errmsg; 2168b38ff370SJamie Gritton 2169b38ff370SJamie Gritton done_deref: 2170b38ff370SJamie Gritton prison_deref(pr, locked | PD_DEREF | PD_LIST_SLOCKED); 2171b38ff370SJamie Gritton goto done_errmsg; 2172b38ff370SJamie Gritton 2173b38ff370SJamie Gritton done_unlock_list: 2174b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2175b38ff370SJamie Gritton done_errmsg: 2176b38ff370SJamie Gritton if (error && errmsg_pos >= 0) { 2177b38ff370SJamie Gritton vfs_getopt(opts, "errmsg", (void **)&errmsg, &errmsg_len); 2178b38ff370SJamie Gritton errmsg_pos = 2 * errmsg_pos + 1; 2179b38ff370SJamie Gritton if (errmsg_len > 0) { 2180b38ff370SJamie Gritton if (optuio->uio_segflg == UIO_SYSSPACE) 2181b38ff370SJamie Gritton bcopy(errmsg, 2182b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 2183b38ff370SJamie Gritton errmsg_len); 2184b38ff370SJamie Gritton else 2185b38ff370SJamie Gritton copyout(errmsg, 2186b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 2187b38ff370SJamie Gritton errmsg_len); 2188b38ff370SJamie Gritton } 2189b38ff370SJamie Gritton } 2190b38ff370SJamie Gritton vfs_freeopts(opts); 2191b38ff370SJamie Gritton return (error); 2192b38ff370SJamie Gritton } 2193b38ff370SJamie Gritton 2194b38ff370SJamie Gritton /* 2195b38ff370SJamie Gritton * struct jail_remove_args { 2196b38ff370SJamie Gritton * int jid; 2197b38ff370SJamie Gritton * }; 2198b38ff370SJamie Gritton */ 2199b38ff370SJamie Gritton int 22008451d0ddSKip Macy sys_jail_remove(struct thread *td, struct jail_remove_args *uap) 2201b38ff370SJamie Gritton { 22020304c731SJamie Gritton struct prison *pr, *cpr, *lpr, *tpr; 22030304c731SJamie Gritton int descend, error; 2204b38ff370SJamie Gritton 2205b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_REMOVE); 2206b38ff370SJamie Gritton if (error) 2207b38ff370SJamie Gritton return (error); 2208b38ff370SJamie Gritton 2209b38ff370SJamie Gritton sx_xlock(&allprison_lock); 22100304c731SJamie Gritton pr = prison_find_child(td->td_ucred->cr_prison, uap->jid); 2211b38ff370SJamie Gritton if (pr == NULL) { 2212b38ff370SJamie Gritton sx_xunlock(&allprison_lock); 2213b38ff370SJamie Gritton return (EINVAL); 2214b38ff370SJamie Gritton } 2215b38ff370SJamie Gritton 22160304c731SJamie Gritton /* Remove all descendants of this prison, then remove this prison. */ 22170304c731SJamie Gritton pr->pr_ref++; 22180304c731SJamie Gritton if (!LIST_EMPTY(&pr->pr_children)) { 22190304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 22200304c731SJamie Gritton lpr = NULL; 22210304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(pr, cpr, descend) { 22220304c731SJamie Gritton mtx_lock(&cpr->pr_mtx); 22230304c731SJamie Gritton if (cpr->pr_ref > 0) { 22240304c731SJamie Gritton tpr = cpr; 22250304c731SJamie Gritton cpr->pr_ref++; 22260304c731SJamie Gritton } else { 22270304c731SJamie Gritton /* Already removed - do not do it again. */ 22280304c731SJamie Gritton tpr = NULL; 22290304c731SJamie Gritton } 22300304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 22310304c731SJamie Gritton if (lpr != NULL) { 22320304c731SJamie Gritton mtx_lock(&lpr->pr_mtx); 22330304c731SJamie Gritton prison_remove_one(lpr); 22340304c731SJamie Gritton sx_xlock(&allprison_lock); 22350304c731SJamie Gritton } 22360304c731SJamie Gritton lpr = tpr; 22370304c731SJamie Gritton } 22380304c731SJamie Gritton if (lpr != NULL) { 22390304c731SJamie Gritton mtx_lock(&lpr->pr_mtx); 22400304c731SJamie Gritton prison_remove_one(lpr); 22410304c731SJamie Gritton sx_xlock(&allprison_lock); 22420304c731SJamie Gritton } 22430304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 22440304c731SJamie Gritton } 22450304c731SJamie Gritton prison_remove_one(pr); 22460304c731SJamie Gritton return (0); 22470304c731SJamie Gritton } 22480304c731SJamie Gritton 22490304c731SJamie Gritton static void 22500304c731SJamie Gritton prison_remove_one(struct prison *pr) 22510304c731SJamie Gritton { 22520304c731SJamie Gritton struct proc *p; 22530304c731SJamie Gritton int deuref; 22540304c731SJamie Gritton 2255b38ff370SJamie Gritton /* If the prison was persistent, it is not anymore. */ 2256b38ff370SJamie Gritton deuref = 0; 2257b38ff370SJamie Gritton if (pr->pr_flags & PR_PERSIST) { 2258b38ff370SJamie Gritton pr->pr_ref--; 2259b38ff370SJamie Gritton deuref = PD_DEUREF; 2260b38ff370SJamie Gritton pr->pr_flags &= ~PR_PERSIST; 2261b38ff370SJamie Gritton } 2262b38ff370SJamie Gritton 22630304c731SJamie Gritton /* 22640304c731SJamie Gritton * jail_remove added a reference. If that's the only one, remove 22650304c731SJamie Gritton * the prison now. 22660304c731SJamie Gritton */ 22670304c731SJamie Gritton KASSERT(pr->pr_ref > 0, 22680304c731SJamie Gritton ("prison_remove_one removing a dead prison (jid=%d)", pr->pr_id)); 22690304c731SJamie Gritton if (pr->pr_ref == 1) { 2270b38ff370SJamie Gritton prison_deref(pr, 2271b38ff370SJamie Gritton deuref | PD_DEREF | PD_LOCKED | PD_LIST_XLOCKED); 22720304c731SJamie Gritton return; 2273b38ff370SJamie Gritton } 2274b38ff370SJamie Gritton 2275b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2276b38ff370SJamie Gritton sx_xunlock(&allprison_lock); 2277b38ff370SJamie Gritton /* 2278b38ff370SJamie Gritton * Kill all processes unfortunate enough to be attached to this prison. 2279b38ff370SJamie Gritton */ 2280b38ff370SJamie Gritton sx_slock(&allproc_lock); 22817938a442SBjoern A. Zeeb FOREACH_PROC_IN_SYSTEM(p) { 2282b38ff370SJamie Gritton PROC_LOCK(p); 2283b38ff370SJamie Gritton if (p->p_state != PRS_NEW && p->p_ucred && 2284b38ff370SJamie Gritton p->p_ucred->cr_prison == pr) 22858451d0ddSKip Macy kern_psignal(p, SIGKILL); 2286b38ff370SJamie Gritton PROC_UNLOCK(p); 2287b38ff370SJamie Gritton } 2288b38ff370SJamie Gritton sx_sunlock(&allproc_lock); 22890304c731SJamie Gritton /* Remove the temporary reference added by jail_remove. */ 2290b38ff370SJamie Gritton prison_deref(pr, deuref | PD_DEREF); 229175c13541SPoul-Henning Kamp } 229275c13541SPoul-Henning Kamp 2293fd7a8150SMike Barcroft /* 22949ddb7954SMike Barcroft * struct jail_attach_args { 22959ddb7954SMike Barcroft * int jid; 22969ddb7954SMike Barcroft * }; 2297fd7a8150SMike Barcroft */ 2298fd7a8150SMike Barcroft int 22998451d0ddSKip Macy sys_jail_attach(struct thread *td, struct jail_attach_args *uap) 2300fd7a8150SMike Barcroft { 2301b38ff370SJamie Gritton struct prison *pr; 2302b38ff370SJamie Gritton int error; 2303b38ff370SJamie Gritton 2304b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_ATTACH); 2305b38ff370SJamie Gritton if (error) 2306b38ff370SJamie Gritton return (error); 2307b38ff370SJamie Gritton 2308ef0ddea3SJamie Gritton /* 2309ef0ddea3SJamie Gritton * Start with exclusive hold on allprison_lock to ensure that a possible 2310ef0ddea3SJamie Gritton * PR_METHOD_REMOVE call isn't concurrent with jail_set or jail_remove. 2311ef0ddea3SJamie Gritton * But then immediately downgrade it since we don't need to stop 2312ef0ddea3SJamie Gritton * readers. 2313ef0ddea3SJamie Gritton */ 2314ef0ddea3SJamie Gritton sx_xlock(&allprison_lock); 2315ef0ddea3SJamie Gritton sx_downgrade(&allprison_lock); 23160304c731SJamie Gritton pr = prison_find_child(td->td_ucred->cr_prison, uap->jid); 2317b38ff370SJamie Gritton if (pr == NULL) { 2318b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2319b38ff370SJamie Gritton return (EINVAL); 2320b38ff370SJamie Gritton } 2321b38ff370SJamie Gritton 2322b38ff370SJamie Gritton /* 2323b38ff370SJamie Gritton * Do not allow a process to attach to a prison that is not 2324b38ff370SJamie Gritton * considered to be "alive". 2325b38ff370SJamie Gritton */ 2326b38ff370SJamie Gritton if (pr->pr_uref == 0) { 2327b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2328b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2329b38ff370SJamie Gritton return (EINVAL); 2330b38ff370SJamie Gritton } 2331b38ff370SJamie Gritton 2332b38ff370SJamie Gritton return (do_jail_attach(td, pr)); 2333b38ff370SJamie Gritton } 2334b38ff370SJamie Gritton 2335b38ff370SJamie Gritton static int 2336b38ff370SJamie Gritton do_jail_attach(struct thread *td, struct prison *pr) 2337b38ff370SJamie Gritton { 2338fd7a8150SMike Barcroft struct proc *p; 2339fd7a8150SMike Barcroft struct ucred *newcred, *oldcred; 23405050aa86SKonstantin Belousov int error; 2341fd7a8150SMike Barcroft 234257f22bd4SJacques Vidrine /* 234357f22bd4SJacques Vidrine * XXX: Note that there is a slight race here if two threads 234457f22bd4SJacques Vidrine * in the same privileged process attempt to attach to two 234557f22bd4SJacques Vidrine * different jails at the same time. It is important for 234657f22bd4SJacques Vidrine * user processes not to do this, or they might end up with 234757f22bd4SJacques Vidrine * a process root from one prison, but attached to the jail 234857f22bd4SJacques Vidrine * of another. 234957f22bd4SJacques Vidrine */ 2350fd7a8150SMike Barcroft pr->pr_ref++; 2351b38ff370SJamie Gritton pr->pr_uref++; 2352fd7a8150SMike Barcroft mtx_unlock(&pr->pr_mtx); 2353b38ff370SJamie Gritton 2354b38ff370SJamie Gritton /* Let modules do whatever they need to prepare for attaching. */ 2355b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_ATTACH, td); 2356b38ff370SJamie Gritton if (error) { 2357b38ff370SJamie Gritton prison_deref(pr, PD_DEREF | PD_DEUREF | PD_LIST_SLOCKED); 2358b38ff370SJamie Gritton return (error); 2359b38ff370SJamie Gritton } 2360dc68a633SPawel Jakub Dawidek sx_sunlock(&allprison_lock); 2361fd7a8150SMike Barcroft 2362413628a7SBjoern A. Zeeb /* 2363413628a7SBjoern A. Zeeb * Reparent the newly attached process to this jail. 2364413628a7SBjoern A. Zeeb */ 2365b38ff370SJamie Gritton p = td->td_proc; 2366413628a7SBjoern A. Zeeb error = cpuset_setproc_update_set(p, pr->pr_cpuset); 2367413628a7SBjoern A. Zeeb if (error) 2368b38ff370SJamie Gritton goto e_revert_osd; 2369413628a7SBjoern A. Zeeb 2370cb05b60aSAttilio Rao vn_lock(pr->pr_root, LK_EXCLUSIVE | LK_RETRY); 2371fd7a8150SMike Barcroft if ((error = change_dir(pr->pr_root, td)) != 0) 2372fd7a8150SMike Barcroft goto e_unlock; 2373fd7a8150SMike Barcroft #ifdef MAC 237430d239bcSRobert Watson if ((error = mac_vnode_check_chroot(td->td_ucred, pr->pr_root))) 2375fd7a8150SMike Barcroft goto e_unlock; 2376fd7a8150SMike Barcroft #endif 2377b249ce48SMateusz Guzik VOP_UNLOCK(pr->pr_root); 2378f0725a8eSMateusz Guzik if ((error = pwd_chroot(td, pr->pr_root))) 23795050aa86SKonstantin Belousov goto e_revert_osd; 2380fd7a8150SMike Barcroft 2381fd7a8150SMike Barcroft newcred = crget(); 2382fd7a8150SMike Barcroft PROC_LOCK(p); 23831fb6767dSJamie Gritton oldcred = crcopysafe(p, newcred); 238469c4ee54SJohn Baldwin newcred->cr_prison = pr; 2385daf63fd2SMateusz Guzik proc_set_cred(p, newcred); 23861fb6767dSJamie Gritton setsugid(p); 2387097055e2SEdward Tomasz Napierala #ifdef RACCT 2388097055e2SEdward Tomasz Napierala racct_proc_ucred_changed(p, oldcred, newcred); 2389f87beb93SAndriy Gapon crhold(newcred); 2390f87beb93SAndriy Gapon #endif 2391f87beb93SAndriy Gapon PROC_UNLOCK(p); 2392f87beb93SAndriy Gapon #ifdef RCTL 2393f87beb93SAndriy Gapon rctl_proc_ucred_changed(p, newcred); 2394f87beb93SAndriy Gapon crfree(newcred); 2395097055e2SEdward Tomasz Napierala #endif 23961fb6767dSJamie Gritton prison_deref(oldcred->cr_prison, PD_DEREF | PD_DEUREF); 2397fd7a8150SMike Barcroft crfree(oldcred); 2398fd7a8150SMike Barcroft return (0); 23991fb6767dSJamie Gritton 2400fd7a8150SMike Barcroft e_unlock: 2401b249ce48SMateusz Guzik VOP_UNLOCK(pr->pr_root); 2402b38ff370SJamie Gritton e_revert_osd: 2403b38ff370SJamie Gritton /* Tell modules this thread is still in its old jail after all. */ 24041fb6767dSJamie Gritton (void)osd_jail_call(td->td_ucred->cr_prison, PR_METHOD_ATTACH, td); 2405b38ff370SJamie Gritton prison_deref(pr, PD_DEREF | PD_DEUREF); 2406fd7a8150SMike Barcroft return (error); 2407fd7a8150SMike Barcroft } 2408fd7a8150SMike Barcroft 2409fd7a8150SMike Barcroft /* 2410fd7a8150SMike Barcroft * Returns a locked prison instance, or NULL on failure. 2411fd7a8150SMike Barcroft */ 241254b369c1SPawel Jakub Dawidek struct prison * 2413fd7a8150SMike Barcroft prison_find(int prid) 2414fd7a8150SMike Barcroft { 2415fd7a8150SMike Barcroft struct prison *pr; 2416fd7a8150SMike Barcroft 2417dc68a633SPawel Jakub Dawidek sx_assert(&allprison_lock, SX_LOCKED); 2418b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) { 2419fd7a8150SMike Barcroft if (pr->pr_id == prid) { 2420fd7a8150SMike Barcroft mtx_lock(&pr->pr_mtx); 2421b38ff370SJamie Gritton if (pr->pr_ref > 0) 2422fd7a8150SMike Barcroft return (pr); 2423b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2424fd7a8150SMike Barcroft } 2425fd7a8150SMike Barcroft } 2426fd7a8150SMike Barcroft return (NULL); 2427fd7a8150SMike Barcroft } 2428fd7a8150SMike Barcroft 2429b38ff370SJamie Gritton /* 24300304c731SJamie Gritton * Find a prison that is a descendant of mypr. Returns a locked prison or NULL. 2431b38ff370SJamie Gritton */ 2432b38ff370SJamie Gritton struct prison * 24330304c731SJamie Gritton prison_find_child(struct prison *mypr, int prid) 2434b38ff370SJamie Gritton { 24350304c731SJamie Gritton struct prison *pr; 24360304c731SJamie Gritton int descend; 2437b38ff370SJamie Gritton 2438b38ff370SJamie Gritton sx_assert(&allprison_lock, SX_LOCKED); 24390304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(mypr, pr, descend) { 24400304c731SJamie Gritton if (pr->pr_id == prid) { 24410304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 24420304c731SJamie Gritton if (pr->pr_ref > 0) 24430304c731SJamie Gritton return (pr); 24440304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 24450304c731SJamie Gritton } 24460304c731SJamie Gritton } 24470304c731SJamie Gritton return (NULL); 24480304c731SJamie Gritton } 24490304c731SJamie Gritton 24500304c731SJamie Gritton /* 24510304c731SJamie Gritton * Look for the name relative to mypr. Returns a locked prison or NULL. 24520304c731SJamie Gritton */ 24530304c731SJamie Gritton struct prison * 24540304c731SJamie Gritton prison_find_name(struct prison *mypr, const char *name) 24550304c731SJamie Gritton { 24560304c731SJamie Gritton struct prison *pr, *deadpr; 24570304c731SJamie Gritton size_t mylen; 24580304c731SJamie Gritton int descend; 24590304c731SJamie Gritton 24600304c731SJamie Gritton sx_assert(&allprison_lock, SX_LOCKED); 24610304c731SJamie Gritton mylen = (mypr == &prison0) ? 0 : strlen(mypr->pr_name) + 1; 2462b38ff370SJamie Gritton again: 2463b38ff370SJamie Gritton deadpr = NULL; 24640304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(mypr, pr, descend) { 24650304c731SJamie Gritton if (!strcmp(pr->pr_name + mylen, name)) { 2466b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 2467b38ff370SJamie Gritton if (pr->pr_ref > 0) { 2468b38ff370SJamie Gritton if (pr->pr_uref > 0) 2469b38ff370SJamie Gritton return (pr); 2470b38ff370SJamie Gritton deadpr = pr; 2471b38ff370SJamie Gritton } 2472b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2473b38ff370SJamie Gritton } 2474b38ff370SJamie Gritton } 24750304c731SJamie Gritton /* There was no valid prison - perhaps there was a dying one. */ 2476b38ff370SJamie Gritton if (deadpr != NULL) { 2477b38ff370SJamie Gritton mtx_lock(&deadpr->pr_mtx); 2478b38ff370SJamie Gritton if (deadpr->pr_ref == 0) { 2479b38ff370SJamie Gritton mtx_unlock(&deadpr->pr_mtx); 2480b38ff370SJamie Gritton goto again; 2481b38ff370SJamie Gritton } 2482b38ff370SJamie Gritton } 2483b38ff370SJamie Gritton return (deadpr); 2484b38ff370SJamie Gritton } 2485b38ff370SJamie Gritton 2486b38ff370SJamie Gritton /* 24870304c731SJamie Gritton * See if a prison has the specific flag set. 24880304c731SJamie Gritton */ 24890304c731SJamie Gritton int 24900304c731SJamie Gritton prison_flag(struct ucred *cred, unsigned flag) 24910304c731SJamie Gritton { 24920304c731SJamie Gritton 24930304c731SJamie Gritton /* This is an atomic read, so no locking is necessary. */ 24940304c731SJamie Gritton return (cred->cr_prison->pr_flags & flag); 24950304c731SJamie Gritton } 24960304c731SJamie Gritton 24970304c731SJamie Gritton int 24980304c731SJamie Gritton prison_allow(struct ucred *cred, unsigned flag) 24990304c731SJamie Gritton { 25000304c731SJamie Gritton 25010304c731SJamie Gritton /* This is an atomic read, so no locking is necessary. */ 25020304c731SJamie Gritton return (cred->cr_prison->pr_allow & flag); 25030304c731SJamie Gritton } 25040304c731SJamie Gritton 25050304c731SJamie Gritton /* 2506b38ff370SJamie Gritton * Remove a prison reference. If that was the last reference, remove the 2507b38ff370SJamie Gritton * prison itself - but not in this context in case there are locks held. 2508b38ff370SJamie Gritton */ 250991421ba2SRobert Watson void 25101ba4a712SPawel Jakub Dawidek prison_free_locked(struct prison *pr) 251191421ba2SRobert Watson { 251273d9e52dSJamie Gritton int ref; 251391421ba2SRobert Watson 25141ba4a712SPawel Jakub Dawidek mtx_assert(&pr->pr_mtx, MA_OWNED); 251573d9e52dSJamie Gritton ref = --pr->pr_ref; 251601137630SRobert Watson mtx_unlock(&pr->pr_mtx); 251773d9e52dSJamie Gritton if (ref == 0) 2518c2cda609SPawel Jakub Dawidek taskqueue_enqueue(taskqueue_thread, &pr->pr_task); 2519c2cda609SPawel Jakub Dawidek } 2520c2cda609SPawel Jakub Dawidek 25211ba4a712SPawel Jakub Dawidek void 25221ba4a712SPawel Jakub Dawidek prison_free(struct prison *pr) 25231ba4a712SPawel Jakub Dawidek { 25241ba4a712SPawel Jakub Dawidek 25251ba4a712SPawel Jakub Dawidek mtx_lock(&pr->pr_mtx); 25261ba4a712SPawel Jakub Dawidek prison_free_locked(pr); 25271ba4a712SPawel Jakub Dawidek } 25281ba4a712SPawel Jakub Dawidek 252973d9e52dSJamie Gritton /* 253073d9e52dSJamie Gritton * Complete a call to either prison_free or prison_proc_free. 253173d9e52dSJamie Gritton */ 2532c2cda609SPawel Jakub Dawidek static void 2533c2cda609SPawel Jakub Dawidek prison_complete(void *context, int pending) 2534c2cda609SPawel Jakub Dawidek { 253573d9e52dSJamie Gritton struct prison *pr = context; 2536b38ff370SJamie Gritton 2537ef0ddea3SJamie Gritton sx_xlock(&allprison_lock); 253873d9e52dSJamie Gritton mtx_lock(&pr->pr_mtx); 253973d9e52dSJamie Gritton prison_deref(pr, pr->pr_uref 2540ef0ddea3SJamie Gritton ? PD_DEREF | PD_DEUREF | PD_LOCKED | PD_LIST_XLOCKED 2541ef0ddea3SJamie Gritton : PD_LOCKED | PD_LIST_XLOCKED); 2542b38ff370SJamie Gritton } 2543b38ff370SJamie Gritton 2544b38ff370SJamie Gritton /* 2545b38ff370SJamie Gritton * Remove a prison reference (usually). This internal version assumes no 2546b38ff370SJamie Gritton * mutexes are held, except perhaps the prison itself. If there are no more 2547b38ff370SJamie Gritton * references, release and delist the prison. On completion, the prison lock 2548b38ff370SJamie Gritton * and the allprison lock are both unlocked. 2549b38ff370SJamie Gritton */ 2550b38ff370SJamie Gritton static void 2551b38ff370SJamie Gritton prison_deref(struct prison *pr, int flags) 2552b38ff370SJamie Gritton { 25530304c731SJamie Gritton struct prison *ppr, *tpr; 2554cc5fd8c7SJamie Gritton int ref, lasturef; 2555c2cda609SPawel Jakub Dawidek 2556b38ff370SJamie Gritton if (!(flags & PD_LOCKED)) 2557b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 25580304c731SJamie Gritton for (;;) { 2559e6d5cb63SJamie Gritton if (flags & PD_DEUREF) { 256073d9e52dSJamie Gritton KASSERT(pr->pr_uref > 0, 256173d9e52dSJamie Gritton ("prison_deref PD_DEUREF on a dead prison (jid=%d)", 256273d9e52dSJamie Gritton pr->pr_id)); 2563e6d5cb63SJamie Gritton pr->pr_uref--; 2564cc5fd8c7SJamie Gritton lasturef = pr->pr_uref == 0; 2565cc5fd8c7SJamie Gritton if (lasturef) 2566cc5fd8c7SJamie Gritton pr->pr_ref++; 2567e6d5cb63SJamie Gritton KASSERT(prison0.pr_uref != 0, ("prison0 pr_uref=0")); 2568cc5fd8c7SJamie Gritton } else 2569cc5fd8c7SJamie Gritton lasturef = 0; 257073d9e52dSJamie Gritton if (flags & PD_DEREF) { 257173d9e52dSJamie Gritton KASSERT(pr->pr_ref > 0, 257273d9e52dSJamie Gritton ("prison_deref PD_DEREF on a dead prison (jid=%d)", 257373d9e52dSJamie Gritton pr->pr_id)); 2574b38ff370SJamie Gritton pr->pr_ref--; 257573d9e52dSJamie Gritton } 2576cc5fd8c7SJamie Gritton ref = pr->pr_ref; 2577b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2578cc5fd8c7SJamie Gritton 2579cc5fd8c7SJamie Gritton /* 2580cc5fd8c7SJamie Gritton * Tell the modules if the last user reference was removed 2581cc5fd8c7SJamie Gritton * (even it sticks around in dying state). 2582cc5fd8c7SJamie Gritton */ 2583cc5fd8c7SJamie Gritton if (lasturef) { 2584cc5fd8c7SJamie Gritton if (!(flags & (PD_LIST_SLOCKED | PD_LIST_XLOCKED))) { 2585cc5fd8c7SJamie Gritton sx_xlock(&allprison_lock); 2586cc5fd8c7SJamie Gritton flags |= PD_LIST_XLOCKED; 2587cc5fd8c7SJamie Gritton } 2588cc5fd8c7SJamie Gritton (void)osd_jail_call(pr, PR_METHOD_REMOVE, NULL); 2589cc5fd8c7SJamie Gritton mtx_lock(&pr->pr_mtx); 2590cc5fd8c7SJamie Gritton ref = --pr->pr_ref; 2591cc5fd8c7SJamie Gritton mtx_unlock(&pr->pr_mtx); 2592cc5fd8c7SJamie Gritton } 2593cc5fd8c7SJamie Gritton 2594cc5fd8c7SJamie Gritton /* If the prison still has references, nothing else to do. */ 2595cc5fd8c7SJamie Gritton if (ref > 0) { 2596b38ff370SJamie Gritton if (flags & PD_LIST_SLOCKED) 2597b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2598b38ff370SJamie Gritton else if (flags & PD_LIST_XLOCKED) 2599b38ff370SJamie Gritton sx_xunlock(&allprison_lock); 2600b38ff370SJamie Gritton return; 2601b38ff370SJamie Gritton } 2602c2cda609SPawel Jakub Dawidek 2603b38ff370SJamie Gritton if (flags & PD_LIST_SLOCKED) { 2604b38ff370SJamie Gritton if (!sx_try_upgrade(&allprison_lock)) { 2605b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2606c2cda609SPawel Jakub Dawidek sx_xlock(&allprison_lock); 2607b38ff370SJamie Gritton } 2608b38ff370SJamie Gritton } else if (!(flags & PD_LIST_XLOCKED)) 2609b38ff370SJamie Gritton sx_xlock(&allprison_lock); 2610b38ff370SJamie Gritton 2611b38ff370SJamie Gritton TAILQ_REMOVE(&allprison, pr, pr_list); 26120304c731SJamie Gritton LIST_REMOVE(pr, pr_sibling); 26130304c731SJamie Gritton ppr = pr->pr_parent; 26140304c731SJamie Gritton for (tpr = ppr; tpr != NULL; tpr = tpr->pr_parent) 2615b97457e2SJamie Gritton tpr->pr_childcount--; 2616c4884ffaSJamie Gritton sx_xunlock(&allprison_lock); 26171ba4a712SPawel Jakub Dawidek 2618679e1390SJamie Gritton #ifdef VIMAGE 26190cb8b6a9SMarko Zec if (pr->pr_vnet != ppr->pr_vnet) 2620679e1390SJamie Gritton vnet_destroy(pr->pr_vnet); 2621679e1390SJamie Gritton #endif 26225050aa86SKonstantin Belousov if (pr->pr_root != NULL) 2623b3059e09SRobert Watson vrele(pr->pr_root); 2624b3059e09SRobert Watson mtx_destroy(&pr->pr_mtx); 2625413628a7SBjoern A. Zeeb #ifdef INET 2626413628a7SBjoern A. Zeeb free(pr->pr_ip4, M_PRISON); 2627413628a7SBjoern A. Zeeb #endif 2628b38ff370SJamie Gritton #ifdef INET6 2629b38ff370SJamie Gritton free(pr->pr_ip6, M_PRISON); 2630b38ff370SJamie Gritton #endif 2631b38ff370SJamie Gritton if (pr->pr_cpuset != NULL) 2632b38ff370SJamie Gritton cpuset_rel(pr->pr_cpuset); 2633b38ff370SJamie Gritton osd_jail_exit(pr); 2634a7ad07bfSEdward Tomasz Napierala #ifdef RACCT 26354b5c9cf6SEdward Tomasz Napierala if (racct_enable) 2636a7ad07bfSEdward Tomasz Napierala prison_racct_detach(pr); 2637ec125fbbSEdward Tomasz Napierala #endif 26381ede983cSDag-Erling Smørgrav free(pr, M_PRISON); 26390304c731SJamie Gritton 26400304c731SJamie Gritton /* Removing a prison frees a reference on its parent. */ 26410304c731SJamie Gritton pr = ppr; 26420304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 2643e6d5cb63SJamie Gritton flags = PD_DEREF | PD_DEUREF; 26440304c731SJamie Gritton } 2645b3059e09SRobert Watson } 2646b3059e09SRobert Watson 264791421ba2SRobert Watson void 26481ba4a712SPawel Jakub Dawidek prison_hold_locked(struct prison *pr) 26491ba4a712SPawel Jakub Dawidek { 26501ba4a712SPawel Jakub Dawidek 26511ba4a712SPawel Jakub Dawidek mtx_assert(&pr->pr_mtx, MA_OWNED); 26521ba4a712SPawel Jakub Dawidek KASSERT(pr->pr_ref > 0, 265336b41cc3SBjoern A. Zeeb ("Trying to hold dead prison %p (jid=%d).", pr, pr->pr_id)); 26541ba4a712SPawel Jakub Dawidek pr->pr_ref++; 26551ba4a712SPawel Jakub Dawidek } 26561ba4a712SPawel Jakub Dawidek 26571ba4a712SPawel Jakub Dawidek void 265891421ba2SRobert Watson prison_hold(struct prison *pr) 265991421ba2SRobert Watson { 266091421ba2SRobert Watson 266101137630SRobert Watson mtx_lock(&pr->pr_mtx); 26621ba4a712SPawel Jakub Dawidek prison_hold_locked(pr); 266301137630SRobert Watson mtx_unlock(&pr->pr_mtx); 266401137630SRobert Watson } 266501137630SRobert Watson 2666413628a7SBjoern A. Zeeb void 2667413628a7SBjoern A. Zeeb prison_proc_hold(struct prison *pr) 266801137630SRobert Watson { 266901137630SRobert Watson 2670413628a7SBjoern A. Zeeb mtx_lock(&pr->pr_mtx); 2671b38ff370SJamie Gritton KASSERT(pr->pr_uref > 0, 2672b38ff370SJamie Gritton ("Cannot add a process to a non-alive prison (jid=%d)", pr->pr_id)); 2673b38ff370SJamie Gritton pr->pr_uref++; 2674413628a7SBjoern A. Zeeb mtx_unlock(&pr->pr_mtx); 267575c13541SPoul-Henning Kamp } 267675c13541SPoul-Henning Kamp 267775c13541SPoul-Henning Kamp void 2678413628a7SBjoern A. Zeeb prison_proc_free(struct prison *pr) 267975c13541SPoul-Henning Kamp { 2680413628a7SBjoern A. Zeeb 2681413628a7SBjoern A. Zeeb mtx_lock(&pr->pr_mtx); 2682b38ff370SJamie Gritton KASSERT(pr->pr_uref > 0, 2683b38ff370SJamie Gritton ("Trying to kill a process in a dead prison (jid=%d)", pr->pr_id)); 268473d9e52dSJamie Gritton if (pr->pr_uref > 1) 268573d9e52dSJamie Gritton pr->pr_uref--; 268673d9e52dSJamie Gritton else { 268773d9e52dSJamie Gritton /* 268873d9e52dSJamie Gritton * Don't remove the last user reference in this context, which 268973d9e52dSJamie Gritton * is expected to be a process that is not only locked, but 269073d9e52dSJamie Gritton * also half dead. 269173d9e52dSJamie Gritton */ 269273d9e52dSJamie Gritton pr->pr_ref++; 269373d9e52dSJamie Gritton mtx_unlock(&pr->pr_mtx); 269473d9e52dSJamie Gritton taskqueue_enqueue(taskqueue_thread, &pr->pr_task); 269573d9e52dSJamie Gritton return; 269673d9e52dSJamie Gritton } 269773d9e52dSJamie Gritton mtx_unlock(&pr->pr_mtx); 2698413628a7SBjoern A. Zeeb } 2699413628a7SBjoern A. Zeeb 2700413628a7SBjoern A. Zeeb /* 2701ca04ba64SJamie Gritton * Check if a jail supports the given address family. 2702ca04ba64SJamie Gritton * 2703ca04ba64SJamie Gritton * Returns 0 if not jailed or the address family is supported, EAFNOSUPPORT 2704ca04ba64SJamie Gritton * if not. 2705ca04ba64SJamie Gritton */ 2706ca04ba64SJamie Gritton int 2707ca04ba64SJamie Gritton prison_check_af(struct ucred *cred, int af) 2708ca04ba64SJamie Gritton { 27090304c731SJamie Gritton struct prison *pr; 2710ca04ba64SJamie Gritton int error; 2711ca04ba64SJamie Gritton 2712ca04ba64SJamie Gritton KASSERT(cred != NULL, ("%s: cred is NULL", __func__)); 2713ca04ba64SJamie Gritton 27140304c731SJamie Gritton pr = cred->cr_prison; 2715499650a0SJamie Gritton #ifdef VIMAGE 27166bb79563SJamie Gritton /* Prisons with their own network stack are not limited. */ 2717de0bd6f7SBjoern A. Zeeb if (prison_owns_vnet(cred)) 27186bb79563SJamie Gritton return (0); 2719499650a0SJamie Gritton #endif 27206bb79563SJamie Gritton 2721ca04ba64SJamie Gritton error = 0; 2722ca04ba64SJamie Gritton switch (af) 2723ca04ba64SJamie Gritton { 2724ca04ba64SJamie Gritton #ifdef INET 2725ca04ba64SJamie Gritton case AF_INET: 27260304c731SJamie Gritton if (pr->pr_flags & PR_IP4) 27270304c731SJamie Gritton { 27280304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 27290304c731SJamie Gritton if ((pr->pr_flags & PR_IP4) && pr->pr_ip4 == NULL) 2730ca04ba64SJamie Gritton error = EAFNOSUPPORT; 27310304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 27320304c731SJamie Gritton } 2733ca04ba64SJamie Gritton break; 2734ca04ba64SJamie Gritton #endif 2735ca04ba64SJamie Gritton #ifdef INET6 2736ca04ba64SJamie Gritton case AF_INET6: 27370304c731SJamie Gritton if (pr->pr_flags & PR_IP6) 27380304c731SJamie Gritton { 27390304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 27400304c731SJamie Gritton if ((pr->pr_flags & PR_IP6) && pr->pr_ip6 == NULL) 2741ca04ba64SJamie Gritton error = EAFNOSUPPORT; 27420304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 27430304c731SJamie Gritton } 2744ca04ba64SJamie Gritton break; 2745ca04ba64SJamie Gritton #endif 2746ca04ba64SJamie Gritton case AF_LOCAL: 2747ca04ba64SJamie Gritton case AF_ROUTE: 2748ca04ba64SJamie Gritton break; 2749ca04ba64SJamie Gritton default: 27500304c731SJamie Gritton if (!(pr->pr_allow & PR_ALLOW_SOCKET_AF)) 2751ca04ba64SJamie Gritton error = EAFNOSUPPORT; 2752ca04ba64SJamie Gritton } 2753ca04ba64SJamie Gritton return (error); 2754ca04ba64SJamie Gritton } 2755ca04ba64SJamie Gritton 2756ca04ba64SJamie Gritton /* 2757413628a7SBjoern A. Zeeb * Check if given address belongs to the jail referenced by cred (wrapper to 2758413628a7SBjoern A. Zeeb * prison_check_ip[46]). 2759413628a7SBjoern A. Zeeb * 27600304c731SJamie Gritton * Returns 0 if jail doesn't restrict the address family or if address belongs 27610304c731SJamie Gritton * to jail, EADDRNOTAVAIL if the address doesn't belong, or EAFNOSUPPORT if 27620304c731SJamie Gritton * the jail doesn't allow the address family. IPv4 Address passed in in NBO. 2763413628a7SBjoern A. Zeeb */ 2764413628a7SBjoern A. Zeeb int 2765c83dda36SAlexander V. Chernikov prison_if(struct ucred *cred, const struct sockaddr *sa) 276675c13541SPoul-Henning Kamp { 2767413628a7SBjoern A. Zeeb #ifdef INET 2768c83dda36SAlexander V. Chernikov const struct sockaddr_in *sai; 2769413628a7SBjoern A. Zeeb #endif 2770413628a7SBjoern A. Zeeb #ifdef INET6 2771c83dda36SAlexander V. Chernikov const struct sockaddr_in6 *sai6; 2772413628a7SBjoern A. Zeeb #endif 2773b89e82ddSJamie Gritton int error; 277475c13541SPoul-Henning Kamp 2775413628a7SBjoern A. Zeeb KASSERT(cred != NULL, ("%s: cred is NULL", __func__)); 2776413628a7SBjoern A. Zeeb KASSERT(sa != NULL, ("%s: sa is NULL", __func__)); 2777413628a7SBjoern A. Zeeb 2778de0bd6f7SBjoern A. Zeeb #ifdef VIMAGE 2779de0bd6f7SBjoern A. Zeeb if (prison_owns_vnet(cred)) 2780de0bd6f7SBjoern A. Zeeb return (0); 2781de0bd6f7SBjoern A. Zeeb #endif 2782de0bd6f7SBjoern A. Zeeb 2783b89e82ddSJamie Gritton error = 0; 2784413628a7SBjoern A. Zeeb switch (sa->sa_family) 2785413628a7SBjoern A. Zeeb { 2786413628a7SBjoern A. Zeeb #ifdef INET 2787413628a7SBjoern A. Zeeb case AF_INET: 2788c83dda36SAlexander V. Chernikov sai = (const struct sockaddr_in *)sa; 2789b89e82ddSJamie Gritton error = prison_check_ip4(cred, &sai->sin_addr); 2790413628a7SBjoern A. Zeeb break; 2791413628a7SBjoern A. Zeeb #endif 2792413628a7SBjoern A. Zeeb #ifdef INET6 2793413628a7SBjoern A. Zeeb case AF_INET6: 2794c83dda36SAlexander V. Chernikov sai6 = (const struct sockaddr_in6 *)sa; 2795b89e82ddSJamie Gritton error = prison_check_ip6(cred, &sai6->sin6_addr); 2796413628a7SBjoern A. Zeeb break; 2797413628a7SBjoern A. Zeeb #endif 2798413628a7SBjoern A. Zeeb default: 27990304c731SJamie Gritton if (!(cred->cr_prison->pr_allow & PR_ALLOW_SOCKET_AF)) 2800b89e82ddSJamie Gritton error = EAFNOSUPPORT; 2801413628a7SBjoern A. Zeeb } 2802b89e82ddSJamie Gritton return (error); 280375c13541SPoul-Henning Kamp } 280491421ba2SRobert Watson 280591421ba2SRobert Watson /* 280691421ba2SRobert Watson * Return 0 if jails permit p1 to frob p2, otherwise ESRCH. 280791421ba2SRobert Watson */ 280891421ba2SRobert Watson int 28099ddb7954SMike Barcroft prison_check(struct ucred *cred1, struct ucred *cred2) 281091421ba2SRobert Watson { 281191421ba2SRobert Watson 28120304c731SJamie Gritton return ((cred1->cr_prison == cred2->cr_prison || 28130304c731SJamie Gritton prison_ischild(cred1->cr_prison, cred2->cr_prison)) ? 0 : ESRCH); 28140304c731SJamie Gritton } 281591421ba2SRobert Watson 28160304c731SJamie Gritton /* 28170304c731SJamie Gritton * Return 1 if p2 is a child of p1, otherwise 0. 28180304c731SJamie Gritton */ 28190304c731SJamie Gritton int 28200304c731SJamie Gritton prison_ischild(struct prison *pr1, struct prison *pr2) 28210304c731SJamie Gritton { 28220304c731SJamie Gritton 28230304c731SJamie Gritton for (pr2 = pr2->pr_parent; pr2 != NULL; pr2 = pr2->pr_parent) 28240304c731SJamie Gritton if (pr1 == pr2) 28250304c731SJamie Gritton return (1); 282691421ba2SRobert Watson return (0); 282791421ba2SRobert Watson } 282891421ba2SRobert Watson 282991421ba2SRobert Watson /* 2830de0bd6f7SBjoern A. Zeeb * Return 1 if the passed credential is in a jail and that jail does not 2831de0bd6f7SBjoern A. Zeeb * have its own virtual network stack, otherwise 0. 2832de0bd6f7SBjoern A. Zeeb */ 2833de0bd6f7SBjoern A. Zeeb int 2834de0bd6f7SBjoern A. Zeeb jailed_without_vnet(struct ucred *cred) 2835de0bd6f7SBjoern A. Zeeb { 2836de0bd6f7SBjoern A. Zeeb 2837de0bd6f7SBjoern A. Zeeb if (!jailed(cred)) 2838de0bd6f7SBjoern A. Zeeb return (0); 2839de0bd6f7SBjoern A. Zeeb #ifdef VIMAGE 2840de0bd6f7SBjoern A. Zeeb if (prison_owns_vnet(cred)) 2841de0bd6f7SBjoern A. Zeeb return (0); 2842de0bd6f7SBjoern A. Zeeb #endif 2843de0bd6f7SBjoern A. Zeeb 2844de0bd6f7SBjoern A. Zeeb return (1); 2845de0bd6f7SBjoern A. Zeeb } 2846de0bd6f7SBjoern A. Zeeb 2847de0bd6f7SBjoern A. Zeeb /* 28487455b100SJamie Gritton * Return the correct hostname (domainname, et al) for the passed credential. 28499484d0c0SRobert Drehmel */ 2850ad1ff099SRobert Drehmel void 28519ddb7954SMike Barcroft getcredhostname(struct ucred *cred, char *buf, size_t size) 28529484d0c0SRobert Drehmel { 285376ca6f88SJamie Gritton struct prison *pr; 28549484d0c0SRobert Drehmel 28557455b100SJamie Gritton /* 28567455b100SJamie Gritton * A NULL credential can be used to shortcut to the physical 28577455b100SJamie Gritton * system's hostname. 28587455b100SJamie Gritton */ 285976ca6f88SJamie Gritton pr = (cred != NULL) ? cred->cr_prison : &prison0; 286076ca6f88SJamie Gritton mtx_lock(&pr->pr_mtx); 2861c1f19219SJamie Gritton strlcpy(buf, pr->pr_hostname, size); 286276ca6f88SJamie Gritton mtx_unlock(&pr->pr_mtx); 28639484d0c0SRobert Drehmel } 2864fd7a8150SMike Barcroft 28657455b100SJamie Gritton void 28667455b100SJamie Gritton getcreddomainname(struct ucred *cred, char *buf, size_t size) 28677455b100SJamie Gritton { 28687455b100SJamie Gritton 28697455b100SJamie Gritton mtx_lock(&cred->cr_prison->pr_mtx); 2870c1f19219SJamie Gritton strlcpy(buf, cred->cr_prison->pr_domainname, size); 28717455b100SJamie Gritton mtx_unlock(&cred->cr_prison->pr_mtx); 28727455b100SJamie Gritton } 28737455b100SJamie Gritton 28747455b100SJamie Gritton void 28757455b100SJamie Gritton getcredhostuuid(struct ucred *cred, char *buf, size_t size) 28767455b100SJamie Gritton { 28777455b100SJamie Gritton 28787455b100SJamie Gritton mtx_lock(&cred->cr_prison->pr_mtx); 2879c1f19219SJamie Gritton strlcpy(buf, cred->cr_prison->pr_hostuuid, size); 28807455b100SJamie Gritton mtx_unlock(&cred->cr_prison->pr_mtx); 28817455b100SJamie Gritton } 28827455b100SJamie Gritton 28837455b100SJamie Gritton void 28847455b100SJamie Gritton getcredhostid(struct ucred *cred, unsigned long *hostid) 28857455b100SJamie Gritton { 28867455b100SJamie Gritton 28877455b100SJamie Gritton mtx_lock(&cred->cr_prison->pr_mtx); 28887455b100SJamie Gritton *hostid = cred->cr_prison->pr_hostid; 28897455b100SJamie Gritton mtx_unlock(&cred->cr_prison->pr_mtx); 28907455b100SJamie Gritton } 28917455b100SJamie Gritton 2892eb79e1c7SBjoern A. Zeeb #ifdef VIMAGE 2893eb79e1c7SBjoern A. Zeeb /* 2894eb79e1c7SBjoern A. Zeeb * Determine whether the prison represented by cred owns 2895eb79e1c7SBjoern A. Zeeb * its vnet rather than having it inherited. 2896eb79e1c7SBjoern A. Zeeb * 2897eb79e1c7SBjoern A. Zeeb * Returns 1 in case the prison owns the vnet, 0 otherwise. 2898eb79e1c7SBjoern A. Zeeb */ 2899eb79e1c7SBjoern A. Zeeb int 2900eb79e1c7SBjoern A. Zeeb prison_owns_vnet(struct ucred *cred) 2901eb79e1c7SBjoern A. Zeeb { 2902eb79e1c7SBjoern A. Zeeb 2903eb79e1c7SBjoern A. Zeeb /* 2904eb79e1c7SBjoern A. Zeeb * vnets cannot be added/removed after jail creation, 2905eb79e1c7SBjoern A. Zeeb * so no need to lock here. 2906eb79e1c7SBjoern A. Zeeb */ 2907eb79e1c7SBjoern A. Zeeb return (cred->cr_prison->pr_flags & PR_VNET ? 1 : 0); 2908eb79e1c7SBjoern A. Zeeb } 2909eb79e1c7SBjoern A. Zeeb #endif 2910eb79e1c7SBjoern A. Zeeb 2911f08df373SRobert Watson /* 2912820a0de9SPawel Jakub Dawidek * Determine whether the subject represented by cred can "see" 2913820a0de9SPawel Jakub Dawidek * status of a mount point. 2914820a0de9SPawel Jakub Dawidek * Returns: 0 for permitted, ENOENT otherwise. 2915820a0de9SPawel Jakub Dawidek * XXX: This function should be called cr_canseemount() and should be 2916820a0de9SPawel Jakub Dawidek * placed in kern_prot.c. 2917f08df373SRobert Watson */ 2918f08df373SRobert Watson int 2919820a0de9SPawel Jakub Dawidek prison_canseemount(struct ucred *cred, struct mount *mp) 2920f08df373SRobert Watson { 2921820a0de9SPawel Jakub Dawidek struct prison *pr; 2922820a0de9SPawel Jakub Dawidek struct statfs *sp; 2923820a0de9SPawel Jakub Dawidek size_t len; 2924f08df373SRobert Watson 2925820a0de9SPawel Jakub Dawidek pr = cred->cr_prison; 29260304c731SJamie Gritton if (pr->pr_enforce_statfs == 0) 29270304c731SJamie Gritton return (0); 2928820a0de9SPawel Jakub Dawidek if (pr->pr_root->v_mount == mp) 2929820a0de9SPawel Jakub Dawidek return (0); 29300304c731SJamie Gritton if (pr->pr_enforce_statfs == 2) 2931820a0de9SPawel Jakub Dawidek return (ENOENT); 2932820a0de9SPawel Jakub Dawidek /* 2933820a0de9SPawel Jakub Dawidek * If jail's chroot directory is set to "/" we should be able to see 2934820a0de9SPawel Jakub Dawidek * all mount-points from inside a jail. 2935820a0de9SPawel Jakub Dawidek * This is ugly check, but this is the only situation when jail's 2936820a0de9SPawel Jakub Dawidek * directory ends with '/'. 2937820a0de9SPawel Jakub Dawidek */ 2938820a0de9SPawel Jakub Dawidek if (strcmp(pr->pr_path, "/") == 0) 2939820a0de9SPawel Jakub Dawidek return (0); 2940820a0de9SPawel Jakub Dawidek len = strlen(pr->pr_path); 2941820a0de9SPawel Jakub Dawidek sp = &mp->mnt_stat; 2942820a0de9SPawel Jakub Dawidek if (strncmp(pr->pr_path, sp->f_mntonname, len) != 0) 2943820a0de9SPawel Jakub Dawidek return (ENOENT); 2944820a0de9SPawel Jakub Dawidek /* 2945820a0de9SPawel Jakub Dawidek * Be sure that we don't have situation where jail's root directory 2946820a0de9SPawel Jakub Dawidek * is "/some/path" and mount point is "/some/pathpath". 2947820a0de9SPawel Jakub Dawidek */ 2948820a0de9SPawel Jakub Dawidek if (sp->f_mntonname[len] != '\0' && sp->f_mntonname[len] != '/') 2949820a0de9SPawel Jakub Dawidek return (ENOENT); 2950f08df373SRobert Watson return (0); 2951f08df373SRobert Watson } 2952820a0de9SPawel Jakub Dawidek 2953820a0de9SPawel Jakub Dawidek void 2954820a0de9SPawel Jakub Dawidek prison_enforce_statfs(struct ucred *cred, struct mount *mp, struct statfs *sp) 2955820a0de9SPawel Jakub Dawidek { 2956820a0de9SPawel Jakub Dawidek char jpath[MAXPATHLEN]; 2957820a0de9SPawel Jakub Dawidek struct prison *pr; 2958820a0de9SPawel Jakub Dawidek size_t len; 2959820a0de9SPawel Jakub Dawidek 2960820a0de9SPawel Jakub Dawidek pr = cred->cr_prison; 29610304c731SJamie Gritton if (pr->pr_enforce_statfs == 0) 29620304c731SJamie Gritton return; 2963820a0de9SPawel Jakub Dawidek if (prison_canseemount(cred, mp) != 0) { 2964820a0de9SPawel Jakub Dawidek bzero(sp->f_mntonname, sizeof(sp->f_mntonname)); 2965820a0de9SPawel Jakub Dawidek strlcpy(sp->f_mntonname, "[restricted]", 2966820a0de9SPawel Jakub Dawidek sizeof(sp->f_mntonname)); 2967820a0de9SPawel Jakub Dawidek return; 2968820a0de9SPawel Jakub Dawidek } 2969820a0de9SPawel Jakub Dawidek if (pr->pr_root->v_mount == mp) { 2970820a0de9SPawel Jakub Dawidek /* 2971820a0de9SPawel Jakub Dawidek * Clear current buffer data, so we are sure nothing from 2972820a0de9SPawel Jakub Dawidek * the valid path left there. 2973820a0de9SPawel Jakub Dawidek */ 2974820a0de9SPawel Jakub Dawidek bzero(sp->f_mntonname, sizeof(sp->f_mntonname)); 2975820a0de9SPawel Jakub Dawidek *sp->f_mntonname = '/'; 2976820a0de9SPawel Jakub Dawidek return; 2977820a0de9SPawel Jakub Dawidek } 2978820a0de9SPawel Jakub Dawidek /* 2979820a0de9SPawel Jakub Dawidek * If jail's chroot directory is set to "/" we should be able to see 2980820a0de9SPawel Jakub Dawidek * all mount-points from inside a jail. 2981820a0de9SPawel Jakub Dawidek */ 2982820a0de9SPawel Jakub Dawidek if (strcmp(pr->pr_path, "/") == 0) 2983820a0de9SPawel Jakub Dawidek return; 2984820a0de9SPawel Jakub Dawidek len = strlen(pr->pr_path); 2985820a0de9SPawel Jakub Dawidek strlcpy(jpath, sp->f_mntonname + len, sizeof(jpath)); 2986820a0de9SPawel Jakub Dawidek /* 2987820a0de9SPawel Jakub Dawidek * Clear current buffer data, so we are sure nothing from 2988820a0de9SPawel Jakub Dawidek * the valid path left there. 2989820a0de9SPawel Jakub Dawidek */ 2990820a0de9SPawel Jakub Dawidek bzero(sp->f_mntonname, sizeof(sp->f_mntonname)); 2991820a0de9SPawel Jakub Dawidek if (*jpath == '\0') { 2992820a0de9SPawel Jakub Dawidek /* Should never happen. */ 2993820a0de9SPawel Jakub Dawidek *sp->f_mntonname = '/'; 2994820a0de9SPawel Jakub Dawidek } else { 2995820a0de9SPawel Jakub Dawidek strlcpy(sp->f_mntonname, jpath, sizeof(sp->f_mntonname)); 2996820a0de9SPawel Jakub Dawidek } 2997f08df373SRobert Watson } 2998f08df373SRobert Watson 2999800c9408SRobert Watson /* 3000800c9408SRobert Watson * Check with permission for a specific privilege is granted within jail. We 3001800c9408SRobert Watson * have a specific list of accepted privileges; the rest are denied. 3002800c9408SRobert Watson */ 3003800c9408SRobert Watson int 3004800c9408SRobert Watson prison_priv_check(struct ucred *cred, int priv) 3005800c9408SRobert Watson { 3006800c9408SRobert Watson 30077b2ff0dcSMateusz Guzik /* 30087b2ff0dcSMateusz Guzik * Some policies have custom handlers. This routine should not be 30097b2ff0dcSMateusz Guzik * called for them. See priv_check_cred(). 30107b2ff0dcSMateusz Guzik */ 30117b2ff0dcSMateusz Guzik switch (priv) { 30127b2ff0dcSMateusz Guzik case PRIV_VFS_GENERATION: 30137b2ff0dcSMateusz Guzik KASSERT(0, ("prison_priv_check instead of a custom handler " 30147b2ff0dcSMateusz Guzik "called for %d\n", priv)); 30157b2ff0dcSMateusz Guzik } 30167b2ff0dcSMateusz Guzik 3017800c9408SRobert Watson if (!jailed(cred)) 3018800c9408SRobert Watson return (0); 3019800c9408SRobert Watson 30206bb79563SJamie Gritton #ifdef VIMAGE 30216bb79563SJamie Gritton /* 30226bb79563SJamie Gritton * Privileges specific to prisons with a virtual network stack. 30236bb79563SJamie Gritton * There might be a duplicate entry here in case the privilege 30246bb79563SJamie Gritton * is only granted conditionally in the legacy jail case. 30256bb79563SJamie Gritton */ 30266bb79563SJamie Gritton switch (priv) { 30276bb79563SJamie Gritton #ifdef notyet 30286bb79563SJamie Gritton /* 30296bb79563SJamie Gritton * NFS-specific privileges. 30306bb79563SJamie Gritton */ 30316bb79563SJamie Gritton case PRIV_NFS_DAEMON: 30326bb79563SJamie Gritton case PRIV_NFS_LOCKD: 30336bb79563SJamie Gritton #endif 30346bb79563SJamie Gritton /* 30356bb79563SJamie Gritton * Network stack privileges. 30366bb79563SJamie Gritton */ 30376bb79563SJamie Gritton case PRIV_NET_BRIDGE: 30386bb79563SJamie Gritton case PRIV_NET_GRE: 30396bb79563SJamie Gritton case PRIV_NET_BPF: 30406bb79563SJamie Gritton case PRIV_NET_RAW: /* Dup, cond. in legacy jail case. */ 30416bb79563SJamie Gritton case PRIV_NET_ROUTE: 30426bb79563SJamie Gritton case PRIV_NET_TAP: 30436bb79563SJamie Gritton case PRIV_NET_SETIFMTU: 30446bb79563SJamie Gritton case PRIV_NET_SETIFFLAGS: 30456bb79563SJamie Gritton case PRIV_NET_SETIFCAP: 3046215940b3SXin LI case PRIV_NET_SETIFDESCR: 30476bb79563SJamie Gritton case PRIV_NET_SETIFNAME : 30486bb79563SJamie Gritton case PRIV_NET_SETIFMETRIC: 30496bb79563SJamie Gritton case PRIV_NET_SETIFPHYS: 30506bb79563SJamie Gritton case PRIV_NET_SETIFMAC: 3051389474c1SKonstantin Belousov case PRIV_NET_SETLANPCP: 30526bb79563SJamie Gritton case PRIV_NET_ADDMULTI: 30536bb79563SJamie Gritton case PRIV_NET_DELMULTI: 30546bb79563SJamie Gritton case PRIV_NET_HWIOCTL: 30556bb79563SJamie Gritton case PRIV_NET_SETLLADDR: 30566bb79563SJamie Gritton case PRIV_NET_ADDIFGROUP: 30576bb79563SJamie Gritton case PRIV_NET_DELIFGROUP: 30586bb79563SJamie Gritton case PRIV_NET_IFCREATE: 30596bb79563SJamie Gritton case PRIV_NET_IFDESTROY: 30606bb79563SJamie Gritton case PRIV_NET_ADDIFADDR: 30616bb79563SJamie Gritton case PRIV_NET_DELIFADDR: 30626bb79563SJamie Gritton case PRIV_NET_LAGG: 30636bb79563SJamie Gritton case PRIV_NET_GIF: 30646bb79563SJamie Gritton case PRIV_NET_SETIFVNET: 306535fd7bc0SBjoern A. Zeeb case PRIV_NET_SETIFFIB: 30666bb79563SJamie Gritton 30676bb79563SJamie Gritton /* 30686bb79563SJamie Gritton * 802.11-related privileges. 30696bb79563SJamie Gritton */ 30706bb79563SJamie Gritton case PRIV_NET80211_GETKEY: 30716bb79563SJamie Gritton #ifdef notyet 30726bb79563SJamie Gritton case PRIV_NET80211_MANAGE: /* XXX-BZ discuss with sam@ */ 30736bb79563SJamie Gritton #endif 30746bb79563SJamie Gritton 30756bb79563SJamie Gritton #ifdef notyet 30766bb79563SJamie Gritton /* 30776bb79563SJamie Gritton * ATM privileges. 30786bb79563SJamie Gritton */ 30796bb79563SJamie Gritton case PRIV_NETATM_CFG: 30806bb79563SJamie Gritton case PRIV_NETATM_ADD: 30816bb79563SJamie Gritton case PRIV_NETATM_DEL: 30826bb79563SJamie Gritton case PRIV_NETATM_SET: 30836bb79563SJamie Gritton 30846bb79563SJamie Gritton /* 30856bb79563SJamie Gritton * Bluetooth privileges. 30866bb79563SJamie Gritton */ 30876bb79563SJamie Gritton case PRIV_NETBLUETOOTH_RAW: 30886bb79563SJamie Gritton #endif 30896bb79563SJamie Gritton 30906bb79563SJamie Gritton /* 30916bb79563SJamie Gritton * Netgraph and netgraph module privileges. 30926bb79563SJamie Gritton */ 30936bb79563SJamie Gritton case PRIV_NETGRAPH_CONTROL: 30946bb79563SJamie Gritton #ifdef notyet 30956bb79563SJamie Gritton case PRIV_NETGRAPH_TTY: 30966bb79563SJamie Gritton #endif 30976bb79563SJamie Gritton 30986bb79563SJamie Gritton /* 30996bb79563SJamie Gritton * IPv4 and IPv6 privileges. 31006bb79563SJamie Gritton */ 31016bb79563SJamie Gritton case PRIV_NETINET_IPFW: 31026bb79563SJamie Gritton case PRIV_NETINET_DIVERT: 31036bb79563SJamie Gritton case PRIV_NETINET_PF: 31046bb79563SJamie Gritton case PRIV_NETINET_DUMMYNET: 31056bb79563SJamie Gritton case PRIV_NETINET_CARP: 31066bb79563SJamie Gritton case PRIV_NETINET_MROUTE: 31076bb79563SJamie Gritton case PRIV_NETINET_RAW: 31086bb79563SJamie Gritton case PRIV_NETINET_ADDRCTRL6: 31096bb79563SJamie Gritton case PRIV_NETINET_ND6: 31106bb79563SJamie Gritton case PRIV_NETINET_SCOPE6: 31116bb79563SJamie Gritton case PRIV_NETINET_ALIFETIME6: 31126bb79563SJamie Gritton case PRIV_NETINET_IPSEC: 31136bb79563SJamie Gritton case PRIV_NETINET_BINDANY: 31146bb79563SJamie Gritton 31156bb79563SJamie Gritton #ifdef notyet 31166bb79563SJamie Gritton /* 31176bb79563SJamie Gritton * NCP privileges. 31186bb79563SJamie Gritton */ 31196bb79563SJamie Gritton case PRIV_NETNCP: 31206bb79563SJamie Gritton 31216bb79563SJamie Gritton /* 31226bb79563SJamie Gritton * SMB privileges. 31236bb79563SJamie Gritton */ 31246bb79563SJamie Gritton case PRIV_NETSMB: 31256bb79563SJamie Gritton #endif 31266bb79563SJamie Gritton 31276bb79563SJamie Gritton /* 31286bb79563SJamie Gritton * No default: or deny here. 31296bb79563SJamie Gritton * In case of no permit fall through to next switch(). 31306bb79563SJamie Gritton */ 31316bb79563SJamie Gritton if (cred->cr_prison->pr_flags & PR_VNET) 31326bb79563SJamie Gritton return (0); 31336bb79563SJamie Gritton } 31346bb79563SJamie Gritton #endif /* VIMAGE */ 31356bb79563SJamie Gritton 3136800c9408SRobert Watson switch (priv) { 3137800c9408SRobert Watson 3138800c9408SRobert Watson /* 3139800c9408SRobert Watson * Allow ktrace privileges for root in jail. 3140800c9408SRobert Watson */ 3141800c9408SRobert Watson case PRIV_KTRACE: 3142800c9408SRobert Watson 3143c3c1b5e6SRobert Watson #if 0 3144800c9408SRobert Watson /* 3145800c9408SRobert Watson * Allow jailed processes to configure audit identity and 3146800c9408SRobert Watson * submit audit records (login, etc). In the future we may 3147800c9408SRobert Watson * want to further refine the relationship between audit and 3148800c9408SRobert Watson * jail. 3149800c9408SRobert Watson */ 3150800c9408SRobert Watson case PRIV_AUDIT_GETAUDIT: 3151800c9408SRobert Watson case PRIV_AUDIT_SETAUDIT: 3152800c9408SRobert Watson case PRIV_AUDIT_SUBMIT: 3153c3c1b5e6SRobert Watson #endif 3154800c9408SRobert Watson 3155800c9408SRobert Watson /* 3156800c9408SRobert Watson * Allow jailed processes to manipulate process UNIX 3157800c9408SRobert Watson * credentials in any way they see fit. 3158800c9408SRobert Watson */ 3159800c9408SRobert Watson case PRIV_CRED_SETUID: 3160800c9408SRobert Watson case PRIV_CRED_SETEUID: 3161800c9408SRobert Watson case PRIV_CRED_SETGID: 3162800c9408SRobert Watson case PRIV_CRED_SETEGID: 3163800c9408SRobert Watson case PRIV_CRED_SETGROUPS: 3164800c9408SRobert Watson case PRIV_CRED_SETREUID: 3165800c9408SRobert Watson case PRIV_CRED_SETREGID: 3166800c9408SRobert Watson case PRIV_CRED_SETRESUID: 3167800c9408SRobert Watson case PRIV_CRED_SETRESGID: 3168800c9408SRobert Watson 3169800c9408SRobert Watson /* 3170800c9408SRobert Watson * Jail implements visibility constraints already, so allow 3171800c9408SRobert Watson * jailed root to override uid/gid-based constraints. 3172800c9408SRobert Watson */ 3173800c9408SRobert Watson case PRIV_SEEOTHERGIDS: 3174800c9408SRobert Watson case PRIV_SEEOTHERUIDS: 3175800c9408SRobert Watson 3176800c9408SRobert Watson /* 3177800c9408SRobert Watson * Jail implements inter-process debugging limits already, so 3178800c9408SRobert Watson * allow jailed root various debugging privileges. 3179800c9408SRobert Watson */ 3180800c9408SRobert Watson case PRIV_DEBUG_DIFFCRED: 3181800c9408SRobert Watson case PRIV_DEBUG_SUGID: 3182800c9408SRobert Watson case PRIV_DEBUG_UNPRIV: 3183800c9408SRobert Watson 3184800c9408SRobert Watson /* 3185800c9408SRobert Watson * Allow jail to set various resource limits and login 3186800c9408SRobert Watson * properties, and for now, exceed process resource limits. 3187800c9408SRobert Watson */ 3188800c9408SRobert Watson case PRIV_PROC_LIMIT: 3189800c9408SRobert Watson case PRIV_PROC_SETLOGIN: 3190800c9408SRobert Watson case PRIV_PROC_SETRLIMIT: 3191800c9408SRobert Watson 3192800c9408SRobert Watson /* 3193800c9408SRobert Watson * System V and POSIX IPC privileges are granted in jail. 3194800c9408SRobert Watson */ 3195800c9408SRobert Watson case PRIV_IPC_READ: 3196800c9408SRobert Watson case PRIV_IPC_WRITE: 3197800c9408SRobert Watson case PRIV_IPC_ADMIN: 3198800c9408SRobert Watson case PRIV_IPC_MSGSIZE: 3199800c9408SRobert Watson case PRIV_MQ_ADMIN: 3200800c9408SRobert Watson 3201800c9408SRobert Watson /* 32020304c731SJamie Gritton * Jail operations within a jail work on child jails. 32030304c731SJamie Gritton */ 32040304c731SJamie Gritton case PRIV_JAIL_ATTACH: 32050304c731SJamie Gritton case PRIV_JAIL_SET: 32060304c731SJamie Gritton case PRIV_JAIL_REMOVE: 32070304c731SJamie Gritton 32080304c731SJamie Gritton /* 3209800c9408SRobert Watson * Jail implements its own inter-process limits, so allow 3210800c9408SRobert Watson * root processes in jail to change scheduling on other 3211800c9408SRobert Watson * processes in the same jail. Likewise for signalling. 3212800c9408SRobert Watson */ 3213800c9408SRobert Watson case PRIV_SCHED_DIFFCRED: 3214413628a7SBjoern A. Zeeb case PRIV_SCHED_CPUSET: 3215800c9408SRobert Watson case PRIV_SIGNAL_DIFFCRED: 3216800c9408SRobert Watson case PRIV_SIGNAL_SUGID: 3217800c9408SRobert Watson 3218800c9408SRobert Watson /* 3219800c9408SRobert Watson * Allow jailed processes to write to sysctls marked as jail 3220800c9408SRobert Watson * writable. 3221800c9408SRobert Watson */ 3222800c9408SRobert Watson case PRIV_SYSCTL_WRITEJAIL: 3223800c9408SRobert Watson 3224800c9408SRobert Watson /* 3225800c9408SRobert Watson * Allow root in jail to manage a variety of quota 3226e82d0201SRobert Watson * properties. These should likely be conditional on a 3227e82d0201SRobert Watson * configuration option. 3228800c9408SRobert Watson */ 322995b091d2SRobert Watson case PRIV_VFS_GETQUOTA: 323095b091d2SRobert Watson case PRIV_VFS_SETQUOTA: 3231800c9408SRobert Watson 3232800c9408SRobert Watson /* 3233800c9408SRobert Watson * Since Jail relies on chroot() to implement file system 3234800c9408SRobert Watson * protections, grant many VFS privileges to root in jail. 3235800c9408SRobert Watson * Be careful to exclude mount-related and NFS-related 3236800c9408SRobert Watson * privileges. 3237800c9408SRobert Watson */ 3238800c9408SRobert Watson case PRIV_VFS_READ: 3239800c9408SRobert Watson case PRIV_VFS_WRITE: 3240800c9408SRobert Watson case PRIV_VFS_ADMIN: 3241800c9408SRobert Watson case PRIV_VFS_EXEC: 3242800c9408SRobert Watson case PRIV_VFS_LOOKUP: 3243800c9408SRobert Watson case PRIV_VFS_BLOCKRESERVE: /* XXXRW: Slightly surprising. */ 3244800c9408SRobert Watson case PRIV_VFS_CHFLAGS_DEV: 3245800c9408SRobert Watson case PRIV_VFS_CHOWN: 3246800c9408SRobert Watson case PRIV_VFS_CHROOT: 3247bb531912SPawel Jakub Dawidek case PRIV_VFS_RETAINSUGID: 3248800c9408SRobert Watson case PRIV_VFS_FCHROOT: 3249800c9408SRobert Watson case PRIV_VFS_LINK: 3250800c9408SRobert Watson case PRIV_VFS_SETGID: 3251e41966dcSRobert Watson case PRIV_VFS_STAT: 3252800c9408SRobert Watson case PRIV_VFS_STICKYFILE: 3253bb56d716SJamie Gritton 3254bb56d716SJamie Gritton /* 3255bb56d716SJamie Gritton * As in the non-jail case, non-root users are expected to be 3256bb56d716SJamie Gritton * able to read kernel/phyiscal memory (provided /dev/[k]mem 3257bb56d716SJamie Gritton * exists in the jail and they have permission to access it). 3258bb56d716SJamie Gritton */ 3259bb56d716SJamie Gritton case PRIV_KMEM_READ: 3260800c9408SRobert Watson return (0); 3261800c9408SRobert Watson 3262800c9408SRobert Watson /* 3263800c9408SRobert Watson * Depending on the global setting, allow privilege of 3264800c9408SRobert Watson * setting system flags. 3265800c9408SRobert Watson */ 3266800c9408SRobert Watson case PRIV_VFS_SYSFLAGS: 32670304c731SJamie Gritton if (cred->cr_prison->pr_allow & PR_ALLOW_CHFLAGS) 3268800c9408SRobert Watson return (0); 3269800c9408SRobert Watson else 3270800c9408SRobert Watson return (EPERM); 3271800c9408SRobert Watson 3272800c9408SRobert Watson /* 3273f3a8d2f9SPawel Jakub Dawidek * Depending on the global setting, allow privilege of 3274f3a8d2f9SPawel Jakub Dawidek * mounting/unmounting file systems. 3275f3a8d2f9SPawel Jakub Dawidek */ 3276f3a8d2f9SPawel Jakub Dawidek case PRIV_VFS_MOUNT: 3277f3a8d2f9SPawel Jakub Dawidek case PRIV_VFS_UNMOUNT: 3278f3a8d2f9SPawel Jakub Dawidek case PRIV_VFS_MOUNT_NONUSER: 327924b0502eSPawel Jakub Dawidek case PRIV_VFS_MOUNT_OWNER: 3280435d4667SMartin Matuska if (cred->cr_prison->pr_allow & PR_ALLOW_MOUNT && 3281435d4667SMartin Matuska cred->cr_prison->pr_enforce_statfs < 2) 3282f3a8d2f9SPawel Jakub Dawidek return (0); 3283f3a8d2f9SPawel Jakub Dawidek else 3284f3a8d2f9SPawel Jakub Dawidek return (EPERM); 3285f3a8d2f9SPawel Jakub Dawidek 3286f3a8d2f9SPawel Jakub Dawidek /* 3287ccd6ac9fSAntoine Brodin * Conditionnaly allow locking (unlocking) physical pages 3288ccd6ac9fSAntoine Brodin * in memory. 3289ccd6ac9fSAntoine Brodin */ 3290ccd6ac9fSAntoine Brodin case PRIV_VM_MLOCK: 3291ccd6ac9fSAntoine Brodin case PRIV_VM_MUNLOCK: 3292ccd6ac9fSAntoine Brodin if (cred->cr_prison->pr_allow & PR_ALLOW_MLOCK) 3293ccd6ac9fSAntoine Brodin return (0); 3294ccd6ac9fSAntoine Brodin else 3295ccd6ac9fSAntoine Brodin return (EPERM); 3296ccd6ac9fSAntoine Brodin 3297ccd6ac9fSAntoine Brodin /* 3298e28f9b7dSAllan Jude * Conditionally allow jailed root to bind reserved ports. 3299800c9408SRobert Watson */ 3300800c9408SRobert Watson case PRIV_NETINET_RESERVEDPORT: 3301e28f9b7dSAllan Jude if (cred->cr_prison->pr_allow & PR_ALLOW_RESERVED_PORTS) 3302e28f9b7dSAllan Jude return (0); 3303e28f9b7dSAllan Jude else 3304e28f9b7dSAllan Jude return (EPERM); 3305e28f9b7dSAllan Jude 3306e28f9b7dSAllan Jude /* 3307e28f9b7dSAllan Jude * Allow jailed root to reuse in-use ports. 3308e28f9b7dSAllan Jude */ 33094b084056SRobert Watson case PRIV_NETINET_REUSEPORT: 3310800c9408SRobert Watson return (0); 3311800c9408SRobert Watson 3312800c9408SRobert Watson /* 3313e3043798SPedro F. Giffuni * Allow jailed root to set certain IPv4/6 (option) headers. 331479ba3952SBjoern A. Zeeb */ 331579ba3952SBjoern A. Zeeb case PRIV_NETINET_SETHDROPTS: 331679ba3952SBjoern A. Zeeb return (0); 331779ba3952SBjoern A. Zeeb 331879ba3952SBjoern A. Zeeb /* 3319800c9408SRobert Watson * Conditionally allow creating raw sockets in jail. 3320800c9408SRobert Watson */ 3321800c9408SRobert Watson case PRIV_NETINET_RAW: 33220304c731SJamie Gritton if (cred->cr_prison->pr_allow & PR_ALLOW_RAW_SOCKETS) 3323800c9408SRobert Watson return (0); 3324800c9408SRobert Watson else 3325800c9408SRobert Watson return (EPERM); 3326800c9408SRobert Watson 3327800c9408SRobert Watson /* 3328800c9408SRobert Watson * Since jail implements its own visibility limits on netstat 3329800c9408SRobert Watson * sysctls, allow getcred. This allows identd to work in 3330800c9408SRobert Watson * jail. 3331800c9408SRobert Watson */ 3332800c9408SRobert Watson case PRIV_NETINET_GETCRED: 3333800c9408SRobert Watson return (0); 3334800c9408SRobert Watson 33352bfc50bcSEdward Tomasz Napierala /* 33362bfc50bcSEdward Tomasz Napierala * Allow jailed root to set loginclass. 33372bfc50bcSEdward Tomasz Napierala */ 33382bfc50bcSEdward Tomasz Napierala case PRIV_PROC_SETLOGINCLASS: 33392bfc50bcSEdward Tomasz Napierala return (0); 33402bfc50bcSEdward Tomasz Napierala 3341b19d66fdSJamie Gritton /* 33424520f617SJamie Gritton * Do not allow a process inside a jail to read the kernel 3343b19d66fdSJamie Gritton * message buffer unless explicitly permitted. 3344b19d66fdSJamie Gritton */ 3345b19d66fdSJamie Gritton case PRIV_MSGBUF: 3346b19d66fdSJamie Gritton if (cred->cr_prison->pr_allow & PR_ALLOW_READ_MSGBUF) 3347b19d66fdSJamie Gritton return (0); 3348b19d66fdSJamie Gritton return (EPERM); 3349b19d66fdSJamie Gritton 3350800c9408SRobert Watson default: 3351800c9408SRobert Watson /* 3352800c9408SRobert Watson * In all remaining cases, deny the privilege request. This 3353800c9408SRobert Watson * includes almost all network privileges, many system 3354800c9408SRobert Watson * configuration privileges. 3355800c9408SRobert Watson */ 3356800c9408SRobert Watson return (EPERM); 3357800c9408SRobert Watson } 3358800c9408SRobert Watson } 3359800c9408SRobert Watson 33600304c731SJamie Gritton /* 33610304c731SJamie Gritton * Return the part of pr2's name that is relative to pr1, or the whole name 33620304c731SJamie Gritton * if it does not directly follow. 33630304c731SJamie Gritton */ 33640304c731SJamie Gritton 33650304c731SJamie Gritton char * 33660304c731SJamie Gritton prison_name(struct prison *pr1, struct prison *pr2) 33670304c731SJamie Gritton { 33680304c731SJamie Gritton char *name; 33690304c731SJamie Gritton 33700304c731SJamie Gritton /* Jails see themselves as "0" (if they see themselves at all). */ 33710304c731SJamie Gritton if (pr1 == pr2) 33720304c731SJamie Gritton return "0"; 33730304c731SJamie Gritton name = pr2->pr_name; 33740304c731SJamie Gritton if (prison_ischild(pr1, pr2)) { 33750304c731SJamie Gritton /* 33760304c731SJamie Gritton * pr1 isn't locked (and allprison_lock may not be either) 33770304c731SJamie Gritton * so its length can't be counted on. But the number of dots 33780304c731SJamie Gritton * can be counted on - and counted. 33790304c731SJamie Gritton */ 33800304c731SJamie Gritton for (; pr1 != &prison0; pr1 = pr1->pr_parent) 33810304c731SJamie Gritton name = strchr(name, '.') + 1; 33820304c731SJamie Gritton } 33830304c731SJamie Gritton return (name); 33840304c731SJamie Gritton } 33850304c731SJamie Gritton 33860304c731SJamie Gritton /* 33870304c731SJamie Gritton * Return the part of pr2's path that is relative to pr1, or the whole path 33880304c731SJamie Gritton * if it does not directly follow. 33890304c731SJamie Gritton */ 33900304c731SJamie Gritton static char * 33910304c731SJamie Gritton prison_path(struct prison *pr1, struct prison *pr2) 33920304c731SJamie Gritton { 33930304c731SJamie Gritton char *path1, *path2; 33940304c731SJamie Gritton int len1; 33950304c731SJamie Gritton 33960304c731SJamie Gritton path1 = pr1->pr_path; 33970304c731SJamie Gritton path2 = pr2->pr_path; 33980304c731SJamie Gritton if (!strcmp(path1, "/")) 33990304c731SJamie Gritton return (path2); 34000304c731SJamie Gritton len1 = strlen(path1); 34010304c731SJamie Gritton if (strncmp(path1, path2, len1)) 34020304c731SJamie Gritton return (path2); 34030304c731SJamie Gritton if (path2[len1] == '\0') 34040304c731SJamie Gritton return "/"; 34050304c731SJamie Gritton if (path2[len1] == '/') 34060304c731SJamie Gritton return (path2 + len1); 34070304c731SJamie Gritton return (path2); 34080304c731SJamie Gritton } 34090304c731SJamie Gritton 34100304c731SJamie Gritton /* 34110304c731SJamie Gritton * Jail-related sysctls. 34120304c731SJamie Gritton */ 34137029da5cSPawel Biernacki static SYSCTL_NODE(_security, OID_AUTO, jail, CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 34140304c731SJamie Gritton "Jails"); 34150304c731SJamie Gritton 3416fd7a8150SMike Barcroft static int 3417fd7a8150SMike Barcroft sysctl_jail_list(SYSCTL_HANDLER_ARGS) 3418fd7a8150SMike Barcroft { 3419b38ff370SJamie Gritton struct xprison *xp; 34200304c731SJamie Gritton struct prison *pr, *cpr; 3421b38ff370SJamie Gritton #ifdef INET 3422b38ff370SJamie Gritton struct in_addr *ip4 = NULL; 3423b38ff370SJamie Gritton int ip4s = 0; 3424b38ff370SJamie Gritton #endif 3425b38ff370SJamie Gritton #ifdef INET6 34263beefaedSColin Percival struct in6_addr *ip6 = NULL; 3427b38ff370SJamie Gritton int ip6s = 0; 3428b38ff370SJamie Gritton #endif 34290304c731SJamie Gritton int descend, error; 3430fd7a8150SMike Barcroft 3431b38ff370SJamie Gritton xp = malloc(sizeof(*xp), M_TEMP, M_WAITOK); 34320304c731SJamie Gritton pr = req->td->td_ucred->cr_prison; 3433b38ff370SJamie Gritton error = 0; 3434dc68a633SPawel Jakub Dawidek sx_slock(&allprison_lock); 34350304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(pr, cpr, descend) { 34360304c731SJamie Gritton #if defined(INET) || defined(INET6) 3437b38ff370SJamie Gritton again: 34380304c731SJamie Gritton #endif 34390304c731SJamie Gritton mtx_lock(&cpr->pr_mtx); 3440413628a7SBjoern A. Zeeb #ifdef INET 34410304c731SJamie Gritton if (cpr->pr_ip4s > 0) { 34420304c731SJamie Gritton if (ip4s < cpr->pr_ip4s) { 34430304c731SJamie Gritton ip4s = cpr->pr_ip4s; 34440304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3445b38ff370SJamie Gritton ip4 = realloc(ip4, ip4s * 3446b38ff370SJamie Gritton sizeof(struct in_addr), M_TEMP, M_WAITOK); 3447b38ff370SJamie Gritton goto again; 3448b38ff370SJamie Gritton } 34490304c731SJamie Gritton bcopy(cpr->pr_ip4, ip4, 34500304c731SJamie Gritton cpr->pr_ip4s * sizeof(struct in_addr)); 3451b38ff370SJamie Gritton } 3452413628a7SBjoern A. Zeeb #endif 3453413628a7SBjoern A. Zeeb #ifdef INET6 34540304c731SJamie Gritton if (cpr->pr_ip6s > 0) { 34550304c731SJamie Gritton if (ip6s < cpr->pr_ip6s) { 34560304c731SJamie Gritton ip6s = cpr->pr_ip6s; 34570304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3458b38ff370SJamie Gritton ip6 = realloc(ip6, ip6s * 3459b38ff370SJamie Gritton sizeof(struct in6_addr), M_TEMP, M_WAITOK); 3460b38ff370SJamie Gritton goto again; 3461413628a7SBjoern A. Zeeb } 34620304c731SJamie Gritton bcopy(cpr->pr_ip6, ip6, 34630304c731SJamie Gritton cpr->pr_ip6s * sizeof(struct in6_addr)); 3464b38ff370SJamie Gritton } 3465b38ff370SJamie Gritton #endif 34660304c731SJamie Gritton if (cpr->pr_ref == 0) { 34670304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3468b38ff370SJamie Gritton continue; 3469b38ff370SJamie Gritton } 3470b38ff370SJamie Gritton bzero(xp, sizeof(*xp)); 3471fd7a8150SMike Barcroft xp->pr_version = XPRISON_VERSION; 34720304c731SJamie Gritton xp->pr_id = cpr->pr_id; 34730304c731SJamie Gritton xp->pr_state = cpr->pr_uref > 0 3474b38ff370SJamie Gritton ? PRISON_STATE_ALIVE : PRISON_STATE_DYING; 34750304c731SJamie Gritton strlcpy(xp->pr_path, prison_path(pr, cpr), sizeof(xp->pr_path)); 3476c1f19219SJamie Gritton strlcpy(xp->pr_host, cpr->pr_hostname, sizeof(xp->pr_host)); 34770304c731SJamie Gritton strlcpy(xp->pr_name, prison_name(pr, cpr), sizeof(xp->pr_name)); 3478413628a7SBjoern A. Zeeb #ifdef INET 34790304c731SJamie Gritton xp->pr_ip4s = cpr->pr_ip4s; 3480413628a7SBjoern A. Zeeb #endif 3481413628a7SBjoern A. Zeeb #ifdef INET6 34820304c731SJamie Gritton xp->pr_ip6s = cpr->pr_ip6s; 3483413628a7SBjoern A. Zeeb #endif 34840304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3485b38ff370SJamie Gritton error = SYSCTL_OUT(req, xp, sizeof(*xp)); 3486b38ff370SJamie Gritton if (error) 3487b38ff370SJamie Gritton break; 3488413628a7SBjoern A. Zeeb #ifdef INET 3489b38ff370SJamie Gritton if (xp->pr_ip4s > 0) { 3490b38ff370SJamie Gritton error = SYSCTL_OUT(req, ip4, 3491b38ff370SJamie Gritton xp->pr_ip4s * sizeof(struct in_addr)); 3492b38ff370SJamie Gritton if (error) 3493b38ff370SJamie Gritton break; 3494413628a7SBjoern A. Zeeb } 3495413628a7SBjoern A. Zeeb #endif 3496413628a7SBjoern A. Zeeb #ifdef INET6 3497b38ff370SJamie Gritton if (xp->pr_ip6s > 0) { 3498b38ff370SJamie Gritton error = SYSCTL_OUT(req, ip6, 3499b38ff370SJamie Gritton xp->pr_ip6s * sizeof(struct in6_addr)); 3500b38ff370SJamie Gritton if (error) 3501b38ff370SJamie Gritton break; 3502413628a7SBjoern A. Zeeb } 3503413628a7SBjoern A. Zeeb #endif 3504fd7a8150SMike Barcroft } 3505dc68a633SPawel Jakub Dawidek sx_sunlock(&allprison_lock); 3506b38ff370SJamie Gritton free(xp, M_TEMP); 3507b38ff370SJamie Gritton #ifdef INET 3508b38ff370SJamie Gritton free(ip4, M_TEMP); 3509b38ff370SJamie Gritton #endif 3510b38ff370SJamie Gritton #ifdef INET6 3511b38ff370SJamie Gritton free(ip6, M_TEMP); 3512b38ff370SJamie Gritton #endif 3513fd7a8150SMike Barcroft return (error); 3514fd7a8150SMike Barcroft } 3515fd7a8150SMike Barcroft 3516f3b86a5fSEd Schouten SYSCTL_OID(_security_jail, OID_AUTO, list, 3517f3b86a5fSEd Schouten CTLTYPE_STRUCT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0, 3518f3b86a5fSEd Schouten sysctl_jail_list, "S", "List of active jails"); 3519461167c2SPawel Jakub Dawidek 3520461167c2SPawel Jakub Dawidek static int 3521461167c2SPawel Jakub Dawidek sysctl_jail_jailed(SYSCTL_HANDLER_ARGS) 3522461167c2SPawel Jakub Dawidek { 3523461167c2SPawel Jakub Dawidek int error, injail; 3524461167c2SPawel Jakub Dawidek 3525461167c2SPawel Jakub Dawidek injail = jailed(req->td->td_ucred); 3526461167c2SPawel Jakub Dawidek error = SYSCTL_OUT(req, &injail, sizeof(injail)); 3527461167c2SPawel Jakub Dawidek 3528461167c2SPawel Jakub Dawidek return (error); 3529461167c2SPawel Jakub Dawidek } 35300304c731SJamie Gritton 3531f3b86a5fSEd Schouten SYSCTL_PROC(_security_jail, OID_AUTO, jailed, 3532f3b86a5fSEd Schouten CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0, 3533f3b86a5fSEd Schouten sysctl_jail_jailed, "I", "Process in jail?"); 3534413628a7SBjoern A. Zeeb 3535761d2bb5SJamie Gritton static int 3536761d2bb5SJamie Gritton sysctl_jail_vnet(SYSCTL_HANDLER_ARGS) 3537761d2bb5SJamie Gritton { 3538761d2bb5SJamie Gritton int error, havevnet; 3539761d2bb5SJamie Gritton #ifdef VIMAGE 3540761d2bb5SJamie Gritton struct ucred *cred = req->td->td_ucred; 3541761d2bb5SJamie Gritton 3542761d2bb5SJamie Gritton havevnet = jailed(cred) && prison_owns_vnet(cred); 3543761d2bb5SJamie Gritton #else 3544761d2bb5SJamie Gritton havevnet = 0; 3545761d2bb5SJamie Gritton #endif 3546761d2bb5SJamie Gritton error = SYSCTL_OUT(req, &havevnet, sizeof(havevnet)); 3547761d2bb5SJamie Gritton 3548761d2bb5SJamie Gritton return (error); 3549761d2bb5SJamie Gritton } 3550761d2bb5SJamie Gritton 3551761d2bb5SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, vnet, 3552761d2bb5SJamie Gritton CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0, 3553bb8f1623SBjoern A. Zeeb sysctl_jail_vnet, "I", "Jail owns vnet?"); 3554761d2bb5SJamie Gritton 35550304c731SJamie Gritton #if defined(INET) || defined(INET6) 3556e92e0574SJamie Gritton SYSCTL_UINT(_security_jail, OID_AUTO, jail_max_af_ips, CTLFLAG_RW, 35570304c731SJamie Gritton &jail_max_af_ips, 0, 3558c542c43eSJamie Gritton "Number of IP addresses a jail may have at most per address family (deprecated)"); 35590304c731SJamie Gritton #endif 35600304c731SJamie Gritton 35610304c731SJamie Gritton /* 3562c542c43eSJamie Gritton * Default parameters for jail(2) compatibility. For historical reasons, 3563c542c43eSJamie Gritton * the sysctl names have varying similarity to the parameter names. Prisons 3564c542c43eSJamie Gritton * just see their own parameters, and can't change them. 35650304c731SJamie Gritton */ 35660304c731SJamie Gritton static int 35670304c731SJamie Gritton sysctl_jail_default_allow(SYSCTL_HANDLER_ARGS) 35680304c731SJamie Gritton { 35690304c731SJamie Gritton struct prison *pr; 35700304c731SJamie Gritton int allow, error, i; 35710304c731SJamie Gritton 35720304c731SJamie Gritton pr = req->td->td_ucred->cr_prison; 35730304c731SJamie Gritton allow = (pr == &prison0) ? jail_default_allow : pr->pr_allow; 35740304c731SJamie Gritton 35750304c731SJamie Gritton /* Get the current flag value, and convert it to a boolean. */ 35760304c731SJamie Gritton i = (allow & arg2) ? 1 : 0; 35770304c731SJamie Gritton if (arg1 != NULL) 35780304c731SJamie Gritton i = !i; 35790304c731SJamie Gritton error = sysctl_handle_int(oidp, &i, 0, req); 3580c542c43eSJamie Gritton if (error || !req->newptr) 35810304c731SJamie Gritton return (error); 35820304c731SJamie Gritton i = i ? arg2 : 0; 35830304c731SJamie Gritton if (arg1 != NULL) 35840304c731SJamie Gritton i ^= arg2; 35850304c731SJamie Gritton /* 35860304c731SJamie Gritton * The sysctls don't have CTLFLAGS_PRISON, so assume prison0 35870304c731SJamie Gritton * for writing. 35880304c731SJamie Gritton */ 35890304c731SJamie Gritton mtx_lock(&prison0.pr_mtx); 35900304c731SJamie Gritton jail_default_allow = (jail_default_allow & ~arg2) | i; 35910304c731SJamie Gritton mtx_unlock(&prison0.pr_mtx); 35920304c731SJamie Gritton return (0); 35930304c731SJamie Gritton } 35940304c731SJamie Gritton 35950304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, set_hostname_allowed, 3596c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 35970304c731SJamie Gritton NULL, PR_ALLOW_SET_HOSTNAME, sysctl_jail_default_allow, "I", 3598c542c43eSJamie Gritton "Processes in jail can set their hostnames (deprecated)"); 35990304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, socket_unixiproute_only, 3600c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 36010304c731SJamie Gritton (void *)1, PR_ALLOW_SOCKET_AF, sysctl_jail_default_allow, "I", 3602c542c43eSJamie Gritton "Processes in jail are limited to creating UNIX/IP/route sockets only (deprecated)"); 36030304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, sysvipc_allowed, 3604c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 36050304c731SJamie Gritton NULL, PR_ALLOW_SYSVIPC, sysctl_jail_default_allow, "I", 3606c542c43eSJamie Gritton "Processes in jail can use System V IPC primitives (deprecated)"); 36070304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, allow_raw_sockets, 3608c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 36090304c731SJamie Gritton NULL, PR_ALLOW_RAW_SOCKETS, sysctl_jail_default_allow, "I", 3610c542c43eSJamie Gritton "Prison root can create raw sockets (deprecated)"); 36110304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, chflags_allowed, 3612c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 36130304c731SJamie Gritton NULL, PR_ALLOW_CHFLAGS, sysctl_jail_default_allow, "I", 3614c542c43eSJamie Gritton "Processes in jail can alter system file flags (deprecated)"); 36150304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, mount_allowed, 3616c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 36170304c731SJamie Gritton NULL, PR_ALLOW_MOUNT, sysctl_jail_default_allow, "I", 3618c542c43eSJamie Gritton "Processes in jail can mount/unmount jail-friendly file systems (deprecated)"); 36190304c731SJamie Gritton 36200304c731SJamie Gritton static int 36210304c731SJamie Gritton sysctl_jail_default_level(SYSCTL_HANDLER_ARGS) 36220304c731SJamie Gritton { 36230304c731SJamie Gritton struct prison *pr; 36240304c731SJamie Gritton int level, error; 36250304c731SJamie Gritton 36260304c731SJamie Gritton pr = req->td->td_ucred->cr_prison; 36270304c731SJamie Gritton level = (pr == &prison0) ? *(int *)arg1 : *(int *)((char *)pr + arg2); 36280304c731SJamie Gritton error = sysctl_handle_int(oidp, &level, 0, req); 3629c542c43eSJamie Gritton if (error || !req->newptr) 36300304c731SJamie Gritton return (error); 36310304c731SJamie Gritton *(int *)arg1 = level; 36320304c731SJamie Gritton return (0); 36330304c731SJamie Gritton } 36340304c731SJamie Gritton 36350304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, enforce_statfs, 3636c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 3637c542c43eSJamie Gritton &jail_default_enforce_statfs, offsetof(struct prison, pr_enforce_statfs), 36380304c731SJamie Gritton sysctl_jail_default_level, "I", 3639c542c43eSJamie Gritton "Processes in jail cannot see all mounted file systems (deprecated)"); 3640c542c43eSJamie Gritton 36410cc207a6SMartin Matuska SYSCTL_PROC(_security_jail, OID_AUTO, devfs_ruleset, 3642c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, 3643c542c43eSJamie Gritton &jail_default_devfs_rsnum, offsetof(struct prison, pr_devfs_rsnum), 36440cc207a6SMartin Matuska sysctl_jail_default_level, "I", 3645c542c43eSJamie Gritton "Ruleset for the devfs filesystem in jail (deprecated)"); 36460cc207a6SMartin Matuska 36470304c731SJamie Gritton /* 36480304c731SJamie Gritton * Nodes to describe jail parameters. Maximum length of string parameters 36490304c731SJamie Gritton * is returned in the string itself, and the other parameters exist merely 36500304c731SJamie Gritton * to make themselves and their types known. 36510304c731SJamie Gritton */ 36527029da5cSPawel Biernacki SYSCTL_NODE(_security_jail, OID_AUTO, param, CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 36530304c731SJamie Gritton "Jail parameters"); 36540304c731SJamie Gritton 36550304c731SJamie Gritton int 36560304c731SJamie Gritton sysctl_jail_param(SYSCTL_HANDLER_ARGS) 36570304c731SJamie Gritton { 36580304c731SJamie Gritton int i; 36590304c731SJamie Gritton long l; 36600304c731SJamie Gritton size_t s; 36610304c731SJamie Gritton char numbuf[12]; 36620304c731SJamie Gritton 36630304c731SJamie Gritton switch (oidp->oid_kind & CTLTYPE) 36640304c731SJamie Gritton { 36650304c731SJamie Gritton case CTLTYPE_LONG: 36660304c731SJamie Gritton case CTLTYPE_ULONG: 36670304c731SJamie Gritton l = 0; 36680304c731SJamie Gritton #ifdef SCTL_MASK32 36690304c731SJamie Gritton if (!(req->flags & SCTL_MASK32)) 36700304c731SJamie Gritton #endif 36710304c731SJamie Gritton return (SYSCTL_OUT(req, &l, sizeof(l))); 36720304c731SJamie Gritton case CTLTYPE_INT: 36730304c731SJamie Gritton case CTLTYPE_UINT: 36740304c731SJamie Gritton i = 0; 36750304c731SJamie Gritton return (SYSCTL_OUT(req, &i, sizeof(i))); 36760304c731SJamie Gritton case CTLTYPE_STRING: 3677e4cd31ddSJeff Roberson snprintf(numbuf, sizeof(numbuf), "%jd", (intmax_t)arg2); 36780304c731SJamie Gritton return 36790304c731SJamie Gritton (sysctl_handle_string(oidp, numbuf, sizeof(numbuf), req)); 36800304c731SJamie Gritton case CTLTYPE_STRUCT: 36810304c731SJamie Gritton s = (size_t)arg2; 36820304c731SJamie Gritton return (SYSCTL_OUT(req, &s, sizeof(s))); 36830304c731SJamie Gritton } 36840304c731SJamie Gritton return (0); 36850304c731SJamie Gritton } 36860304c731SJamie Gritton 3687b96bd95bSIan Lepore /* 3688b96bd95bSIan Lepore * CTLFLAG_RDTUN in the following indicates jail parameters that can be set at 3689b96bd95bSIan Lepore * jail creation time but cannot be changed in an existing jail. 3690b96bd95bSIan Lepore */ 36910304c731SJamie Gritton SYSCTL_JAIL_PARAM(, jid, CTLTYPE_INT | CTLFLAG_RDTUN, "I", "Jail ID"); 36920304c731SJamie Gritton SYSCTL_JAIL_PARAM(, parent, CTLTYPE_INT | CTLFLAG_RD, "I", "Jail parent ID"); 36930304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRING(, name, CTLFLAG_RW, MAXHOSTNAMELEN, "Jail name"); 36940304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRING(, path, CTLFLAG_RDTUN, MAXPATHLEN, "Jail root path"); 36950304c731SJamie Gritton SYSCTL_JAIL_PARAM(, securelevel, CTLTYPE_INT | CTLFLAG_RW, 36960304c731SJamie Gritton "I", "Jail secure level"); 3697b96bd95bSIan Lepore SYSCTL_JAIL_PARAM(, osreldate, CTLTYPE_INT | CTLFLAG_RDTUN, "I", 3698b96bd95bSIan Lepore "Jail value for kern.osreldate and uname -K"); 3699b96bd95bSIan Lepore SYSCTL_JAIL_PARAM_STRING(, osrelease, CTLFLAG_RDTUN, OSRELEASELEN, 3700b96bd95bSIan Lepore "Jail value for kern.osrelease and uname -r"); 37010304c731SJamie Gritton SYSCTL_JAIL_PARAM(, enforce_statfs, CTLTYPE_INT | CTLFLAG_RW, 37020304c731SJamie Gritton "I", "Jail cannot see all mounted file systems"); 37030cc207a6SMartin Matuska SYSCTL_JAIL_PARAM(, devfs_ruleset, CTLTYPE_INT | CTLFLAG_RW, 37040cc207a6SMartin Matuska "I", "Ruleset for in-jail devfs mounts"); 37050304c731SJamie Gritton SYSCTL_JAIL_PARAM(, persist, CTLTYPE_INT | CTLFLAG_RW, 37060304c731SJamie Gritton "B", "Jail persistence"); 3707679e1390SJamie Gritton #ifdef VIMAGE 3708679e1390SJamie Gritton SYSCTL_JAIL_PARAM(, vnet, CTLTYPE_INT | CTLFLAG_RDTUN, 37097cbf7213SJamie Gritton "E,jailsys", "Virtual network stack"); 3710679e1390SJamie Gritton #endif 37110304c731SJamie Gritton SYSCTL_JAIL_PARAM(, dying, CTLTYPE_INT | CTLFLAG_RD, 37120304c731SJamie Gritton "B", "Jail is in the process of shutting down"); 37130304c731SJamie Gritton 3714b97457e2SJamie Gritton SYSCTL_JAIL_PARAM_NODE(children, "Number of child jails"); 3715b97457e2SJamie Gritton SYSCTL_JAIL_PARAM(_children, cur, CTLTYPE_INT | CTLFLAG_RD, 3716b97457e2SJamie Gritton "I", "Current number of child jails"); 3717b97457e2SJamie Gritton SYSCTL_JAIL_PARAM(_children, max, CTLTYPE_INT | CTLFLAG_RW, 3718b97457e2SJamie Gritton "I", "Maximum number of child jails"); 3719b97457e2SJamie Gritton 37207cbf7213SJamie Gritton SYSCTL_JAIL_PARAM_SYS_NODE(host, CTLFLAG_RW, "Jail host info"); 37210304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRING(_host, hostname, CTLFLAG_RW, MAXHOSTNAMELEN, 37220304c731SJamie Gritton "Jail hostname"); 372376ca6f88SJamie Gritton SYSCTL_JAIL_PARAM_STRING(_host, domainname, CTLFLAG_RW, MAXHOSTNAMELEN, 372476ca6f88SJamie Gritton "Jail NIS domainname"); 372576ca6f88SJamie Gritton SYSCTL_JAIL_PARAM_STRING(_host, hostuuid, CTLFLAG_RW, HOSTUUIDLEN, 372676ca6f88SJamie Gritton "Jail host UUID"); 372776ca6f88SJamie Gritton SYSCTL_JAIL_PARAM(_host, hostid, CTLTYPE_ULONG | CTLFLAG_RW, 372876ca6f88SJamie Gritton "LU", "Jail host ID"); 37290304c731SJamie Gritton 37300304c731SJamie Gritton SYSCTL_JAIL_PARAM_NODE(cpuset, "Jail cpuset"); 37310304c731SJamie Gritton SYSCTL_JAIL_PARAM(_cpuset, id, CTLTYPE_INT | CTLFLAG_RD, "I", "Jail cpuset ID"); 37320304c731SJamie Gritton 37330304c731SJamie Gritton #ifdef INET 37342b0d6f81SJamie Gritton SYSCTL_JAIL_PARAM_SYS_NODE(ip4, CTLFLAG_RDTUN, 37352b0d6f81SJamie Gritton "Jail IPv4 address virtualization"); 37360304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRUCT(_ip4, addr, CTLFLAG_RW, sizeof(struct in_addr), 37370304c731SJamie Gritton "S,in_addr,a", "Jail IPv4 addresses"); 3738592bcae8SBjoern A. Zeeb SYSCTL_JAIL_PARAM(_ip4, saddrsel, CTLTYPE_INT | CTLFLAG_RW, 3739592bcae8SBjoern A. Zeeb "B", "Do (not) use IPv4 source address selection rather than the " 3740592bcae8SBjoern A. Zeeb "primary jail IPv4 address."); 37410304c731SJamie Gritton #endif 37420304c731SJamie Gritton #ifdef INET6 37432b0d6f81SJamie Gritton SYSCTL_JAIL_PARAM_SYS_NODE(ip6, CTLFLAG_RDTUN, 37442b0d6f81SJamie Gritton "Jail IPv6 address virtualization"); 37450304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRUCT(_ip6, addr, CTLFLAG_RW, sizeof(struct in6_addr), 37460304c731SJamie Gritton "S,in6_addr,a", "Jail IPv6 addresses"); 3747592bcae8SBjoern A. Zeeb SYSCTL_JAIL_PARAM(_ip6, saddrsel, CTLTYPE_INT | CTLFLAG_RW, 3748592bcae8SBjoern A. Zeeb "B", "Do (not) use IPv6 source address selection rather than the " 3749592bcae8SBjoern A. Zeeb "primary jail IPv6 address."); 37500304c731SJamie Gritton #endif 37510304c731SJamie Gritton 37520304c731SJamie Gritton SYSCTL_JAIL_PARAM_NODE(allow, "Jail permission flags"); 37530304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, set_hostname, CTLTYPE_INT | CTLFLAG_RW, 37540304c731SJamie Gritton "B", "Jail may set hostname"); 37550304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, sysvipc, CTLTYPE_INT | CTLFLAG_RW, 37560304c731SJamie Gritton "B", "Jail may use SYSV IPC"); 37570304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, raw_sockets, CTLTYPE_INT | CTLFLAG_RW, 37580304c731SJamie Gritton "B", "Jail may create raw sockets"); 37590304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, chflags, CTLTYPE_INT | CTLFLAG_RW, 37600304c731SJamie Gritton "B", "Jail may alter system file flags"); 37610304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, quotas, CTLTYPE_INT | CTLFLAG_RW, 37620304c731SJamie Gritton "B", "Jail may set file quotas"); 37630304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, socket_af, CTLTYPE_INT | CTLFLAG_RW, 37640304c731SJamie Gritton "B", "Jail may create sockets other than just UNIX/IPv4/IPv6/route"); 3765ccd6ac9fSAntoine Brodin SYSCTL_JAIL_PARAM(_allow, mlock, CTLTYPE_INT | CTLFLAG_RW, 3766ccd6ac9fSAntoine Brodin "B", "Jail may lock (unlock) physical pages in memory"); 3767e28f9b7dSAllan Jude SYSCTL_JAIL_PARAM(_allow, reserved_ports, CTLTYPE_INT | CTLFLAG_RW, 3768e28f9b7dSAllan Jude "B", "Jail may bind sockets to reserved ports"); 3769b19d66fdSJamie Gritton SYSCTL_JAIL_PARAM(_allow, read_msgbuf, CTLTYPE_INT | CTLFLAG_RW, 3770b19d66fdSJamie Gritton "B", "Jail may read the kernel message buffer"); 3771b3079544SJamie Gritton SYSCTL_JAIL_PARAM(_allow, unprivileged_proc_debug, CTLTYPE_INT | CTLFLAG_RW, 3772b3079544SJamie Gritton "B", "Unprivileged processes may use process debugging facilities"); 37730304c731SJamie Gritton 3774bf3db8aaSMartin Matuska SYSCTL_JAIL_PARAM_SUBNODE(allow, mount, "Jail mount/unmount permission flags"); 3775bf3db8aaSMartin Matuska SYSCTL_JAIL_PARAM(_allow_mount, , CTLTYPE_INT | CTLFLAG_RW, 3776bf3db8aaSMartin Matuska "B", "Jail may mount/unmount jail-friendly file systems in general"); 37770e5c6bd4SJamie Gritton 37780e5c6bd4SJamie Gritton /* 37790a172404SJamie Gritton * Add a dynamic parameter allow.<name>, or allow.<prefix>.<name>. Return 37800a172404SJamie Gritton * its associated bit in the pr_allow bitmask, or zero if the parameter was 37810a172404SJamie Gritton * not created. 37820e5c6bd4SJamie Gritton */ 37830a172404SJamie Gritton unsigned 37840a172404SJamie Gritton prison_add_allow(const char *prefix, const char *name, const char *prefix_descr, 37850a172404SJamie Gritton const char *descr) 37860e5c6bd4SJamie Gritton { 37870e5c6bd4SJamie Gritton struct bool_flags *bf; 37880a172404SJamie Gritton struct sysctl_oid *parent; 37890a172404SJamie Gritton char *allow_name, *allow_noname, *allowed; 3790c542c43eSJamie Gritton #ifndef NO_SYSCTL_DESCR 3791c542c43eSJamie Gritton char *descr_deprecated; 3792c542c43eSJamie Gritton #endif 37930e5c6bd4SJamie Gritton unsigned allow_flag; 37940e5c6bd4SJamie Gritton 37950a172404SJamie Gritton if (prefix 37960a172404SJamie Gritton ? asprintf(&allow_name, M_PRISON, "allow.%s.%s", prefix, name) 37970a172404SJamie Gritton < 0 || 37980a172404SJamie Gritton asprintf(&allow_noname, M_PRISON, "allow.%s.no%s", prefix, name) 37990a172404SJamie Gritton < 0 38000a172404SJamie Gritton : asprintf(&allow_name, M_PRISON, "allow.%s", name) < 0 || 38010a172404SJamie Gritton asprintf(&allow_noname, M_PRISON, "allow.no%s", name) < 0) { 38020e5c6bd4SJamie Gritton free(allow_name, M_PRISON); 38030a172404SJamie Gritton return 0; 38040e5c6bd4SJamie Gritton } 38050e5c6bd4SJamie Gritton 38060e5c6bd4SJamie Gritton /* 38070a172404SJamie Gritton * See if this parameter has already beed added, i.e. a module was 38080a172404SJamie Gritton * previously loaded/unloaded. 38090e5c6bd4SJamie Gritton */ 38100e5c6bd4SJamie Gritton mtx_lock(&prison0.pr_mtx); 38110e5c6bd4SJamie Gritton for (bf = pr_flag_allow; 38120e5c6bd4SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && bf->flag != 0; 38130e5c6bd4SJamie Gritton bf++) { 38140e5c6bd4SJamie Gritton if (strcmp(bf->name, allow_name) == 0) { 38150a172404SJamie Gritton allow_flag = bf->flag; 38160e5c6bd4SJamie Gritton goto no_add; 38170e5c6bd4SJamie Gritton } 38180e5c6bd4SJamie Gritton } 38190e5c6bd4SJamie Gritton 38200e5c6bd4SJamie Gritton /* 38210e5c6bd4SJamie Gritton * Find a free bit in prison0's pr_allow, failing if there are none 38220e5c6bd4SJamie Gritton * (which shouldn't happen as long as we keep track of how many 38230a172404SJamie Gritton * potential dynamic flags exist). 3824b3079544SJamie Gritton * 3825b3079544SJamie Gritton * Due to per-jail unprivileged process debugging support 3826b3079544SJamie Gritton * using pr_allow, also verify against PR_ALLOW_ALL_STATIC. 3827b3079544SJamie Gritton * prison0 may have unprivileged process debugging unset. 38280e5c6bd4SJamie Gritton */ 38290e5c6bd4SJamie Gritton for (allow_flag = 1;; allow_flag <<= 1) { 38300e5c6bd4SJamie Gritton if (allow_flag == 0) 38310e5c6bd4SJamie Gritton goto no_add; 3832b3079544SJamie Gritton if (allow_flag & PR_ALLOW_ALL_STATIC) 3833b3079544SJamie Gritton continue; 38340e5c6bd4SJamie Gritton if ((prison0.pr_allow & allow_flag) == 0) 38350e5c6bd4SJamie Gritton break; 38360e5c6bd4SJamie Gritton } 38370e5c6bd4SJamie Gritton 38380e5c6bd4SJamie Gritton /* 38390e5c6bd4SJamie Gritton * Note the parameter in the next open slot in pr_flag_allow. 38400e5c6bd4SJamie Gritton * Set the flag last so code that checks pr_flag_allow can do so 38410e5c6bd4SJamie Gritton * without locking. 38420e5c6bd4SJamie Gritton */ 38430e5c6bd4SJamie Gritton for (bf = pr_flag_allow; bf->flag != 0; bf++) 38440e5c6bd4SJamie Gritton if (bf == pr_flag_allow + nitems(pr_flag_allow)) { 38450e5c6bd4SJamie Gritton /* This should never happen, but is not fatal. */ 38460a172404SJamie Gritton allow_flag = 0; 38470e5c6bd4SJamie Gritton goto no_add; 38480e5c6bd4SJamie Gritton } 38490e5c6bd4SJamie Gritton prison0.pr_allow |= allow_flag; 38500e5c6bd4SJamie Gritton bf->name = allow_name; 38510e5c6bd4SJamie Gritton bf->noname = allow_noname; 38520e5c6bd4SJamie Gritton bf->flag = allow_flag; 38530e5c6bd4SJamie Gritton mtx_unlock(&prison0.pr_mtx); 38540e5c6bd4SJamie Gritton 3855c542c43eSJamie Gritton /* 3856c542c43eSJamie Gritton * Create sysctls for the paramter, and the back-compat global 3857c542c43eSJamie Gritton * permission. 3858c542c43eSJamie Gritton */ 38590a172404SJamie Gritton parent = prefix 38600a172404SJamie Gritton ? SYSCTL_ADD_NODE(NULL, 38610a172404SJamie Gritton SYSCTL_CHILDREN(&sysctl___security_jail_param_allow), 38627029da5cSPawel Biernacki OID_AUTO, prefix, CTLFLAG_MPSAFE, 0, prefix_descr) 38630a172404SJamie Gritton : &sysctl___security_jail_param_allow; 38640a172404SJamie Gritton (void)SYSCTL_ADD_PROC(NULL, SYSCTL_CHILDREN(parent), OID_AUTO, 38650a172404SJamie Gritton name, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 38660e5c6bd4SJamie Gritton NULL, 0, sysctl_jail_param, "B", descr); 38670a172404SJamie Gritton if ((prefix 38680a172404SJamie Gritton ? asprintf(&allowed, M_TEMP, "%s_%s_allowed", prefix, name) 38690a172404SJamie Gritton : asprintf(&allowed, M_TEMP, "%s_allowed", name)) >= 0) { 3870c542c43eSJamie Gritton #ifndef NO_SYSCTL_DESCR 3871c542c43eSJamie Gritton (void)asprintf(&descr_deprecated, M_TEMP, "%s (deprecated)", 3872c542c43eSJamie Gritton descr); 3873c542c43eSJamie Gritton #endif 38740e5c6bd4SJamie Gritton (void)SYSCTL_ADD_PROC(NULL, 38750a172404SJamie Gritton SYSCTL_CHILDREN(&sysctl___security_jail), OID_AUTO, allowed, 3876c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, NULL, allow_flag, 3877c542c43eSJamie Gritton sysctl_jail_default_allow, "I", descr_deprecated); 3878c542c43eSJamie Gritton #ifndef NO_SYSCTL_DESCR 3879c542c43eSJamie Gritton free(descr_deprecated, M_TEMP); 3880c542c43eSJamie Gritton #endif 38810a172404SJamie Gritton free(allowed, M_TEMP); 38820e5c6bd4SJamie Gritton } 38830a172404SJamie Gritton return allow_flag; 38840e5c6bd4SJamie Gritton 38850e5c6bd4SJamie Gritton no_add: 38860e5c6bd4SJamie Gritton mtx_unlock(&prison0.pr_mtx); 38870e5c6bd4SJamie Gritton free(allow_name, M_PRISON); 38880e5c6bd4SJamie Gritton free(allow_noname, M_PRISON); 38890a172404SJamie Gritton return allow_flag; 38900a172404SJamie Gritton } 38910a172404SJamie Gritton 38920a172404SJamie Gritton /* 38930a172404SJamie Gritton * The VFS system will register jail-aware filesystems here. They each get 38940a172404SJamie Gritton * a parameter allow.mount.xxxfs and a flag to check when a jailed user 38950a172404SJamie Gritton * attempts to mount. 38960a172404SJamie Gritton */ 38970a172404SJamie Gritton void 38980a172404SJamie Gritton prison_add_vfs(struct vfsconf *vfsp) 38990a172404SJamie Gritton { 39000a172404SJamie Gritton #ifdef NO_SYSCTL_DESCR 39010a172404SJamie Gritton 39020a172404SJamie Gritton vfsp->vfc_prison_flag = prison_add_allow("mount", vfsp->vfc_name, 39030a172404SJamie Gritton NULL, NULL); 39040a172404SJamie Gritton #else 39050a172404SJamie Gritton char *descr; 39060a172404SJamie Gritton 39070a172404SJamie Gritton (void)asprintf(&descr, M_TEMP, "Jail may mount the %s file system", 39080a172404SJamie Gritton vfsp->vfc_name); 39090a172404SJamie Gritton vfsp->vfc_prison_flag = prison_add_allow("mount", vfsp->vfc_name, 39100a172404SJamie Gritton NULL, descr); 39110a172404SJamie Gritton free(descr, M_TEMP); 39120a172404SJamie Gritton #endif 39130e5c6bd4SJamie Gritton } 3914bf3db8aaSMartin Matuska 39154b5c9cf6SEdward Tomasz Napierala #ifdef RACCT 3916097055e2SEdward Tomasz Napierala void 3917097055e2SEdward Tomasz Napierala prison_racct_foreach(void (*callback)(struct racct *racct, 391815db3c07SEdward Tomasz Napierala void *arg2, void *arg3), void (*pre)(void), void (*post)(void), 391915db3c07SEdward Tomasz Napierala void *arg2, void *arg3) 3920097055e2SEdward Tomasz Napierala { 3921a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 3922097055e2SEdward Tomasz Napierala 39234b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 39244b5c9cf6SEdward Tomasz Napierala 3925097055e2SEdward Tomasz Napierala sx_slock(&allprison_lock); 392615db3c07SEdward Tomasz Napierala if (pre != NULL) 392715db3c07SEdward Tomasz Napierala (pre)(); 3928a7ad07bfSEdward Tomasz Napierala LIST_FOREACH(prr, &allprison_racct, prr_next) 3929a7ad07bfSEdward Tomasz Napierala (callback)(prr->prr_racct, arg2, arg3); 393015db3c07SEdward Tomasz Napierala if (post != NULL) 393115db3c07SEdward Tomasz Napierala (post)(); 3932097055e2SEdward Tomasz Napierala sx_sunlock(&allprison_lock); 3933097055e2SEdward Tomasz Napierala } 39340304c731SJamie Gritton 3935a7ad07bfSEdward Tomasz Napierala static struct prison_racct * 3936a7ad07bfSEdward Tomasz Napierala prison_racct_find_locked(const char *name) 3937a7ad07bfSEdward Tomasz Napierala { 3938a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 3939a7ad07bfSEdward Tomasz Napierala 39404b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 3941a7ad07bfSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_XLOCKED); 3942a7ad07bfSEdward Tomasz Napierala 3943a7ad07bfSEdward Tomasz Napierala if (name[0] == '\0' || strlen(name) >= MAXHOSTNAMELEN) 3944a7ad07bfSEdward Tomasz Napierala return (NULL); 3945a7ad07bfSEdward Tomasz Napierala 3946a7ad07bfSEdward Tomasz Napierala LIST_FOREACH(prr, &allprison_racct, prr_next) { 3947a7ad07bfSEdward Tomasz Napierala if (strcmp(name, prr->prr_name) != 0) 3948a7ad07bfSEdward Tomasz Napierala continue; 3949a7ad07bfSEdward Tomasz Napierala 3950a7ad07bfSEdward Tomasz Napierala /* Found prison_racct with a matching name? */ 3951a7ad07bfSEdward Tomasz Napierala prison_racct_hold(prr); 3952a7ad07bfSEdward Tomasz Napierala return (prr); 3953a7ad07bfSEdward Tomasz Napierala } 3954a7ad07bfSEdward Tomasz Napierala 3955a7ad07bfSEdward Tomasz Napierala /* Add new prison_racct. */ 3956a7ad07bfSEdward Tomasz Napierala prr = malloc(sizeof(*prr), M_PRISON_RACCT, M_ZERO | M_WAITOK); 3957a7ad07bfSEdward Tomasz Napierala racct_create(&prr->prr_racct); 3958a7ad07bfSEdward Tomasz Napierala 3959a7ad07bfSEdward Tomasz Napierala strcpy(prr->prr_name, name); 3960a7ad07bfSEdward Tomasz Napierala refcount_init(&prr->prr_refcount, 1); 3961a7ad07bfSEdward Tomasz Napierala LIST_INSERT_HEAD(&allprison_racct, prr, prr_next); 3962a7ad07bfSEdward Tomasz Napierala 3963a7ad07bfSEdward Tomasz Napierala return (prr); 3964a7ad07bfSEdward Tomasz Napierala } 3965a7ad07bfSEdward Tomasz Napierala 3966a7ad07bfSEdward Tomasz Napierala struct prison_racct * 3967a7ad07bfSEdward Tomasz Napierala prison_racct_find(const char *name) 3968a7ad07bfSEdward Tomasz Napierala { 3969a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 3970a7ad07bfSEdward Tomasz Napierala 39714b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 39724b5c9cf6SEdward Tomasz Napierala 3973a7ad07bfSEdward Tomasz Napierala sx_xlock(&allprison_lock); 3974a7ad07bfSEdward Tomasz Napierala prr = prison_racct_find_locked(name); 3975a7ad07bfSEdward Tomasz Napierala sx_xunlock(&allprison_lock); 3976a7ad07bfSEdward Tomasz Napierala return (prr); 3977a7ad07bfSEdward Tomasz Napierala } 3978a7ad07bfSEdward Tomasz Napierala 3979a7ad07bfSEdward Tomasz Napierala void 3980a7ad07bfSEdward Tomasz Napierala prison_racct_hold(struct prison_racct *prr) 3981a7ad07bfSEdward Tomasz Napierala { 3982a7ad07bfSEdward Tomasz Napierala 39834b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 39844b5c9cf6SEdward Tomasz Napierala 3985a7ad07bfSEdward Tomasz Napierala refcount_acquire(&prr->prr_refcount); 3986a7ad07bfSEdward Tomasz Napierala } 3987a7ad07bfSEdward Tomasz Napierala 3988c34bbd2aSEdward Tomasz Napierala static void 3989c34bbd2aSEdward Tomasz Napierala prison_racct_free_locked(struct prison_racct *prr) 3990c34bbd2aSEdward Tomasz Napierala { 3991c34bbd2aSEdward Tomasz Napierala 39924b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 3993c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_XLOCKED); 3994c34bbd2aSEdward Tomasz Napierala 3995c34bbd2aSEdward Tomasz Napierala if (refcount_release(&prr->prr_refcount)) { 3996c34bbd2aSEdward Tomasz Napierala racct_destroy(&prr->prr_racct); 3997c34bbd2aSEdward Tomasz Napierala LIST_REMOVE(prr, prr_next); 3998c34bbd2aSEdward Tomasz Napierala free(prr, M_PRISON_RACCT); 3999c34bbd2aSEdward Tomasz Napierala } 4000c34bbd2aSEdward Tomasz Napierala } 4001c34bbd2aSEdward Tomasz Napierala 4002a7ad07bfSEdward Tomasz Napierala void 4003a7ad07bfSEdward Tomasz Napierala prison_racct_free(struct prison_racct *prr) 4004a7ad07bfSEdward Tomasz Napierala { 4005a7ad07bfSEdward Tomasz Napierala 40064b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4007c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_UNLOCKED); 4008c34bbd2aSEdward Tomasz Napierala 40096ff4688bSMateusz Guzik if (refcount_release_if_not_last(&prr->prr_refcount)) 4010a7ad07bfSEdward Tomasz Napierala return; 4011a7ad07bfSEdward Tomasz Napierala 4012a7ad07bfSEdward Tomasz Napierala sx_xlock(&allprison_lock); 4013c34bbd2aSEdward Tomasz Napierala prison_racct_free_locked(prr); 4014a7ad07bfSEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4015a7ad07bfSEdward Tomasz Napierala } 4016a7ad07bfSEdward Tomasz Napierala 4017a7ad07bfSEdward Tomasz Napierala static void 4018a7ad07bfSEdward Tomasz Napierala prison_racct_attach(struct prison *pr) 4019a7ad07bfSEdward Tomasz Napierala { 4020a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 4021a7ad07bfSEdward Tomasz Napierala 40224b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4023c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_XLOCKED); 4024c34bbd2aSEdward Tomasz Napierala 4025a7ad07bfSEdward Tomasz Napierala prr = prison_racct_find_locked(pr->pr_name); 4026a7ad07bfSEdward Tomasz Napierala KASSERT(prr != NULL, ("cannot find prison_racct")); 4027a7ad07bfSEdward Tomasz Napierala 4028a7ad07bfSEdward Tomasz Napierala pr->pr_prison_racct = prr; 4029a7ad07bfSEdward Tomasz Napierala } 4030a7ad07bfSEdward Tomasz Napierala 4031c34bbd2aSEdward Tomasz Napierala /* 4032c34bbd2aSEdward Tomasz Napierala * Handle jail renaming. From the racct point of view, renaming means 4033c34bbd2aSEdward Tomasz Napierala * moving from one prison_racct to another. 4034c34bbd2aSEdward Tomasz Napierala */ 4035c34bbd2aSEdward Tomasz Napierala static void 4036c34bbd2aSEdward Tomasz Napierala prison_racct_modify(struct prison *pr) 4037c34bbd2aSEdward Tomasz Napierala { 4038dbadb015SKonstantin Belousov #ifdef RCTL 4039c34bbd2aSEdward Tomasz Napierala struct proc *p; 4040c34bbd2aSEdward Tomasz Napierala struct ucred *cred; 4041dbadb015SKonstantin Belousov #endif 4042c34bbd2aSEdward Tomasz Napierala struct prison_racct *oldprr; 4043c34bbd2aSEdward Tomasz Napierala 40444b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 40454b5c9cf6SEdward Tomasz Napierala 4046c34bbd2aSEdward Tomasz Napierala sx_slock(&allproc_lock); 4047c34bbd2aSEdward Tomasz Napierala sx_xlock(&allprison_lock); 4048c34bbd2aSEdward Tomasz Napierala 4049e30345e7SEdward Tomasz Napierala if (strcmp(pr->pr_name, pr->pr_prison_racct->prr_name) == 0) { 4050e30345e7SEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4051e30345e7SEdward Tomasz Napierala sx_sunlock(&allproc_lock); 4052c34bbd2aSEdward Tomasz Napierala return; 4053e30345e7SEdward Tomasz Napierala } 4054c34bbd2aSEdward Tomasz Napierala 4055c34bbd2aSEdward Tomasz Napierala oldprr = pr->pr_prison_racct; 4056c34bbd2aSEdward Tomasz Napierala pr->pr_prison_racct = NULL; 4057c34bbd2aSEdward Tomasz Napierala 4058c34bbd2aSEdward Tomasz Napierala prison_racct_attach(pr); 4059c34bbd2aSEdward Tomasz Napierala 4060c34bbd2aSEdward Tomasz Napierala /* 4061c34bbd2aSEdward Tomasz Napierala * Move resource utilisation records. 4062c34bbd2aSEdward Tomasz Napierala */ 4063c34bbd2aSEdward Tomasz Napierala racct_move(pr->pr_prison_racct->prr_racct, oldprr->prr_racct); 4064c34bbd2aSEdward Tomasz Napierala 4065f87beb93SAndriy Gapon #ifdef RCTL 4066c34bbd2aSEdward Tomasz Napierala /* 4067c34bbd2aSEdward Tomasz Napierala * Force rctl to reattach rules to processes. 4068c34bbd2aSEdward Tomasz Napierala */ 4069c34bbd2aSEdward Tomasz Napierala FOREACH_PROC_IN_SYSTEM(p) { 4070c34bbd2aSEdward Tomasz Napierala PROC_LOCK(p); 4071c34bbd2aSEdward Tomasz Napierala cred = crhold(p->p_ucred); 4072c34bbd2aSEdward Tomasz Napierala PROC_UNLOCK(p); 4073f87beb93SAndriy Gapon rctl_proc_ucred_changed(p, cred); 4074c34bbd2aSEdward Tomasz Napierala crfree(cred); 4075c34bbd2aSEdward Tomasz Napierala } 4076f87beb93SAndriy Gapon #endif 4077c34bbd2aSEdward Tomasz Napierala 4078c34bbd2aSEdward Tomasz Napierala sx_sunlock(&allproc_lock); 4079c34bbd2aSEdward Tomasz Napierala prison_racct_free_locked(oldprr); 4080c34bbd2aSEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4081c34bbd2aSEdward Tomasz Napierala } 4082c34bbd2aSEdward Tomasz Napierala 4083a7ad07bfSEdward Tomasz Napierala static void 4084a7ad07bfSEdward Tomasz Napierala prison_racct_detach(struct prison *pr) 4085a7ad07bfSEdward Tomasz Napierala { 4086c34bbd2aSEdward Tomasz Napierala 40874b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4088c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_UNLOCKED); 4089c34bbd2aSEdward Tomasz Napierala 4090af3c786cSMateusz Guzik if (pr->pr_prison_racct == NULL) 4091af3c786cSMateusz Guzik return; 4092a7ad07bfSEdward Tomasz Napierala prison_racct_free(pr->pr_prison_racct); 4093a7ad07bfSEdward Tomasz Napierala pr->pr_prison_racct = NULL; 4094a7ad07bfSEdward Tomasz Napierala } 4095a7ad07bfSEdward Tomasz Napierala #endif /* RACCT */ 4096a7ad07bfSEdward Tomasz Napierala 4097413628a7SBjoern A. Zeeb #ifdef DDB 4098b38ff370SJamie Gritton 4099b38ff370SJamie Gritton static void 4100b38ff370SJamie Gritton db_show_prison(struct prison *pr) 4101413628a7SBjoern A. Zeeb { 4102672756aaSJamie Gritton struct bool_flags *bf; 4103672756aaSJamie Gritton struct jailsys_flags *jsf; 4104b38ff370SJamie Gritton #if defined(INET) || defined(INET6) 4105b38ff370SJamie Gritton int ii; 4106413628a7SBjoern A. Zeeb #endif 4107672756aaSJamie Gritton unsigned f; 41088144690aSEric van Gyzen #ifdef INET 41098144690aSEric van Gyzen char ip4buf[INET_ADDRSTRLEN]; 41108144690aSEric van Gyzen #endif 4111413628a7SBjoern A. Zeeb #ifdef INET6 4112413628a7SBjoern A. Zeeb char ip6buf[INET6_ADDRSTRLEN]; 4113413628a7SBjoern A. Zeeb #endif 4114413628a7SBjoern A. Zeeb 4115b38ff370SJamie Gritton db_printf("prison %p:\n", pr); 4116b38ff370SJamie Gritton db_printf(" jid = %d\n", pr->pr_id); 4117b38ff370SJamie Gritton db_printf(" name = %s\n", pr->pr_name); 41180304c731SJamie Gritton db_printf(" parent = %p\n", pr->pr_parent); 4119b38ff370SJamie Gritton db_printf(" ref = %d\n", pr->pr_ref); 4120b38ff370SJamie Gritton db_printf(" uref = %d\n", pr->pr_uref); 4121b38ff370SJamie Gritton db_printf(" path = %s\n", pr->pr_path); 4122b38ff370SJamie Gritton db_printf(" cpuset = %d\n", pr->pr_cpuset 4123b38ff370SJamie Gritton ? pr->pr_cpuset->cs_id : -1); 4124679e1390SJamie Gritton #ifdef VIMAGE 4125679e1390SJamie Gritton db_printf(" vnet = %p\n", pr->pr_vnet); 4126679e1390SJamie Gritton #endif 4127b38ff370SJamie Gritton db_printf(" root = %p\n", pr->pr_root); 4128b38ff370SJamie Gritton db_printf(" securelevel = %d\n", pr->pr_securelevel); 41290cc207a6SMartin Matuska db_printf(" devfs_rsnum = %d\n", pr->pr_devfs_rsnum); 4130fe0518e9SBjoern A. Zeeb db_printf(" children.max = %d\n", pr->pr_childmax); 4131fe0518e9SBjoern A. Zeeb db_printf(" children.cur = %d\n", pr->pr_childcount); 41320304c731SJamie Gritton db_printf(" child = %p\n", LIST_FIRST(&pr->pr_children)); 41330304c731SJamie Gritton db_printf(" sibling = %p\n", LIST_NEXT(pr, pr_sibling)); 4134fe0518e9SBjoern A. Zeeb db_printf(" flags = 0x%x", pr->pr_flags); 4135672756aaSJamie Gritton for (bf = pr_flag_bool; bf < pr_flag_bool + nitems(pr_flag_bool); bf++) 4136672756aaSJamie Gritton if (pr->pr_flags & bf->flag) 4137672756aaSJamie Gritton db_printf(" %s", bf->name); 4138672756aaSJamie Gritton for (jsf = pr_flag_jailsys; 4139672756aaSJamie Gritton jsf < pr_flag_jailsys + nitems(pr_flag_jailsys); 4140672756aaSJamie Gritton jsf++) { 4141672756aaSJamie Gritton f = pr->pr_flags & (jsf->disable | jsf->new); 4142672756aaSJamie Gritton db_printf(" %-16s= %s\n", jsf->name, 4143672756aaSJamie Gritton (f != 0 && f == jsf->disable) ? "disable" 4144672756aaSJamie Gritton : (f == jsf->new) ? "new" 41457cbf7213SJamie Gritton : "inherit"); 41467cbf7213SJamie Gritton } 4147fe0518e9SBjoern A. Zeeb db_printf(" allow = 0x%x", pr->pr_allow); 4148672756aaSJamie Gritton for (bf = pr_flag_allow; 41490e5c6bd4SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && bf->flag != 0; 4150672756aaSJamie Gritton bf++) 4151672756aaSJamie Gritton if (pr->pr_allow & bf->flag) 4152672756aaSJamie Gritton db_printf(" %s", bf->name); 4153b38ff370SJamie Gritton db_printf("\n"); 41540304c731SJamie Gritton db_printf(" enforce_statfs = %d\n", pr->pr_enforce_statfs); 4155c1f19219SJamie Gritton db_printf(" host.hostname = %s\n", pr->pr_hostname); 4156c1f19219SJamie Gritton db_printf(" host.domainname = %s\n", pr->pr_domainname); 4157c1f19219SJamie Gritton db_printf(" host.hostuuid = %s\n", pr->pr_hostuuid); 415876ca6f88SJamie Gritton db_printf(" host.hostid = %lu\n", pr->pr_hostid); 4159413628a7SBjoern A. Zeeb #ifdef INET 4160b38ff370SJamie Gritton db_printf(" ip4s = %d\n", pr->pr_ip4s); 4161b38ff370SJamie Gritton for (ii = 0; ii < pr->pr_ip4s; ii++) 4162b38ff370SJamie Gritton db_printf(" %s %s\n", 4163fe0518e9SBjoern A. Zeeb ii == 0 ? "ip4.addr =" : " ", 41648144690aSEric van Gyzen inet_ntoa_r(pr->pr_ip4[ii], ip4buf)); 4165413628a7SBjoern A. Zeeb #endif 4166413628a7SBjoern A. Zeeb #ifdef INET6 4167b38ff370SJamie Gritton db_printf(" ip6s = %d\n", pr->pr_ip6s); 4168b38ff370SJamie Gritton for (ii = 0; ii < pr->pr_ip6s; ii++) 4169b38ff370SJamie Gritton db_printf(" %s %s\n", 4170fe0518e9SBjoern A. Zeeb ii == 0 ? "ip6.addr =" : " ", 4171b38ff370SJamie Gritton ip6_sprintf(ip6buf, &pr->pr_ip6[ii])); 4172b38ff370SJamie Gritton #endif 4173b38ff370SJamie Gritton } 4174b38ff370SJamie Gritton 4175b38ff370SJamie Gritton DB_SHOW_COMMAND(prison, db_show_prison_command) 4176b38ff370SJamie Gritton { 4177b38ff370SJamie Gritton struct prison *pr; 4178b38ff370SJamie Gritton 4179b38ff370SJamie Gritton if (!have_addr) { 41800304c731SJamie Gritton /* 41810304c731SJamie Gritton * Show all prisons in the list, and prison0 which is not 41820304c731SJamie Gritton * listed. 41830304c731SJamie Gritton */ 41840304c731SJamie Gritton db_show_prison(&prison0); 41850304c731SJamie Gritton if (!db_pager_quit) { 4186b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) { 4187b38ff370SJamie Gritton db_show_prison(pr); 4188413628a7SBjoern A. Zeeb if (db_pager_quit) 4189413628a7SBjoern A. Zeeb break; 4190413628a7SBjoern A. Zeeb } 41910304c731SJamie Gritton } 4192b38ff370SJamie Gritton return; 4193413628a7SBjoern A. Zeeb } 4194b38ff370SJamie Gritton 41950304c731SJamie Gritton if (addr == 0) 41960304c731SJamie Gritton pr = &prison0; 41970304c731SJamie Gritton else { 4198b38ff370SJamie Gritton /* Look for a prison with the ID and with references. */ 4199b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) 4200b38ff370SJamie Gritton if (pr->pr_id == addr && pr->pr_ref > 0) 4201b38ff370SJamie Gritton break; 4202b38ff370SJamie Gritton if (pr == NULL) 4203b38ff370SJamie Gritton /* Look again, without requiring a reference. */ 4204b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) 4205b38ff370SJamie Gritton if (pr->pr_id == addr) 4206b38ff370SJamie Gritton break; 4207b38ff370SJamie Gritton if (pr == NULL) 4208b38ff370SJamie Gritton /* Assume address points to a valid prison. */ 4209b38ff370SJamie Gritton pr = (struct prison *)addr; 42100304c731SJamie Gritton } 4211b38ff370SJamie Gritton db_show_prison(pr); 4212b38ff370SJamie Gritton } 4213b38ff370SJamie Gritton 4214413628a7SBjoern A. Zeeb #endif /* DDB */ 4215