19454b2d8SWarner Losh /*- 28a36da99SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 38a36da99SPedro F. Giffuni * 4413628a7SBjoern A. Zeeb * Copyright (c) 1999 Poul-Henning Kamp. 5413628a7SBjoern A. Zeeb * Copyright (c) 2008 Bjoern A. Zeeb. 6b38ff370SJamie Gritton * Copyright (c) 2009 James Gritton. 7413628a7SBjoern A. Zeeb * All rights reserved. 8b9f0b66cSBjoern A. Zeeb * 9b9f0b66cSBjoern A. Zeeb * Redistribution and use in source and binary forms, with or without 10b9f0b66cSBjoern A. Zeeb * modification, are permitted provided that the following conditions 11b9f0b66cSBjoern A. Zeeb * are met: 12b9f0b66cSBjoern A. Zeeb * 1. Redistributions of source code must retain the above copyright 13b9f0b66cSBjoern A. Zeeb * notice, this list of conditions and the following disclaimer. 14b9f0b66cSBjoern A. Zeeb * 2. Redistributions in binary form must reproduce the above copyright 15b9f0b66cSBjoern A. Zeeb * notice, this list of conditions and the following disclaimer in the 16b9f0b66cSBjoern A. Zeeb * documentation and/or other materials provided with the distribution. 17b9f0b66cSBjoern A. Zeeb * 18b9f0b66cSBjoern A. Zeeb * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 19b9f0b66cSBjoern A. Zeeb * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 20b9f0b66cSBjoern A. Zeeb * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 21b9f0b66cSBjoern A. Zeeb * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 22b9f0b66cSBjoern A. Zeeb * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 23b9f0b66cSBjoern A. Zeeb * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 24b9f0b66cSBjoern A. Zeeb * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 25b9f0b66cSBjoern A. Zeeb * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 26b9f0b66cSBjoern A. Zeeb * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 27b9f0b66cSBjoern A. Zeeb * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 28b9f0b66cSBjoern A. Zeeb * SUCH DAMAGE. 2907901f22SPoul-Henning Kamp */ 3075c13541SPoul-Henning Kamp 31677b542eSDavid E. O'Brien #include <sys/cdefs.h> 32677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 33677b542eSDavid E. O'Brien 34413628a7SBjoern A. Zeeb #include "opt_ddb.h" 35413628a7SBjoern A. Zeeb #include "opt_inet.h" 36413628a7SBjoern A. Zeeb #include "opt_inet6.h" 3746e3b1cbSPawel Jakub Dawidek 3875c13541SPoul-Henning Kamp #include <sys/param.h> 3975c13541SPoul-Henning Kamp #include <sys/types.h> 4075c13541SPoul-Henning Kamp #include <sys/kernel.h> 4175c13541SPoul-Henning Kamp #include <sys/systm.h> 4275c13541SPoul-Henning Kamp #include <sys/errno.h> 4375c13541SPoul-Henning Kamp #include <sys/sysproto.h> 4475c13541SPoul-Henning Kamp #include <sys/malloc.h> 450304c731SJamie Gritton #include <sys/osd.h> 46800c9408SRobert Watson #include <sys/priv.h> 4775c13541SPoul-Henning Kamp #include <sys/proc.h> 48b3059e09SRobert Watson #include <sys/taskqueue.h> 4957b4252eSKonstantin Belousov #include <sys/fcntl.h> 5075c13541SPoul-Henning Kamp #include <sys/jail.h> 51c3188289SKyle Evans #include <sys/linker.h> 5201137630SRobert Watson #include <sys/lock.h> 5301137630SRobert Watson #include <sys/mutex.h> 54097055e2SEdward Tomasz Napierala #include <sys/racct.h> 55f87beb93SAndriy Gapon #include <sys/rctl.h> 56a7ad07bfSEdward Tomasz Napierala #include <sys/refcount.h> 57dc68a633SPawel Jakub Dawidek #include <sys/sx.h> 5876ca6f88SJamie Gritton #include <sys/sysent.h> 59fd7a8150SMike Barcroft #include <sys/namei.h> 60820a0de9SPawel Jakub Dawidek #include <sys/mount.h> 61fd7a8150SMike Barcroft #include <sys/queue.h> 6275c13541SPoul-Henning Kamp #include <sys/socket.h> 63fd7a8150SMike Barcroft #include <sys/syscallsubr.h> 6483f1e257SRobert Watson #include <sys/sysctl.h> 65c3188289SKyle Evans #include <sys/uuid.h> 66fd7a8150SMike Barcroft #include <sys/vnode.h> 67530c0060SRobert Watson 6875c13541SPoul-Henning Kamp #include <net/if.h> 69530c0060SRobert Watson #include <net/vnet.h> 70530c0060SRobert Watson 7175c13541SPoul-Henning Kamp #include <netinet/in.h> 72530c0060SRobert Watson 73413628a7SBjoern A. Zeeb #ifdef DDB 74413628a7SBjoern A. Zeeb #include <ddb/ddb.h> 75413628a7SBjoern A. Zeeb #endif /* DDB */ 7675c13541SPoul-Henning Kamp 77aed55708SRobert Watson #include <security/mac/mac_framework.h> 78aed55708SRobert Watson 79c3188289SKyle Evans #define PRISON0_HOSTUUID_MODULE "hostuuid" 808986e3a0SJamie Gritton 8175c13541SPoul-Henning Kamp MALLOC_DEFINE(M_PRISON, "prison", "Prison structures"); 82d745c852SEd Schouten static MALLOC_DEFINE(M_PRISON_RACCT, "prison_racct", "Prison racct structures"); 8375c13541SPoul-Henning Kamp 84592bcae8SBjoern A. Zeeb /* Keep struct prison prison0 and some code in kern_jail_set() readable. */ 85592bcae8SBjoern A. Zeeb #ifdef INET 86592bcae8SBjoern A. Zeeb #ifdef INET6 87592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL PR_IP4_SADDRSEL|PR_IP6_SADDRSEL 88592bcae8SBjoern A. Zeeb #else 89592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL PR_IP4_SADDRSEL 90592bcae8SBjoern A. Zeeb #endif 91592bcae8SBjoern A. Zeeb #else /* !INET */ 92592bcae8SBjoern A. Zeeb #ifdef INET6 93592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL PR_IP6_SADDRSEL 94592bcae8SBjoern A. Zeeb #else 95592bcae8SBjoern A. Zeeb #define _PR_IP_SADDRSEL 0 96592bcae8SBjoern A. Zeeb #endif 97592bcae8SBjoern A. Zeeb #endif 98592bcae8SBjoern A. Zeeb 990304c731SJamie Gritton /* prison0 describes what is "real" about the system. */ 1000304c731SJamie Gritton struct prison prison0 = { 1010304c731SJamie Gritton .pr_id = 0, 1020304c731SJamie Gritton .pr_name = "0", 1030304c731SJamie Gritton .pr_ref = 1, 1040304c731SJamie Gritton .pr_uref = 1, 1050304c731SJamie Gritton .pr_path = "/", 1060304c731SJamie Gritton .pr_securelevel = -1, 1070cc207a6SMartin Matuska .pr_devfs_rsnum = 0, 1081158508aSJamie Gritton .pr_state = PRISON_STATE_ALIVE, 109b97457e2SJamie Gritton .pr_childmax = JAIL_MAX, 1108986e3a0SJamie Gritton .pr_hostuuid = DEFAULT_HOSTUUID, 11113e403fdSAntoine Brodin .pr_children = LIST_HEAD_INITIALIZER(prison0.pr_children), 112eb79e1c7SBjoern A. Zeeb #ifdef VIMAGE 113592bcae8SBjoern A. Zeeb .pr_flags = PR_HOST|PR_VNET|_PR_IP_SADDRSEL, 114eb79e1c7SBjoern A. Zeeb #else 115592bcae8SBjoern A. Zeeb .pr_flags = PR_HOST|_PR_IP_SADDRSEL, 116eb79e1c7SBjoern A. Zeeb #endif 1170e5c6bd4SJamie Gritton .pr_allow = PR_ALLOW_ALL_STATIC, 1180304c731SJamie Gritton }; 1190304c731SJamie Gritton MTX_SYSINIT(prison0, &prison0.pr_mtx, "jail mutex", MTX_DEF); 12083f1e257SRobert Watson 121672756aaSJamie Gritton struct bool_flags { 122672756aaSJamie Gritton const char *name; 123672756aaSJamie Gritton const char *noname; 1245d58f959SJamie Gritton volatile u_int flag; 125672756aaSJamie Gritton }; 126672756aaSJamie Gritton struct jailsys_flags { 127672756aaSJamie Gritton const char *name; 128672756aaSJamie Gritton unsigned disable; 129672756aaSJamie Gritton unsigned new; 130672756aaSJamie Gritton }; 131672756aaSJamie Gritton 132a7ad07bfSEdward Tomasz Napierala /* allprison, allprison_racct and lastprid are protected by allprison_lock. */ 133dc68a633SPawel Jakub Dawidek struct sx allprison_lock; 134b38ff370SJamie Gritton SX_SYSINIT(allprison_lock, &allprison_lock, "allprison"); 135b38ff370SJamie Gritton struct prisonlist allprison = TAILQ_HEAD_INITIALIZER(allprison); 136a7ad07bfSEdward Tomasz Napierala LIST_HEAD(, prison_racct) allprison_racct; 1372110d913SXin LI int lastprid = 0; 138fd7a8150SMike Barcroft 1397de883c8SJamie Gritton static int get_next_prid(struct prison **insprp); 140f7496dcaSJamie Gritton static int do_jail_attach(struct thread *td, struct prison *pr, int drflags); 141b3059e09SRobert Watson static void prison_complete(void *context, int pending); 142b38ff370SJamie Gritton static void prison_deref(struct prison *pr, int flags); 143c861373bSJamie Gritton static void prison_deref_kill(struct prison *pr, struct prisonlist *freeprison); 144f7496dcaSJamie Gritton static int prison_lock_xlock(struct prison *pr, int flags); 145f7496dcaSJamie Gritton static void prison_free_not_last(struct prison *pr); 146c861373bSJamie Gritton static void prison_proc_free_not_last(struct prison *pr); 1470fe74ae6SJamie Gritton static void prison_set_allow_locked(struct prison *pr, unsigned flag, 1480fe74ae6SJamie Gritton int enable); 1490304c731SJamie Gritton static char *prison_path(struct prison *pr1, struct prison *pr2); 150a7ad07bfSEdward Tomasz Napierala #ifdef RACCT 151a7ad07bfSEdward Tomasz Napierala static void prison_racct_attach(struct prison *pr); 152c34bbd2aSEdward Tomasz Napierala static void prison_racct_modify(struct prison *pr); 153a7ad07bfSEdward Tomasz Napierala static void prison_racct_detach(struct prison *pr); 154a7ad07bfSEdward Tomasz Napierala #endif 155fd7a8150SMike Barcroft 156b38ff370SJamie Gritton /* Flags for prison_deref */ 1572a4b2251SJamie Gritton #define PD_DEREF 0x01 /* Decrement pr_ref */ 1582a4b2251SJamie Gritton #define PD_DEUREF 0x02 /* Decrement pr_uref */ 159c861373bSJamie Gritton #define PD_KILL 0x04 /* Remove jail, kill processes, etc */ 160c861373bSJamie Gritton #define PD_LOCKED 0x10 /* pr_mtx is held */ 161c861373bSJamie Gritton #define PD_LIST_SLOCKED 0x20 /* allprison_lock is held shared */ 162c861373bSJamie Gritton #define PD_LIST_XLOCKED 0x40 /* allprison_lock is held exclusive */ 163589e4c1dSJamie Gritton #define PD_OP_FLAGS 0x07 /* Operation flags */ 164589e4c1dSJamie Gritton #define PD_LOCK_FLAGS 0x70 /* Lock status flags */ 165fd7a8150SMike Barcroft 1660304c731SJamie Gritton /* 1675cc70397SBjoern A. Zeeb * Parameter names corresponding to PR_* flag values. Size values are for kvm 1685cc70397SBjoern A. Zeeb * as we cannot figure out the size of a sparse array, or an array without a 1695cc70397SBjoern A. Zeeb * terminating entry. 1700304c731SJamie Gritton */ 171672756aaSJamie Gritton static struct bool_flags pr_flag_bool[] = { 172672756aaSJamie Gritton {"persist", "nopersist", PR_PERSIST}, 173592bcae8SBjoern A. Zeeb #ifdef INET 174672756aaSJamie Gritton {"ip4.saddrsel", "ip4.nosaddrsel", PR_IP4_SADDRSEL}, 175592bcae8SBjoern A. Zeeb #endif 176592bcae8SBjoern A. Zeeb #ifdef INET6 177672756aaSJamie Gritton {"ip6.saddrsel", "ip6.nosaddrsel", PR_IP6_SADDRSEL}, 178592bcae8SBjoern A. Zeeb #endif 1790304c731SJamie Gritton }; 180672756aaSJamie Gritton const size_t pr_flag_bool_size = sizeof(pr_flag_bool); 1810304c731SJamie Gritton 182672756aaSJamie Gritton static struct jailsys_flags pr_flag_jailsys[] = { 1837cbf7213SJamie Gritton {"host", 0, PR_HOST}, 1847cbf7213SJamie Gritton #ifdef VIMAGE 1857cbf7213SJamie Gritton {"vnet", 0, PR_VNET}, 1867cbf7213SJamie Gritton #endif 1870304c731SJamie Gritton #ifdef INET 1886a3f2779SJamie Gritton {"ip4", PR_IP4_USER, PR_IP4_USER}, 1890304c731SJamie Gritton #endif 1900304c731SJamie Gritton #ifdef INET6 1916a3f2779SJamie Gritton {"ip6", PR_IP6_USER, PR_IP6_USER}, 192679e1390SJamie Gritton #endif 1930304c731SJamie Gritton }; 1945cc70397SBjoern A. Zeeb const size_t pr_flag_jailsys_size = sizeof(pr_flag_jailsys); 1950304c731SJamie Gritton 1965d58f959SJamie Gritton /* 1975d58f959SJamie Gritton * Make this array full-size so dynamic parameters can be added. 1985d58f959SJamie Gritton * It is protected by prison0.mtx, but lockless reading is allowed 1995d58f959SJamie Gritton * with an atomic check of the flag values. 2005d58f959SJamie Gritton */ 2010e5c6bd4SJamie Gritton static struct bool_flags pr_flag_allow[NBBY * NBPW] = { 202672756aaSJamie Gritton {"allow.set_hostname", "allow.noset_hostname", PR_ALLOW_SET_HOSTNAME}, 203672756aaSJamie Gritton {"allow.sysvipc", "allow.nosysvipc", PR_ALLOW_SYSVIPC}, 204672756aaSJamie Gritton {"allow.raw_sockets", "allow.noraw_sockets", PR_ALLOW_RAW_SOCKETS}, 205672756aaSJamie Gritton {"allow.chflags", "allow.nochflags", PR_ALLOW_CHFLAGS}, 206672756aaSJamie Gritton {"allow.mount", "allow.nomount", PR_ALLOW_MOUNT}, 207672756aaSJamie Gritton {"allow.quotas", "allow.noquotas", PR_ALLOW_QUOTAS}, 208672756aaSJamie Gritton {"allow.socket_af", "allow.nosocket_af", PR_ALLOW_SOCKET_AF}, 209ccd6ac9fSAntoine Brodin {"allow.mlock", "allow.nomlock", PR_ALLOW_MLOCK}, 210672756aaSJamie Gritton {"allow.reserved_ports", "allow.noreserved_ports", 211672756aaSJamie Gritton PR_ALLOW_RESERVED_PORTS}, 212b19d66fdSJamie Gritton {"allow.read_msgbuf", "allow.noread_msgbuf", PR_ALLOW_READ_MSGBUF}, 213b3079544SJamie Gritton {"allow.unprivileged_proc_debug", "allow.nounprivileged_proc_debug", 214b3079544SJamie Gritton PR_ALLOW_UNPRIV_DEBUG}, 21505e1e482SMariusz Zaborski {"allow.suser", "allow.nosuser", PR_ALLOW_SUSER}, 2160304c731SJamie Gritton }; 2175d58f959SJamie Gritton static unsigned pr_allow_all = PR_ALLOW_ALL_STATIC; 218672756aaSJamie Gritton const size_t pr_flag_allow_size = sizeof(pr_flag_allow); 2190304c731SJamie Gritton 220b3079544SJamie Gritton #define JAIL_DEFAULT_ALLOW (PR_ALLOW_SET_HOSTNAME | \ 221b3079544SJamie Gritton PR_ALLOW_RESERVED_PORTS | \ 22205e1e482SMariusz Zaborski PR_ALLOW_UNPRIV_DEBUG | \ 22305e1e482SMariusz Zaborski PR_ALLOW_SUSER) 22442bebd82SJamie Gritton #define JAIL_DEFAULT_ENFORCE_STATFS 2 225bf3db8aaSMartin Matuska #define JAIL_DEFAULT_DEVFS_RSNUM 0 2260304c731SJamie Gritton static unsigned jail_default_allow = JAIL_DEFAULT_ALLOW; 22742bebd82SJamie Gritton static int jail_default_enforce_statfs = JAIL_DEFAULT_ENFORCE_STATFS; 2280cc207a6SMartin Matuska static int jail_default_devfs_rsnum = JAIL_DEFAULT_DEVFS_RSNUM; 2290304c731SJamie Gritton #if defined(INET) || defined(INET6) 230e92e0574SJamie Gritton static unsigned jail_max_af_ips = 255; 2310304c731SJamie Gritton #endif 2320304c731SJamie Gritton 233b96bd95bSIan Lepore /* 234b96bd95bSIan Lepore * Initialize the parts of prison0 that can't be static-initialized with 235b96bd95bSIan Lepore * constants. This is called from proc0_init() after creating thread0 cpuset. 236b96bd95bSIan Lepore */ 237b96bd95bSIan Lepore void 238b96bd95bSIan Lepore prison0_init(void) 239b96bd95bSIan Lepore { 240c3188289SKyle Evans uint8_t *file, *data; 241c3188289SKyle Evans size_t size; 242b96bd95bSIan Lepore 243b96bd95bSIan Lepore prison0.pr_cpuset = cpuset_ref(thread0.td_cpuset); 244b96bd95bSIan Lepore prison0.pr_osreldate = osreldate; 245b96bd95bSIan Lepore strlcpy(prison0.pr_osrelease, osrelease, sizeof(prison0.pr_osrelease)); 246c3188289SKyle Evans 247c3188289SKyle Evans /* If we have a preloaded hostuuid, use it. */ 248c3188289SKyle Evans file = preload_search_by_type(PRISON0_HOSTUUID_MODULE); 249c3188289SKyle Evans if (file != NULL) { 250c3188289SKyle Evans data = preload_fetch_addr(file); 251c3188289SKyle Evans size = preload_fetch_size(file); 252c3188289SKyle Evans if (data != NULL) { 253c3188289SKyle Evans /* 254c3188289SKyle Evans * The preloaded data may include trailing whitespace, almost 255c3188289SKyle Evans * certainly a newline; skip over any whitespace or 256c3188289SKyle Evans * non-printable characters to be safe. 257c3188289SKyle Evans */ 258c3188289SKyle Evans while (size > 0 && data[size - 1] <= 0x20) { 259b6be9566SColin Percival size--; 260c3188289SKyle Evans } 261c3188289SKyle Evans if (validate_uuid(data, size, NULL, 0) == 0) { 262c3188289SKyle Evans (void)strlcpy(prison0.pr_hostuuid, data, 263c3188289SKyle Evans size + 1); 264c3188289SKyle Evans } else if (bootverbose) { 265330f110bSColin Percival printf("hostuuid: preload data malformed: '%.*s'\n", 266330f110bSColin Percival (int)size, data); 267c3188289SKyle Evans } 268c3188289SKyle Evans } 269c3188289SKyle Evans } 270c3188289SKyle Evans if (bootverbose) 271c3188289SKyle Evans printf("hostuuid: using %s\n", prison0.pr_hostuuid); 272b96bd95bSIan Lepore } 273b96bd95bSIan Lepore 274116734c4SMatthew Dillon /* 2759ddb7954SMike Barcroft * struct jail_args { 2769ddb7954SMike Barcroft * struct jail *jail; 2779ddb7954SMike Barcroft * }; 278116734c4SMatthew Dillon */ 27975c13541SPoul-Henning Kamp int 280c542c43eSJamie Gritton sys_jail(struct thread *td, struct jail_args *uap) 28175c13541SPoul-Henning Kamp { 282413628a7SBjoern A. Zeeb uint32_t version; 283413628a7SBjoern A. Zeeb int error; 2840304c731SJamie Gritton struct jail j; 285413628a7SBjoern A. Zeeb 286413628a7SBjoern A. Zeeb error = copyin(uap->jail, &version, sizeof(uint32_t)); 287413628a7SBjoern A. Zeeb if (error) 288413628a7SBjoern A. Zeeb return (error); 289413628a7SBjoern A. Zeeb 290413628a7SBjoern A. Zeeb switch (version) { 291413628a7SBjoern A. Zeeb case 0: 292413628a7SBjoern A. Zeeb { 293413628a7SBjoern A. Zeeb struct jail_v0 j0; 294413628a7SBjoern A. Zeeb 2950304c731SJamie Gritton /* FreeBSD single IPv4 jails. */ 2960304c731SJamie Gritton bzero(&j, sizeof(struct jail)); 297413628a7SBjoern A. Zeeb error = copyin(uap->jail, &j0, sizeof(struct jail_v0)); 298413628a7SBjoern A. Zeeb if (error) 299413628a7SBjoern A. Zeeb return (error); 3000304c731SJamie Gritton j.version = j0.version; 3010304c731SJamie Gritton j.path = j0.path; 3020304c731SJamie Gritton j.hostname = j0.hostname; 303b5019bc4SPeter Wemm j.ip4s = htonl(j0.ip_number); /* jail_v0 is host order */ 304413628a7SBjoern A. Zeeb break; 305413628a7SBjoern A. Zeeb } 306413628a7SBjoern A. Zeeb 307413628a7SBjoern A. Zeeb case 1: 308413628a7SBjoern A. Zeeb /* 309413628a7SBjoern A. Zeeb * Version 1 was used by multi-IPv4 jail implementations 310413628a7SBjoern A. Zeeb * that never made it into the official kernel. 311413628a7SBjoern A. Zeeb */ 312413628a7SBjoern A. Zeeb return (EINVAL); 313413628a7SBjoern A. Zeeb 314413628a7SBjoern A. Zeeb case 2: /* JAIL_API_VERSION */ 315413628a7SBjoern A. Zeeb /* FreeBSD multi-IPv4/IPv6,noIP jails. */ 316413628a7SBjoern A. Zeeb error = copyin(uap->jail, &j, sizeof(struct jail)); 317413628a7SBjoern A. Zeeb if (error) 318413628a7SBjoern A. Zeeb return (error); 3190304c731SJamie Gritton break; 3200304c731SJamie Gritton 3210304c731SJamie Gritton default: 3220304c731SJamie Gritton /* Sci-Fi jails are not supported, sorry. */ 3230304c731SJamie Gritton return (EINVAL); 3240304c731SJamie Gritton } 325c542c43eSJamie Gritton return (kern_jail(td, &j)); 3260304c731SJamie Gritton } 3270304c731SJamie Gritton 3280304c731SJamie Gritton int 329c542c43eSJamie Gritton kern_jail(struct thread *td, struct jail *j) 3300304c731SJamie Gritton { 331c542c43eSJamie Gritton struct iovec optiov[2 * (4 + nitems(pr_flag_allow) 332e92e0574SJamie Gritton #ifdef INET 333e92e0574SJamie Gritton + 1 334e92e0574SJamie Gritton #endif 335e92e0574SJamie Gritton #ifdef INET6 336e92e0574SJamie Gritton + 1 337e92e0574SJamie Gritton #endif 338e92e0574SJamie Gritton )]; 3390304c731SJamie Gritton struct uio opt; 3400304c731SJamie Gritton char *u_path, *u_hostname, *u_name; 341672756aaSJamie Gritton struct bool_flags *bf; 3420304c731SJamie Gritton #ifdef INET 343e92e0574SJamie Gritton uint32_t ip4s; 3440304c731SJamie Gritton struct in_addr *u_ip4; 3450304c731SJamie Gritton #endif 3460304c731SJamie Gritton #ifdef INET6 3470304c731SJamie Gritton struct in6_addr *u_ip6; 3480304c731SJamie Gritton #endif 3490304c731SJamie Gritton size_t tmplen; 350c542c43eSJamie Gritton int error, enforce_statfs; 3510304c731SJamie Gritton 3520304c731SJamie Gritton bzero(&optiov, sizeof(optiov)); 3530304c731SJamie Gritton opt.uio_iov = optiov; 3540304c731SJamie Gritton opt.uio_iovcnt = 0; 3550304c731SJamie Gritton opt.uio_offset = -1; 3560304c731SJamie Gritton opt.uio_resid = -1; 3570304c731SJamie Gritton opt.uio_segflg = UIO_SYSSPACE; 3580304c731SJamie Gritton opt.uio_rw = UIO_READ; 3590304c731SJamie Gritton opt.uio_td = td; 3600304c731SJamie Gritton 3610304c731SJamie Gritton /* Set permissions for top-level jails from sysctls. */ 3620304c731SJamie Gritton if (!jailed(td->td_ucred)) { 363672756aaSJamie Gritton for (bf = pr_flag_allow; 3640e5c6bd4SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && 3655d58f959SJamie Gritton atomic_load_int(&bf->flag) != 0; 366672756aaSJamie Gritton bf++) { 367672756aaSJamie Gritton optiov[opt.uio_iovcnt].iov_base = __DECONST(char *, 368672756aaSJamie Gritton (jail_default_allow & bf->flag) 369672756aaSJamie Gritton ? bf->name : bf->noname); 3700304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = 3710304c731SJamie Gritton strlen(optiov[opt.uio_iovcnt].iov_base) + 1; 3720304c731SJamie Gritton opt.uio_iovcnt += 2; 3730304c731SJamie Gritton } 3740304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "enforce_statfs"; 3750304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("enforce_statfs"); 3760304c731SJamie Gritton opt.uio_iovcnt++; 3770304c731SJamie Gritton enforce_statfs = jail_default_enforce_statfs; 3780304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = &enforce_statfs; 3790304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof(enforce_statfs); 3800304c731SJamie Gritton opt.uio_iovcnt++; 3810304c731SJamie Gritton } 3820304c731SJamie Gritton 383b38ff370SJamie Gritton tmplen = MAXPATHLEN + MAXHOSTNAMELEN + MAXHOSTNAMELEN; 384b38ff370SJamie Gritton #ifdef INET 3850304c731SJamie Gritton ip4s = (j->version == 0) ? 1 : j->ip4s; 3860304c731SJamie Gritton if (ip4s > jail_max_af_ips) 387b38ff370SJamie Gritton return (EINVAL); 3880304c731SJamie Gritton tmplen += ip4s * sizeof(struct in_addr); 389b38ff370SJamie Gritton #else 3900304c731SJamie Gritton if (j->ip4s > 0) 391b38ff370SJamie Gritton return (EINVAL); 392b38ff370SJamie Gritton #endif 393b38ff370SJamie Gritton #ifdef INET6 3940304c731SJamie Gritton if (j->ip6s > jail_max_af_ips) 395b38ff370SJamie Gritton return (EINVAL); 3960304c731SJamie Gritton tmplen += j->ip6s * sizeof(struct in6_addr); 397b38ff370SJamie Gritton #else 3980304c731SJamie Gritton if (j->ip6s > 0) 399b38ff370SJamie Gritton return (EINVAL); 400b38ff370SJamie Gritton #endif 401b38ff370SJamie Gritton u_path = malloc(tmplen, M_TEMP, M_WAITOK); 402b38ff370SJamie Gritton u_hostname = u_path + MAXPATHLEN; 403b38ff370SJamie Gritton u_name = u_hostname + MAXHOSTNAMELEN; 404b38ff370SJamie Gritton #ifdef INET 405b38ff370SJamie Gritton u_ip4 = (struct in_addr *)(u_name + MAXHOSTNAMELEN); 406b38ff370SJamie Gritton #endif 407b38ff370SJamie Gritton #ifdef INET6 408b38ff370SJamie Gritton #ifdef INET 4090304c731SJamie Gritton u_ip6 = (struct in6_addr *)(u_ip4 + ip4s); 410b38ff370SJamie Gritton #else 411b38ff370SJamie Gritton u_ip6 = (struct in6_addr *)(u_name + MAXHOSTNAMELEN); 412b38ff370SJamie Gritton #endif 413b38ff370SJamie Gritton #endif 4140304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "path"; 4150304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("path"); 4160304c731SJamie Gritton opt.uio_iovcnt++; 4170304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_path; 4180304c731SJamie Gritton error = copyinstr(j->path, u_path, MAXPATHLEN, 4190304c731SJamie Gritton &optiov[opt.uio_iovcnt].iov_len); 420b38ff370SJamie Gritton if (error) { 421b38ff370SJamie Gritton free(u_path, M_TEMP); 422b38ff370SJamie Gritton return (error); 423b38ff370SJamie Gritton } 4240304c731SJamie Gritton opt.uio_iovcnt++; 4250304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "host.hostname"; 4260304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("host.hostname"); 4270304c731SJamie Gritton opt.uio_iovcnt++; 4280304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_hostname; 4290304c731SJamie Gritton error = copyinstr(j->hostname, u_hostname, MAXHOSTNAMELEN, 4300304c731SJamie Gritton &optiov[opt.uio_iovcnt].iov_len); 431b38ff370SJamie Gritton if (error) { 432b38ff370SJamie Gritton free(u_path, M_TEMP); 433b38ff370SJamie Gritton return (error); 434b38ff370SJamie Gritton } 4350304c731SJamie Gritton opt.uio_iovcnt++; 4360304c731SJamie Gritton if (j->jailname != NULL) { 437b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "name"; 438b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("name"); 439b38ff370SJamie Gritton opt.uio_iovcnt++; 440b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_name; 4410304c731SJamie Gritton error = copyinstr(j->jailname, u_name, MAXHOSTNAMELEN, 442b38ff370SJamie Gritton &optiov[opt.uio_iovcnt].iov_len); 443b38ff370SJamie Gritton if (error) { 444b38ff370SJamie Gritton free(u_path, M_TEMP); 445b38ff370SJamie Gritton return (error); 446b38ff370SJamie Gritton } 447b38ff370SJamie Gritton opt.uio_iovcnt++; 448b38ff370SJamie Gritton } 449b38ff370SJamie Gritton #ifdef INET 450b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "ip4.addr"; 451b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("ip4.addr"); 452b38ff370SJamie Gritton opt.uio_iovcnt++; 453b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_ip4; 4540304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = ip4s * sizeof(struct in_addr); 4550304c731SJamie Gritton if (j->version == 0) 4560304c731SJamie Gritton u_ip4->s_addr = j->ip4s; 4570304c731SJamie Gritton else { 4580304c731SJamie Gritton error = copyin(j->ip4, u_ip4, optiov[opt.uio_iovcnt].iov_len); 459b38ff370SJamie Gritton if (error) { 460b38ff370SJamie Gritton free(u_path, M_TEMP); 461b38ff370SJamie Gritton return (error); 462b38ff370SJamie Gritton } 4630304c731SJamie Gritton } 464b38ff370SJamie Gritton opt.uio_iovcnt++; 465b38ff370SJamie Gritton #endif 466b38ff370SJamie Gritton #ifdef INET6 467b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = "ip6.addr"; 468b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_len = sizeof("ip6.addr"); 469b38ff370SJamie Gritton opt.uio_iovcnt++; 470b38ff370SJamie Gritton optiov[opt.uio_iovcnt].iov_base = u_ip6; 4710304c731SJamie Gritton optiov[opt.uio_iovcnt].iov_len = j->ip6s * sizeof(struct in6_addr); 4720304c731SJamie Gritton error = copyin(j->ip6, u_ip6, optiov[opt.uio_iovcnt].iov_len); 473b38ff370SJamie Gritton if (error) { 474b38ff370SJamie Gritton free(u_path, M_TEMP); 475b38ff370SJamie Gritton return (error); 476b38ff370SJamie Gritton } 477b38ff370SJamie Gritton opt.uio_iovcnt++; 478b38ff370SJamie Gritton #endif 47902abd400SPedro F. Giffuni KASSERT(opt.uio_iovcnt <= nitems(optiov), 4800304c731SJamie Gritton ("kern_jail: too many iovecs (%d)", opt.uio_iovcnt)); 481b38ff370SJamie Gritton error = kern_jail_set(td, &opt, JAIL_CREATE | JAIL_ATTACH); 482b38ff370SJamie Gritton free(u_path, M_TEMP); 483b38ff370SJamie Gritton return (error); 484b38ff370SJamie Gritton } 485b38ff370SJamie Gritton 486b38ff370SJamie Gritton /* 487b38ff370SJamie Gritton * struct jail_set_args { 488b38ff370SJamie Gritton * struct iovec *iovp; 489b38ff370SJamie Gritton * unsigned int iovcnt; 490b38ff370SJamie Gritton * int flags; 491b38ff370SJamie Gritton * }; 492b38ff370SJamie Gritton */ 493b38ff370SJamie Gritton int 4948451d0ddSKip Macy sys_jail_set(struct thread *td, struct jail_set_args *uap) 495b38ff370SJamie Gritton { 496b38ff370SJamie Gritton struct uio *auio; 497b38ff370SJamie Gritton int error; 498b38ff370SJamie Gritton 499b38ff370SJamie Gritton /* Check that we have an even number of iovecs. */ 500b38ff370SJamie Gritton if (uap->iovcnt & 1) 501b38ff370SJamie Gritton return (EINVAL); 502b38ff370SJamie Gritton 503b38ff370SJamie Gritton error = copyinuio(uap->iovp, uap->iovcnt, &auio); 504b38ff370SJamie Gritton if (error) 505b38ff370SJamie Gritton return (error); 506b38ff370SJamie Gritton error = kern_jail_set(td, auio, uap->flags); 507b38ff370SJamie Gritton free(auio, M_IOV); 508b38ff370SJamie Gritton return (error); 509413628a7SBjoern A. Zeeb } 510413628a7SBjoern A. Zeeb 511413628a7SBjoern A. Zeeb int 512b38ff370SJamie Gritton kern_jail_set(struct thread *td, struct uio *optuio, int flags) 513413628a7SBjoern A. Zeeb { 514fd7a8150SMike Barcroft struct nameidata nd; 515b38ff370SJamie Gritton #ifdef INET 516b38ff370SJamie Gritton struct in_addr *ip4; 517413628a7SBjoern A. Zeeb #endif 518b38ff370SJamie Gritton #ifdef INET6 519b38ff370SJamie Gritton struct in6_addr *ip6; 520b38ff370SJamie Gritton #endif 521b38ff370SJamie Gritton struct vfsopt *opt; 522b38ff370SJamie Gritton struct vfsoptlist *opts; 5237de883c8SJamie Gritton struct prison *pr, *deadpr, *inspr, *mypr, *ppr, *tpr; 524b38ff370SJamie Gritton struct vnode *root; 525babbbb9cSJamie Gritton char *domain, *errmsg, *host, *name, *namelc, *p, *path, *uuid; 526b96bd95bSIan Lepore char *g_path, *osrelstr; 527672756aaSJamie Gritton struct bool_flags *bf; 528672756aaSJamie Gritton struct jailsys_flags *jsf; 5290304c731SJamie Gritton #if defined(INET) || defined(INET6) 53057aea6dfSBjoern A. Zeeb struct prison *tppr; 531b38ff370SJamie Gritton void *op; 5320304c731SJamie Gritton #endif 53376ca6f88SJamie Gritton unsigned long hid; 534b6f47c23SJamie Gritton size_t namelen, onamelen, pnamelen; 5352a4b2251SJamie Gritton int born, created, cuflags, descend, drflags, enforce; 536cc5fd8c7SJamie Gritton int error, errmsg_len, errmsg_pos; 5370cc207a6SMartin Matuska int gotchildmax, gotenforce, gothid, gotrsnum, gotslevel; 538672756aaSJamie Gritton int jid, jsys, len, level; 539b96bd95bSIan Lepore int childmax, osreldt, rsnum, slevel; 540d465a41dSBjoern A. Zeeb #if defined(INET) || defined(INET6) 5410304c731SJamie Gritton int ii, ij; 542413628a7SBjoern A. Zeeb #endif 543413628a7SBjoern A. Zeeb #ifdef INET 5442b0d6f81SJamie Gritton int ip4s, redo_ip4; 545413628a7SBjoern A. Zeeb #endif 546b38ff370SJamie Gritton #ifdef INET6 5472b0d6f81SJamie Gritton int ip6s, redo_ip6; 548b38ff370SJamie Gritton #endif 5496beb3bb4SKirk McKusick uint64_t pr_allow, ch_allow, pr_flags, ch_flags; 550b3079544SJamie Gritton uint64_t pr_allow_diff; 5516beb3bb4SKirk McKusick unsigned tallow; 552b38ff370SJamie Gritton char numbuf[12]; 553b38ff370SJamie Gritton 554b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_SET); 555b38ff370SJamie Gritton if (!error && (flags & JAIL_ATTACH)) 556b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_ATTACH); 557b38ff370SJamie Gritton if (error) 55875c13541SPoul-Henning Kamp return (error); 559b6f47c23SJamie Gritton mypr = td->td_ucred->cr_prison; 560b97457e2SJamie Gritton if ((flags & JAIL_CREATE) && mypr->pr_childmax == 0) 5610304c731SJamie Gritton return (EPERM); 562b38ff370SJamie Gritton if (flags & ~JAIL_SET_MASK) 563b38ff370SJamie Gritton return (EINVAL); 564b38ff370SJamie Gritton 565b38ff370SJamie Gritton /* 566b38ff370SJamie Gritton * Check all the parameters before committing to anything. Not all 567b38ff370SJamie Gritton * errors can be caught early, but we may as well try. Also, this 568b38ff370SJamie Gritton * takes care of some expensive stuff (path lookup) before getting 569b38ff370SJamie Gritton * the allprison lock. 570b38ff370SJamie Gritton * 571b38ff370SJamie Gritton * XXX Jails are not filesystems, and jail parameters are not mount 572b38ff370SJamie Gritton * options. But it makes more sense to re-use the vfsopt code 573b38ff370SJamie Gritton * than duplicate it under a different name. 574b38ff370SJamie Gritton */ 575b38ff370SJamie Gritton error = vfs_buildopts(optuio, &opts); 576b38ff370SJamie Gritton if (error) 577b38ff370SJamie Gritton return (error); 578b38ff370SJamie Gritton #ifdef INET 579b38ff370SJamie Gritton ip4 = NULL; 580b38ff370SJamie Gritton #endif 581b38ff370SJamie Gritton #ifdef INET6 582b38ff370SJamie Gritton ip6 = NULL; 583b38ff370SJamie Gritton #endif 5846dfe0a3dSMartin Matuska g_path = NULL; 585b38ff370SJamie Gritton 586b6f47c23SJamie Gritton cuflags = flags & (JAIL_CREATE | JAIL_UPDATE); 587b6f47c23SJamie Gritton if (!cuflags) { 588b6f47c23SJamie Gritton error = EINVAL; 589b6f47c23SJamie Gritton vfs_opterror(opts, "no valid operation (create or update)"); 590b6f47c23SJamie Gritton goto done_errmsg; 591b6f47c23SJamie Gritton } 592b6f47c23SJamie Gritton 593b38ff370SJamie Gritton error = vfs_copyopt(opts, "jid", &jid, sizeof(jid)); 594b38ff370SJamie Gritton if (error == ENOENT) 595b38ff370SJamie Gritton jid = 0; 596b38ff370SJamie Gritton else if (error != 0) 597b38ff370SJamie Gritton goto done_free; 598b38ff370SJamie Gritton 599b38ff370SJamie Gritton error = vfs_copyopt(opts, "securelevel", &slevel, sizeof(slevel)); 600b38ff370SJamie Gritton if (error == ENOENT) 601b38ff370SJamie Gritton gotslevel = 0; 602b38ff370SJamie Gritton else if (error != 0) 603b38ff370SJamie Gritton goto done_free; 604b38ff370SJamie Gritton else 605b38ff370SJamie Gritton gotslevel = 1; 606b38ff370SJamie Gritton 607b97457e2SJamie Gritton error = 608b97457e2SJamie Gritton vfs_copyopt(opts, "children.max", &childmax, sizeof(childmax)); 609b97457e2SJamie Gritton if (error == ENOENT) 610b97457e2SJamie Gritton gotchildmax = 0; 611b97457e2SJamie Gritton else if (error != 0) 612b97457e2SJamie Gritton goto done_free; 613b97457e2SJamie Gritton else 614b97457e2SJamie Gritton gotchildmax = 1; 615b97457e2SJamie Gritton 6160304c731SJamie Gritton error = vfs_copyopt(opts, "enforce_statfs", &enforce, sizeof(enforce)); 617f337198dSJamie Gritton if (error == ENOENT) 618f337198dSJamie Gritton gotenforce = 0; 619f337198dSJamie Gritton else if (error != 0) 6200304c731SJamie Gritton goto done_free; 621f337198dSJamie Gritton else if (enforce < 0 || enforce > 2) { 622f337198dSJamie Gritton error = EINVAL; 623f337198dSJamie Gritton goto done_free; 624f337198dSJamie Gritton } else 625f337198dSJamie Gritton gotenforce = 1; 6260304c731SJamie Gritton 6270cc207a6SMartin Matuska error = vfs_copyopt(opts, "devfs_ruleset", &rsnum, sizeof(rsnum)); 6280cc207a6SMartin Matuska if (error == ENOENT) 6290cc207a6SMartin Matuska gotrsnum = 0; 6300cc207a6SMartin Matuska else if (error != 0) 6310cc207a6SMartin Matuska goto done_free; 6320cc207a6SMartin Matuska else 6330cc207a6SMartin Matuska gotrsnum = 1; 6340cc207a6SMartin Matuska 635b38ff370SJamie Gritton pr_flags = ch_flags = 0; 636672756aaSJamie Gritton for (bf = pr_flag_bool; 637672756aaSJamie Gritton bf < pr_flag_bool + nitems(pr_flag_bool); 638672756aaSJamie Gritton bf++) { 639672756aaSJamie Gritton vfs_flagopt(opts, bf->name, &pr_flags, bf->flag); 640672756aaSJamie Gritton vfs_flagopt(opts, bf->noname, &ch_flags, bf->flag); 6410304c731SJamie Gritton } 642b38ff370SJamie Gritton ch_flags |= pr_flags; 643672756aaSJamie Gritton for (jsf = pr_flag_jailsys; 644672756aaSJamie Gritton jsf < pr_flag_jailsys + nitems(pr_flag_jailsys); 645672756aaSJamie Gritton jsf++) { 646672756aaSJamie Gritton error = vfs_copyopt(opts, jsf->name, &jsys, sizeof(jsys)); 6477cbf7213SJamie Gritton if (error == ENOENT) 6487cbf7213SJamie Gritton continue; 6497cbf7213SJamie Gritton if (error != 0) 6507cbf7213SJamie Gritton goto done_free; 6517cbf7213SJamie Gritton switch (jsys) { 6527cbf7213SJamie Gritton case JAIL_SYS_DISABLE: 653672756aaSJamie Gritton if (!jsf->disable) { 6547cbf7213SJamie Gritton error = EINVAL; 6557cbf7213SJamie Gritton goto done_free; 6567cbf7213SJamie Gritton } 657672756aaSJamie Gritton pr_flags |= jsf->disable; 6587cbf7213SJamie Gritton break; 6597cbf7213SJamie Gritton case JAIL_SYS_NEW: 660672756aaSJamie Gritton pr_flags |= jsf->new; 6617cbf7213SJamie Gritton break; 6627cbf7213SJamie Gritton case JAIL_SYS_INHERIT: 6637cbf7213SJamie Gritton break; 6647cbf7213SJamie Gritton default: 6657cbf7213SJamie Gritton error = EINVAL; 6667cbf7213SJamie Gritton goto done_free; 6677cbf7213SJamie Gritton } 668672756aaSJamie Gritton ch_flags |= jsf->new | jsf->disable; 6697cbf7213SJamie Gritton } 6701158508aSJamie Gritton if ((flags & (JAIL_CREATE | JAIL_ATTACH)) == JAIL_CREATE 6714affa14cSJamie Gritton && !(pr_flags & PR_PERSIST)) { 6724affa14cSJamie Gritton error = EINVAL; 6734affa14cSJamie Gritton vfs_opterror(opts, "new jail must persist or attach"); 6744affa14cSJamie Gritton goto done_errmsg; 6754affa14cSJamie Gritton } 676679e1390SJamie Gritton #ifdef VIMAGE 677679e1390SJamie Gritton if ((flags & JAIL_UPDATE) && (ch_flags & PR_VNET)) { 678679e1390SJamie Gritton error = EINVAL; 679679e1390SJamie Gritton vfs_opterror(opts, "vnet cannot be changed after creation"); 680679e1390SJamie Gritton goto done_errmsg; 681679e1390SJamie Gritton } 682679e1390SJamie Gritton #endif 6832b0d6f81SJamie Gritton #ifdef INET 6842b0d6f81SJamie Gritton if ((flags & JAIL_UPDATE) && (ch_flags & PR_IP4_USER)) { 6852b0d6f81SJamie Gritton error = EINVAL; 6862b0d6f81SJamie Gritton vfs_opterror(opts, "ip4 cannot be changed after creation"); 6872b0d6f81SJamie Gritton goto done_errmsg; 6882b0d6f81SJamie Gritton } 6892b0d6f81SJamie Gritton #endif 6902b0d6f81SJamie Gritton #ifdef INET6 6912b0d6f81SJamie Gritton if ((flags & JAIL_UPDATE) && (ch_flags & PR_IP6_USER)) { 6922b0d6f81SJamie Gritton error = EINVAL; 6932b0d6f81SJamie Gritton vfs_opterror(opts, "ip6 cannot be changed after creation"); 6942b0d6f81SJamie Gritton goto done_errmsg; 6952b0d6f81SJamie Gritton } 6962b0d6f81SJamie Gritton #endif 697b38ff370SJamie Gritton 6980304c731SJamie Gritton pr_allow = ch_allow = 0; 699672756aaSJamie Gritton for (bf = pr_flag_allow; 7005d58f959SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && 7015d58f959SJamie Gritton atomic_load_int(&bf->flag) != 0; 702672756aaSJamie Gritton bf++) { 703672756aaSJamie Gritton vfs_flagopt(opts, bf->name, &pr_allow, bf->flag); 704672756aaSJamie Gritton vfs_flagopt(opts, bf->noname, &ch_allow, bf->flag); 7050304c731SJamie Gritton } 7060304c731SJamie Gritton ch_allow |= pr_allow; 7070304c731SJamie Gritton 708b38ff370SJamie Gritton error = vfs_getopt(opts, "name", (void **)&name, &len); 709b38ff370SJamie Gritton if (error == ENOENT) 710b38ff370SJamie Gritton name = NULL; 711b38ff370SJamie Gritton else if (error != 0) 712b38ff370SJamie Gritton goto done_free; 713b38ff370SJamie Gritton else { 714b38ff370SJamie Gritton if (len == 0 || name[len - 1] != '\0') { 715b38ff370SJamie Gritton error = EINVAL; 716b38ff370SJamie Gritton goto done_free; 717b38ff370SJamie Gritton } 718b38ff370SJamie Gritton if (len > MAXHOSTNAMELEN) { 719b38ff370SJamie Gritton error = ENAMETOOLONG; 720b38ff370SJamie Gritton goto done_free; 721b38ff370SJamie Gritton } 722b38ff370SJamie Gritton } 723b38ff370SJamie Gritton 724b38ff370SJamie Gritton error = vfs_getopt(opts, "host.hostname", (void **)&host, &len); 725b38ff370SJamie Gritton if (error == ENOENT) 726b38ff370SJamie Gritton host = NULL; 727b38ff370SJamie Gritton else if (error != 0) 728b38ff370SJamie Gritton goto done_free; 729b38ff370SJamie Gritton else { 73076ca6f88SJamie Gritton ch_flags |= PR_HOST; 73176ca6f88SJamie Gritton pr_flags |= PR_HOST; 732b38ff370SJamie Gritton if (len == 0 || host[len - 1] != '\0') { 733b38ff370SJamie Gritton error = EINVAL; 734b38ff370SJamie Gritton goto done_free; 735b38ff370SJamie Gritton } 736b38ff370SJamie Gritton if (len > MAXHOSTNAMELEN) { 737b38ff370SJamie Gritton error = ENAMETOOLONG; 738b38ff370SJamie Gritton goto done_free; 739b38ff370SJamie Gritton } 740b38ff370SJamie Gritton } 741b38ff370SJamie Gritton 74276ca6f88SJamie Gritton error = vfs_getopt(opts, "host.domainname", (void **)&domain, &len); 74376ca6f88SJamie Gritton if (error == ENOENT) 74476ca6f88SJamie Gritton domain = NULL; 74576ca6f88SJamie Gritton else if (error != 0) 74676ca6f88SJamie Gritton goto done_free; 74776ca6f88SJamie Gritton else { 74876ca6f88SJamie Gritton ch_flags |= PR_HOST; 74976ca6f88SJamie Gritton pr_flags |= PR_HOST; 75076ca6f88SJamie Gritton if (len == 0 || domain[len - 1] != '\0') { 75176ca6f88SJamie Gritton error = EINVAL; 75276ca6f88SJamie Gritton goto done_free; 75376ca6f88SJamie Gritton } 75476ca6f88SJamie Gritton if (len > MAXHOSTNAMELEN) { 75576ca6f88SJamie Gritton error = ENAMETOOLONG; 75676ca6f88SJamie Gritton goto done_free; 75776ca6f88SJamie Gritton } 75876ca6f88SJamie Gritton } 75976ca6f88SJamie Gritton 76076ca6f88SJamie Gritton error = vfs_getopt(opts, "host.hostuuid", (void **)&uuid, &len); 76176ca6f88SJamie Gritton if (error == ENOENT) 76276ca6f88SJamie Gritton uuid = NULL; 76376ca6f88SJamie Gritton else if (error != 0) 76476ca6f88SJamie Gritton goto done_free; 76576ca6f88SJamie Gritton else { 76676ca6f88SJamie Gritton ch_flags |= PR_HOST; 76776ca6f88SJamie Gritton pr_flags |= PR_HOST; 76876ca6f88SJamie Gritton if (len == 0 || uuid[len - 1] != '\0') { 76976ca6f88SJamie Gritton error = EINVAL; 77076ca6f88SJamie Gritton goto done_free; 77176ca6f88SJamie Gritton } 77276ca6f88SJamie Gritton if (len > HOSTUUIDLEN) { 77376ca6f88SJamie Gritton error = ENAMETOOLONG; 77476ca6f88SJamie Gritton goto done_free; 77576ca6f88SJamie Gritton } 77676ca6f88SJamie Gritton } 77776ca6f88SJamie Gritton 778841c0c7eSNathan Whitehorn #ifdef COMPAT_FREEBSD32 779a5c1afadSDmitry Chagin if (SV_PROC_FLAG(td->td_proc, SV_ILP32)) { 78076ca6f88SJamie Gritton uint32_t hid32; 78176ca6f88SJamie Gritton 78276ca6f88SJamie Gritton error = vfs_copyopt(opts, "host.hostid", &hid32, sizeof(hid32)); 78376ca6f88SJamie Gritton hid = hid32; 78476ca6f88SJamie Gritton } else 78576ca6f88SJamie Gritton #endif 78676ca6f88SJamie Gritton error = vfs_copyopt(opts, "host.hostid", &hid, sizeof(hid)); 78776ca6f88SJamie Gritton if (error == ENOENT) 78876ca6f88SJamie Gritton gothid = 0; 78976ca6f88SJamie Gritton else if (error != 0) 79076ca6f88SJamie Gritton goto done_free; 79176ca6f88SJamie Gritton else { 79276ca6f88SJamie Gritton gothid = 1; 79376ca6f88SJamie Gritton ch_flags |= PR_HOST; 79476ca6f88SJamie Gritton pr_flags |= PR_HOST; 79576ca6f88SJamie Gritton } 79676ca6f88SJamie Gritton 797b38ff370SJamie Gritton #ifdef INET 798b38ff370SJamie Gritton error = vfs_getopt(opts, "ip4.addr", &op, &ip4s); 799b38ff370SJamie Gritton if (error == ENOENT) 8000e5e396eSJamie Gritton ip4s = 0; 801b38ff370SJamie Gritton else if (error != 0) 802b38ff370SJamie Gritton goto done_free; 803b38ff370SJamie Gritton else if (ip4s & (sizeof(*ip4) - 1)) { 804b38ff370SJamie Gritton error = EINVAL; 805b38ff370SJamie Gritton goto done_free; 8060304c731SJamie Gritton } else { 8076a3f2779SJamie Gritton ch_flags |= PR_IP4_USER; 8086a3f2779SJamie Gritton pr_flags |= PR_IP4_USER; 8096a3f2779SJamie Gritton if (ip4s > 0) { 810b38ff370SJamie Gritton ip4s /= sizeof(*ip4); 811b38ff370SJamie Gritton if (ip4s > jail_max_af_ips) { 812b38ff370SJamie Gritton error = EINVAL; 813b38ff370SJamie Gritton vfs_opterror(opts, "too many IPv4 addresses"); 814b38ff370SJamie Gritton goto done_errmsg; 815b38ff370SJamie Gritton } 8162b0d6f81SJamie Gritton ip4 = malloc(ip4s * sizeof(*ip4), M_PRISON, M_WAITOK); 817b38ff370SJamie Gritton bcopy(op, ip4, ip4s * sizeof(*ip4)); 818b38ff370SJamie Gritton /* 8190304c731SJamie Gritton * IP addresses are all sorted but ip[0] to preserve 8200304c731SJamie Gritton * the primary IP address as given from userland. 8210304c731SJamie Gritton * This special IP is used for unbound outgoing 822bef916f9SBjoern A. Zeeb * connections as well for "loopback" traffic in case 823bef916f9SBjoern A. Zeeb * source address selection cannot find any more fitting 824bef916f9SBjoern A. Zeeb * address to connect from. 825b38ff370SJamie Gritton */ 826b38ff370SJamie Gritton if (ip4s > 1) 8270ce1624dSStephen J. Kiernan qsort(ip4 + 1, ip4s - 1, sizeof(*ip4), 8280ce1624dSStephen J. Kiernan prison_qcmp_v4); 829b38ff370SJamie Gritton /* 8300304c731SJamie Gritton * Check for duplicate addresses and do some simple 8310304c731SJamie Gritton * zero and broadcast checks. If users give other bogus 8320304c731SJamie Gritton * addresses it is their problem. 833b38ff370SJamie Gritton * 8340304c731SJamie Gritton * We do not have to care about byte order for these 8350304c731SJamie Gritton * checks so we will do them in NBO. 836b38ff370SJamie Gritton */ 837b38ff370SJamie Gritton for (ii = 0; ii < ip4s; ii++) { 838b38ff370SJamie Gritton if (ip4[ii].s_addr == INADDR_ANY || 839b38ff370SJamie Gritton ip4[ii].s_addr == INADDR_BROADCAST) { 840b38ff370SJamie Gritton error = EINVAL; 841b38ff370SJamie Gritton goto done_free; 842b38ff370SJamie Gritton } 843b38ff370SJamie Gritton if ((ii+1) < ip4s && 844b38ff370SJamie Gritton (ip4[0].s_addr == ip4[ii+1].s_addr || 845b38ff370SJamie Gritton ip4[ii].s_addr == ip4[ii+1].s_addr)) { 846b38ff370SJamie Gritton error = EINVAL; 847b38ff370SJamie Gritton goto done_free; 848b38ff370SJamie Gritton } 849b38ff370SJamie Gritton } 850b38ff370SJamie Gritton } 8510304c731SJamie Gritton } 852b38ff370SJamie Gritton #endif 853b38ff370SJamie Gritton 854b38ff370SJamie Gritton #ifdef INET6 855b38ff370SJamie Gritton error = vfs_getopt(opts, "ip6.addr", &op, &ip6s); 856b38ff370SJamie Gritton if (error == ENOENT) 8570e5e396eSJamie Gritton ip6s = 0; 858b38ff370SJamie Gritton else if (error != 0) 859b38ff370SJamie Gritton goto done_free; 860b38ff370SJamie Gritton else if (ip6s & (sizeof(*ip6) - 1)) { 861b38ff370SJamie Gritton error = EINVAL; 862b38ff370SJamie Gritton goto done_free; 8630304c731SJamie Gritton } else { 8646a3f2779SJamie Gritton ch_flags |= PR_IP6_USER; 8656a3f2779SJamie Gritton pr_flags |= PR_IP6_USER; 8666a3f2779SJamie Gritton if (ip6s > 0) { 867b38ff370SJamie Gritton ip6s /= sizeof(*ip6); 868b38ff370SJamie Gritton if (ip6s > jail_max_af_ips) { 869b38ff370SJamie Gritton error = EINVAL; 870b38ff370SJamie Gritton vfs_opterror(opts, "too many IPv6 addresses"); 871b38ff370SJamie Gritton goto done_errmsg; 872b38ff370SJamie Gritton } 8732b0d6f81SJamie Gritton ip6 = malloc(ip6s * sizeof(*ip6), M_PRISON, M_WAITOK); 874b38ff370SJamie Gritton bcopy(op, ip6, ip6s * sizeof(*ip6)); 875b38ff370SJamie Gritton if (ip6s > 1) 8760ce1624dSStephen J. Kiernan qsort(ip6 + 1, ip6s - 1, sizeof(*ip6), 8770ce1624dSStephen J. Kiernan prison_qcmp_v6); 878b38ff370SJamie Gritton for (ii = 0; ii < ip6s; ii++) { 8790304c731SJamie Gritton if (IN6_IS_ADDR_UNSPECIFIED(&ip6[ii])) { 880b38ff370SJamie Gritton error = EINVAL; 881b38ff370SJamie Gritton goto done_free; 882b38ff370SJamie Gritton } 883b38ff370SJamie Gritton if ((ii+1) < ip6s && 884b38ff370SJamie Gritton (IN6_ARE_ADDR_EQUAL(&ip6[0], &ip6[ii+1]) || 885b38ff370SJamie Gritton IN6_ARE_ADDR_EQUAL(&ip6[ii], &ip6[ii+1]))) 886b38ff370SJamie Gritton { 887b38ff370SJamie Gritton error = EINVAL; 888b38ff370SJamie Gritton goto done_free; 889b38ff370SJamie Gritton } 890b38ff370SJamie Gritton } 891b38ff370SJamie Gritton } 8920304c731SJamie Gritton } 893b38ff370SJamie Gritton #endif 894b38ff370SJamie Gritton 895bdfc8cc4SJamie Gritton #if defined(VIMAGE) && (defined(INET) || defined(INET6)) 896bdfc8cc4SJamie Gritton if ((ch_flags & PR_VNET) && (ch_flags & (PR_IP4_USER | PR_IP6_USER))) { 897bdfc8cc4SJamie Gritton error = EINVAL; 898bdfc8cc4SJamie Gritton vfs_opterror(opts, 899bdfc8cc4SJamie Gritton "vnet jails cannot have IP address restrictions"); 900bdfc8cc4SJamie Gritton goto done_errmsg; 901bdfc8cc4SJamie Gritton } 902bdfc8cc4SJamie Gritton #endif 903bdfc8cc4SJamie Gritton 904cf0313c6SJamie Gritton error = vfs_getopt(opts, "osrelease", (void **)&osrelstr, &len); 905cf0313c6SJamie Gritton if (error == ENOENT) 906cf0313c6SJamie Gritton osrelstr = NULL; 907cf0313c6SJamie Gritton else if (error != 0) 908cf0313c6SJamie Gritton goto done_free; 909cf0313c6SJamie Gritton else { 910cf0313c6SJamie Gritton if (flags & JAIL_UPDATE) { 911cf0313c6SJamie Gritton error = EINVAL; 912cf0313c6SJamie Gritton vfs_opterror(opts, 913cf0313c6SJamie Gritton "osrelease cannot be changed after creation"); 914cf0313c6SJamie Gritton goto done_errmsg; 915cf0313c6SJamie Gritton } 9161b786d01SBjoern A. Zeeb if (len == 0 || osrelstr[len - 1] != '\0') { 917cf0313c6SJamie Gritton error = EINVAL; 9181b786d01SBjoern A. Zeeb goto done_free; 9191b786d01SBjoern A. Zeeb } 9201b786d01SBjoern A. Zeeb if (len >= OSRELEASELEN) { 9211b786d01SBjoern A. Zeeb error = ENAMETOOLONG; 922cf0313c6SJamie Gritton vfs_opterror(opts, 923cf0313c6SJamie Gritton "osrelease string must be 1-%d bytes long", 924cf0313c6SJamie Gritton OSRELEASELEN - 1); 925cf0313c6SJamie Gritton goto done_errmsg; 926cf0313c6SJamie Gritton } 927cf0313c6SJamie Gritton } 928cf0313c6SJamie Gritton 929cf0313c6SJamie Gritton error = vfs_copyopt(opts, "osreldate", &osreldt, sizeof(osreldt)); 930cf0313c6SJamie Gritton if (error == ENOENT) 931cf0313c6SJamie Gritton osreldt = 0; 932cf0313c6SJamie Gritton else if (error != 0) 933cf0313c6SJamie Gritton goto done_free; 934cf0313c6SJamie Gritton else { 935cf0313c6SJamie Gritton if (flags & JAIL_UPDATE) { 936cf0313c6SJamie Gritton error = EINVAL; 937cf0313c6SJamie Gritton vfs_opterror(opts, 938cf0313c6SJamie Gritton "osreldate cannot be changed after creation"); 939cf0313c6SJamie Gritton goto done_errmsg; 940cf0313c6SJamie Gritton } 941cf0313c6SJamie Gritton if (osreldt == 0) { 942cf0313c6SJamie Gritton error = EINVAL; 943cf0313c6SJamie Gritton vfs_opterror(opts, "osreldate cannot be 0"); 944cf0313c6SJamie Gritton goto done_errmsg; 945cf0313c6SJamie Gritton } 946cf0313c6SJamie Gritton } 947cf0313c6SJamie Gritton 948b38ff370SJamie Gritton root = NULL; 949b38ff370SJamie Gritton error = vfs_getopt(opts, "path", (void **)&path, &len); 950b38ff370SJamie Gritton if (error == ENOENT) 951b38ff370SJamie Gritton path = NULL; 952b38ff370SJamie Gritton else if (error != 0) 953b38ff370SJamie Gritton goto done_free; 954b38ff370SJamie Gritton else { 955b38ff370SJamie Gritton if (flags & JAIL_UPDATE) { 956b38ff370SJamie Gritton error = EINVAL; 957b38ff370SJamie Gritton vfs_opterror(opts, 958b38ff370SJamie Gritton "path cannot be changed after creation"); 959b38ff370SJamie Gritton goto done_errmsg; 960b38ff370SJamie Gritton } 961b38ff370SJamie Gritton if (len == 0 || path[len - 1] != '\0') { 962b38ff370SJamie Gritton error = EINVAL; 963b38ff370SJamie Gritton goto done_free; 964b38ff370SJamie Gritton } 965*7e1d3eefSMateusz Guzik NDINIT(&nd, LOOKUP, FOLLOW | LOCKLEAF, UIO_SYSSPACE, path); 966b38ff370SJamie Gritton error = namei(&nd); 967b38ff370SJamie Gritton if (error) 968b38ff370SJamie Gritton goto done_free; 969b38ff370SJamie Gritton root = nd.ni_vp; 970b38ff370SJamie Gritton NDFREE(&nd, NDF_ONLY_PNBUF); 9716dfe0a3dSMartin Matuska g_path = malloc(MAXPATHLEN, M_TEMP, M_WAITOK); 9726dfe0a3dSMartin Matuska strlcpy(g_path, path, MAXPATHLEN); 9736dfe0a3dSMartin Matuska error = vn_path_to_global_path(td, root, g_path, MAXPATHLEN); 9743eb6b656SMateusz Guzik if (error == 0) { 9756dfe0a3dSMartin Matuska path = g_path; 9766dfe0a3dSMartin Matuska } else { 977f6e633a9SMartin Matuska /* exit on other errors */ 978b38ff370SJamie Gritton goto done_free; 979b38ff370SJamie Gritton } 980f6e633a9SMartin Matuska if (root->v_type != VDIR) { 981f6e633a9SMartin Matuska error = ENOTDIR; 982f6e633a9SMartin Matuska vput(root); 983f6e633a9SMartin Matuska goto done_free; 984f6e633a9SMartin Matuska } 985b249ce48SMateusz Guzik VOP_UNLOCK(root); 986b38ff370SJamie Gritton } 987b38ff370SJamie Gritton 988b38ff370SJamie Gritton /* 989b6f47c23SJamie Gritton * Find the specified jail, or at least its parent. 990b38ff370SJamie Gritton * This abuses the file error codes ENOENT and EEXIST. 991b38ff370SJamie Gritton */ 992b38ff370SJamie Gritton pr = NULL; 9937de883c8SJamie Gritton inspr = NULL; 994babbbb9cSJamie Gritton if (cuflags == JAIL_CREATE && jid == 0 && name != NULL) { 995babbbb9cSJamie Gritton namelc = strrchr(name, '.'); 996babbbb9cSJamie Gritton jid = strtoul(namelc != NULL ? namelc + 1 : name, &p, 10); 997babbbb9cSJamie Gritton if (*p != '\0') 998babbbb9cSJamie Gritton jid = 0; 999babbbb9cSJamie Gritton } 1000b6f47c23SJamie Gritton sx_xlock(&allprison_lock); 1001108a9384SJamie Gritton drflags = PD_LIST_XLOCKED; 10020a2a96f3SJamie Gritton ppr = mypr; 10030a2a96f3SJamie Gritton if (!prison_isalive(ppr)) { 10040a2a96f3SJamie Gritton /* This jail is dying. This process will surely follow. */ 10050a2a96f3SJamie Gritton error = EAGAIN; 10060a2a96f3SJamie Gritton goto done_deref; 10070a2a96f3SJamie Gritton } 1008b38ff370SJamie Gritton if (jid != 0) { 1009b38ff370SJamie Gritton if (jid < 0) { 1010b38ff370SJamie Gritton error = EINVAL; 1011b38ff370SJamie Gritton vfs_opterror(opts, "negative jid"); 10122a4b2251SJamie Gritton goto done_deref; 1013b38ff370SJamie Gritton } 10147de883c8SJamie Gritton /* 10157de883c8SJamie Gritton * See if a requested jid already exists. Keep track of 10167de883c8SJamie Gritton * where it can be inserted later. 10177de883c8SJamie Gritton */ 10187de883c8SJamie Gritton TAILQ_FOREACH(inspr, &allprison, pr_list) { 1019f7496dcaSJamie Gritton if (inspr->pr_id < jid) 1020f7496dcaSJamie Gritton continue; 1021f7496dcaSJamie Gritton if (inspr->pr_id > jid) 1022f7496dcaSJamie Gritton break; 10237de883c8SJamie Gritton pr = inspr; 1024f7496dcaSJamie Gritton mtx_lock(&pr->pr_mtx); 10252a4b2251SJamie Gritton drflags |= PD_LOCKED; 10267de883c8SJamie Gritton inspr = NULL; 10277de883c8SJamie Gritton break; 10287de883c8SJamie Gritton } 1029b38ff370SJamie Gritton if (pr != NULL) { 1030b38ff370SJamie Gritton /* Create: jid must not exist. */ 1031b38ff370SJamie Gritton if (cuflags == JAIL_CREATE) { 10327de883c8SJamie Gritton /* 10337de883c8SJamie Gritton * Even creators that cannot see the jail will 10347de883c8SJamie Gritton * get EEXIST. 10357de883c8SJamie Gritton */ 1036b38ff370SJamie Gritton error = EEXIST; 1037b38ff370SJamie Gritton vfs_opterror(opts, "jail %d already exists", 1038b38ff370SJamie Gritton jid); 10392a4b2251SJamie Gritton goto done_deref; 1040b38ff370SJamie Gritton } 10410304c731SJamie Gritton if (!prison_ischild(mypr, pr)) { 10427de883c8SJamie Gritton /* 10437de883c8SJamie Gritton * Updaters get ENOENT if they cannot see the 10447de883c8SJamie Gritton * jail. This is true even for CREATE | UPDATE, 10457de883c8SJamie Gritton * which normally cannot give this error. 10467de883c8SJamie Gritton */ 10472a4b2251SJamie Gritton error = ENOENT; 10482a4b2251SJamie Gritton vfs_opterror(opts, "jail %d not found", jid); 10492a4b2251SJamie Gritton goto done_deref; 1050f7496dcaSJamie Gritton } 10510a2a96f3SJamie Gritton ppr = pr->pr_parent; 10520a2a96f3SJamie Gritton if (!prison_isalive(ppr)) { 10530a2a96f3SJamie Gritton error = ENOENT; 10540a2a96f3SJamie Gritton vfs_opterror(opts, "jail %d is dying", 10550a2a96f3SJamie Gritton ppr->pr_id); 10560a2a96f3SJamie Gritton goto done_deref; 10570a2a96f3SJamie Gritton } 1058f7496dcaSJamie Gritton if (!prison_isalive(pr)) { 1059b38ff370SJamie Gritton if (!(flags & JAIL_DYING)) { 1060b38ff370SJamie Gritton error = ENOENT; 1061b38ff370SJamie Gritton vfs_opterror(opts, "jail %d is dying", 1062b38ff370SJamie Gritton jid); 10632a4b2251SJamie Gritton goto done_deref; 1064f7496dcaSJamie Gritton } 1065f7496dcaSJamie Gritton if ((flags & JAIL_ATTACH) || 1066b38ff370SJamie Gritton (pr_flags & PR_PERSIST)) { 1067b38ff370SJamie Gritton /* 1068b38ff370SJamie Gritton * A dying jail might be resurrected 1069b38ff370SJamie Gritton * (via attach or persist), but first 1070b38ff370SJamie Gritton * it must determine if another jail 1071b38ff370SJamie Gritton * has claimed its name. Accomplish 1072b38ff370SJamie Gritton * this by implicitly re-setting the 1073b38ff370SJamie Gritton * name. 1074b38ff370SJamie Gritton */ 1075b38ff370SJamie Gritton if (name == NULL) 10760304c731SJamie Gritton name = prison_name(mypr, pr); 1077b38ff370SJamie Gritton } 1078b38ff370SJamie Gritton } 10792a4b2251SJamie Gritton } else { 1080b38ff370SJamie Gritton /* Update: jid must exist. */ 1081b38ff370SJamie Gritton if (cuflags == JAIL_UPDATE) { 1082b38ff370SJamie Gritton error = ENOENT; 1083b38ff370SJamie Gritton vfs_opterror(opts, "jail %d not found", jid); 10842a4b2251SJamie Gritton goto done_deref; 1085b38ff370SJamie Gritton } 1086b38ff370SJamie Gritton } 1087b38ff370SJamie Gritton } 1088b38ff370SJamie Gritton /* 1089b38ff370SJamie Gritton * If the caller provided a name, look for a jail by that name. 1090b38ff370SJamie Gritton * This has different semantics for creates and updates keyed by jid 1091b38ff370SJamie Gritton * (where the name must not already exist in a different jail), 1092b38ff370SJamie Gritton * and updates keyed by the name itself (where the name must exist 1093b38ff370SJamie Gritton * because that is the jail being updated). 1094b38ff370SJamie Gritton */ 1095b6f47c23SJamie Gritton namelc = NULL; 1096b38ff370SJamie Gritton if (name != NULL) { 1097babbbb9cSJamie Gritton namelc = strrchr(name, '.'); 1098babbbb9cSJamie Gritton if (namelc == NULL) 1099babbbb9cSJamie Gritton namelc = name; 1100babbbb9cSJamie Gritton else { 11010304c731SJamie Gritton /* 11020304c731SJamie Gritton * This is a hierarchical name. Split it into the 11030304c731SJamie Gritton * parent and child names, and make sure the parent 11040304c731SJamie Gritton * exists or matches an already found jail. 11050304c731SJamie Gritton */ 11060304c731SJamie Gritton if (pr != NULL) { 1107babbbb9cSJamie Gritton if (strncmp(name, ppr->pr_name, namelc - name) 1108babbbb9cSJamie Gritton || ppr->pr_name[namelc - name] != '\0') { 11090304c731SJamie Gritton error = EINVAL; 11100304c731SJamie Gritton vfs_opterror(opts, 11110304c731SJamie Gritton "cannot change jail's parent"); 11122a4b2251SJamie Gritton goto done_deref; 11130304c731SJamie Gritton } 11140304c731SJamie Gritton } else { 1115b6f47c23SJamie Gritton *namelc = '\0'; 11160304c731SJamie Gritton ppr = prison_find_name(mypr, name); 11170304c731SJamie Gritton if (ppr == NULL) { 11180304c731SJamie Gritton error = ENOENT; 11190304c731SJamie Gritton vfs_opterror(opts, 11200304c731SJamie Gritton "jail \"%s\" not found", name); 11212a4b2251SJamie Gritton goto done_deref; 11220304c731SJamie Gritton } 1123c050ea80SJamie Gritton mtx_unlock(&ppr->pr_mtx); 11240a2a96f3SJamie Gritton if (!prison_isalive(ppr)) { 1125c050ea80SJamie Gritton error = ENOENT; 1126c050ea80SJamie Gritton vfs_opterror(opts, 1127c050ea80SJamie Gritton "jail \"%s\" is dying", name); 1128c050ea80SJamie Gritton goto done_deref; 1129c050ea80SJamie Gritton } 1130b6f47c23SJamie Gritton *namelc = '.'; 11310304c731SJamie Gritton } 1132b6f47c23SJamie Gritton namelc++; 11330304c731SJamie Gritton } 1134b6f47c23SJamie Gritton if (namelc[0] != '\0') { 1135b6f47c23SJamie Gritton pnamelen = 11360304c731SJamie Gritton (ppr == &prison0) ? 0 : strlen(ppr->pr_name) + 1; 11370304c731SJamie Gritton deadpr = NULL; 11380304c731SJamie Gritton FOREACH_PRISON_CHILD(ppr, tpr) { 11396754ae25SJamie Gritton if (tpr != pr && 1140b6f47c23SJamie Gritton !strcmp(tpr->pr_name + pnamelen, namelc)) { 114176ad42abSJamie Gritton if (prison_isalive(tpr)) { 1142b38ff370SJamie Gritton if (pr == NULL && 1143b38ff370SJamie Gritton cuflags != JAIL_CREATE) { 1144b38ff370SJamie Gritton /* 1145b38ff370SJamie Gritton * Use this jail 1146b38ff370SJamie Gritton * for updates. 1147b38ff370SJamie Gritton */ 1148b38ff370SJamie Gritton pr = tpr; 1149f7496dcaSJamie Gritton mtx_lock(&pr->pr_mtx); 115083bc72a0SJamie Gritton drflags |= PD_LOCKED; 1151b38ff370SJamie Gritton break; 1152b38ff370SJamie Gritton } 1153b38ff370SJamie Gritton /* 1154b38ff370SJamie Gritton * Create, or update(jid): 1155b38ff370SJamie Gritton * name must not exist in an 11560304c731SJamie Gritton * active sibling jail. 1157b38ff370SJamie Gritton */ 1158b38ff370SJamie Gritton error = EEXIST; 1159b38ff370SJamie Gritton vfs_opterror(opts, 1160b38ff370SJamie Gritton "jail \"%s\" already exists", 1161b38ff370SJamie Gritton name); 11622a4b2251SJamie Gritton goto done_deref; 1163b38ff370SJamie Gritton } 116476ad42abSJamie Gritton if (pr == NULL && 1165f7496dcaSJamie Gritton cuflags != JAIL_CREATE) { 116676ad42abSJamie Gritton deadpr = tpr; 1167f7496dcaSJamie Gritton } 1168b38ff370SJamie Gritton } 1169b38ff370SJamie Gritton } 1170b38ff370SJamie Gritton /* If no active jail is found, use a dying one. */ 1171b38ff370SJamie Gritton if (deadpr != NULL && pr == NULL) { 1172b38ff370SJamie Gritton if (flags & JAIL_DYING) { 1173b38ff370SJamie Gritton pr = deadpr; 1174f7496dcaSJamie Gritton mtx_lock(&pr->pr_mtx); 11752a4b2251SJamie Gritton drflags |= PD_LOCKED; 1176b38ff370SJamie Gritton } else if (cuflags == JAIL_UPDATE) { 1177b38ff370SJamie Gritton error = ENOENT; 1178b38ff370SJamie Gritton vfs_opterror(opts, 1179b38ff370SJamie Gritton "jail \"%s\" is dying", name); 11802a4b2251SJamie Gritton goto done_deref; 1181b38ff370SJamie Gritton } 1182b38ff370SJamie Gritton } 1183b38ff370SJamie Gritton /* Update: name must exist if no jid. */ 1184b38ff370SJamie Gritton else if (cuflags == JAIL_UPDATE && pr == NULL) { 1185b38ff370SJamie Gritton error = ENOENT; 1186b38ff370SJamie Gritton vfs_opterror(opts, "jail \"%s\" not found", 1187b38ff370SJamie Gritton name); 11882a4b2251SJamie Gritton goto done_deref; 1189b38ff370SJamie Gritton } 1190b38ff370SJamie Gritton } 1191b38ff370SJamie Gritton } 1192b38ff370SJamie Gritton /* Update: must provide a jid or name. */ 1193b38ff370SJamie Gritton else if (cuflags == JAIL_UPDATE && pr == NULL) { 1194b38ff370SJamie Gritton error = ENOENT; 1195b38ff370SJamie Gritton vfs_opterror(opts, "update specified no jail"); 11962a4b2251SJamie Gritton goto done_deref; 1197b38ff370SJamie Gritton } 1198b38ff370SJamie Gritton 1199b38ff370SJamie Gritton /* If there's no prison to update, create a new one and link it in. */ 12002a4b2251SJamie Gritton created = pr == NULL; 12012a4b2251SJamie Gritton if (created) { 1202b97457e2SJamie Gritton for (tpr = mypr; tpr != NULL; tpr = tpr->pr_parent) 1203b97457e2SJamie Gritton if (tpr->pr_childcount >= tpr->pr_childmax) { 1204b97457e2SJamie Gritton error = EPERM; 1205b97457e2SJamie Gritton vfs_opterror(opts, "prison limit exceeded"); 12062a4b2251SJamie Gritton goto done_deref; 1207b97457e2SJamie Gritton } 12087de883c8SJamie Gritton if (jid == 0 && (jid = get_next_prid(&inspr)) == 0) { 1209b38ff370SJamie Gritton error = EAGAIN; 12107de883c8SJamie Gritton vfs_opterror(opts, "no available jail IDs"); 12112a4b2251SJamie Gritton goto done_deref; 1212b38ff370SJamie Gritton } 12132a4b2251SJamie Gritton 12142a4b2251SJamie Gritton pr = malloc(sizeof(*pr), M_PRISON, M_WAITOK | M_ZERO); 12151158508aSJamie Gritton pr->pr_state = PRISON_STATE_INVALID; 12161158508aSJamie Gritton refcount_init(&pr->pr_ref, 1); 1217f7496dcaSJamie Gritton refcount_init(&pr->pr_uref, 0); 12181158508aSJamie Gritton drflags |= PD_DEREF; 12192a4b2251SJamie Gritton LIST_INIT(&pr->pr_children); 12202a4b2251SJamie Gritton mtx_init(&pr->pr_mtx, "jail mutex", NULL, MTX_DEF | MTX_DUPOK); 12212a4b2251SJamie Gritton TASK_INIT(&pr->pr_task, 0, prison_complete, pr); 12222a4b2251SJamie Gritton 12237de883c8SJamie Gritton pr->pr_id = jid; 12247de883c8SJamie Gritton if (inspr != NULL) 12257de883c8SJamie Gritton TAILQ_INSERT_BEFORE(inspr, pr, pr_list); 12267de883c8SJamie Gritton else 1227b38ff370SJamie Gritton TAILQ_INSERT_TAIL(&allprison, pr, pr_list); 12287de883c8SJamie Gritton 12297de883c8SJamie Gritton pr->pr_parent = ppr; 12300a2a96f3SJamie Gritton prison_hold(ppr); 12310a2a96f3SJamie Gritton prison_proc_hold(ppr); 12320304c731SJamie Gritton LIST_INSERT_HEAD(&ppr->pr_children, pr, pr_sibling); 12330304c731SJamie Gritton for (tpr = ppr; tpr != NULL; tpr = tpr->pr_parent) 1234b97457e2SJamie Gritton tpr->pr_childcount++; 1235b38ff370SJamie Gritton 12360304c731SJamie Gritton /* Set some default values, and inherit some from the parent. */ 1237b6f47c23SJamie Gritton if (namelc == NULL) 1238b6f47c23SJamie Gritton namelc = ""; 1239b38ff370SJamie Gritton if (path == NULL) { 1240b38ff370SJamie Gritton path = "/"; 12410304c731SJamie Gritton root = mypr->pr_root; 1242b38ff370SJamie Gritton vref(root); 1243b38ff370SJamie Gritton } 12448986e3a0SJamie Gritton strlcpy(pr->pr_hostuuid, DEFAULT_HOSTUUID, HOSTUUIDLEN); 12458986e3a0SJamie Gritton pr->pr_flags |= PR_HOST; 1246bdfc8cc4SJamie Gritton #if defined(INET) || defined(INET6) 1247bdfc8cc4SJamie Gritton #ifdef VIMAGE 1248bdfc8cc4SJamie Gritton if (!(pr_flags & PR_VNET)) 1249bdfc8cc4SJamie Gritton #endif 1250bdfc8cc4SJamie Gritton { 12510304c731SJamie Gritton #ifdef INET 12522b0d6f81SJamie Gritton if (!(ch_flags & PR_IP4_USER)) 12536a3f2779SJamie Gritton pr->pr_flags |= PR_IP4 | PR_IP4_USER; 12542b0d6f81SJamie Gritton else if (!(pr_flags & PR_IP4_USER)) { 12552b0d6f81SJamie Gritton pr->pr_flags |= ppr->pr_flags & PR_IP4; 12562b0d6f81SJamie Gritton if (ppr->pr_ip4 != NULL) { 12572b0d6f81SJamie Gritton pr->pr_ip4s = ppr->pr_ip4s; 12582b0d6f81SJamie Gritton pr->pr_ip4 = malloc(pr->pr_ip4s * 12592b0d6f81SJamie Gritton sizeof(struct in_addr), M_PRISON, 12602b0d6f81SJamie Gritton M_WAITOK); 12612b0d6f81SJamie Gritton bcopy(ppr->pr_ip4, pr->pr_ip4, 12622b0d6f81SJamie Gritton pr->pr_ip4s * sizeof(*pr->pr_ip4)); 12632b0d6f81SJamie Gritton } 12642b0d6f81SJamie Gritton } 12650304c731SJamie Gritton #endif 12660304c731SJamie Gritton #ifdef INET6 12672b0d6f81SJamie Gritton if (!(ch_flags & PR_IP6_USER)) 12686a3f2779SJamie Gritton pr->pr_flags |= PR_IP6 | PR_IP6_USER; 12692b0d6f81SJamie Gritton else if (!(pr_flags & PR_IP6_USER)) { 12702b0d6f81SJamie Gritton pr->pr_flags |= ppr->pr_flags & PR_IP6; 12712b0d6f81SJamie Gritton if (ppr->pr_ip6 != NULL) { 12722b0d6f81SJamie Gritton pr->pr_ip6s = ppr->pr_ip6s; 12732b0d6f81SJamie Gritton pr->pr_ip6 = malloc(pr->pr_ip6s * 12742b0d6f81SJamie Gritton sizeof(struct in6_addr), M_PRISON, 12752b0d6f81SJamie Gritton M_WAITOK); 12762b0d6f81SJamie Gritton bcopy(ppr->pr_ip6, pr->pr_ip6, 12772b0d6f81SJamie Gritton pr->pr_ip6s * sizeof(*pr->pr_ip6)); 12782b0d6f81SJamie Gritton } 12792b0d6f81SJamie Gritton } 12800304c731SJamie Gritton #endif 1281bdfc8cc4SJamie Gritton } 1282bdfc8cc4SJamie Gritton #endif 1283592bcae8SBjoern A. Zeeb /* Source address selection is always on by default. */ 1284592bcae8SBjoern A. Zeeb pr->pr_flags |= _PR_IP_SADDRSEL; 1285592bcae8SBjoern A. Zeeb 12860304c731SJamie Gritton pr->pr_securelevel = ppr->pr_securelevel; 12870304c731SJamie Gritton pr->pr_allow = JAIL_DEFAULT_ALLOW & ppr->pr_allow; 1288af10bf05SBjoern A. Zeeb pr->pr_enforce_statfs = jail_default_enforce_statfs; 1289bf3db8aaSMartin Matuska pr->pr_devfs_rsnum = ppr->pr_devfs_rsnum; 1290b38ff370SJamie Gritton 1291b96bd95bSIan Lepore pr->pr_osreldate = osreldt ? osreldt : ppr->pr_osreldate; 1292b96bd95bSIan Lepore if (osrelstr == NULL) 12931b786d01SBjoern A. Zeeb strlcpy(pr->pr_osrelease, ppr->pr_osrelease, 12941b786d01SBjoern A. Zeeb sizeof(pr->pr_osrelease)); 1295b96bd95bSIan Lepore else 12961b786d01SBjoern A. Zeeb strlcpy(pr->pr_osrelease, osrelstr, 12971b786d01SBjoern A. Zeeb sizeof(pr->pr_osrelease)); 1298b96bd95bSIan Lepore 1299679e1390SJamie Gritton #ifdef VIMAGE 1300679e1390SJamie Gritton /* Allocate a new vnet if specified. */ 1301679e1390SJamie Gritton pr->pr_vnet = (pr_flags & PR_VNET) 1302679e1390SJamie Gritton ? vnet_alloc() : ppr->pr_vnet; 1303679e1390SJamie Gritton #endif 1304b38ff370SJamie Gritton /* 1305b38ff370SJamie Gritton * Allocate a dedicated cpuset for each jail. 13068771ff75SGordon Bergling * Unlike other initial settings, this may return an error. 1307b38ff370SJamie Gritton */ 13080304c731SJamie Gritton error = cpuset_create_root(ppr, &pr->pr_cpuset); 13092a4b2251SJamie Gritton if (error) 13102a4b2251SJamie Gritton goto done_deref; 1311b38ff370SJamie Gritton 1312b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 13132a4b2251SJamie Gritton drflags |= PD_LOCKED; 1314b38ff370SJamie Gritton } else { 13152b0d6f81SJamie Gritton /* 13162b0d6f81SJamie Gritton * Grab a reference for existing prisons, to ensure they 13172b0d6f81SJamie Gritton * continue to exist for the duration of the call. 13182b0d6f81SJamie Gritton */ 13196754ae25SJamie Gritton prison_hold(pr); 13202a4b2251SJamie Gritton drflags |= PD_DEREF; 1321bdfc8cc4SJamie Gritton #if defined(VIMAGE) && (defined(INET) || defined(INET6)) 1322bdfc8cc4SJamie Gritton if ((pr->pr_flags & PR_VNET) && 1323bdfc8cc4SJamie Gritton (ch_flags & (PR_IP4_USER | PR_IP6_USER))) { 1324bdfc8cc4SJamie Gritton error = EINVAL; 1325bdfc8cc4SJamie Gritton vfs_opterror(opts, 1326bdfc8cc4SJamie Gritton "vnet jails cannot have IP address restrictions"); 13272a4b2251SJamie Gritton goto done_deref; 1328bdfc8cc4SJamie Gritton } 1329bdfc8cc4SJamie Gritton #endif 13302b0d6f81SJamie Gritton #ifdef INET 13312b0d6f81SJamie Gritton if (PR_IP4_USER & ch_flags & (pr_flags ^ pr->pr_flags)) { 13322b0d6f81SJamie Gritton error = EINVAL; 13332b0d6f81SJamie Gritton vfs_opterror(opts, 13342b0d6f81SJamie Gritton "ip4 cannot be changed after creation"); 13352a4b2251SJamie Gritton goto done_deref; 13362b0d6f81SJamie Gritton } 13372b0d6f81SJamie Gritton #endif 13382b0d6f81SJamie Gritton #ifdef INET6 13392b0d6f81SJamie Gritton if (PR_IP6_USER & ch_flags & (pr_flags ^ pr->pr_flags)) { 13402b0d6f81SJamie Gritton error = EINVAL; 13412b0d6f81SJamie Gritton vfs_opterror(opts, 13422b0d6f81SJamie Gritton "ip6 cannot be changed after creation"); 13432a4b2251SJamie Gritton goto done_deref; 13442b0d6f81SJamie Gritton } 13452b0d6f81SJamie Gritton #endif 1346b38ff370SJamie Gritton } 1347b38ff370SJamie Gritton 1348b38ff370SJamie Gritton /* Do final error checking before setting anything. */ 13490304c731SJamie Gritton if (gotslevel) { 13500304c731SJamie Gritton if (slevel < ppr->pr_securelevel) { 13510304c731SJamie Gritton error = EPERM; 13522a4b2251SJamie Gritton goto done_deref; 13530304c731SJamie Gritton } 13540304c731SJamie Gritton } 1355b97457e2SJamie Gritton if (gotchildmax) { 1356b97457e2SJamie Gritton if (childmax >= ppr->pr_childmax) { 1357b97457e2SJamie Gritton error = EPERM; 13582a4b2251SJamie Gritton goto done_deref; 1359b97457e2SJamie Gritton } 1360b97457e2SJamie Gritton } 13610304c731SJamie Gritton if (gotenforce) { 13620304c731SJamie Gritton if (enforce < ppr->pr_enforce_statfs) { 13630304c731SJamie Gritton error = EPERM; 13642a4b2251SJamie Gritton goto done_deref; 13650304c731SJamie Gritton } 13660304c731SJamie Gritton } 13670cc207a6SMartin Matuska if (gotrsnum) { 13680cc207a6SMartin Matuska /* 13690cc207a6SMartin Matuska * devfs_rsnum is a uint16_t 13700cc207a6SMartin Matuska */ 1371bf3db8aaSMartin Matuska if (rsnum < 0 || rsnum > 65535) { 13720cc207a6SMartin Matuska error = EINVAL; 13732a4b2251SJamie Gritton goto done_deref; 13740cc207a6SMartin Matuska } 13750cc207a6SMartin Matuska /* 1376bf3db8aaSMartin Matuska * Nested jails always inherit parent's devfs ruleset 13770cc207a6SMartin Matuska */ 13780cc207a6SMartin Matuska if (jailed(td->td_ucred)) { 13790cc207a6SMartin Matuska if (rsnum > 0 && rsnum != ppr->pr_devfs_rsnum) { 13800cc207a6SMartin Matuska error = EPERM; 13812a4b2251SJamie Gritton goto done_deref; 1382bf3db8aaSMartin Matuska } else 13830cc207a6SMartin Matuska rsnum = ppr->pr_devfs_rsnum; 13840cc207a6SMartin Matuska } 13850cc207a6SMartin Matuska } 1386b38ff370SJamie Gritton #ifdef INET 13872b0d6f81SJamie Gritton if (ip4s > 0) { 13880304c731SJamie Gritton if (ppr->pr_flags & PR_IP4) { 13890304c731SJamie Gritton /* 13900304c731SJamie Gritton * Make sure the new set of IP addresses is a 13910304c731SJamie Gritton * subset of the parent's list. Don't worry 13920304c731SJamie Gritton * about the parent being unlocked, as any 13930304c731SJamie Gritton * setting is done with allprison_lock held. 13940304c731SJamie Gritton */ 13950304c731SJamie Gritton for (ij = 0; ij < ppr->pr_ip4s; ij++) 13962b0d6f81SJamie Gritton if (ip4[0].s_addr == ppr->pr_ip4[ij].s_addr) 13970304c731SJamie Gritton break; 13980304c731SJamie Gritton if (ij == ppr->pr_ip4s) { 13990304c731SJamie Gritton error = EPERM; 14002a4b2251SJamie Gritton goto done_deref; 14010304c731SJamie Gritton } 14020304c731SJamie Gritton if (ip4s > 1) { 14030304c731SJamie Gritton for (ii = ij = 1; ii < ip4s; ii++) { 14040304c731SJamie Gritton if (ip4[ii].s_addr == 14050304c731SJamie Gritton ppr->pr_ip4[0].s_addr) 1406b38ff370SJamie Gritton continue; 14070304c731SJamie Gritton for (; ij < ppr->pr_ip4s; ij++) 14080304c731SJamie Gritton if (ip4[ii].s_addr == 14090304c731SJamie Gritton ppr->pr_ip4[ij].s_addr) 14100304c731SJamie Gritton break; 14110304c731SJamie Gritton if (ij == ppr->pr_ip4s) 14120304c731SJamie Gritton break; 14130304c731SJamie Gritton } 14140304c731SJamie Gritton if (ij == ppr->pr_ip4s) { 14150304c731SJamie Gritton error = EPERM; 14162a4b2251SJamie Gritton goto done_deref; 14170304c731SJamie Gritton } 14180304c731SJamie Gritton } 14190304c731SJamie Gritton } 14200304c731SJamie Gritton /* 14210304c731SJamie Gritton * Check for conflicting IP addresses. We permit them 14220304c731SJamie Gritton * if there is no more than one IP on each jail. If 14230304c731SJamie Gritton * there is a duplicate on a jail with more than one 14240304c731SJamie Gritton * IP stop checking and return error. 14250304c731SJamie Gritton */ 1426bdfc8cc4SJamie Gritton #ifdef VIMAGE 142708b43333SJamie Gritton for (tppr = ppr; tppr != &prison0; tppr = tppr->pr_parent) 1428bdfc8cc4SJamie Gritton if (tppr->pr_flags & PR_VNET) 1429bdfc8cc4SJamie Gritton break; 143008b43333SJamie Gritton #else 143108b43333SJamie Gritton tppr = &prison0; 1432bdfc8cc4SJamie Gritton #endif 1433bdfc8cc4SJamie Gritton FOREACH_PRISON_DESCENDANT(tppr, tpr, descend) { 1434bdfc8cc4SJamie Gritton if (tpr == pr || 1435bdfc8cc4SJamie Gritton #ifdef VIMAGE 14362b0d6f81SJamie Gritton (tpr != tppr && (tpr->pr_flags & PR_VNET)) || 1437bdfc8cc4SJamie Gritton #endif 1438f7496dcaSJamie Gritton !prison_isalive(tpr)) { 14390304c731SJamie Gritton descend = 0; 14400304c731SJamie Gritton continue; 14410304c731SJamie Gritton } 14420304c731SJamie Gritton if (!(tpr->pr_flags & PR_IP4_USER)) 14430304c731SJamie Gritton continue; 14440304c731SJamie Gritton descend = 0; 14450304c731SJamie Gritton if (tpr->pr_ip4 == NULL || 14460304c731SJamie Gritton (ip4s == 1 && tpr->pr_ip4s == 1)) 14470304c731SJamie Gritton continue; 14480304c731SJamie Gritton for (ii = 0; ii < ip4s; ii++) { 14490ce1624dSStephen J. Kiernan if (prison_check_ip4_locked(tpr, &ip4[ii]) == 14500ce1624dSStephen J. Kiernan 0) { 14510304c731SJamie Gritton error = EADDRINUSE; 1452b38ff370SJamie Gritton vfs_opterror(opts, 1453b38ff370SJamie Gritton "IPv4 addresses clash"); 14542a4b2251SJamie Gritton goto done_deref; 1455b38ff370SJamie Gritton } 14560304c731SJamie Gritton } 14570304c731SJamie Gritton } 14580304c731SJamie Gritton } 1459b38ff370SJamie Gritton #endif 1460b38ff370SJamie Gritton #ifdef INET6 14612b0d6f81SJamie Gritton if (ip6s > 0) { 14620304c731SJamie Gritton if (ppr->pr_flags & PR_IP6) { 14630304c731SJamie Gritton /* 14640304c731SJamie Gritton * Make sure the new set of IP addresses is a 14650304c731SJamie Gritton * subset of the parent's list. 14660304c731SJamie Gritton */ 14670304c731SJamie Gritton for (ij = 0; ij < ppr->pr_ip6s; ij++) 14680304c731SJamie Gritton if (IN6_ARE_ADDR_EQUAL(&ip6[0], 14690304c731SJamie Gritton &ppr->pr_ip6[ij])) 14700304c731SJamie Gritton break; 14710304c731SJamie Gritton if (ij == ppr->pr_ip6s) { 14720304c731SJamie Gritton error = EPERM; 14732a4b2251SJamie Gritton goto done_deref; 14740304c731SJamie Gritton } 14750304c731SJamie Gritton if (ip6s > 1) { 14760304c731SJamie Gritton for (ii = ij = 1; ii < ip6s; ii++) { 14770304c731SJamie Gritton if (IN6_ARE_ADDR_EQUAL(&ip6[ii], 14780304c731SJamie Gritton &ppr->pr_ip6[0])) 14790304c731SJamie Gritton continue; 14800304c731SJamie Gritton for (; ij < ppr->pr_ip6s; ij++) 14810304c731SJamie Gritton if (IN6_ARE_ADDR_EQUAL( 14822b0d6f81SJamie Gritton &ip6[ii], &ppr->pr_ip6[ij])) 14830304c731SJamie Gritton break; 14840304c731SJamie Gritton if (ij == ppr->pr_ip6s) 14850304c731SJamie Gritton break; 14860304c731SJamie Gritton } 14870304c731SJamie Gritton if (ij == ppr->pr_ip6s) { 14880304c731SJamie Gritton error = EPERM; 14892a4b2251SJamie Gritton goto done_deref; 14900304c731SJamie Gritton } 14910304c731SJamie Gritton } 14920304c731SJamie Gritton } 14930304c731SJamie Gritton /* Check for conflicting IP addresses. */ 1494bdfc8cc4SJamie Gritton #ifdef VIMAGE 149508b43333SJamie Gritton for (tppr = ppr; tppr != &prison0; tppr = tppr->pr_parent) 1496bdfc8cc4SJamie Gritton if (tppr->pr_flags & PR_VNET) 1497bdfc8cc4SJamie Gritton break; 149808b43333SJamie Gritton #else 149908b43333SJamie Gritton tppr = &prison0; 1500bdfc8cc4SJamie Gritton #endif 1501bdfc8cc4SJamie Gritton FOREACH_PRISON_DESCENDANT(tppr, tpr, descend) { 1502bdfc8cc4SJamie Gritton if (tpr == pr || 1503bdfc8cc4SJamie Gritton #ifdef VIMAGE 15042b0d6f81SJamie Gritton (tpr != tppr && (tpr->pr_flags & PR_VNET)) || 1505bdfc8cc4SJamie Gritton #endif 1506f7496dcaSJamie Gritton !prison_isalive(tpr)) { 15070304c731SJamie Gritton descend = 0; 15080304c731SJamie Gritton continue; 15090304c731SJamie Gritton } 15100304c731SJamie Gritton if (!(tpr->pr_flags & PR_IP6_USER)) 15110304c731SJamie Gritton continue; 15120304c731SJamie Gritton descend = 0; 15130304c731SJamie Gritton if (tpr->pr_ip6 == NULL || 15140304c731SJamie Gritton (ip6s == 1 && tpr->pr_ip6s == 1)) 15150304c731SJamie Gritton continue; 15160304c731SJamie Gritton for (ii = 0; ii < ip6s; ii++) { 15170ce1624dSStephen J. Kiernan if (prison_check_ip6_locked(tpr, &ip6[ii]) == 15180ce1624dSStephen J. Kiernan 0) { 15190304c731SJamie Gritton error = EADDRINUSE; 1520b38ff370SJamie Gritton vfs_opterror(opts, 1521b38ff370SJamie Gritton "IPv6 addresses clash"); 15222a4b2251SJamie Gritton goto done_deref; 1523b38ff370SJamie Gritton } 15240304c731SJamie Gritton } 15250304c731SJamie Gritton } 15260304c731SJamie Gritton } 1527b38ff370SJamie Gritton #endif 15280304c731SJamie Gritton onamelen = namelen = 0; 1529b6f47c23SJamie Gritton if (namelc != NULL) { 15306ab6058eSJamie Gritton /* Give a default name of the jid. Also allow the name to be 15316ab6058eSJamie Gritton * explicitly the jid - but not any other number, and only in 15326ab6058eSJamie Gritton * normal form (no leading zero/etc). 15336ab6058eSJamie Gritton */ 1534b6f47c23SJamie Gritton if (namelc[0] == '\0') 1535b6f47c23SJamie Gritton snprintf(namelc = numbuf, sizeof(numbuf), "%d", jid); 15366ab6058eSJamie Gritton else if ((strtoul(namelc, &p, 10) != jid || 15376ab6058eSJamie Gritton namelc[0] < '1' || namelc[0] > '9') && *p == '\0') { 1538b38ff370SJamie Gritton error = EINVAL; 1539babbbb9cSJamie Gritton vfs_opterror(opts, 1540babbbb9cSJamie Gritton "name cannot be numeric (unless it is the jid)"); 15412a4b2251SJamie Gritton goto done_deref; 1542b38ff370SJamie Gritton } 1543b38ff370SJamie Gritton /* 15440304c731SJamie Gritton * Make sure the name isn't too long for the prison or its 15450304c731SJamie Gritton * children. 1546b38ff370SJamie Gritton */ 1547b6f47c23SJamie Gritton pnamelen = (ppr == &prison0) ? 0 : strlen(ppr->pr_name) + 1; 1548b6f47c23SJamie Gritton onamelen = strlen(pr->pr_name + pnamelen); 1549b6f47c23SJamie Gritton namelen = strlen(namelc); 1550b6f47c23SJamie Gritton if (pnamelen + namelen + 1 > sizeof(pr->pr_name)) { 15510304c731SJamie Gritton error = ENAMETOOLONG; 15522a4b2251SJamie Gritton goto done_deref; 15530304c731SJamie Gritton } 15540304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(pr, tpr, descend) { 15550304c731SJamie Gritton if (strlen(tpr->pr_name) + (namelen - onamelen) >= 15560304c731SJamie Gritton sizeof(pr->pr_name)) { 15570304c731SJamie Gritton error = ENAMETOOLONG; 15582a4b2251SJamie Gritton goto done_deref; 15590304c731SJamie Gritton } 15600304c731SJamie Gritton } 15610304c731SJamie Gritton } 1562b3079544SJamie Gritton pr_allow_diff = pr_allow & ~ppr->pr_allow; 1563b3079544SJamie Gritton if (pr_allow_diff & ~PR_ALLOW_DIFFERENCES) { 15640304c731SJamie Gritton error = EPERM; 15652a4b2251SJamie Gritton goto done_deref; 1566b38ff370SJamie Gritton } 1567b38ff370SJamie Gritton 1568b6f47c23SJamie Gritton /* 1569b6f47c23SJamie Gritton * Let modules check their parameters. This requires unlocking and 1570b6f47c23SJamie Gritton * then re-locking the prison, but this is still a valid state as long 1571b6f47c23SJamie Gritton * as allprison_lock remains xlocked. 1572b6f47c23SJamie Gritton */ 1573b6f47c23SJamie Gritton mtx_unlock(&pr->pr_mtx); 15742a4b2251SJamie Gritton drflags &= ~PD_LOCKED; 1575b6f47c23SJamie Gritton error = osd_jail_call(pr, PR_METHOD_CHECK, opts); 15762a4b2251SJamie Gritton if (error != 0) 15772a4b2251SJamie Gritton goto done_deref; 1578b6f47c23SJamie Gritton mtx_lock(&pr->pr_mtx); 15792a4b2251SJamie Gritton drflags |= PD_LOCKED; 1580b6f47c23SJamie Gritton 1581b6f47c23SJamie Gritton /* At this point, all valid parameters should have been noted. */ 1582b6f47c23SJamie Gritton TAILQ_FOREACH(opt, opts, link) { 1583b6f47c23SJamie Gritton if (!opt->seen && strcmp(opt->name, "errmsg")) { 1584b6f47c23SJamie Gritton error = EINVAL; 1585b6f47c23SJamie Gritton vfs_opterror(opts, "unknown parameter: %s", opt->name); 15862a4b2251SJamie Gritton goto done_deref; 1587b6f47c23SJamie Gritton } 1588b6f47c23SJamie Gritton } 1589b6f47c23SJamie Gritton 1590b38ff370SJamie Gritton /* Set the parameters of the prison. */ 1591b38ff370SJamie Gritton #ifdef INET 15920304c731SJamie Gritton redo_ip4 = 0; 15930304c731SJamie Gritton if (pr_flags & PR_IP4_USER) { 15940304c731SJamie Gritton pr->pr_flags |= PR_IP4; 1595b38ff370SJamie Gritton free(pr->pr_ip4, M_PRISON); 15960304c731SJamie Gritton pr->pr_ip4s = ip4s; 1597b38ff370SJamie Gritton pr->pr_ip4 = ip4; 1598b38ff370SJamie Gritton ip4 = NULL; 15990304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1600bdfc8cc4SJamie Gritton #ifdef VIMAGE 1601bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1602bdfc8cc4SJamie Gritton descend = 0; 1603bdfc8cc4SJamie Gritton continue; 1604bdfc8cc4SJamie Gritton } 1605bdfc8cc4SJamie Gritton #endif 16060304c731SJamie Gritton if (prison_restrict_ip4(tpr, NULL)) { 16070304c731SJamie Gritton redo_ip4 = 1; 16080304c731SJamie Gritton descend = 0; 16090304c731SJamie Gritton } 16100304c731SJamie Gritton } 16110304c731SJamie Gritton } 1612b38ff370SJamie Gritton #endif 1613b38ff370SJamie Gritton #ifdef INET6 16140304c731SJamie Gritton redo_ip6 = 0; 16150304c731SJamie Gritton if (pr_flags & PR_IP6_USER) { 16160304c731SJamie Gritton pr->pr_flags |= PR_IP6; 1617b38ff370SJamie Gritton free(pr->pr_ip6, M_PRISON); 16180304c731SJamie Gritton pr->pr_ip6s = ip6s; 1619b38ff370SJamie Gritton pr->pr_ip6 = ip6; 1620b38ff370SJamie Gritton ip6 = NULL; 16210304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1622bdfc8cc4SJamie Gritton #ifdef VIMAGE 1623bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1624bdfc8cc4SJamie Gritton descend = 0; 1625bdfc8cc4SJamie Gritton continue; 1626bdfc8cc4SJamie Gritton } 1627bdfc8cc4SJamie Gritton #endif 16280304c731SJamie Gritton if (prison_restrict_ip6(tpr, NULL)) { 16290304c731SJamie Gritton redo_ip6 = 1; 16300304c731SJamie Gritton descend = 0; 16310304c731SJamie Gritton } 16320304c731SJamie Gritton } 16330304c731SJamie Gritton } 1634b38ff370SJamie Gritton #endif 16350304c731SJamie Gritton if (gotslevel) { 1636b38ff370SJamie Gritton pr->pr_securelevel = slevel; 16370304c731SJamie Gritton /* Set all child jails to be at least this level. */ 16380304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16390304c731SJamie Gritton if (tpr->pr_securelevel < slevel) 16400304c731SJamie Gritton tpr->pr_securelevel = slevel; 16410304c731SJamie Gritton } 1642b97457e2SJamie Gritton if (gotchildmax) { 1643b97457e2SJamie Gritton pr->pr_childmax = childmax; 1644b97457e2SJamie Gritton /* Set all child jails to under this limit. */ 1645b97457e2SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED_LEVEL(pr, tpr, descend, level) 1646b97457e2SJamie Gritton if (tpr->pr_childmax > childmax - level) 1647b97457e2SJamie Gritton tpr->pr_childmax = childmax > level 1648b97457e2SJamie Gritton ? childmax - level : 0; 1649b97457e2SJamie Gritton } 16500304c731SJamie Gritton if (gotenforce) { 16510304c731SJamie Gritton pr->pr_enforce_statfs = enforce; 16520304c731SJamie Gritton /* Pass this restriction on to the children. */ 16530304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16540304c731SJamie Gritton if (tpr->pr_enforce_statfs < enforce) 16550304c731SJamie Gritton tpr->pr_enforce_statfs = enforce; 16560304c731SJamie Gritton } 16570cc207a6SMartin Matuska if (gotrsnum) { 16580cc207a6SMartin Matuska pr->pr_devfs_rsnum = rsnum; 16590cc207a6SMartin Matuska /* Pass this restriction on to the children. */ 16600cc207a6SMartin Matuska FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) 16610cc207a6SMartin Matuska tpr->pr_devfs_rsnum = rsnum; 16620cc207a6SMartin Matuska } 1663b6f47c23SJamie Gritton if (namelc != NULL) { 16640304c731SJamie Gritton if (ppr == &prison0) 1665b6f47c23SJamie Gritton strlcpy(pr->pr_name, namelc, sizeof(pr->pr_name)); 16660304c731SJamie Gritton else 16670304c731SJamie Gritton snprintf(pr->pr_name, sizeof(pr->pr_name), "%s.%s", 1668b6f47c23SJamie Gritton ppr->pr_name, namelc); 16690304c731SJamie Gritton /* Change this component of child names. */ 16700304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 16710304c731SJamie Gritton bcopy(tpr->pr_name + onamelen, tpr->pr_name + namelen, 16720304c731SJamie Gritton strlen(tpr->pr_name + onamelen) + 1); 16730304c731SJamie Gritton bcopy(pr->pr_name, tpr->pr_name, namelen); 16740304c731SJamie Gritton } 16750304c731SJamie Gritton } 1676b38ff370SJamie Gritton if (path != NULL) { 16770304c731SJamie Gritton /* Try to keep a real-rooted full pathname. */ 1678b38ff370SJamie Gritton strlcpy(pr->pr_path, path, sizeof(pr->pr_path)); 1679b38ff370SJamie Gritton pr->pr_root = root; 16802a4b2251SJamie Gritton root = NULL; 1681b38ff370SJamie Gritton } 168276ca6f88SJamie Gritton if (PR_HOST & ch_flags & ~pr_flags) { 168376ca6f88SJamie Gritton if (pr->pr_flags & PR_HOST) { 168476ca6f88SJamie Gritton /* 168576ca6f88SJamie Gritton * Copy the parent's host info. As with pr_ip4 above, 168676ca6f88SJamie Gritton * the lack of a lock on the parent is not a problem; 168776ca6f88SJamie Gritton * it is always set with allprison_lock at least 168876ca6f88SJamie Gritton * shared, and is held exclusively here. 168976ca6f88SJamie Gritton */ 1690c1f19219SJamie Gritton strlcpy(pr->pr_hostname, pr->pr_parent->pr_hostname, 1691c1f19219SJamie Gritton sizeof(pr->pr_hostname)); 1692c1f19219SJamie Gritton strlcpy(pr->pr_domainname, pr->pr_parent->pr_domainname, 1693c1f19219SJamie Gritton sizeof(pr->pr_domainname)); 1694c1f19219SJamie Gritton strlcpy(pr->pr_hostuuid, pr->pr_parent->pr_hostuuid, 1695c1f19219SJamie Gritton sizeof(pr->pr_hostuuid)); 169676ca6f88SJamie Gritton pr->pr_hostid = pr->pr_parent->pr_hostid; 169776ca6f88SJamie Gritton } 169876ca6f88SJamie Gritton } else if (host != NULL || domain != NULL || uuid != NULL || gothid) { 169976ca6f88SJamie Gritton /* Set this prison, and any descendants without PR_HOST. */ 1700b38ff370SJamie Gritton if (host != NULL) 1701c1f19219SJamie Gritton strlcpy(pr->pr_hostname, host, sizeof(pr->pr_hostname)); 170276ca6f88SJamie Gritton if (domain != NULL) 1703c1f19219SJamie Gritton strlcpy(pr->pr_domainname, domain, 1704c1f19219SJamie Gritton sizeof(pr->pr_domainname)); 170576ca6f88SJamie Gritton if (uuid != NULL) 1706c1f19219SJamie Gritton strlcpy(pr->pr_hostuuid, uuid, sizeof(pr->pr_hostuuid)); 170776ca6f88SJamie Gritton if (gothid) 170876ca6f88SJamie Gritton pr->pr_hostid = hid; 170976ca6f88SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 171076ca6f88SJamie Gritton if (tpr->pr_flags & PR_HOST) 171176ca6f88SJamie Gritton descend = 0; 171276ca6f88SJamie Gritton else { 171376ca6f88SJamie Gritton if (host != NULL) 1714c1f19219SJamie Gritton strlcpy(tpr->pr_hostname, 1715c1f19219SJamie Gritton pr->pr_hostname, 1716c1f19219SJamie Gritton sizeof(tpr->pr_hostname)); 171776ca6f88SJamie Gritton if (domain != NULL) 1718c1f19219SJamie Gritton strlcpy(tpr->pr_domainname, 1719c1f19219SJamie Gritton pr->pr_domainname, 1720c1f19219SJamie Gritton sizeof(tpr->pr_domainname)); 172176ca6f88SJamie Gritton if (uuid != NULL) 1722c1f19219SJamie Gritton strlcpy(tpr->pr_hostuuid, 1723c1f19219SJamie Gritton pr->pr_hostuuid, 1724c1f19219SJamie Gritton sizeof(tpr->pr_hostuuid)); 172576ca6f88SJamie Gritton if (gothid) 172676ca6f88SJamie Gritton tpr->pr_hostid = hid; 172776ca6f88SJamie Gritton } 172876ca6f88SJamie Gritton } 172976ca6f88SJamie Gritton } 17300304c731SJamie Gritton pr->pr_allow = (pr->pr_allow & ~ch_allow) | pr_allow; 17310fe74ae6SJamie Gritton if ((tallow = ch_allow & ~pr_allow)) 17320fe74ae6SJamie Gritton prison_set_allow_locked(pr, tallow, 0); 1733b38ff370SJamie Gritton /* 1734b38ff370SJamie Gritton * Persistent prisons get an extra reference, and prisons losing their 17351158508aSJamie Gritton * persist flag lose that reference. 1736b38ff370SJamie Gritton */ 173776ad42abSJamie Gritton born = !prison_isalive(pr); 17381158508aSJamie Gritton if (ch_flags & PR_PERSIST & (pr_flags ^ pr->pr_flags)) { 1739b38ff370SJamie Gritton if (pr_flags & PR_PERSIST) { 17406754ae25SJamie Gritton prison_hold(pr); 17411158508aSJamie Gritton /* 17421158508aSJamie Gritton * This may make a dead prison alive again, but wait 17431158508aSJamie Gritton * to label it as such until after OSD calls have had 17441158508aSJamie Gritton * a chance to run (and perhaps to fail). 17451158508aSJamie Gritton */ 17466754ae25SJamie Gritton refcount_acquire(&pr->pr_uref); 1747b38ff370SJamie Gritton } else { 174839c8ef90SJamie Gritton drflags |= PD_DEUREF; 1749f7496dcaSJamie Gritton prison_free_not_last(pr); 1750b38ff370SJamie Gritton } 1751b38ff370SJamie Gritton } 1752b38ff370SJamie Gritton pr->pr_flags = (pr->pr_flags & ~ch_flags) | pr_flags; 1753b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 17542a4b2251SJamie Gritton drflags &= ~PD_LOCKED; 1755c861373bSJamie Gritton /* 1756c861373bSJamie Gritton * Any errors past this point will need to de-persist newly created 1757c861373bSJamie Gritton * prisons, as well as call remove methods. 1758c861373bSJamie Gritton */ 1759c861373bSJamie Gritton if (born) 1760c861373bSJamie Gritton drflags |= PD_KILL; 1761b38ff370SJamie Gritton 1762a7ad07bfSEdward Tomasz Napierala #ifdef RACCT 17634b5c9cf6SEdward Tomasz Napierala if (racct_enable && created) 1764a7ad07bfSEdward Tomasz Napierala prison_racct_attach(pr); 1765a7ad07bfSEdward Tomasz Napierala #endif 1766a7ad07bfSEdward Tomasz Napierala 17670304c731SJamie Gritton /* Locks may have prevented a complete restriction of child IP 17680304c731SJamie Gritton * addresses. If so, allocate some more memory and try again. 17690304c731SJamie Gritton */ 17700304c731SJamie Gritton #ifdef INET 17710304c731SJamie Gritton while (redo_ip4) { 17720304c731SJamie Gritton ip4s = pr->pr_ip4s; 17730304c731SJamie Gritton ip4 = malloc(ip4s * sizeof(*ip4), M_PRISON, M_WAITOK); 17740304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 17750304c731SJamie Gritton redo_ip4 = 0; 17760304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1777bdfc8cc4SJamie Gritton #ifdef VIMAGE 1778bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1779bdfc8cc4SJamie Gritton descend = 0; 1780bdfc8cc4SJamie Gritton continue; 1781bdfc8cc4SJamie Gritton } 1782bdfc8cc4SJamie Gritton #endif 17830304c731SJamie Gritton if (prison_restrict_ip4(tpr, ip4)) { 17840304c731SJamie Gritton if (ip4 != NULL) 17850304c731SJamie Gritton ip4 = NULL; 17860304c731SJamie Gritton else 17870304c731SJamie Gritton redo_ip4 = 1; 17880304c731SJamie Gritton } 17890304c731SJamie Gritton } 17900304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 17910304c731SJamie Gritton } 17920304c731SJamie Gritton #endif 17930304c731SJamie Gritton #ifdef INET6 17940304c731SJamie Gritton while (redo_ip6) { 17950304c731SJamie Gritton ip6s = pr->pr_ip6s; 17960304c731SJamie Gritton ip6 = malloc(ip6s * sizeof(*ip6), M_PRISON, M_WAITOK); 17970304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 17980304c731SJamie Gritton redo_ip6 = 0; 17990304c731SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, tpr, descend) { 1800bdfc8cc4SJamie Gritton #ifdef VIMAGE 1801bdfc8cc4SJamie Gritton if (tpr->pr_flags & PR_VNET) { 1802bdfc8cc4SJamie Gritton descend = 0; 1803bdfc8cc4SJamie Gritton continue; 1804bdfc8cc4SJamie Gritton } 1805bdfc8cc4SJamie Gritton #endif 18060304c731SJamie Gritton if (prison_restrict_ip6(tpr, ip6)) { 18070304c731SJamie Gritton if (ip6 != NULL) 18080304c731SJamie Gritton ip6 = NULL; 18090304c731SJamie Gritton else 18100304c731SJamie Gritton redo_ip6 = 1; 18110304c731SJamie Gritton } 18120304c731SJamie Gritton } 18130304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 18140304c731SJamie Gritton } 18150304c731SJamie Gritton #endif 18160304c731SJamie Gritton 1817b38ff370SJamie Gritton /* Let the modules do their work. */ 1818cc5fd8c7SJamie Gritton if (born) { 1819b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_CREATE, opts); 1820c861373bSJamie Gritton if (error) 18212a4b2251SJamie Gritton goto done_deref; 1822b38ff370SJamie Gritton } 1823b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_SET, opts); 1824c861373bSJamie Gritton if (error) 18252a4b2251SJamie Gritton goto done_deref; 1826b38ff370SJamie Gritton 18271158508aSJamie Gritton /* 18281158508aSJamie Gritton * A new prison is now ready to be seen; either it has gained a user 18291158508aSJamie Gritton * reference via persistence, or is about to gain one via attachment. 18301158508aSJamie Gritton */ 18311158508aSJamie Gritton if (born) { 18321158508aSJamie Gritton drflags = prison_lock_xlock(pr, drflags); 18331158508aSJamie Gritton pr->pr_state = PRISON_STATE_ALIVE; 18341158508aSJamie Gritton } 18351158508aSJamie Gritton 1836b38ff370SJamie Gritton /* Attach this process to the prison if requested. */ 1837b38ff370SJamie Gritton if (flags & JAIL_ATTACH) { 1838c861373bSJamie Gritton error = do_jail_attach(td, pr, 1839589e4c1dSJamie Gritton prison_lock_xlock(pr, drflags & PD_LOCK_FLAGS)); 1840f7496dcaSJamie Gritton drflags &= ~(PD_LOCKED | PD_LIST_XLOCKED); 1841b38ff370SJamie Gritton if (error) { 1842b38ff370SJamie Gritton vfs_opterror(opts, "attach failed"); 18432a4b2251SJamie Gritton goto done_deref; 1844b38ff370SJamie Gritton } 1845b38ff370SJamie Gritton } 1846b38ff370SJamie Gritton 18471fb24974SEdward Tomasz Napierala #ifdef RACCT 18484b5c9cf6SEdward Tomasz Napierala if (racct_enable && !created) { 1849701d6b50SJamie Gritton if (drflags & PD_LOCKED) { 1850701d6b50SJamie Gritton mtx_unlock(&pr->pr_mtx); 1851701d6b50SJamie Gritton drflags &= ~PD_LOCKED; 1852701d6b50SJamie Gritton } 1853f7496dcaSJamie Gritton if (drflags & PD_LIST_XLOCKED) { 1854f7496dcaSJamie Gritton sx_xunlock(&allprison_lock); 1855f7496dcaSJamie Gritton drflags &= ~PD_LIST_XLOCKED; 1856b4e87a63SJamie Gritton } 18571fb24974SEdward Tomasz Napierala prison_racct_modify(pr); 18581fb24974SEdward Tomasz Napierala } 18591fb24974SEdward Tomasz Napierala #endif 18601fb24974SEdward Tomasz Napierala 1861c861373bSJamie Gritton drflags &= ~PD_KILL; 18621fb24974SEdward Tomasz Napierala td->td_retval[0] = pr->pr_id; 18631fb24974SEdward Tomasz Napierala 18642a4b2251SJamie Gritton done_deref: 18652a4b2251SJamie Gritton /* Release any temporary prison holds and/or locks. */ 18662a4b2251SJamie Gritton if (pr != NULL) 18672a4b2251SJamie Gritton prison_deref(pr, drflags); 18682a4b2251SJamie Gritton else if (drflags & PD_LIST_SLOCKED) 1869b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 18702a4b2251SJamie Gritton else if (drflags & PD_LIST_XLOCKED) 1871b38ff370SJamie Gritton sx_xunlock(&allprison_lock); 18725050aa86SKonstantin Belousov if (root != NULL) 1873b38ff370SJamie Gritton vrele(root); 1874b38ff370SJamie Gritton done_errmsg: 1875b38ff370SJamie Gritton if (error) { 18762a4b2251SJamie Gritton /* Write the error message back to userspace. */ 1877176ff3a0SJamie Gritton if (vfs_getopt(opts, "errmsg", (void **)&errmsg, 1878176ff3a0SJamie Gritton &errmsg_len) == 0 && errmsg_len > 0) { 1879b38ff370SJamie Gritton errmsg_pos = 2 * vfs_getopt_pos(opts, "errmsg") + 1; 1880b38ff370SJamie Gritton if (optuio->uio_segflg == UIO_SYSSPACE) 1881b38ff370SJamie Gritton bcopy(errmsg, 1882b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 1883b38ff370SJamie Gritton errmsg_len); 1884b38ff370SJamie Gritton else 1885b38ff370SJamie Gritton copyout(errmsg, 1886b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 1887b38ff370SJamie Gritton errmsg_len); 1888b38ff370SJamie Gritton } 1889b38ff370SJamie Gritton } 1890b38ff370SJamie Gritton done_free: 1891b38ff370SJamie Gritton #ifdef INET 1892b38ff370SJamie Gritton free(ip4, M_PRISON); 1893b38ff370SJamie Gritton #endif 1894b38ff370SJamie Gritton #ifdef INET6 1895b38ff370SJamie Gritton free(ip6, M_PRISON); 1896b38ff370SJamie Gritton #endif 18976dfe0a3dSMartin Matuska if (g_path != NULL) 18986dfe0a3dSMartin Matuska free(g_path, M_TEMP); 1899b38ff370SJamie Gritton vfs_freeopts(opts); 1900b38ff370SJamie Gritton return (error); 1901b38ff370SJamie Gritton } 1902b38ff370SJamie Gritton 1903b38ff370SJamie Gritton /* 19047de883c8SJamie Gritton * Find the next available prison ID. Return the ID on success, or zero 19057de883c8SJamie Gritton * on failure. Also set a pointer to the allprison list entry the prison 19067de883c8SJamie Gritton * should be inserted before. 19077de883c8SJamie Gritton */ 19087de883c8SJamie Gritton static int 19097de883c8SJamie Gritton get_next_prid(struct prison **insprp) 19107de883c8SJamie Gritton { 19117de883c8SJamie Gritton struct prison *inspr; 19127de883c8SJamie Gritton int jid, maxid; 19137de883c8SJamie Gritton 19147de883c8SJamie Gritton jid = lastprid % JAIL_MAX + 1; 19157de883c8SJamie Gritton if (TAILQ_EMPTY(&allprison) || 19167de883c8SJamie Gritton TAILQ_LAST(&allprison, prisonlist)->pr_id < jid) { 19177de883c8SJamie Gritton /* 19187de883c8SJamie Gritton * A common case is for all jails to be implicitly numbered, 19197de883c8SJamie Gritton * which means they'll go on the end of the list, at least 19207de883c8SJamie Gritton * for the first JAIL_MAX times. 19217de883c8SJamie Gritton */ 19227de883c8SJamie Gritton inspr = NULL; 19237de883c8SJamie Gritton } else { 19247de883c8SJamie Gritton /* 19257de883c8SJamie Gritton * Take two passes through the allprison list: first starting 19267de883c8SJamie Gritton * with the proposed jid, then ending with it. 19277de883c8SJamie Gritton */ 19287de883c8SJamie Gritton for (maxid = JAIL_MAX; maxid != 0; ) { 19297de883c8SJamie Gritton TAILQ_FOREACH(inspr, &allprison, pr_list) { 19307de883c8SJamie Gritton if (inspr->pr_id < jid) 19317de883c8SJamie Gritton continue; 1932f7496dcaSJamie Gritton if (inspr->pr_id > jid) { 1933f7496dcaSJamie Gritton /* Found an opening. */ 19347de883c8SJamie Gritton maxid = 0; 19357de883c8SJamie Gritton break; 19367de883c8SJamie Gritton } 19377de883c8SJamie Gritton if (++jid > maxid) { 19387de883c8SJamie Gritton if (lastprid == maxid || lastprid == 0) 19397de883c8SJamie Gritton { 19407de883c8SJamie Gritton /* 19417de883c8SJamie Gritton * The entire legal range 19427de883c8SJamie Gritton * has been traversed 19437de883c8SJamie Gritton */ 19447de883c8SJamie Gritton return 0; 19457de883c8SJamie Gritton } 19467de883c8SJamie Gritton /* Try again from the start. */ 19477de883c8SJamie Gritton jid = 1; 19487de883c8SJamie Gritton maxid = lastprid; 19497de883c8SJamie Gritton break; 19507de883c8SJamie Gritton } 19517de883c8SJamie Gritton } 19527de883c8SJamie Gritton if (inspr == NULL) { 19537de883c8SJamie Gritton /* Found room at the end of the list. */ 19547de883c8SJamie Gritton break; 19557de883c8SJamie Gritton } 19567de883c8SJamie Gritton } 19577de883c8SJamie Gritton } 19587de883c8SJamie Gritton *insprp = inspr; 19597de883c8SJamie Gritton lastprid = jid; 19607de883c8SJamie Gritton return (jid); 19617de883c8SJamie Gritton } 19627de883c8SJamie Gritton 19637de883c8SJamie Gritton /* 1964b38ff370SJamie Gritton * struct jail_get_args { 1965b38ff370SJamie Gritton * struct iovec *iovp; 1966b38ff370SJamie Gritton * unsigned int iovcnt; 1967b38ff370SJamie Gritton * int flags; 1968b38ff370SJamie Gritton * }; 1969b38ff370SJamie Gritton */ 1970b38ff370SJamie Gritton int 19718451d0ddSKip Macy sys_jail_get(struct thread *td, struct jail_get_args *uap) 1972b38ff370SJamie Gritton { 1973b38ff370SJamie Gritton struct uio *auio; 1974b38ff370SJamie Gritton int error; 1975b38ff370SJamie Gritton 1976b38ff370SJamie Gritton /* Check that we have an even number of iovecs. */ 1977b38ff370SJamie Gritton if (uap->iovcnt & 1) 1978b38ff370SJamie Gritton return (EINVAL); 1979b38ff370SJamie Gritton 1980b38ff370SJamie Gritton error = copyinuio(uap->iovp, uap->iovcnt, &auio); 1981b38ff370SJamie Gritton if (error) 1982b38ff370SJamie Gritton return (error); 1983b38ff370SJamie Gritton error = kern_jail_get(td, auio, uap->flags); 1984b38ff370SJamie Gritton if (error == 0) 1985b38ff370SJamie Gritton error = copyout(auio->uio_iov, uap->iovp, 1986b38ff370SJamie Gritton uap->iovcnt * sizeof (struct iovec)); 1987b38ff370SJamie Gritton free(auio, M_IOV); 1988b38ff370SJamie Gritton return (error); 1989b38ff370SJamie Gritton } 1990b38ff370SJamie Gritton 1991b38ff370SJamie Gritton int 1992b38ff370SJamie Gritton kern_jail_get(struct thread *td, struct uio *optuio, int flags) 1993b38ff370SJamie Gritton { 1994672756aaSJamie Gritton struct bool_flags *bf; 1995672756aaSJamie Gritton struct jailsys_flags *jsf; 19960304c731SJamie Gritton struct prison *pr, *mypr; 1997b38ff370SJamie Gritton struct vfsopt *opt; 1998b38ff370SJamie Gritton struct vfsoptlist *opts; 1999b38ff370SJamie Gritton char *errmsg, *name; 20002a4b2251SJamie Gritton int drflags, error, errmsg_len, errmsg_pos, i, jid, len, pos; 2001672756aaSJamie Gritton unsigned f; 2002b38ff370SJamie Gritton 2003b38ff370SJamie Gritton if (flags & ~JAIL_GET_MASK) 2004b38ff370SJamie Gritton return (EINVAL); 2005b38ff370SJamie Gritton 2006b38ff370SJamie Gritton /* Get the parameter list. */ 2007b38ff370SJamie Gritton error = vfs_buildopts(optuio, &opts); 2008b38ff370SJamie Gritton if (error) 2009b38ff370SJamie Gritton return (error); 2010b38ff370SJamie Gritton errmsg_pos = vfs_getopt_pos(opts, "errmsg"); 20110304c731SJamie Gritton mypr = td->td_ucred->cr_prison; 20122a4b2251SJamie Gritton pr = NULL; 20131e2a13e6SJamie Gritton 2014b38ff370SJamie Gritton /* 2015b38ff370SJamie Gritton * Find the prison specified by one of: lastjid, jid, name. 2016b38ff370SJamie Gritton */ 2017b38ff370SJamie Gritton sx_slock(&allprison_lock); 20182a4b2251SJamie Gritton drflags = PD_LIST_SLOCKED; 2019b38ff370SJamie Gritton error = vfs_copyopt(opts, "lastjid", &jid, sizeof(jid)); 2020b38ff370SJamie Gritton if (error == 0) { 2021b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) { 2022f7496dcaSJamie Gritton if (pr->pr_id > jid && 2023f7496dcaSJamie Gritton ((flags & JAIL_DYING) || prison_isalive(pr)) && 2024f7496dcaSJamie Gritton prison_ischild(mypr, pr)) { 2025b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 20262a4b2251SJamie Gritton drflags |= PD_LOCKED; 2027b38ff370SJamie Gritton goto found_prison; 20282a4b2251SJamie Gritton } 2029f7496dcaSJamie Gritton } 2030b38ff370SJamie Gritton error = ENOENT; 2031b38ff370SJamie Gritton vfs_opterror(opts, "no jail after %d", jid); 20322a4b2251SJamie Gritton goto done; 2033b38ff370SJamie Gritton } else if (error != ENOENT) 20342a4b2251SJamie Gritton goto done; 2035b38ff370SJamie Gritton 2036b38ff370SJamie Gritton error = vfs_copyopt(opts, "jid", &jid, sizeof(jid)); 2037b38ff370SJamie Gritton if (error == 0) { 2038b38ff370SJamie Gritton if (jid != 0) { 20390304c731SJamie Gritton pr = prison_find_child(mypr, jid); 2040b38ff370SJamie Gritton if (pr != NULL) { 20412a4b2251SJamie Gritton drflags |= PD_LOCKED; 204276ad42abSJamie Gritton if (!(prison_isalive(pr) || 204376ad42abSJamie Gritton (flags & JAIL_DYING))) { 2044b38ff370SJamie Gritton error = ENOENT; 2045b38ff370SJamie Gritton vfs_opterror(opts, "jail %d is dying", 2046b38ff370SJamie Gritton jid); 20472a4b2251SJamie Gritton goto done; 2048b38ff370SJamie Gritton } 2049b38ff370SJamie Gritton goto found_prison; 2050b38ff370SJamie Gritton } 2051b38ff370SJamie Gritton error = ENOENT; 2052b38ff370SJamie Gritton vfs_opterror(opts, "jail %d not found", jid); 20532a4b2251SJamie Gritton goto done; 2054b38ff370SJamie Gritton } 2055b38ff370SJamie Gritton } else if (error != ENOENT) 20562a4b2251SJamie Gritton goto done; 2057b38ff370SJamie Gritton 2058b38ff370SJamie Gritton error = vfs_getopt(opts, "name", (void **)&name, &len); 2059b38ff370SJamie Gritton if (error == 0) { 2060b38ff370SJamie Gritton if (len == 0 || name[len - 1] != '\0') { 2061b38ff370SJamie Gritton error = EINVAL; 20622a4b2251SJamie Gritton goto done; 2063b38ff370SJamie Gritton } 20640304c731SJamie Gritton pr = prison_find_name(mypr, name); 2065b38ff370SJamie Gritton if (pr != NULL) { 20662a4b2251SJamie Gritton drflags |= PD_LOCKED; 206776ad42abSJamie Gritton if (!(prison_isalive(pr) || (flags & JAIL_DYING))) { 2068b38ff370SJamie Gritton error = ENOENT; 2069b38ff370SJamie Gritton vfs_opterror(opts, "jail \"%s\" is dying", 2070b38ff370SJamie Gritton name); 20712a4b2251SJamie Gritton goto done; 2072b38ff370SJamie Gritton } 2073b38ff370SJamie Gritton goto found_prison; 2074b38ff370SJamie Gritton } 2075b38ff370SJamie Gritton error = ENOENT; 2076b38ff370SJamie Gritton vfs_opterror(opts, "jail \"%s\" not found", name); 20772a4b2251SJamie Gritton goto done; 2078b38ff370SJamie Gritton } else if (error != ENOENT) 20792a4b2251SJamie Gritton goto done; 2080b38ff370SJamie Gritton 2081b38ff370SJamie Gritton vfs_opterror(opts, "no jail specified"); 2082b38ff370SJamie Gritton error = ENOENT; 20832a4b2251SJamie Gritton goto done; 2084b38ff370SJamie Gritton 2085b38ff370SJamie Gritton found_prison: 2086b38ff370SJamie Gritton /* Get the parameters of the prison. */ 20876754ae25SJamie Gritton prison_hold(pr); 20882a4b2251SJamie Gritton drflags |= PD_DEREF; 2089b38ff370SJamie Gritton td->td_retval[0] = pr->pr_id; 2090b38ff370SJamie Gritton error = vfs_setopt(opts, "jid", &pr->pr_id, sizeof(pr->pr_id)); 2091b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 20922a4b2251SJamie Gritton goto done; 20930304c731SJamie Gritton i = (pr->pr_parent == mypr) ? 0 : pr->pr_parent->pr_id; 20940304c731SJamie Gritton error = vfs_setopt(opts, "parent", &i, sizeof(i)); 2095b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 20962a4b2251SJamie Gritton goto done; 20970304c731SJamie Gritton error = vfs_setopts(opts, "name", prison_name(mypr, pr)); 20980304c731SJamie Gritton if (error != 0 && error != ENOENT) 20992a4b2251SJamie Gritton goto done; 21000304c731SJamie Gritton error = vfs_setopt(opts, "cpuset.id", &pr->pr_cpuset->cs_id, 2101b38ff370SJamie Gritton sizeof(pr->pr_cpuset->cs_id)); 2102b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21032a4b2251SJamie Gritton goto done; 21040304c731SJamie Gritton error = vfs_setopts(opts, "path", prison_path(mypr, pr)); 2105b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21062a4b2251SJamie Gritton goto done; 2107b38ff370SJamie Gritton #ifdef INET 2108b38ff370SJamie Gritton error = vfs_setopt_part(opts, "ip4.addr", pr->pr_ip4, 2109b38ff370SJamie Gritton pr->pr_ip4s * sizeof(*pr->pr_ip4)); 2110b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21112a4b2251SJamie Gritton goto done; 2112b38ff370SJamie Gritton #endif 2113b38ff370SJamie Gritton #ifdef INET6 2114b38ff370SJamie Gritton error = vfs_setopt_part(opts, "ip6.addr", pr->pr_ip6, 2115b38ff370SJamie Gritton pr->pr_ip6s * sizeof(*pr->pr_ip6)); 2116b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21172a4b2251SJamie Gritton goto done; 2118b38ff370SJamie Gritton #endif 2119b38ff370SJamie Gritton error = vfs_setopt(opts, "securelevel", &pr->pr_securelevel, 2120b38ff370SJamie Gritton sizeof(pr->pr_securelevel)); 2121b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21222a4b2251SJamie Gritton goto done; 2123b97457e2SJamie Gritton error = vfs_setopt(opts, "children.cur", &pr->pr_childcount, 2124b97457e2SJamie Gritton sizeof(pr->pr_childcount)); 2125b97457e2SJamie Gritton if (error != 0 && error != ENOENT) 21262a4b2251SJamie Gritton goto done; 2127b97457e2SJamie Gritton error = vfs_setopt(opts, "children.max", &pr->pr_childmax, 2128b97457e2SJamie Gritton sizeof(pr->pr_childmax)); 2129b97457e2SJamie Gritton if (error != 0 && error != ENOENT) 21302a4b2251SJamie Gritton goto done; 2131c1f19219SJamie Gritton error = vfs_setopts(opts, "host.hostname", pr->pr_hostname); 2132b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21332a4b2251SJamie Gritton goto done; 2134c1f19219SJamie Gritton error = vfs_setopts(opts, "host.domainname", pr->pr_domainname); 213576ca6f88SJamie Gritton if (error != 0 && error != ENOENT) 21362a4b2251SJamie Gritton goto done; 2137c1f19219SJamie Gritton error = vfs_setopts(opts, "host.hostuuid", pr->pr_hostuuid); 213876ca6f88SJamie Gritton if (error != 0 && error != ENOENT) 21392a4b2251SJamie Gritton goto done; 2140841c0c7eSNathan Whitehorn #ifdef COMPAT_FREEBSD32 2141a5c1afadSDmitry Chagin if (SV_PROC_FLAG(td->td_proc, SV_ILP32)) { 214276ca6f88SJamie Gritton uint32_t hid32 = pr->pr_hostid; 214376ca6f88SJamie Gritton 214476ca6f88SJamie Gritton error = vfs_setopt(opts, "host.hostid", &hid32, sizeof(hid32)); 214576ca6f88SJamie Gritton } else 214676ca6f88SJamie Gritton #endif 214776ca6f88SJamie Gritton error = vfs_setopt(opts, "host.hostid", &pr->pr_hostid, 214876ca6f88SJamie Gritton sizeof(pr->pr_hostid)); 214976ca6f88SJamie Gritton if (error != 0 && error != ENOENT) 21502a4b2251SJamie Gritton goto done; 21510304c731SJamie Gritton error = vfs_setopt(opts, "enforce_statfs", &pr->pr_enforce_statfs, 21520304c731SJamie Gritton sizeof(pr->pr_enforce_statfs)); 21530304c731SJamie Gritton if (error != 0 && error != ENOENT) 21542a4b2251SJamie Gritton goto done; 21550cc207a6SMartin Matuska error = vfs_setopt(opts, "devfs_ruleset", &pr->pr_devfs_rsnum, 21560cc207a6SMartin Matuska sizeof(pr->pr_devfs_rsnum)); 21570cc207a6SMartin Matuska if (error != 0 && error != ENOENT) 21582a4b2251SJamie Gritton goto done; 2159672756aaSJamie Gritton for (bf = pr_flag_bool; 2160672756aaSJamie Gritton bf < pr_flag_bool + nitems(pr_flag_bool); 2161672756aaSJamie Gritton bf++) { 2162672756aaSJamie Gritton i = (pr->pr_flags & bf->flag) ? 1 : 0; 2163672756aaSJamie Gritton error = vfs_setopt(opts, bf->name, &i, sizeof(i)); 2164b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21652a4b2251SJamie Gritton goto done; 2166b38ff370SJamie Gritton i = !i; 2167672756aaSJamie Gritton error = vfs_setopt(opts, bf->noname, &i, sizeof(i)); 2168b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21692a4b2251SJamie Gritton goto done; 21700304c731SJamie Gritton } 2171672756aaSJamie Gritton for (jsf = pr_flag_jailsys; 2172672756aaSJamie Gritton jsf < pr_flag_jailsys + nitems(pr_flag_jailsys); 2173672756aaSJamie Gritton jsf++) { 2174672756aaSJamie Gritton f = pr->pr_flags & (jsf->disable | jsf->new); 2175672756aaSJamie Gritton i = (f != 0 && f == jsf->disable) ? JAIL_SYS_DISABLE 2176672756aaSJamie Gritton : (f == jsf->new) ? JAIL_SYS_NEW 21777cbf7213SJamie Gritton : JAIL_SYS_INHERIT; 2178672756aaSJamie Gritton error = vfs_setopt(opts, jsf->name, &i, sizeof(i)); 21797cbf7213SJamie Gritton if (error != 0 && error != ENOENT) 21802a4b2251SJamie Gritton goto done; 21817cbf7213SJamie Gritton } 2182672756aaSJamie Gritton for (bf = pr_flag_allow; 21835d58f959SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && 21845d58f959SJamie Gritton atomic_load_int(&bf->flag) != 0; 2185672756aaSJamie Gritton bf++) { 2186672756aaSJamie Gritton i = (pr->pr_allow & bf->flag) ? 1 : 0; 2187672756aaSJamie Gritton error = vfs_setopt(opts, bf->name, &i, sizeof(i)); 21880304c731SJamie Gritton if (error != 0 && error != ENOENT) 21892a4b2251SJamie Gritton goto done; 21900304c731SJamie Gritton i = !i; 2191672756aaSJamie Gritton error = vfs_setopt(opts, bf->noname, &i, sizeof(i)); 21920304c731SJamie Gritton if (error != 0 && error != ENOENT) 21932a4b2251SJamie Gritton goto done; 21940304c731SJamie Gritton } 219576ad42abSJamie Gritton i = !prison_isalive(pr); 2196b38ff370SJamie Gritton error = vfs_setopt(opts, "dying", &i, sizeof(i)); 2197b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 21982a4b2251SJamie Gritton goto done; 2199b38ff370SJamie Gritton i = !i; 2200b38ff370SJamie Gritton error = vfs_setopt(opts, "nodying", &i, sizeof(i)); 2201b38ff370SJamie Gritton if (error != 0 && error != ENOENT) 22022a4b2251SJamie Gritton goto done; 2203bd96bd15SIan Lepore error = vfs_setopt(opts, "osreldate", &pr->pr_osreldate, 2204bd96bd15SIan Lepore sizeof(pr->pr_osreldate)); 2205a1a4c1b0SIan Lepore if (error != 0 && error != ENOENT) 22062a4b2251SJamie Gritton goto done; 2207a1a4c1b0SIan Lepore error = vfs_setopts(opts, "osrelease", pr->pr_osrelease); 2208a1a4c1b0SIan Lepore if (error != 0 && error != ENOENT) 22092a4b2251SJamie Gritton goto done; 2210b38ff370SJamie Gritton 2211b38ff370SJamie Gritton /* Get the module parameters. */ 2212b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 22132a4b2251SJamie Gritton drflags &= ~PD_LOCKED; 2214b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_GET, opts); 2215b38ff370SJamie Gritton if (error) 22162a4b2251SJamie Gritton goto done; 22172a4b2251SJamie Gritton prison_deref(pr, drflags); 22182a4b2251SJamie Gritton pr = NULL; 22192a4b2251SJamie Gritton drflags = 0; 2220b38ff370SJamie Gritton 2221b38ff370SJamie Gritton /* By now, all parameters should have been noted. */ 2222b38ff370SJamie Gritton TAILQ_FOREACH(opt, opts, link) { 2223b38ff370SJamie Gritton if (!opt->seen && strcmp(opt->name, "errmsg")) { 2224b38ff370SJamie Gritton error = EINVAL; 2225b38ff370SJamie Gritton vfs_opterror(opts, "unknown parameter: %s", opt->name); 22262a4b2251SJamie Gritton goto done; 2227b38ff370SJamie Gritton } 2228b38ff370SJamie Gritton } 2229b38ff370SJamie Gritton 2230b38ff370SJamie Gritton /* Write the fetched parameters back to userspace. */ 2231b38ff370SJamie Gritton error = 0; 2232b38ff370SJamie Gritton TAILQ_FOREACH(opt, opts, link) { 2233b38ff370SJamie Gritton if (opt->pos >= 0 && opt->pos != errmsg_pos) { 2234b38ff370SJamie Gritton pos = 2 * opt->pos + 1; 2235b38ff370SJamie Gritton optuio->uio_iov[pos].iov_len = opt->len; 2236b38ff370SJamie Gritton if (opt->value != NULL) { 2237b38ff370SJamie Gritton if (optuio->uio_segflg == UIO_SYSSPACE) { 2238b38ff370SJamie Gritton bcopy(opt->value, 2239b38ff370SJamie Gritton optuio->uio_iov[pos].iov_base, 2240b38ff370SJamie Gritton opt->len); 2241b38ff370SJamie Gritton } else { 2242b38ff370SJamie Gritton error = copyout(opt->value, 2243b38ff370SJamie Gritton optuio->uio_iov[pos].iov_base, 2244b38ff370SJamie Gritton opt->len); 2245b38ff370SJamie Gritton if (error) 2246b38ff370SJamie Gritton break; 2247b38ff370SJamie Gritton } 2248b38ff370SJamie Gritton } 2249b38ff370SJamie Gritton } 2250b38ff370SJamie Gritton } 2251b38ff370SJamie Gritton 22522a4b2251SJamie Gritton done: 22532a4b2251SJamie Gritton /* Release any temporary prison holds and/or locks. */ 22542a4b2251SJamie Gritton if (pr != NULL) 22552a4b2251SJamie Gritton prison_deref(pr, drflags); 22562a4b2251SJamie Gritton else if (drflags & PD_LIST_SLOCKED) 2257b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2258b38ff370SJamie Gritton if (error && errmsg_pos >= 0) { 22592a4b2251SJamie Gritton /* Write the error message back to userspace. */ 2260b38ff370SJamie Gritton vfs_getopt(opts, "errmsg", (void **)&errmsg, &errmsg_len); 2261b38ff370SJamie Gritton errmsg_pos = 2 * errmsg_pos + 1; 2262b38ff370SJamie Gritton if (errmsg_len > 0) { 2263b38ff370SJamie Gritton if (optuio->uio_segflg == UIO_SYSSPACE) 2264b38ff370SJamie Gritton bcopy(errmsg, 2265b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 2266b38ff370SJamie Gritton errmsg_len); 2267b38ff370SJamie Gritton else 2268b38ff370SJamie Gritton copyout(errmsg, 2269b38ff370SJamie Gritton optuio->uio_iov[errmsg_pos].iov_base, 2270b38ff370SJamie Gritton errmsg_len); 2271b38ff370SJamie Gritton } 2272b38ff370SJamie Gritton } 2273b38ff370SJamie Gritton vfs_freeopts(opts); 2274b38ff370SJamie Gritton return (error); 2275b38ff370SJamie Gritton } 2276b38ff370SJamie Gritton 2277b38ff370SJamie Gritton /* 2278b38ff370SJamie Gritton * struct jail_remove_args { 2279b38ff370SJamie Gritton * int jid; 2280b38ff370SJamie Gritton * }; 2281b38ff370SJamie Gritton */ 2282b38ff370SJamie Gritton int 22838451d0ddSKip Macy sys_jail_remove(struct thread *td, struct jail_remove_args *uap) 2284b38ff370SJamie Gritton { 2285c861373bSJamie Gritton struct prison *pr; 2286c861373bSJamie Gritton int error; 2287b38ff370SJamie Gritton 2288b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_REMOVE); 2289b38ff370SJamie Gritton if (error) 2290b38ff370SJamie Gritton return (error); 2291b38ff370SJamie Gritton 2292b38ff370SJamie Gritton sx_xlock(&allprison_lock); 22930304c731SJamie Gritton pr = prison_find_child(td->td_ucred->cr_prison, uap->jid); 2294b38ff370SJamie Gritton if (pr == NULL) { 2295b38ff370SJamie Gritton sx_xunlock(&allprison_lock); 2296b38ff370SJamie Gritton return (EINVAL); 2297b38ff370SJamie Gritton } 2298c861373bSJamie Gritton if (!prison_isalive(pr)) { 2299c861373bSJamie Gritton /* Silently ignore already-dying prisons. */ 23000304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 2301c861373bSJamie Gritton sx_xunlock(&allprison_lock); 23020304c731SJamie Gritton return (0); 23030304c731SJamie Gritton } 2304c861373bSJamie Gritton prison_deref(pr, PD_KILL | PD_LOCKED | PD_LIST_XLOCKED); 2305c861373bSJamie Gritton return (0); 230675c13541SPoul-Henning Kamp } 230775c13541SPoul-Henning Kamp 2308fd7a8150SMike Barcroft /* 23099ddb7954SMike Barcroft * struct jail_attach_args { 23109ddb7954SMike Barcroft * int jid; 23119ddb7954SMike Barcroft * }; 2312fd7a8150SMike Barcroft */ 2313fd7a8150SMike Barcroft int 23148451d0ddSKip Macy sys_jail_attach(struct thread *td, struct jail_attach_args *uap) 2315fd7a8150SMike Barcroft { 2316b38ff370SJamie Gritton struct prison *pr; 2317b38ff370SJamie Gritton int error; 2318b38ff370SJamie Gritton 2319b38ff370SJamie Gritton error = priv_check(td, PRIV_JAIL_ATTACH); 2320b38ff370SJamie Gritton if (error) 2321b38ff370SJamie Gritton return (error); 2322b38ff370SJamie Gritton 2323f7496dcaSJamie Gritton sx_slock(&allprison_lock); 23240304c731SJamie Gritton pr = prison_find_child(td->td_ucred->cr_prison, uap->jid); 2325b38ff370SJamie Gritton if (pr == NULL) { 2326b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2327b38ff370SJamie Gritton return (EINVAL); 2328b38ff370SJamie Gritton } 2329b38ff370SJamie Gritton 233076ad42abSJamie Gritton /* Do not allow a process to attach to a prison that is not alive. */ 233176ad42abSJamie Gritton if (!prison_isalive(pr)) { 2332b38ff370SJamie Gritton mtx_unlock(&pr->pr_mtx); 2333b38ff370SJamie Gritton sx_sunlock(&allprison_lock); 2334b38ff370SJamie Gritton return (EINVAL); 2335b38ff370SJamie Gritton } 2336b38ff370SJamie Gritton 2337f7496dcaSJamie Gritton return (do_jail_attach(td, pr, PD_LOCKED | PD_LIST_SLOCKED)); 2338b38ff370SJamie Gritton } 2339b38ff370SJamie Gritton 2340b38ff370SJamie Gritton static int 2341f7496dcaSJamie Gritton do_jail_attach(struct thread *td, struct prison *pr, int drflags) 2342b38ff370SJamie Gritton { 2343fd7a8150SMike Barcroft struct proc *p; 2344fd7a8150SMike Barcroft struct ucred *newcred, *oldcred; 23455050aa86SKonstantin Belousov int error; 2346fd7a8150SMike Barcroft 2347f7496dcaSJamie Gritton mtx_assert(&pr->pr_mtx, MA_OWNED); 2348f7496dcaSJamie Gritton sx_assert(&allprison_lock, SX_LOCKED); 2349589e4c1dSJamie Gritton drflags &= PD_LOCK_FLAGS; 235057f22bd4SJacques Vidrine /* 235157f22bd4SJacques Vidrine * XXX: Note that there is a slight race here if two threads 235257f22bd4SJacques Vidrine * in the same privileged process attempt to attach to two 235357f22bd4SJacques Vidrine * different jails at the same time. It is important for 235457f22bd4SJacques Vidrine * user processes not to do this, or they might end up with 235557f22bd4SJacques Vidrine * a process root from one prison, but attached to the jail 235657f22bd4SJacques Vidrine * of another. 235757f22bd4SJacques Vidrine */ 23581158508aSJamie Gritton prison_hold(pr); 23596754ae25SJamie Gritton refcount_acquire(&pr->pr_uref); 2360f7496dcaSJamie Gritton drflags |= PD_DEREF | PD_DEUREF; 2361fd7a8150SMike Barcroft mtx_unlock(&pr->pr_mtx); 2362f7496dcaSJamie Gritton drflags &= ~PD_LOCKED; 2363b38ff370SJamie Gritton 2364b38ff370SJamie Gritton /* Let modules do whatever they need to prepare for attaching. */ 2365b38ff370SJamie Gritton error = osd_jail_call(pr, PR_METHOD_ATTACH, td); 2366b38ff370SJamie Gritton if (error) { 2367f7496dcaSJamie Gritton prison_deref(pr, drflags); 2368b38ff370SJamie Gritton return (error); 2369b38ff370SJamie Gritton } 2370f7496dcaSJamie Gritton sx_unlock(&allprison_lock); 2371f7496dcaSJamie Gritton drflags &= ~(PD_LIST_SLOCKED | PD_LIST_XLOCKED); 2372fd7a8150SMike Barcroft 2373413628a7SBjoern A. Zeeb /* 2374413628a7SBjoern A. Zeeb * Reparent the newly attached process to this jail. 2375413628a7SBjoern A. Zeeb */ 2376b38ff370SJamie Gritton p = td->td_proc; 2377413628a7SBjoern A. Zeeb error = cpuset_setproc_update_set(p, pr->pr_cpuset); 2378413628a7SBjoern A. Zeeb if (error) 2379b38ff370SJamie Gritton goto e_revert_osd; 2380413628a7SBjoern A. Zeeb 2381cb05b60aSAttilio Rao vn_lock(pr->pr_root, LK_EXCLUSIVE | LK_RETRY); 2382fd7a8150SMike Barcroft if ((error = change_dir(pr->pr_root, td)) != 0) 2383fd7a8150SMike Barcroft goto e_unlock; 2384fd7a8150SMike Barcroft #ifdef MAC 238530d239bcSRobert Watson if ((error = mac_vnode_check_chroot(td->td_ucred, pr->pr_root))) 2386fd7a8150SMike Barcroft goto e_unlock; 2387fd7a8150SMike Barcroft #endif 2388b249ce48SMateusz Guzik VOP_UNLOCK(pr->pr_root); 2389d4380c0cSJamie Gritton if ((error = pwd_chroot_chdir(td, pr->pr_root))) 23905050aa86SKonstantin Belousov goto e_revert_osd; 2391fd7a8150SMike Barcroft 2392fd7a8150SMike Barcroft newcred = crget(); 2393fd7a8150SMike Barcroft PROC_LOCK(p); 23941fb6767dSJamie Gritton oldcred = crcopysafe(p, newcred); 239569c4ee54SJohn Baldwin newcred->cr_prison = pr; 2396daf63fd2SMateusz Guzik proc_set_cred(p, newcred); 23971fb6767dSJamie Gritton setsugid(p); 2398097055e2SEdward Tomasz Napierala #ifdef RACCT 2399097055e2SEdward Tomasz Napierala racct_proc_ucred_changed(p, oldcred, newcred); 2400f87beb93SAndriy Gapon crhold(newcred); 2401f87beb93SAndriy Gapon #endif 2402f87beb93SAndriy Gapon PROC_UNLOCK(p); 2403f87beb93SAndriy Gapon #ifdef RCTL 2404f87beb93SAndriy Gapon rctl_proc_ucred_changed(p, newcred); 2405f87beb93SAndriy Gapon crfree(newcred); 2406097055e2SEdward Tomasz Napierala #endif 2407f7496dcaSJamie Gritton prison_deref(oldcred->cr_prison, drflags); 2408fd7a8150SMike Barcroft crfree(oldcred); 2409cc7b7306SJamie Gritton 2410cc7b7306SJamie Gritton /* 2411cc7b7306SJamie Gritton * If the prison was killed while changing credentials, die along 2412cc7b7306SJamie Gritton * with it. 2413cc7b7306SJamie Gritton */ 2414cc7b7306SJamie Gritton if (!prison_isalive(pr)) { 2415cc7b7306SJamie Gritton PROC_LOCK(p); 2416cc7b7306SJamie Gritton kern_psignal(p, SIGKILL); 2417cc7b7306SJamie Gritton PROC_UNLOCK(p); 2418cc7b7306SJamie Gritton } 2419cc7b7306SJamie Gritton 2420fd7a8150SMike Barcroft return (0); 24211fb6767dSJamie Gritton 2422fd7a8150SMike Barcroft e_unlock: 2423b249ce48SMateusz Guzik VOP_UNLOCK(pr->pr_root); 2424b38ff370SJamie Gritton e_revert_osd: 2425b38ff370SJamie Gritton /* Tell modules this thread is still in its old jail after all. */ 24267f4e7248SJamie Gritton sx_slock(&allprison_lock); 2427f7496dcaSJamie Gritton drflags |= PD_LIST_SLOCKED; 24281fb6767dSJamie Gritton (void)osd_jail_call(td->td_ucred->cr_prison, PR_METHOD_ATTACH, td); 2429f7496dcaSJamie Gritton prison_deref(pr, drflags); 2430fd7a8150SMike Barcroft return (error); 2431fd7a8150SMike Barcroft } 2432fd7a8150SMike Barcroft 2433fd7a8150SMike Barcroft /* 2434fd7a8150SMike Barcroft * Returns a locked prison instance, or NULL on failure. 2435fd7a8150SMike Barcroft */ 243654b369c1SPawel Jakub Dawidek struct prison * 2437fd7a8150SMike Barcroft prison_find(int prid) 2438fd7a8150SMike Barcroft { 2439fd7a8150SMike Barcroft struct prison *pr; 2440fd7a8150SMike Barcroft 2441dc68a633SPawel Jakub Dawidek sx_assert(&allprison_lock, SX_LOCKED); 2442b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) { 2443f7496dcaSJamie Gritton if (pr->pr_id < prid) 2444f7496dcaSJamie Gritton continue; 24457de883c8SJamie Gritton if (pr->pr_id > prid) 24467de883c8SJamie Gritton break; 2447f7496dcaSJamie Gritton KASSERT(prison_isvalid(pr), ("Found invalid prison %p", pr)); 2448f7496dcaSJamie Gritton mtx_lock(&pr->pr_mtx); 2449f7496dcaSJamie Gritton return (pr); 2450fd7a8150SMike Barcroft } 2451fd7a8150SMike Barcroft return (NULL); 2452fd7a8150SMike Barcroft } 2453fd7a8150SMike Barcroft 2454b38ff370SJamie Gritton /* 24550304c731SJamie Gritton * Find a prison that is a descendant of mypr. Returns a locked prison or NULL. 2456b38ff370SJamie Gritton */ 2457b38ff370SJamie Gritton struct prison * 24580304c731SJamie Gritton prison_find_child(struct prison *mypr, int prid) 2459b38ff370SJamie Gritton { 24600304c731SJamie Gritton struct prison *pr; 24610304c731SJamie Gritton int descend; 2462b38ff370SJamie Gritton 2463b38ff370SJamie Gritton sx_assert(&allprison_lock, SX_LOCKED); 24640304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(mypr, pr, descend) { 24650304c731SJamie Gritton if (pr->pr_id == prid) { 2466f7496dcaSJamie Gritton KASSERT(prison_isvalid(pr), 2467f7496dcaSJamie Gritton ("Found invalid prison %p", pr)); 24680304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 24690304c731SJamie Gritton return (pr); 24700304c731SJamie Gritton } 24710304c731SJamie Gritton } 24720304c731SJamie Gritton return (NULL); 24730304c731SJamie Gritton } 24740304c731SJamie Gritton 24750304c731SJamie Gritton /* 24760304c731SJamie Gritton * Look for the name relative to mypr. Returns a locked prison or NULL. 24770304c731SJamie Gritton */ 24780304c731SJamie Gritton struct prison * 24790304c731SJamie Gritton prison_find_name(struct prison *mypr, const char *name) 24800304c731SJamie Gritton { 24810304c731SJamie Gritton struct prison *pr, *deadpr; 24820304c731SJamie Gritton size_t mylen; 24830304c731SJamie Gritton int descend; 24840304c731SJamie Gritton 24850304c731SJamie Gritton sx_assert(&allprison_lock, SX_LOCKED); 24860304c731SJamie Gritton mylen = (mypr == &prison0) ? 0 : strlen(mypr->pr_name) + 1; 2487b38ff370SJamie Gritton deadpr = NULL; 24880304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(mypr, pr, descend) { 24890304c731SJamie Gritton if (!strcmp(pr->pr_name + mylen, name)) { 2490f7496dcaSJamie Gritton KASSERT(prison_isvalid(pr), 2491f7496dcaSJamie Gritton ("Found invalid prison %p", pr)); 2492f7496dcaSJamie Gritton if (prison_isalive(pr)) { 2493b38ff370SJamie Gritton mtx_lock(&pr->pr_mtx); 2494b38ff370SJamie Gritton return (pr); 2495f7496dcaSJamie Gritton } 2496b38ff370SJamie Gritton deadpr = pr; 2497b38ff370SJamie Gritton } 2498b38ff370SJamie Gritton } 24990304c731SJamie Gritton /* There was no valid prison - perhaps there was a dying one. */ 2500f7496dcaSJamie Gritton if (deadpr != NULL) 2501b38ff370SJamie Gritton mtx_lock(&deadpr->pr_mtx); 2502b38ff370SJamie Gritton return (deadpr); 2503b38ff370SJamie Gritton } 2504b38ff370SJamie Gritton 2505b38ff370SJamie Gritton /* 25060fe74ae6SJamie Gritton * See if a prison has the specific flag set. The prison should be locked, 25070fe74ae6SJamie Gritton * unless checking for flags that are only set at jail creation (such as 25080fe74ae6SJamie Gritton * PR_IP4 and PR_IP6), or only the single bit is examined, without regard 25090fe74ae6SJamie Gritton * to any other prison data. 25100304c731SJamie Gritton */ 25110304c731SJamie Gritton int 25120304c731SJamie Gritton prison_flag(struct ucred *cred, unsigned flag) 25130304c731SJamie Gritton { 25140304c731SJamie Gritton 25150304c731SJamie Gritton return (cred->cr_prison->pr_flags & flag); 25160304c731SJamie Gritton } 25170304c731SJamie Gritton 25180304c731SJamie Gritton int 25190304c731SJamie Gritton prison_allow(struct ucred *cred, unsigned flag) 25200304c731SJamie Gritton { 25210304c731SJamie Gritton 25220fe74ae6SJamie Gritton return ((cred->cr_prison->pr_allow & flag) != 0); 25230304c731SJamie Gritton } 25240304c731SJamie Gritton 25250304c731SJamie Gritton /* 2526effad35eSJamie Gritton * Hold a prison reference, by incrementing pr_ref. It is generally 2527effad35eSJamie Gritton * an error to hold a prison that does not already have a reference. 2528effad35eSJamie Gritton * A prison record will remain valid as long as it has at least one 2529effad35eSJamie Gritton * reference, and will not be removed as long as either the prison 2530effad35eSJamie Gritton * mutex or the allprison lock is held (allprison_lock may be shared). 2531effad35eSJamie Gritton */ 2532effad35eSJamie Gritton void 2533effad35eSJamie Gritton prison_hold_locked(struct prison *pr) 2534effad35eSJamie Gritton { 2535effad35eSJamie Gritton 25366754ae25SJamie Gritton /* Locking is no longer required. */ 25376754ae25SJamie Gritton prison_hold(pr); 2538effad35eSJamie Gritton } 2539effad35eSJamie Gritton 2540effad35eSJamie Gritton void 2541effad35eSJamie Gritton prison_hold(struct prison *pr) 2542effad35eSJamie Gritton { 25436754ae25SJamie Gritton #ifdef INVARIANTS 25446754ae25SJamie Gritton int was_valid = refcount_acquire_if_not_zero(&pr->pr_ref); 2545effad35eSJamie Gritton 25466754ae25SJamie Gritton KASSERT(was_valid, 25476754ae25SJamie Gritton ("Trying to hold dead prison %p (jid=%d).", pr, pr->pr_id)); 25486754ae25SJamie Gritton #else 25496754ae25SJamie Gritton refcount_acquire(&pr->pr_ref); 25506754ae25SJamie Gritton #endif 2551effad35eSJamie Gritton } 2552effad35eSJamie Gritton 2553effad35eSJamie Gritton /* 2554effad35eSJamie Gritton * Remove a prison reference. If that was the last reference, the 2555f7496dcaSJamie Gritton * prison will be removed (at a later time). 2556b38ff370SJamie Gritton */ 255791421ba2SRobert Watson void 25581ba4a712SPawel Jakub Dawidek prison_free_locked(struct prison *pr) 255991421ba2SRobert Watson { 256091421ba2SRobert Watson 25611ba4a712SPawel Jakub Dawidek mtx_assert(&pr->pr_mtx, MA_OWNED); 2562effad35eSJamie Gritton /* 2563f7496dcaSJamie Gritton * Locking is no longer required, but unlock because the caller 2564f7496dcaSJamie Gritton * expects it. 2565effad35eSJamie Gritton */ 2566f7496dcaSJamie Gritton mtx_unlock(&pr->pr_mtx); 2567f7496dcaSJamie Gritton prison_free(pr); 2568effad35eSJamie Gritton } 2569c2cda609SPawel Jakub Dawidek 25701ba4a712SPawel Jakub Dawidek void 25711ba4a712SPawel Jakub Dawidek prison_free(struct prison *pr) 25721ba4a712SPawel Jakub Dawidek { 25731ba4a712SPawel Jakub Dawidek 25746754ae25SJamie Gritton KASSERT(refcount_load(&pr->pr_ref) > 0, 25756754ae25SJamie Gritton ("Trying to free dead prison %p (jid=%d).", 25766754ae25SJamie Gritton pr, pr->pr_id)); 2577f7496dcaSJamie Gritton if (!refcount_release_if_not_last(&pr->pr_ref)) { 2578f7496dcaSJamie Gritton /* 2579f7496dcaSJamie Gritton * Don't remove the last reference in this context, 2580f7496dcaSJamie Gritton * in case there are locks held. 2581f7496dcaSJamie Gritton */ 2582f7496dcaSJamie Gritton taskqueue_enqueue(taskqueue_thread, &pr->pr_task); 2583f7496dcaSJamie Gritton } 2584f7496dcaSJamie Gritton } 2585f7496dcaSJamie Gritton 2586f7496dcaSJamie Gritton static void 2587f7496dcaSJamie Gritton prison_free_not_last(struct prison *pr) 2588f7496dcaSJamie Gritton { 2589f7496dcaSJamie Gritton #ifdef INVARIANTS 2590f7496dcaSJamie Gritton int lastref; 2591f7496dcaSJamie Gritton 2592f7496dcaSJamie Gritton KASSERT(refcount_load(&pr->pr_ref) > 0, 2593f7496dcaSJamie Gritton ("Trying to free dead prison %p (jid=%d).", 2594f7496dcaSJamie Gritton pr, pr->pr_id)); 2595f7496dcaSJamie Gritton lastref = refcount_release(&pr->pr_ref); 2596f7496dcaSJamie Gritton KASSERT(!lastref, 2597f7496dcaSJamie Gritton ("prison_free_not_last freed last ref on prison %p (jid=%d).", 2598f7496dcaSJamie Gritton pr, pr->pr_id)); 2599f7496dcaSJamie Gritton #else 2600ee9b37aeSMateusz Guzik refcount_release(&pr->pr_ref); 2601f7496dcaSJamie Gritton #endif 26021ba4a712SPawel Jakub Dawidek } 26031ba4a712SPawel Jakub Dawidek 260473d9e52dSJamie Gritton /* 2605effad35eSJamie Gritton * Hold a a prison for user visibility, by incrementing pr_uref. 2606effad35eSJamie Gritton * It is generally an error to hold a prison that isn't already 2607effad35eSJamie Gritton * user-visible, except through the the jail system calls. It is also 2608effad35eSJamie Gritton * an error to hold an invalid prison. A prison record will remain 2609effad35eSJamie Gritton * alive as long as it has at least one user reference, and will not 2610f7496dcaSJamie Gritton * be set to the dying state until the prison mutex and allprison_lock 2611f7496dcaSJamie Gritton * are both freed. 2612effad35eSJamie Gritton */ 2613effad35eSJamie Gritton void 2614effad35eSJamie Gritton prison_proc_hold(struct prison *pr) 2615effad35eSJamie Gritton { 26166754ae25SJamie Gritton #ifdef INVARIANTS 26176754ae25SJamie Gritton int was_alive = refcount_acquire_if_not_zero(&pr->pr_uref); 2618effad35eSJamie Gritton 26196754ae25SJamie Gritton KASSERT(was_alive, 2620effad35eSJamie Gritton ("Cannot add a process to a non-alive prison (jid=%d)", pr->pr_id)); 26216754ae25SJamie Gritton #else 26226754ae25SJamie Gritton refcount_acquire(&pr->pr_uref); 26236754ae25SJamie Gritton #endif 2624effad35eSJamie Gritton } 2625effad35eSJamie Gritton 2626effad35eSJamie Gritton /* 2627effad35eSJamie Gritton * Remove a prison user reference. If it was the last reference, the 2628effad35eSJamie Gritton * prison will be considered "dying", and may be removed once all of 2629effad35eSJamie Gritton * its references are dropped. 2630effad35eSJamie Gritton */ 2631effad35eSJamie Gritton void 2632effad35eSJamie Gritton prison_proc_free(struct prison *pr) 2633effad35eSJamie Gritton { 2634effad35eSJamie Gritton 26356754ae25SJamie Gritton /* 26366754ae25SJamie Gritton * Locking is only required when releasing the last reference. 26376754ae25SJamie Gritton * This allows assurance that a locked prison will remain alive 26386754ae25SJamie Gritton * until it is unlocked. 26396754ae25SJamie Gritton */ 26406754ae25SJamie Gritton KASSERT(refcount_load(&pr->pr_uref) > 0, 2641effad35eSJamie Gritton ("Trying to kill a process in a dead prison (jid=%d)", pr->pr_id)); 2642195cd6aeSJamie Gritton if (!refcount_release_if_not_last(&pr->pr_uref)) { 2643effad35eSJamie Gritton /* 2644effad35eSJamie Gritton * Don't remove the last user reference in this context, 2645effad35eSJamie Gritton * which is expected to be a process that is not only locked, 2646effad35eSJamie Gritton * but also half dead. Add a reference so any calls to 2647effad35eSJamie Gritton * prison_free() won't re-submit the task. 2648effad35eSJamie Gritton */ 2649f7496dcaSJamie Gritton prison_hold(pr); 26501158508aSJamie Gritton mtx_lock(&pr->pr_mtx); 26511158508aSJamie Gritton KASSERT(!(pr->pr_flags & PR_COMPLETE_PROC), 26521158508aSJamie Gritton ("Redundant last reference in prison_proc_free (jid=%d)", 26531158508aSJamie Gritton pr->pr_id)); 26541158508aSJamie Gritton pr->pr_flags |= PR_COMPLETE_PROC; 26551158508aSJamie Gritton mtx_unlock(&pr->pr_mtx); 2656effad35eSJamie Gritton taskqueue_enqueue(taskqueue_thread, &pr->pr_task); 2657effad35eSJamie Gritton } 2658effad35eSJamie Gritton } 2659effad35eSJamie Gritton 2660c861373bSJamie Gritton static void 2661c861373bSJamie Gritton prison_proc_free_not_last(struct prison *pr) 2662c861373bSJamie Gritton { 2663c861373bSJamie Gritton #ifdef INVARIANTS 2664c861373bSJamie Gritton int lastref; 2665c861373bSJamie Gritton 2666c861373bSJamie Gritton KASSERT(refcount_load(&pr->pr_uref) > 0, 2667c861373bSJamie Gritton ("Trying to free dead prison %p (jid=%d).", 2668c861373bSJamie Gritton pr, pr->pr_id)); 2669c861373bSJamie Gritton lastref = refcount_release(&pr->pr_uref); 2670c861373bSJamie Gritton KASSERT(!lastref, 2671c861373bSJamie Gritton ("prison_proc_free_not_last freed last uref on prison %p (jid=%d).", 2672c861373bSJamie Gritton pr, pr->pr_id)); 2673c861373bSJamie Gritton #else 2674c861373bSJamie Gritton refcount_release(&pr->pr_uref); 2675c861373bSJamie Gritton #endif 2676c861373bSJamie Gritton } 2677c861373bSJamie Gritton 2678effad35eSJamie Gritton /* 267973d9e52dSJamie Gritton * Complete a call to either prison_free or prison_proc_free. 268073d9e52dSJamie Gritton */ 2681c2cda609SPawel Jakub Dawidek static void 2682c2cda609SPawel Jakub Dawidek prison_complete(void *context, int pending) 2683c2cda609SPawel Jakub Dawidek { 268473d9e52dSJamie Gritton struct prison *pr = context; 2685f7496dcaSJamie Gritton int drflags; 2686b38ff370SJamie Gritton 2687effad35eSJamie Gritton /* 26881158508aSJamie Gritton * This could be called to release the last reference, or the last 26891158508aSJamie Gritton * user reference (plus the reference held in prison_proc_free). 2690effad35eSJamie Gritton */ 2691f7496dcaSJamie Gritton drflags = prison_lock_xlock(pr, PD_DEREF); 26921158508aSJamie Gritton if (pr->pr_flags & PR_COMPLETE_PROC) { 26931158508aSJamie Gritton pr->pr_flags &= ~PR_COMPLETE_PROC; 2694f7496dcaSJamie Gritton drflags |= PD_DEUREF; 26951158508aSJamie Gritton } 2696f7496dcaSJamie Gritton prison_deref(pr, drflags); 2697b38ff370SJamie Gritton } 2698b38ff370SJamie Gritton 2699b38ff370SJamie Gritton /* 2700effad35eSJamie Gritton * Remove a prison reference and/or user reference (usually). 2701effad35eSJamie Gritton * This assumes context that allows sleeping (for allprison_lock), 2702effad35eSJamie Gritton * with no non-sleeping locks held, except perhaps the prison itself. 2703effad35eSJamie Gritton * If there are no more references, release and delist the prison. 2704effad35eSJamie Gritton * On completion, the prison lock and the allprison lock are both 2705effad35eSJamie Gritton * unlocked. 2706b38ff370SJamie Gritton */ 2707b38ff370SJamie Gritton static void 2708b38ff370SJamie Gritton prison_deref(struct prison *pr, int flags) 2709b38ff370SJamie Gritton { 27106e1d1bfcSJamie Gritton struct prisonlist freeprison; 2711c861373bSJamie Gritton struct prison *killpr, *rpr, *ppr, *tpr; 2712c861373bSJamie Gritton struct proc *p; 2713c2cda609SPawel Jakub Dawidek 2714c861373bSJamie Gritton killpr = NULL; 27156e1d1bfcSJamie Gritton TAILQ_INIT(&freeprison); 27166e1d1bfcSJamie Gritton /* 27176e1d1bfcSJamie Gritton * Release this prison as requested, which may cause its parent 27186e1d1bfcSJamie Gritton * to be released, and then maybe its grandparent, etc. 27196e1d1bfcSJamie Gritton */ 27200304c731SJamie Gritton for (;;) { 2721c861373bSJamie Gritton if (flags & PD_KILL) { 2722c861373bSJamie Gritton /* Kill the prison and its descendents. */ 2723589e4c1dSJamie Gritton KASSERT(pr != &prison0, 2724589e4c1dSJamie Gritton ("prison_deref trying to kill prison0")); 2725c861373bSJamie Gritton if (!(flags & PD_DEREF)) { 2726c861373bSJamie Gritton prison_hold(pr); 2727c861373bSJamie Gritton flags |= PD_DEREF; 2728c861373bSJamie Gritton } 2729c861373bSJamie Gritton flags = prison_lock_xlock(pr, flags); 2730c861373bSJamie Gritton prison_deref_kill(pr, &freeprison); 2731c861373bSJamie Gritton } 2732e6d5cb63SJamie Gritton if (flags & PD_DEUREF) { 2733f7496dcaSJamie Gritton /* Drop a user reference. */ 27346754ae25SJamie Gritton KASSERT(refcount_load(&pr->pr_uref) > 0, 273573d9e52dSJamie Gritton ("prison_deref PD_DEUREF on a dead prison (jid=%d)", 273673d9e52dSJamie Gritton pr->pr_id)); 2737f7496dcaSJamie Gritton if (!refcount_release_if_not_last(&pr->pr_uref)) { 2738f7496dcaSJamie Gritton if (!(flags & PD_DEREF)) { 2739f7496dcaSJamie Gritton prison_hold(pr); 2740f7496dcaSJamie Gritton flags |= PD_DEREF; 2741f7496dcaSJamie Gritton } 2742f7496dcaSJamie Gritton flags = prison_lock_xlock(pr, flags); 27431158508aSJamie Gritton if (refcount_release(&pr->pr_uref) && 27441158508aSJamie Gritton pr->pr_state == PRISON_STATE_ALIVE) { 2745f7496dcaSJamie Gritton /* 2746f7496dcaSJamie Gritton * When the last user references goes, 2747f7496dcaSJamie Gritton * this becomes a dying prison. 2748f7496dcaSJamie Gritton */ 2749f7496dcaSJamie Gritton KASSERT( 2750f7496dcaSJamie Gritton refcount_load(&prison0.pr_uref) > 0, 27516754ae25SJamie Gritton ("prison0 pr_uref=0")); 27521158508aSJamie Gritton pr->pr_state = PRISON_STATE_DYING; 2753f7496dcaSJamie Gritton mtx_unlock(&pr->pr_mtx); 2754f7496dcaSJamie Gritton flags &= ~PD_LOCKED; 2755f7496dcaSJamie Gritton (void)osd_jail_call(pr, 2756f7496dcaSJamie Gritton PR_METHOD_REMOVE, NULL); 2757f7496dcaSJamie Gritton } 2758f7496dcaSJamie Gritton } 2759f7496dcaSJamie Gritton } 2760c861373bSJamie Gritton if (flags & PD_KILL) { 2761c861373bSJamie Gritton /* 2762c861373bSJamie Gritton * Any remaining user references are probably processes 2763c861373bSJamie Gritton * that need to be killed, either in this prison or its 2764c861373bSJamie Gritton * descendants. 2765c861373bSJamie Gritton */ 2766c861373bSJamie Gritton if (refcount_load(&pr->pr_uref) > 0) 2767c861373bSJamie Gritton killpr = pr; 2768589e4c1dSJamie Gritton /* Make sure the parent prison doesn't get killed. */ 2769589e4c1dSJamie Gritton flags &= ~PD_KILL; 2770c861373bSJamie Gritton } 277173d9e52dSJamie Gritton if (flags & PD_DEREF) { 2772f7496dcaSJamie Gritton /* Drop a reference. */ 27736754ae25SJamie Gritton KASSERT(refcount_load(&pr->pr_ref) > 0, 277473d9e52dSJamie Gritton ("prison_deref PD_DEREF on a dead prison (jid=%d)", 277573d9e52dSJamie Gritton pr->pr_id)); 2776f7496dcaSJamie Gritton if (!refcount_release_if_not_last(&pr->pr_ref)) { 2777f7496dcaSJamie Gritton flags = prison_lock_xlock(pr, flags); 2778f7496dcaSJamie Gritton if (refcount_release(&pr->pr_ref)) { 2779cc5fd8c7SJamie Gritton /* 2780f7496dcaSJamie Gritton * When the last reference goes, 2781f7496dcaSJamie Gritton * unlink the prison and set it aside. 2782cc5fd8c7SJamie Gritton */ 2783f7496dcaSJamie Gritton KASSERT( 2784f7496dcaSJamie Gritton refcount_load(&pr->pr_uref) == 0, 2785f7496dcaSJamie Gritton ("prison_deref: last ref, " 2786f7496dcaSJamie Gritton "but still has %d urefs (jid=%d)", 2787f7496dcaSJamie Gritton pr->pr_uref, pr->pr_id)); 2788f7496dcaSJamie Gritton KASSERT( 2789f7496dcaSJamie Gritton refcount_load(&prison0.pr_ref) != 0, 2790f7496dcaSJamie Gritton ("prison0 pr_ref=0")); 27911158508aSJamie Gritton pr->pr_state = PRISON_STATE_INVALID; 2792b38ff370SJamie Gritton TAILQ_REMOVE(&allprison, pr, pr_list); 27930304c731SJamie Gritton LIST_REMOVE(pr, pr_sibling); 2794f7496dcaSJamie Gritton TAILQ_INSERT_TAIL(&freeprison, pr, 2795f7496dcaSJamie Gritton pr_list); 2796f7496dcaSJamie Gritton for (ppr = pr->pr_parent; 2797f7496dcaSJamie Gritton ppr != NULL; 2798f7496dcaSJamie Gritton ppr = ppr->pr_parent) 2799f7496dcaSJamie Gritton ppr->pr_childcount--; 2800f7496dcaSJamie Gritton /* 2801f7496dcaSJamie Gritton * Removing a prison frees references 2802f7496dcaSJamie Gritton * from its parent. 2803f7496dcaSJamie Gritton */ 2804f7496dcaSJamie Gritton mtx_unlock(&pr->pr_mtx); 2805f7496dcaSJamie Gritton flags &= ~PD_LOCKED; 28066e1d1bfcSJamie Gritton pr = pr->pr_parent; 28076e1d1bfcSJamie Gritton flags |= PD_DEREF | PD_DEUREF; 2808f7496dcaSJamie Gritton continue; 2809f7496dcaSJamie Gritton } 2810f7496dcaSJamie Gritton } 2811f7496dcaSJamie Gritton } 2812f7496dcaSJamie Gritton break; 28136e1d1bfcSJamie Gritton } 28146e1d1bfcSJamie Gritton 28156e1d1bfcSJamie Gritton /* Release all the prison locks. */ 2816f7496dcaSJamie Gritton if (flags & PD_LOCKED) 2817f7496dcaSJamie Gritton mtx_unlock(&pr->pr_mtx); 28186e1d1bfcSJamie Gritton if (flags & PD_LIST_SLOCKED) 28196e1d1bfcSJamie Gritton sx_sunlock(&allprison_lock); 28206e1d1bfcSJamie Gritton else if (flags & PD_LIST_XLOCKED) 28216e1d1bfcSJamie Gritton sx_xunlock(&allprison_lock); 28226e1d1bfcSJamie Gritton 2823c861373bSJamie Gritton /* Kill any processes attached to a killed prison. */ 2824c861373bSJamie Gritton if (killpr != NULL) { 2825c861373bSJamie Gritton sx_slock(&allproc_lock); 2826c861373bSJamie Gritton FOREACH_PROC_IN_SYSTEM(p) { 2827c861373bSJamie Gritton PROC_LOCK(p); 2828c861373bSJamie Gritton if (p->p_state != PRS_NEW && p->p_ucred != NULL) { 2829c861373bSJamie Gritton for (ppr = p->p_ucred->cr_prison; 2830c861373bSJamie Gritton ppr != &prison0; 2831c861373bSJamie Gritton ppr = ppr->pr_parent) 2832c861373bSJamie Gritton if (ppr == killpr) { 2833c861373bSJamie Gritton kern_psignal(p, SIGKILL); 2834c861373bSJamie Gritton break; 2835c861373bSJamie Gritton } 2836c861373bSJamie Gritton } 2837c861373bSJamie Gritton PROC_UNLOCK(p); 2838c861373bSJamie Gritton } 2839c861373bSJamie Gritton sx_sunlock(&allproc_lock); 2840c861373bSJamie Gritton } 2841c861373bSJamie Gritton 28426e1d1bfcSJamie Gritton /* 28436e1d1bfcSJamie Gritton * Finish removing any unreferenced prisons, which couldn't happen 28446e1d1bfcSJamie Gritton * while allprison_lock was held (to avoid a LOR on vrele). 28456e1d1bfcSJamie Gritton */ 28466e1d1bfcSJamie Gritton TAILQ_FOREACH_SAFE(rpr, &freeprison, pr_list, tpr) { 28476e1d1bfcSJamie Gritton #ifdef VIMAGE 28486e1d1bfcSJamie Gritton if (rpr->pr_vnet != rpr->pr_parent->pr_vnet) 28496e1d1bfcSJamie Gritton vnet_destroy(rpr->pr_vnet); 28506e1d1bfcSJamie Gritton #endif 28516e1d1bfcSJamie Gritton if (rpr->pr_root != NULL) 28526e1d1bfcSJamie Gritton vrele(rpr->pr_root); 28536e1d1bfcSJamie Gritton mtx_destroy(&rpr->pr_mtx); 28546e1d1bfcSJamie Gritton #ifdef INET 28556e1d1bfcSJamie Gritton free(rpr->pr_ip4, M_PRISON); 28566e1d1bfcSJamie Gritton #endif 28576e1d1bfcSJamie Gritton #ifdef INET6 28586e1d1bfcSJamie Gritton free(rpr->pr_ip6, M_PRISON); 28596e1d1bfcSJamie Gritton #endif 28606e1d1bfcSJamie Gritton if (rpr->pr_cpuset != NULL) 28616e1d1bfcSJamie Gritton cpuset_rel(rpr->pr_cpuset); 28626e1d1bfcSJamie Gritton osd_jail_exit(rpr); 28636e1d1bfcSJamie Gritton #ifdef RACCT 28646e1d1bfcSJamie Gritton if (racct_enable) 28656e1d1bfcSJamie Gritton prison_racct_detach(rpr); 28666e1d1bfcSJamie Gritton #endif 2867f7496dcaSJamie Gritton TAILQ_REMOVE(&freeprison, rpr, pr_list); 28686e1d1bfcSJamie Gritton free(rpr, M_PRISON); 28690304c731SJamie Gritton } 2870b3059e09SRobert Watson } 2871b3059e09SRobert Watson 2872413628a7SBjoern A. Zeeb /* 2873c861373bSJamie Gritton * Kill the prison and its descendants. Mark them as dying, clear the 2874c861373bSJamie Gritton * persist flag, and call module remove methods. 2875c861373bSJamie Gritton */ 2876c861373bSJamie Gritton static void 2877c861373bSJamie Gritton prison_deref_kill(struct prison *pr, struct prisonlist *freeprison) 2878c861373bSJamie Gritton { 2879c861373bSJamie Gritton struct prison *cpr, *ppr, *rpr; 2880c861373bSJamie Gritton bool descend; 2881c861373bSJamie Gritton 2882c861373bSJamie Gritton /* 2883c861373bSJamie Gritton * Unlike the descendants, the target prison can be killed 2884c861373bSJamie Gritton * even if it is currently dying. This is useful for failed 2885c861373bSJamie Gritton * creation in jail_set(2). 2886c861373bSJamie Gritton */ 2887c861373bSJamie Gritton KASSERT(refcount_load(&pr->pr_ref) > 0, 2888c861373bSJamie Gritton ("Trying to kill dead prison %p (jid=%d).", 2889c861373bSJamie Gritton pr, pr->pr_id)); 2890c861373bSJamie Gritton refcount_acquire(&pr->pr_uref); 2891c861373bSJamie Gritton pr->pr_state = PRISON_STATE_DYING; 2892c861373bSJamie Gritton mtx_unlock(&pr->pr_mtx); 2893c861373bSJamie Gritton 2894c861373bSJamie Gritton rpr = NULL; 2895c861373bSJamie Gritton FOREACH_PRISON_DESCENDANT_PRE_POST(pr, cpr, descend) { 2896c861373bSJamie Gritton if (descend) { 2897c861373bSJamie Gritton if (!prison_isalive(cpr)) { 2898c861373bSJamie Gritton descend = false; 2899c861373bSJamie Gritton continue; 2900c861373bSJamie Gritton } 2901c861373bSJamie Gritton prison_hold(cpr); 2902c861373bSJamie Gritton prison_proc_hold(cpr); 2903c861373bSJamie Gritton mtx_lock(&cpr->pr_mtx); 2904c861373bSJamie Gritton cpr->pr_state = PRISON_STATE_DYING; 2905c861373bSJamie Gritton cpr->pr_flags |= PR_REMOVE; 2906c861373bSJamie Gritton mtx_unlock(&cpr->pr_mtx); 2907c861373bSJamie Gritton continue; 2908c861373bSJamie Gritton } 2909c861373bSJamie Gritton if (!(cpr->pr_flags & PR_REMOVE)) 2910c861373bSJamie Gritton continue; 2911c861373bSJamie Gritton (void)osd_jail_call(cpr, PR_METHOD_REMOVE, NULL); 2912c861373bSJamie Gritton mtx_lock(&cpr->pr_mtx); 2913c861373bSJamie Gritton cpr->pr_flags &= ~PR_REMOVE; 2914c861373bSJamie Gritton if (cpr->pr_flags & PR_PERSIST) { 2915c861373bSJamie Gritton cpr->pr_flags &= ~PR_PERSIST; 2916c861373bSJamie Gritton prison_proc_free_not_last(cpr); 2917c861373bSJamie Gritton prison_free_not_last(cpr); 2918c861373bSJamie Gritton } 2919c861373bSJamie Gritton (void)refcount_release(&cpr->pr_uref); 2920c861373bSJamie Gritton if (refcount_release(&cpr->pr_ref)) { 2921c861373bSJamie Gritton /* 2922c861373bSJamie Gritton * When the last reference goes, unlink the prison 2923c861373bSJamie Gritton * and set it aside for prison_deref() to handle. 2924c861373bSJamie Gritton * Delay unlinking the sibling list to keep the loop 2925c861373bSJamie Gritton * safe. 2926c861373bSJamie Gritton */ 2927c861373bSJamie Gritton if (rpr != NULL) 2928c861373bSJamie Gritton LIST_REMOVE(rpr, pr_sibling); 2929c861373bSJamie Gritton rpr = cpr; 2930c861373bSJamie Gritton rpr->pr_state = PRISON_STATE_INVALID; 2931c861373bSJamie Gritton TAILQ_REMOVE(&allprison, rpr, pr_list); 2932c861373bSJamie Gritton TAILQ_INSERT_TAIL(freeprison, rpr, pr_list); 2933c861373bSJamie Gritton /* 2934c861373bSJamie Gritton * Removing a prison frees references from its parent. 2935c861373bSJamie Gritton */ 2936c861373bSJamie Gritton ppr = rpr->pr_parent; 2937c861373bSJamie Gritton prison_proc_free_not_last(ppr); 2938c861373bSJamie Gritton prison_free_not_last(ppr); 2939c861373bSJamie Gritton for (; ppr != NULL; ppr = ppr->pr_parent) 2940c861373bSJamie Gritton ppr->pr_childcount--; 2941c861373bSJamie Gritton } 2942c861373bSJamie Gritton mtx_unlock(&cpr->pr_mtx); 2943c861373bSJamie Gritton } 2944c861373bSJamie Gritton if (rpr != NULL) 2945c861373bSJamie Gritton LIST_REMOVE(rpr, pr_sibling); 2946c861373bSJamie Gritton 2947c861373bSJamie Gritton (void)osd_jail_call(pr, PR_METHOD_REMOVE, NULL); 2948c861373bSJamie Gritton mtx_lock(&pr->pr_mtx); 2949c861373bSJamie Gritton if (pr->pr_flags & PR_PERSIST) { 2950c861373bSJamie Gritton pr->pr_flags &= ~PR_PERSIST; 2951c861373bSJamie Gritton prison_proc_free_not_last(pr); 2952c861373bSJamie Gritton prison_free_not_last(pr); 2953c861373bSJamie Gritton } 2954c861373bSJamie Gritton (void)refcount_release(&pr->pr_uref); 2955c861373bSJamie Gritton } 2956c861373bSJamie Gritton 2957c861373bSJamie Gritton /* 2958f7496dcaSJamie Gritton * Given the current locking state in the flags, make sure allprison_lock 2959f7496dcaSJamie Gritton * is held exclusive, and the prison is locked. Return flags indicating 2960f7496dcaSJamie Gritton * the new state. 2961f7496dcaSJamie Gritton */ 2962f7496dcaSJamie Gritton static int 2963f7496dcaSJamie Gritton prison_lock_xlock(struct prison *pr, int flags) 2964f7496dcaSJamie Gritton { 2965f7496dcaSJamie Gritton 2966f7496dcaSJamie Gritton if (!(flags & PD_LIST_XLOCKED)) { 2967f7496dcaSJamie Gritton /* 2968f7496dcaSJamie Gritton * Get allprison_lock, which may be an upgrade, 2969f7496dcaSJamie Gritton * and may require unlocking the prison. 2970f7496dcaSJamie Gritton */ 2971f7496dcaSJamie Gritton if (flags & PD_LOCKED) { 2972f7496dcaSJamie Gritton mtx_unlock(&pr->pr_mtx); 2973f7496dcaSJamie Gritton flags &= ~PD_LOCKED; 2974f7496dcaSJamie Gritton } 2975f7496dcaSJamie Gritton if (flags & PD_LIST_SLOCKED) { 2976f7496dcaSJamie Gritton if (!sx_try_upgrade(&allprison_lock)) { 2977f7496dcaSJamie Gritton sx_sunlock(&allprison_lock); 2978f7496dcaSJamie Gritton sx_xlock(&allprison_lock); 2979f7496dcaSJamie Gritton } 2980f7496dcaSJamie Gritton flags &= ~PD_LIST_SLOCKED; 2981f7496dcaSJamie Gritton } else 2982f7496dcaSJamie Gritton sx_xlock(&allprison_lock); 2983f7496dcaSJamie Gritton flags |= PD_LIST_XLOCKED; 2984f7496dcaSJamie Gritton } 2985f7496dcaSJamie Gritton if (!(flags & PD_LOCKED)) { 2986f7496dcaSJamie Gritton /* Lock the prison mutex. */ 2987f7496dcaSJamie Gritton mtx_lock(&pr->pr_mtx); 2988f7496dcaSJamie Gritton flags |= PD_LOCKED; 2989f7496dcaSJamie Gritton } 2990f7496dcaSJamie Gritton return flags; 2991f7496dcaSJamie Gritton } 2992f7496dcaSJamie Gritton 2993f7496dcaSJamie Gritton /* 29940fe74ae6SJamie Gritton * Set or clear a permission bit in the pr_allow field, passing restrictions 29950fe74ae6SJamie Gritton * (cleared permission) down to child jails. 29960fe74ae6SJamie Gritton */ 29970fe74ae6SJamie Gritton void 29980fe74ae6SJamie Gritton prison_set_allow(struct ucred *cred, unsigned flag, int enable) 29990fe74ae6SJamie Gritton { 30000fe74ae6SJamie Gritton struct prison *pr; 30010fe74ae6SJamie Gritton 30020fe74ae6SJamie Gritton pr = cred->cr_prison; 30030fe74ae6SJamie Gritton sx_slock(&allprison_lock); 30040fe74ae6SJamie Gritton mtx_lock(&pr->pr_mtx); 30050fe74ae6SJamie Gritton prison_set_allow_locked(pr, flag, enable); 30060fe74ae6SJamie Gritton mtx_unlock(&pr->pr_mtx); 30070fe74ae6SJamie Gritton sx_sunlock(&allprison_lock); 30080fe74ae6SJamie Gritton } 30090fe74ae6SJamie Gritton 30100fe74ae6SJamie Gritton static void 30110fe74ae6SJamie Gritton prison_set_allow_locked(struct prison *pr, unsigned flag, int enable) 30120fe74ae6SJamie Gritton { 30130fe74ae6SJamie Gritton struct prison *cpr; 30140fe74ae6SJamie Gritton int descend; 30150fe74ae6SJamie Gritton 30160fe74ae6SJamie Gritton if (enable != 0) 30170fe74ae6SJamie Gritton pr->pr_allow |= flag; 30180fe74ae6SJamie Gritton else { 30190fe74ae6SJamie Gritton pr->pr_allow &= ~flag; 30200fe74ae6SJamie Gritton FOREACH_PRISON_DESCENDANT_LOCKED(pr, cpr, descend) 30210fe74ae6SJamie Gritton cpr->pr_allow &= ~flag; 30220fe74ae6SJamie Gritton } 30230fe74ae6SJamie Gritton } 30240fe74ae6SJamie Gritton 30250fe74ae6SJamie Gritton /* 3026ca04ba64SJamie Gritton * Check if a jail supports the given address family. 3027ca04ba64SJamie Gritton * 3028ca04ba64SJamie Gritton * Returns 0 if not jailed or the address family is supported, EAFNOSUPPORT 3029ca04ba64SJamie Gritton * if not. 3030ca04ba64SJamie Gritton */ 3031ca04ba64SJamie Gritton int 3032ca04ba64SJamie Gritton prison_check_af(struct ucred *cred, int af) 3033ca04ba64SJamie Gritton { 30340304c731SJamie Gritton struct prison *pr; 3035ca04ba64SJamie Gritton int error; 3036ca04ba64SJamie Gritton 3037ca04ba64SJamie Gritton KASSERT(cred != NULL, ("%s: cred is NULL", __func__)); 3038ca04ba64SJamie Gritton 30390304c731SJamie Gritton pr = cred->cr_prison; 3040499650a0SJamie Gritton #ifdef VIMAGE 30416bb79563SJamie Gritton /* Prisons with their own network stack are not limited. */ 3042de0bd6f7SBjoern A. Zeeb if (prison_owns_vnet(cred)) 30436bb79563SJamie Gritton return (0); 3044499650a0SJamie Gritton #endif 30456bb79563SJamie Gritton 3046ca04ba64SJamie Gritton error = 0; 3047ca04ba64SJamie Gritton switch (af) 3048ca04ba64SJamie Gritton { 3049ca04ba64SJamie Gritton #ifdef INET 3050ca04ba64SJamie Gritton case AF_INET: 30510304c731SJamie Gritton if (pr->pr_flags & PR_IP4) 30520304c731SJamie Gritton { 30530304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 30540304c731SJamie Gritton if ((pr->pr_flags & PR_IP4) && pr->pr_ip4 == NULL) 3055ca04ba64SJamie Gritton error = EAFNOSUPPORT; 30560304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 30570304c731SJamie Gritton } 3058ca04ba64SJamie Gritton break; 3059ca04ba64SJamie Gritton #endif 3060ca04ba64SJamie Gritton #ifdef INET6 3061ca04ba64SJamie Gritton case AF_INET6: 30620304c731SJamie Gritton if (pr->pr_flags & PR_IP6) 30630304c731SJamie Gritton { 30640304c731SJamie Gritton mtx_lock(&pr->pr_mtx); 30650304c731SJamie Gritton if ((pr->pr_flags & PR_IP6) && pr->pr_ip6 == NULL) 3066ca04ba64SJamie Gritton error = EAFNOSUPPORT; 30670304c731SJamie Gritton mtx_unlock(&pr->pr_mtx); 30680304c731SJamie Gritton } 3069ca04ba64SJamie Gritton break; 3070ca04ba64SJamie Gritton #endif 3071ca04ba64SJamie Gritton case AF_LOCAL: 3072ca04ba64SJamie Gritton case AF_ROUTE: 3073ca04ba64SJamie Gritton break; 3074ca04ba64SJamie Gritton default: 30750304c731SJamie Gritton if (!(pr->pr_allow & PR_ALLOW_SOCKET_AF)) 3076ca04ba64SJamie Gritton error = EAFNOSUPPORT; 3077ca04ba64SJamie Gritton } 3078ca04ba64SJamie Gritton return (error); 3079ca04ba64SJamie Gritton } 3080ca04ba64SJamie Gritton 3081ca04ba64SJamie Gritton /* 3082413628a7SBjoern A. Zeeb * Check if given address belongs to the jail referenced by cred (wrapper to 3083413628a7SBjoern A. Zeeb * prison_check_ip[46]). 3084413628a7SBjoern A. Zeeb * 30850304c731SJamie Gritton * Returns 0 if jail doesn't restrict the address family or if address belongs 30860304c731SJamie Gritton * to jail, EADDRNOTAVAIL if the address doesn't belong, or EAFNOSUPPORT if 30870304c731SJamie Gritton * the jail doesn't allow the address family. IPv4 Address passed in in NBO. 3088413628a7SBjoern A. Zeeb */ 3089413628a7SBjoern A. Zeeb int 3090c83dda36SAlexander V. Chernikov prison_if(struct ucred *cred, const struct sockaddr *sa) 309175c13541SPoul-Henning Kamp { 3092413628a7SBjoern A. Zeeb #ifdef INET 3093c83dda36SAlexander V. Chernikov const struct sockaddr_in *sai; 3094413628a7SBjoern A. Zeeb #endif 3095413628a7SBjoern A. Zeeb #ifdef INET6 3096c83dda36SAlexander V. Chernikov const struct sockaddr_in6 *sai6; 3097413628a7SBjoern A. Zeeb #endif 3098b89e82ddSJamie Gritton int error; 309975c13541SPoul-Henning Kamp 3100413628a7SBjoern A. Zeeb KASSERT(cred != NULL, ("%s: cred is NULL", __func__)); 3101413628a7SBjoern A. Zeeb KASSERT(sa != NULL, ("%s: sa is NULL", __func__)); 3102413628a7SBjoern A. Zeeb 3103de0bd6f7SBjoern A. Zeeb #ifdef VIMAGE 3104de0bd6f7SBjoern A. Zeeb if (prison_owns_vnet(cred)) 3105de0bd6f7SBjoern A. Zeeb return (0); 3106de0bd6f7SBjoern A. Zeeb #endif 3107de0bd6f7SBjoern A. Zeeb 3108b89e82ddSJamie Gritton error = 0; 3109413628a7SBjoern A. Zeeb switch (sa->sa_family) 3110413628a7SBjoern A. Zeeb { 3111413628a7SBjoern A. Zeeb #ifdef INET 3112413628a7SBjoern A. Zeeb case AF_INET: 3113c83dda36SAlexander V. Chernikov sai = (const struct sockaddr_in *)sa; 3114b89e82ddSJamie Gritton error = prison_check_ip4(cred, &sai->sin_addr); 3115413628a7SBjoern A. Zeeb break; 3116413628a7SBjoern A. Zeeb #endif 3117413628a7SBjoern A. Zeeb #ifdef INET6 3118413628a7SBjoern A. Zeeb case AF_INET6: 3119c83dda36SAlexander V. Chernikov sai6 = (const struct sockaddr_in6 *)sa; 3120b89e82ddSJamie Gritton error = prison_check_ip6(cred, &sai6->sin6_addr); 3121413628a7SBjoern A. Zeeb break; 3122413628a7SBjoern A. Zeeb #endif 3123413628a7SBjoern A. Zeeb default: 31240304c731SJamie Gritton if (!(cred->cr_prison->pr_allow & PR_ALLOW_SOCKET_AF)) 3125b89e82ddSJamie Gritton error = EAFNOSUPPORT; 3126413628a7SBjoern A. Zeeb } 3127b89e82ddSJamie Gritton return (error); 312875c13541SPoul-Henning Kamp } 312991421ba2SRobert Watson 313091421ba2SRobert Watson /* 313191421ba2SRobert Watson * Return 0 if jails permit p1 to frob p2, otherwise ESRCH. 313291421ba2SRobert Watson */ 313391421ba2SRobert Watson int 31349ddb7954SMike Barcroft prison_check(struct ucred *cred1, struct ucred *cred2) 313591421ba2SRobert Watson { 313691421ba2SRobert Watson 31370304c731SJamie Gritton return ((cred1->cr_prison == cred2->cr_prison || 31380304c731SJamie Gritton prison_ischild(cred1->cr_prison, cred2->cr_prison)) ? 0 : ESRCH); 31390304c731SJamie Gritton } 314091421ba2SRobert Watson 31410304c731SJamie Gritton /* 31420304c731SJamie Gritton * Return 1 if p2 is a child of p1, otherwise 0. 31430304c731SJamie Gritton */ 31440304c731SJamie Gritton int 31450304c731SJamie Gritton prison_ischild(struct prison *pr1, struct prison *pr2) 31460304c731SJamie Gritton { 31470304c731SJamie Gritton 31480304c731SJamie Gritton for (pr2 = pr2->pr_parent; pr2 != NULL; pr2 = pr2->pr_parent) 31490304c731SJamie Gritton if (pr1 == pr2) 31500304c731SJamie Gritton return (1); 315191421ba2SRobert Watson return (0); 315291421ba2SRobert Watson } 315391421ba2SRobert Watson 315491421ba2SRobert Watson /* 3155f7496dcaSJamie Gritton * Return true if the prison is currently alive. A prison is alive if it 3156f7496dcaSJamie Gritton * holds user references and it isn't being removed. 315776ad42abSJamie Gritton */ 315876ad42abSJamie Gritton bool 315976ad42abSJamie Gritton prison_isalive(struct prison *pr) 316076ad42abSJamie Gritton { 316176ad42abSJamie Gritton 31621158508aSJamie Gritton if (__predict_false(pr->pr_state != PRISON_STATE_ALIVE)) 3163cc7b7306SJamie Gritton return (false); 316476ad42abSJamie Gritton return (true); 316576ad42abSJamie Gritton } 316676ad42abSJamie Gritton 316776ad42abSJamie Gritton /* 316876ad42abSJamie Gritton * Return true if the prison is currently valid. A prison is valid if it has 316976ad42abSJamie Gritton * been fully created, and is not being destroyed. Note that dying prisons 3170f7496dcaSJamie Gritton * are still considered valid. Invalid prisons won't be found under normal 3171f7496dcaSJamie Gritton * circumstances, as they're only put in that state by functions that have 3172f7496dcaSJamie Gritton * an exclusive hold on allprison_lock. 317376ad42abSJamie Gritton */ 317476ad42abSJamie Gritton bool 317576ad42abSJamie Gritton prison_isvalid(struct prison *pr) 317676ad42abSJamie Gritton { 317776ad42abSJamie Gritton 31781158508aSJamie Gritton if (__predict_false(pr->pr_state == PRISON_STATE_INVALID)) 31791158508aSJamie Gritton return (false); 31806754ae25SJamie Gritton if (__predict_false(refcount_load(&pr->pr_ref) == 0)) 318176ad42abSJamie Gritton return (false); 318276ad42abSJamie Gritton return (true); 318376ad42abSJamie Gritton } 318476ad42abSJamie Gritton 318576ad42abSJamie Gritton /* 3186de0bd6f7SBjoern A. Zeeb * Return 1 if the passed credential is in a jail and that jail does not 3187de0bd6f7SBjoern A. Zeeb * have its own virtual network stack, otherwise 0. 3188de0bd6f7SBjoern A. Zeeb */ 3189de0bd6f7SBjoern A. Zeeb int 3190de0bd6f7SBjoern A. Zeeb jailed_without_vnet(struct ucred *cred) 3191de0bd6f7SBjoern A. Zeeb { 3192de0bd6f7SBjoern A. Zeeb 3193de0bd6f7SBjoern A. Zeeb if (!jailed(cred)) 3194de0bd6f7SBjoern A. Zeeb return (0); 3195de0bd6f7SBjoern A. Zeeb #ifdef VIMAGE 3196de0bd6f7SBjoern A. Zeeb if (prison_owns_vnet(cred)) 3197de0bd6f7SBjoern A. Zeeb return (0); 3198de0bd6f7SBjoern A. Zeeb #endif 3199de0bd6f7SBjoern A. Zeeb 3200de0bd6f7SBjoern A. Zeeb return (1); 3201de0bd6f7SBjoern A. Zeeb } 3202de0bd6f7SBjoern A. Zeeb 3203de0bd6f7SBjoern A. Zeeb /* 32047455b100SJamie Gritton * Return the correct hostname (domainname, et al) for the passed credential. 32059484d0c0SRobert Drehmel */ 3206ad1ff099SRobert Drehmel void 32079ddb7954SMike Barcroft getcredhostname(struct ucred *cred, char *buf, size_t size) 32089484d0c0SRobert Drehmel { 320976ca6f88SJamie Gritton struct prison *pr; 32109484d0c0SRobert Drehmel 32117455b100SJamie Gritton /* 32127455b100SJamie Gritton * A NULL credential can be used to shortcut to the physical 32137455b100SJamie Gritton * system's hostname. 32147455b100SJamie Gritton */ 321576ca6f88SJamie Gritton pr = (cred != NULL) ? cred->cr_prison : &prison0; 321676ca6f88SJamie Gritton mtx_lock(&pr->pr_mtx); 3217c1f19219SJamie Gritton strlcpy(buf, pr->pr_hostname, size); 321876ca6f88SJamie Gritton mtx_unlock(&pr->pr_mtx); 32199484d0c0SRobert Drehmel } 3220fd7a8150SMike Barcroft 32217455b100SJamie Gritton void 32227455b100SJamie Gritton getcreddomainname(struct ucred *cred, char *buf, size_t size) 32237455b100SJamie Gritton { 32247455b100SJamie Gritton 32257455b100SJamie Gritton mtx_lock(&cred->cr_prison->pr_mtx); 3226c1f19219SJamie Gritton strlcpy(buf, cred->cr_prison->pr_domainname, size); 32277455b100SJamie Gritton mtx_unlock(&cred->cr_prison->pr_mtx); 32287455b100SJamie Gritton } 32297455b100SJamie Gritton 32307455b100SJamie Gritton void 32317455b100SJamie Gritton getcredhostuuid(struct ucred *cred, char *buf, size_t size) 32327455b100SJamie Gritton { 32337455b100SJamie Gritton 32347455b100SJamie Gritton mtx_lock(&cred->cr_prison->pr_mtx); 3235c1f19219SJamie Gritton strlcpy(buf, cred->cr_prison->pr_hostuuid, size); 32367455b100SJamie Gritton mtx_unlock(&cred->cr_prison->pr_mtx); 32377455b100SJamie Gritton } 32387455b100SJamie Gritton 32397455b100SJamie Gritton void 32407455b100SJamie Gritton getcredhostid(struct ucred *cred, unsigned long *hostid) 32417455b100SJamie Gritton { 32427455b100SJamie Gritton 32437455b100SJamie Gritton mtx_lock(&cred->cr_prison->pr_mtx); 32447455b100SJamie Gritton *hostid = cred->cr_prison->pr_hostid; 32457455b100SJamie Gritton mtx_unlock(&cred->cr_prison->pr_mtx); 32467455b100SJamie Gritton } 32477455b100SJamie Gritton 32483f8bc99cSKristof Provost void 32493f8bc99cSKristof Provost getjailname(struct ucred *cred, char *name, size_t len) 32503f8bc99cSKristof Provost { 32513f8bc99cSKristof Provost 32523f8bc99cSKristof Provost mtx_lock(&cred->cr_prison->pr_mtx); 32533f8bc99cSKristof Provost strlcpy(name, cred->cr_prison->pr_name, len); 32543f8bc99cSKristof Provost mtx_unlock(&cred->cr_prison->pr_mtx); 32553f8bc99cSKristof Provost } 32563f8bc99cSKristof Provost 3257eb79e1c7SBjoern A. Zeeb #ifdef VIMAGE 3258eb79e1c7SBjoern A. Zeeb /* 3259eb79e1c7SBjoern A. Zeeb * Determine whether the prison represented by cred owns 3260eb79e1c7SBjoern A. Zeeb * its vnet rather than having it inherited. 3261eb79e1c7SBjoern A. Zeeb * 3262eb79e1c7SBjoern A. Zeeb * Returns 1 in case the prison owns the vnet, 0 otherwise. 3263eb79e1c7SBjoern A. Zeeb */ 3264eb79e1c7SBjoern A. Zeeb int 3265eb79e1c7SBjoern A. Zeeb prison_owns_vnet(struct ucred *cred) 3266eb79e1c7SBjoern A. Zeeb { 3267eb79e1c7SBjoern A. Zeeb 3268eb79e1c7SBjoern A. Zeeb /* 3269eb79e1c7SBjoern A. Zeeb * vnets cannot be added/removed after jail creation, 3270eb79e1c7SBjoern A. Zeeb * so no need to lock here. 3271eb79e1c7SBjoern A. Zeeb */ 3272eb79e1c7SBjoern A. Zeeb return (cred->cr_prison->pr_flags & PR_VNET ? 1 : 0); 3273eb79e1c7SBjoern A. Zeeb } 3274eb79e1c7SBjoern A. Zeeb #endif 3275eb79e1c7SBjoern A. Zeeb 3276f08df373SRobert Watson /* 3277820a0de9SPawel Jakub Dawidek * Determine whether the subject represented by cred can "see" 3278820a0de9SPawel Jakub Dawidek * status of a mount point. 3279820a0de9SPawel Jakub Dawidek * Returns: 0 for permitted, ENOENT otherwise. 3280820a0de9SPawel Jakub Dawidek * XXX: This function should be called cr_canseemount() and should be 3281820a0de9SPawel Jakub Dawidek * placed in kern_prot.c. 3282f08df373SRobert Watson */ 3283f08df373SRobert Watson int 3284820a0de9SPawel Jakub Dawidek prison_canseemount(struct ucred *cred, struct mount *mp) 3285f08df373SRobert Watson { 3286820a0de9SPawel Jakub Dawidek struct prison *pr; 3287820a0de9SPawel Jakub Dawidek struct statfs *sp; 3288820a0de9SPawel Jakub Dawidek size_t len; 3289f08df373SRobert Watson 3290820a0de9SPawel Jakub Dawidek pr = cred->cr_prison; 32910304c731SJamie Gritton if (pr->pr_enforce_statfs == 0) 32920304c731SJamie Gritton return (0); 3293820a0de9SPawel Jakub Dawidek if (pr->pr_root->v_mount == mp) 3294820a0de9SPawel Jakub Dawidek return (0); 32950304c731SJamie Gritton if (pr->pr_enforce_statfs == 2) 3296820a0de9SPawel Jakub Dawidek return (ENOENT); 3297820a0de9SPawel Jakub Dawidek /* 3298820a0de9SPawel Jakub Dawidek * If jail's chroot directory is set to "/" we should be able to see 3299820a0de9SPawel Jakub Dawidek * all mount-points from inside a jail. 3300820a0de9SPawel Jakub Dawidek * This is ugly check, but this is the only situation when jail's 3301820a0de9SPawel Jakub Dawidek * directory ends with '/'. 3302820a0de9SPawel Jakub Dawidek */ 3303820a0de9SPawel Jakub Dawidek if (strcmp(pr->pr_path, "/") == 0) 3304820a0de9SPawel Jakub Dawidek return (0); 3305820a0de9SPawel Jakub Dawidek len = strlen(pr->pr_path); 3306820a0de9SPawel Jakub Dawidek sp = &mp->mnt_stat; 3307820a0de9SPawel Jakub Dawidek if (strncmp(pr->pr_path, sp->f_mntonname, len) != 0) 3308820a0de9SPawel Jakub Dawidek return (ENOENT); 3309820a0de9SPawel Jakub Dawidek /* 3310820a0de9SPawel Jakub Dawidek * Be sure that we don't have situation where jail's root directory 3311820a0de9SPawel Jakub Dawidek * is "/some/path" and mount point is "/some/pathpath". 3312820a0de9SPawel Jakub Dawidek */ 3313820a0de9SPawel Jakub Dawidek if (sp->f_mntonname[len] != '\0' && sp->f_mntonname[len] != '/') 3314820a0de9SPawel Jakub Dawidek return (ENOENT); 3315f08df373SRobert Watson return (0); 3316f08df373SRobert Watson } 3317820a0de9SPawel Jakub Dawidek 3318820a0de9SPawel Jakub Dawidek void 3319820a0de9SPawel Jakub Dawidek prison_enforce_statfs(struct ucred *cred, struct mount *mp, struct statfs *sp) 3320820a0de9SPawel Jakub Dawidek { 3321820a0de9SPawel Jakub Dawidek char jpath[MAXPATHLEN]; 3322820a0de9SPawel Jakub Dawidek struct prison *pr; 3323820a0de9SPawel Jakub Dawidek size_t len; 3324820a0de9SPawel Jakub Dawidek 3325820a0de9SPawel Jakub Dawidek pr = cred->cr_prison; 33260304c731SJamie Gritton if (pr->pr_enforce_statfs == 0) 33270304c731SJamie Gritton return; 3328820a0de9SPawel Jakub Dawidek if (prison_canseemount(cred, mp) != 0) { 3329820a0de9SPawel Jakub Dawidek bzero(sp->f_mntonname, sizeof(sp->f_mntonname)); 3330820a0de9SPawel Jakub Dawidek strlcpy(sp->f_mntonname, "[restricted]", 3331820a0de9SPawel Jakub Dawidek sizeof(sp->f_mntonname)); 3332820a0de9SPawel Jakub Dawidek return; 3333820a0de9SPawel Jakub Dawidek } 3334820a0de9SPawel Jakub Dawidek if (pr->pr_root->v_mount == mp) { 3335820a0de9SPawel Jakub Dawidek /* 3336820a0de9SPawel Jakub Dawidek * Clear current buffer data, so we are sure nothing from 3337820a0de9SPawel Jakub Dawidek * the valid path left there. 3338820a0de9SPawel Jakub Dawidek */ 3339820a0de9SPawel Jakub Dawidek bzero(sp->f_mntonname, sizeof(sp->f_mntonname)); 3340820a0de9SPawel Jakub Dawidek *sp->f_mntonname = '/'; 3341820a0de9SPawel Jakub Dawidek return; 3342820a0de9SPawel Jakub Dawidek } 3343820a0de9SPawel Jakub Dawidek /* 3344820a0de9SPawel Jakub Dawidek * If jail's chroot directory is set to "/" we should be able to see 3345820a0de9SPawel Jakub Dawidek * all mount-points from inside a jail. 3346820a0de9SPawel Jakub Dawidek */ 3347820a0de9SPawel Jakub Dawidek if (strcmp(pr->pr_path, "/") == 0) 3348820a0de9SPawel Jakub Dawidek return; 3349820a0de9SPawel Jakub Dawidek len = strlen(pr->pr_path); 3350820a0de9SPawel Jakub Dawidek strlcpy(jpath, sp->f_mntonname + len, sizeof(jpath)); 3351820a0de9SPawel Jakub Dawidek /* 3352820a0de9SPawel Jakub Dawidek * Clear current buffer data, so we are sure nothing from 3353820a0de9SPawel Jakub Dawidek * the valid path left there. 3354820a0de9SPawel Jakub Dawidek */ 3355820a0de9SPawel Jakub Dawidek bzero(sp->f_mntonname, sizeof(sp->f_mntonname)); 3356820a0de9SPawel Jakub Dawidek if (*jpath == '\0') { 3357820a0de9SPawel Jakub Dawidek /* Should never happen. */ 3358820a0de9SPawel Jakub Dawidek *sp->f_mntonname = '/'; 3359820a0de9SPawel Jakub Dawidek } else { 3360820a0de9SPawel Jakub Dawidek strlcpy(sp->f_mntonname, jpath, sizeof(sp->f_mntonname)); 3361820a0de9SPawel Jakub Dawidek } 3362f08df373SRobert Watson } 3363f08df373SRobert Watson 3364800c9408SRobert Watson /* 3365800c9408SRobert Watson * Check with permission for a specific privilege is granted within jail. We 3366800c9408SRobert Watson * have a specific list of accepted privileges; the rest are denied. 3367800c9408SRobert Watson */ 3368800c9408SRobert Watson int 3369800c9408SRobert Watson prison_priv_check(struct ucred *cred, int priv) 3370800c9408SRobert Watson { 33710fe74ae6SJamie Gritton struct prison *pr; 33720fe74ae6SJamie Gritton int error; 3373800c9408SRobert Watson 33747b2ff0dcSMateusz Guzik /* 33757b2ff0dcSMateusz Guzik * Some policies have custom handlers. This routine should not be 33767b2ff0dcSMateusz Guzik * called for them. See priv_check_cred(). 33777b2ff0dcSMateusz Guzik */ 33787b2ff0dcSMateusz Guzik switch (priv) { 3379a459a6cfSMateusz Guzik case PRIV_VFS_LOOKUP: 33807b2ff0dcSMateusz Guzik case PRIV_VFS_GENERATION: 33817b2ff0dcSMateusz Guzik KASSERT(0, ("prison_priv_check instead of a custom handler " 33827b2ff0dcSMateusz Guzik "called for %d\n", priv)); 33837b2ff0dcSMateusz Guzik } 33847b2ff0dcSMateusz Guzik 3385800c9408SRobert Watson if (!jailed(cred)) 3386800c9408SRobert Watson return (0); 3387800c9408SRobert Watson 33886bb79563SJamie Gritton #ifdef VIMAGE 33896bb79563SJamie Gritton /* 33906bb79563SJamie Gritton * Privileges specific to prisons with a virtual network stack. 33916bb79563SJamie Gritton * There might be a duplicate entry here in case the privilege 33926bb79563SJamie Gritton * is only granted conditionally in the legacy jail case. 33936bb79563SJamie Gritton */ 33946bb79563SJamie Gritton switch (priv) { 33956bb79563SJamie Gritton #ifdef notyet 33966bb79563SJamie Gritton /* 33976bb79563SJamie Gritton * NFS-specific privileges. 33986bb79563SJamie Gritton */ 33996bb79563SJamie Gritton case PRIV_NFS_DAEMON: 34006bb79563SJamie Gritton case PRIV_NFS_LOCKD: 34016bb79563SJamie Gritton #endif 34026bb79563SJamie Gritton /* 34036bb79563SJamie Gritton * Network stack privileges. 34046bb79563SJamie Gritton */ 34056bb79563SJamie Gritton case PRIV_NET_BRIDGE: 34066bb79563SJamie Gritton case PRIV_NET_GRE: 34076bb79563SJamie Gritton case PRIV_NET_BPF: 34086bb79563SJamie Gritton case PRIV_NET_RAW: /* Dup, cond. in legacy jail case. */ 34096bb79563SJamie Gritton case PRIV_NET_ROUTE: 34106bb79563SJamie Gritton case PRIV_NET_TAP: 34116bb79563SJamie Gritton case PRIV_NET_SETIFMTU: 34126bb79563SJamie Gritton case PRIV_NET_SETIFFLAGS: 34136bb79563SJamie Gritton case PRIV_NET_SETIFCAP: 3414215940b3SXin LI case PRIV_NET_SETIFDESCR: 34156bb79563SJamie Gritton case PRIV_NET_SETIFNAME : 34166bb79563SJamie Gritton case PRIV_NET_SETIFMETRIC: 34176bb79563SJamie Gritton case PRIV_NET_SETIFPHYS: 34186bb79563SJamie Gritton case PRIV_NET_SETIFMAC: 3419389474c1SKonstantin Belousov case PRIV_NET_SETLANPCP: 34206bb79563SJamie Gritton case PRIV_NET_ADDMULTI: 34216bb79563SJamie Gritton case PRIV_NET_DELMULTI: 34226bb79563SJamie Gritton case PRIV_NET_HWIOCTL: 34236bb79563SJamie Gritton case PRIV_NET_SETLLADDR: 34246bb79563SJamie Gritton case PRIV_NET_ADDIFGROUP: 34256bb79563SJamie Gritton case PRIV_NET_DELIFGROUP: 34266bb79563SJamie Gritton case PRIV_NET_IFCREATE: 34276bb79563SJamie Gritton case PRIV_NET_IFDESTROY: 34286bb79563SJamie Gritton case PRIV_NET_ADDIFADDR: 34296bb79563SJamie Gritton case PRIV_NET_DELIFADDR: 34306bb79563SJamie Gritton case PRIV_NET_LAGG: 34316bb79563SJamie Gritton case PRIV_NET_GIF: 34326bb79563SJamie Gritton case PRIV_NET_SETIFVNET: 343335fd7bc0SBjoern A. Zeeb case PRIV_NET_SETIFFIB: 34346bb79563SJamie Gritton 34356bb79563SJamie Gritton /* 34366bb79563SJamie Gritton * 802.11-related privileges. 34376bb79563SJamie Gritton */ 3438f7d38a13SAdrian Chadd case PRIV_NET80211_VAP_GETKEY: 3439f7d38a13SAdrian Chadd case PRIV_NET80211_VAP_MANAGE: 34406bb79563SJamie Gritton 34416bb79563SJamie Gritton #ifdef notyet 34426bb79563SJamie Gritton /* 34436bb79563SJamie Gritton * ATM privileges. 34446bb79563SJamie Gritton */ 34456bb79563SJamie Gritton case PRIV_NETATM_CFG: 34466bb79563SJamie Gritton case PRIV_NETATM_ADD: 34476bb79563SJamie Gritton case PRIV_NETATM_DEL: 34486bb79563SJamie Gritton case PRIV_NETATM_SET: 34496bb79563SJamie Gritton 34506bb79563SJamie Gritton /* 34516bb79563SJamie Gritton * Bluetooth privileges. 34526bb79563SJamie Gritton */ 34536bb79563SJamie Gritton case PRIV_NETBLUETOOTH_RAW: 34546bb79563SJamie Gritton #endif 34556bb79563SJamie Gritton 34566bb79563SJamie Gritton /* 34576bb79563SJamie Gritton * Netgraph and netgraph module privileges. 34586bb79563SJamie Gritton */ 34596bb79563SJamie Gritton case PRIV_NETGRAPH_CONTROL: 34606bb79563SJamie Gritton #ifdef notyet 34616bb79563SJamie Gritton case PRIV_NETGRAPH_TTY: 34626bb79563SJamie Gritton #endif 34636bb79563SJamie Gritton 34646bb79563SJamie Gritton /* 34656bb79563SJamie Gritton * IPv4 and IPv6 privileges. 34666bb79563SJamie Gritton */ 34676bb79563SJamie Gritton case PRIV_NETINET_IPFW: 34686bb79563SJamie Gritton case PRIV_NETINET_DIVERT: 34696bb79563SJamie Gritton case PRIV_NETINET_PF: 34706bb79563SJamie Gritton case PRIV_NETINET_DUMMYNET: 34716bb79563SJamie Gritton case PRIV_NETINET_CARP: 34726bb79563SJamie Gritton case PRIV_NETINET_MROUTE: 34736bb79563SJamie Gritton case PRIV_NETINET_RAW: 34746bb79563SJamie Gritton case PRIV_NETINET_ADDRCTRL6: 34756bb79563SJamie Gritton case PRIV_NETINET_ND6: 34766bb79563SJamie Gritton case PRIV_NETINET_SCOPE6: 34776bb79563SJamie Gritton case PRIV_NETINET_ALIFETIME6: 34786bb79563SJamie Gritton case PRIV_NETINET_IPSEC: 34796bb79563SJamie Gritton case PRIV_NETINET_BINDANY: 34806bb79563SJamie Gritton 34816bb79563SJamie Gritton #ifdef notyet 34826bb79563SJamie Gritton /* 34836bb79563SJamie Gritton * NCP privileges. 34846bb79563SJamie Gritton */ 34856bb79563SJamie Gritton case PRIV_NETNCP: 34866bb79563SJamie Gritton 34876bb79563SJamie Gritton /* 34886bb79563SJamie Gritton * SMB privileges. 34896bb79563SJamie Gritton */ 34906bb79563SJamie Gritton case PRIV_NETSMB: 34916bb79563SJamie Gritton #endif 34926bb79563SJamie Gritton 34936bb79563SJamie Gritton /* 34946bb79563SJamie Gritton * No default: or deny here. 34956bb79563SJamie Gritton * In case of no permit fall through to next switch(). 34966bb79563SJamie Gritton */ 34976bb79563SJamie Gritton if (cred->cr_prison->pr_flags & PR_VNET) 34986bb79563SJamie Gritton return (0); 34996bb79563SJamie Gritton } 35006bb79563SJamie Gritton #endif /* VIMAGE */ 35016bb79563SJamie Gritton 3502800c9408SRobert Watson switch (priv) { 3503800c9408SRobert Watson /* 3504800c9408SRobert Watson * Allow ktrace privileges for root in jail. 3505800c9408SRobert Watson */ 3506800c9408SRobert Watson case PRIV_KTRACE: 3507800c9408SRobert Watson 3508c3c1b5e6SRobert Watson #if 0 3509800c9408SRobert Watson /* 3510800c9408SRobert Watson * Allow jailed processes to configure audit identity and 3511800c9408SRobert Watson * submit audit records (login, etc). In the future we may 3512800c9408SRobert Watson * want to further refine the relationship between audit and 3513800c9408SRobert Watson * jail. 3514800c9408SRobert Watson */ 3515800c9408SRobert Watson case PRIV_AUDIT_GETAUDIT: 3516800c9408SRobert Watson case PRIV_AUDIT_SETAUDIT: 3517800c9408SRobert Watson case PRIV_AUDIT_SUBMIT: 3518c3c1b5e6SRobert Watson #endif 3519800c9408SRobert Watson 3520800c9408SRobert Watson /* 3521800c9408SRobert Watson * Allow jailed processes to manipulate process UNIX 3522800c9408SRobert Watson * credentials in any way they see fit. 3523800c9408SRobert Watson */ 3524800c9408SRobert Watson case PRIV_CRED_SETUID: 3525800c9408SRobert Watson case PRIV_CRED_SETEUID: 3526800c9408SRobert Watson case PRIV_CRED_SETGID: 3527800c9408SRobert Watson case PRIV_CRED_SETEGID: 3528800c9408SRobert Watson case PRIV_CRED_SETGROUPS: 3529800c9408SRobert Watson case PRIV_CRED_SETREUID: 3530800c9408SRobert Watson case PRIV_CRED_SETREGID: 3531800c9408SRobert Watson case PRIV_CRED_SETRESUID: 3532800c9408SRobert Watson case PRIV_CRED_SETRESGID: 3533800c9408SRobert Watson 3534800c9408SRobert Watson /* 3535800c9408SRobert Watson * Jail implements visibility constraints already, so allow 3536800c9408SRobert Watson * jailed root to override uid/gid-based constraints. 3537800c9408SRobert Watson */ 3538800c9408SRobert Watson case PRIV_SEEOTHERGIDS: 3539800c9408SRobert Watson case PRIV_SEEOTHERUIDS: 3540800c9408SRobert Watson 3541800c9408SRobert Watson /* 3542800c9408SRobert Watson * Jail implements inter-process debugging limits already, so 3543800c9408SRobert Watson * allow jailed root various debugging privileges. 3544800c9408SRobert Watson */ 3545800c9408SRobert Watson case PRIV_DEBUG_DIFFCRED: 3546800c9408SRobert Watson case PRIV_DEBUG_SUGID: 3547800c9408SRobert Watson case PRIV_DEBUG_UNPRIV: 3548800c9408SRobert Watson 3549800c9408SRobert Watson /* 3550800c9408SRobert Watson * Allow jail to set various resource limits and login 3551800c9408SRobert Watson * properties, and for now, exceed process resource limits. 3552800c9408SRobert Watson */ 3553800c9408SRobert Watson case PRIV_PROC_LIMIT: 3554800c9408SRobert Watson case PRIV_PROC_SETLOGIN: 3555800c9408SRobert Watson case PRIV_PROC_SETRLIMIT: 3556800c9408SRobert Watson 3557800c9408SRobert Watson /* 3558800c9408SRobert Watson * System V and POSIX IPC privileges are granted in jail. 3559800c9408SRobert Watson */ 3560800c9408SRobert Watson case PRIV_IPC_READ: 3561800c9408SRobert Watson case PRIV_IPC_WRITE: 3562800c9408SRobert Watson case PRIV_IPC_ADMIN: 3563800c9408SRobert Watson case PRIV_IPC_MSGSIZE: 3564800c9408SRobert Watson case PRIV_MQ_ADMIN: 3565800c9408SRobert Watson 3566800c9408SRobert Watson /* 35670304c731SJamie Gritton * Jail operations within a jail work on child jails. 35680304c731SJamie Gritton */ 35690304c731SJamie Gritton case PRIV_JAIL_ATTACH: 35700304c731SJamie Gritton case PRIV_JAIL_SET: 35710304c731SJamie Gritton case PRIV_JAIL_REMOVE: 35720304c731SJamie Gritton 35730304c731SJamie Gritton /* 3574800c9408SRobert Watson * Jail implements its own inter-process limits, so allow 3575800c9408SRobert Watson * root processes in jail to change scheduling on other 3576800c9408SRobert Watson * processes in the same jail. Likewise for signalling. 3577800c9408SRobert Watson */ 3578800c9408SRobert Watson case PRIV_SCHED_DIFFCRED: 3579413628a7SBjoern A. Zeeb case PRIV_SCHED_CPUSET: 3580800c9408SRobert Watson case PRIV_SIGNAL_DIFFCRED: 3581800c9408SRobert Watson case PRIV_SIGNAL_SUGID: 3582800c9408SRobert Watson 3583800c9408SRobert Watson /* 3584800c9408SRobert Watson * Allow jailed processes to write to sysctls marked as jail 3585800c9408SRobert Watson * writable. 3586800c9408SRobert Watson */ 3587800c9408SRobert Watson case PRIV_SYSCTL_WRITEJAIL: 3588800c9408SRobert Watson 3589800c9408SRobert Watson /* 3590800c9408SRobert Watson * Allow root in jail to manage a variety of quota 3591e82d0201SRobert Watson * properties. These should likely be conditional on a 3592e82d0201SRobert Watson * configuration option. 3593800c9408SRobert Watson */ 359495b091d2SRobert Watson case PRIV_VFS_GETQUOTA: 359595b091d2SRobert Watson case PRIV_VFS_SETQUOTA: 3596800c9408SRobert Watson 3597800c9408SRobert Watson /* 3598800c9408SRobert Watson * Since Jail relies on chroot() to implement file system 3599800c9408SRobert Watson * protections, grant many VFS privileges to root in jail. 3600800c9408SRobert Watson * Be careful to exclude mount-related and NFS-related 3601800c9408SRobert Watson * privileges. 3602800c9408SRobert Watson */ 3603800c9408SRobert Watson case PRIV_VFS_READ: 3604800c9408SRobert Watson case PRIV_VFS_WRITE: 3605800c9408SRobert Watson case PRIV_VFS_ADMIN: 3606800c9408SRobert Watson case PRIV_VFS_EXEC: 3607800c9408SRobert Watson case PRIV_VFS_BLOCKRESERVE: /* XXXRW: Slightly surprising. */ 3608800c9408SRobert Watson case PRIV_VFS_CHFLAGS_DEV: 3609800c9408SRobert Watson case PRIV_VFS_CHOWN: 3610800c9408SRobert Watson case PRIV_VFS_CHROOT: 3611bb531912SPawel Jakub Dawidek case PRIV_VFS_RETAINSUGID: 3612800c9408SRobert Watson case PRIV_VFS_FCHROOT: 3613800c9408SRobert Watson case PRIV_VFS_LINK: 3614800c9408SRobert Watson case PRIV_VFS_SETGID: 3615e41966dcSRobert Watson case PRIV_VFS_STAT: 3616800c9408SRobert Watson case PRIV_VFS_STICKYFILE: 3617bb56d716SJamie Gritton 3618bb56d716SJamie Gritton /* 3619bb56d716SJamie Gritton * As in the non-jail case, non-root users are expected to be 362070de1003SGordon Bergling * able to read kernel/physical memory (provided /dev/[k]mem 3621bb56d716SJamie Gritton * exists in the jail and they have permission to access it). 3622bb56d716SJamie Gritton */ 3623bb56d716SJamie Gritton case PRIV_KMEM_READ: 3624800c9408SRobert Watson return (0); 3625800c9408SRobert Watson 3626800c9408SRobert Watson /* 3627800c9408SRobert Watson * Depending on the global setting, allow privilege of 3628800c9408SRobert Watson * setting system flags. 3629800c9408SRobert Watson */ 3630800c9408SRobert Watson case PRIV_VFS_SYSFLAGS: 36310304c731SJamie Gritton if (cred->cr_prison->pr_allow & PR_ALLOW_CHFLAGS) 3632800c9408SRobert Watson return (0); 3633800c9408SRobert Watson else 3634800c9408SRobert Watson return (EPERM); 3635800c9408SRobert Watson 3636800c9408SRobert Watson /* 3637f3a8d2f9SPawel Jakub Dawidek * Depending on the global setting, allow privilege of 3638f3a8d2f9SPawel Jakub Dawidek * mounting/unmounting file systems. 3639f3a8d2f9SPawel Jakub Dawidek */ 3640f3a8d2f9SPawel Jakub Dawidek case PRIV_VFS_MOUNT: 3641f3a8d2f9SPawel Jakub Dawidek case PRIV_VFS_UNMOUNT: 3642f3a8d2f9SPawel Jakub Dawidek case PRIV_VFS_MOUNT_NONUSER: 364324b0502eSPawel Jakub Dawidek case PRIV_VFS_MOUNT_OWNER: 36440fe74ae6SJamie Gritton pr = cred->cr_prison; 36450fe74ae6SJamie Gritton prison_lock(pr); 36460fe74ae6SJamie Gritton if (pr->pr_allow & PR_ALLOW_MOUNT && pr->pr_enforce_statfs < 2) 36470fe74ae6SJamie Gritton error = 0; 3648f3a8d2f9SPawel Jakub Dawidek else 36490fe74ae6SJamie Gritton error = EPERM; 36500fe74ae6SJamie Gritton prison_unlock(pr); 36510fe74ae6SJamie Gritton return (error); 3652f3a8d2f9SPawel Jakub Dawidek 3653f3a8d2f9SPawel Jakub Dawidek /* 365463619b6dSKyle Evans * Jails should hold no disposition on the PRIV_VFS_READ_DIR 365563619b6dSKyle Evans * policy. priv_check_cred will not specifically allow it, and 365663619b6dSKyle Evans * we may want a MAC policy to allow it. 365763619b6dSKyle Evans */ 365863619b6dSKyle Evans case PRIV_VFS_READ_DIR: 365963619b6dSKyle Evans return (0); 366063619b6dSKyle Evans 366163619b6dSKyle Evans /* 3662ccd6ac9fSAntoine Brodin * Conditionnaly allow locking (unlocking) physical pages 3663ccd6ac9fSAntoine Brodin * in memory. 3664ccd6ac9fSAntoine Brodin */ 3665ccd6ac9fSAntoine Brodin case PRIV_VM_MLOCK: 3666ccd6ac9fSAntoine Brodin case PRIV_VM_MUNLOCK: 3667ccd6ac9fSAntoine Brodin if (cred->cr_prison->pr_allow & PR_ALLOW_MLOCK) 3668ccd6ac9fSAntoine Brodin return (0); 3669ccd6ac9fSAntoine Brodin else 3670ccd6ac9fSAntoine Brodin return (EPERM); 3671ccd6ac9fSAntoine Brodin 3672ccd6ac9fSAntoine Brodin /* 3673e28f9b7dSAllan Jude * Conditionally allow jailed root to bind reserved ports. 3674800c9408SRobert Watson */ 3675800c9408SRobert Watson case PRIV_NETINET_RESERVEDPORT: 3676e28f9b7dSAllan Jude if (cred->cr_prison->pr_allow & PR_ALLOW_RESERVED_PORTS) 3677e28f9b7dSAllan Jude return (0); 3678e28f9b7dSAllan Jude else 3679e28f9b7dSAllan Jude return (EPERM); 3680e28f9b7dSAllan Jude 3681e28f9b7dSAllan Jude /* 3682e28f9b7dSAllan Jude * Allow jailed root to reuse in-use ports. 3683e28f9b7dSAllan Jude */ 36844b084056SRobert Watson case PRIV_NETINET_REUSEPORT: 3685800c9408SRobert Watson return (0); 3686800c9408SRobert Watson 3687800c9408SRobert Watson /* 3688e3043798SPedro F. Giffuni * Allow jailed root to set certain IPv4/6 (option) headers. 368979ba3952SBjoern A. Zeeb */ 369079ba3952SBjoern A. Zeeb case PRIV_NETINET_SETHDROPTS: 369179ba3952SBjoern A. Zeeb return (0); 369279ba3952SBjoern A. Zeeb 369379ba3952SBjoern A. Zeeb /* 3694800c9408SRobert Watson * Conditionally allow creating raw sockets in jail. 3695800c9408SRobert Watson */ 3696800c9408SRobert Watson case PRIV_NETINET_RAW: 36970304c731SJamie Gritton if (cred->cr_prison->pr_allow & PR_ALLOW_RAW_SOCKETS) 3698800c9408SRobert Watson return (0); 3699800c9408SRobert Watson else 3700800c9408SRobert Watson return (EPERM); 3701800c9408SRobert Watson 3702800c9408SRobert Watson /* 3703800c9408SRobert Watson * Since jail implements its own visibility limits on netstat 3704800c9408SRobert Watson * sysctls, allow getcred. This allows identd to work in 3705800c9408SRobert Watson * jail. 3706800c9408SRobert Watson */ 3707800c9408SRobert Watson case PRIV_NETINET_GETCRED: 3708800c9408SRobert Watson return (0); 3709800c9408SRobert Watson 37102bfc50bcSEdward Tomasz Napierala /* 37112bfc50bcSEdward Tomasz Napierala * Allow jailed root to set loginclass. 37122bfc50bcSEdward Tomasz Napierala */ 37132bfc50bcSEdward Tomasz Napierala case PRIV_PROC_SETLOGINCLASS: 37142bfc50bcSEdward Tomasz Napierala return (0); 37152bfc50bcSEdward Tomasz Napierala 3716b19d66fdSJamie Gritton /* 37174520f617SJamie Gritton * Do not allow a process inside a jail to read the kernel 3718b19d66fdSJamie Gritton * message buffer unless explicitly permitted. 3719b19d66fdSJamie Gritton */ 3720b19d66fdSJamie Gritton case PRIV_MSGBUF: 3721b19d66fdSJamie Gritton if (cred->cr_prison->pr_allow & PR_ALLOW_READ_MSGBUF) 3722b19d66fdSJamie Gritton return (0); 3723b19d66fdSJamie Gritton return (EPERM); 3724b19d66fdSJamie Gritton 3725800c9408SRobert Watson default: 3726800c9408SRobert Watson /* 3727800c9408SRobert Watson * In all remaining cases, deny the privilege request. This 3728800c9408SRobert Watson * includes almost all network privileges, many system 3729800c9408SRobert Watson * configuration privileges. 3730800c9408SRobert Watson */ 3731800c9408SRobert Watson return (EPERM); 3732800c9408SRobert Watson } 3733800c9408SRobert Watson } 3734800c9408SRobert Watson 37350304c731SJamie Gritton /* 37360304c731SJamie Gritton * Return the part of pr2's name that is relative to pr1, or the whole name 37370304c731SJamie Gritton * if it does not directly follow. 37380304c731SJamie Gritton */ 37390304c731SJamie Gritton 37400304c731SJamie Gritton char * 37410304c731SJamie Gritton prison_name(struct prison *pr1, struct prison *pr2) 37420304c731SJamie Gritton { 37430304c731SJamie Gritton char *name; 37440304c731SJamie Gritton 37450304c731SJamie Gritton /* Jails see themselves as "0" (if they see themselves at all). */ 37460304c731SJamie Gritton if (pr1 == pr2) 37470304c731SJamie Gritton return "0"; 37480304c731SJamie Gritton name = pr2->pr_name; 37490304c731SJamie Gritton if (prison_ischild(pr1, pr2)) { 37500304c731SJamie Gritton /* 37510304c731SJamie Gritton * pr1 isn't locked (and allprison_lock may not be either) 37520304c731SJamie Gritton * so its length can't be counted on. But the number of dots 37530304c731SJamie Gritton * can be counted on - and counted. 37540304c731SJamie Gritton */ 37550304c731SJamie Gritton for (; pr1 != &prison0; pr1 = pr1->pr_parent) 37560304c731SJamie Gritton name = strchr(name, '.') + 1; 37570304c731SJamie Gritton } 37580304c731SJamie Gritton return (name); 37590304c731SJamie Gritton } 37600304c731SJamie Gritton 37610304c731SJamie Gritton /* 37620304c731SJamie Gritton * Return the part of pr2's path that is relative to pr1, or the whole path 37630304c731SJamie Gritton * if it does not directly follow. 37640304c731SJamie Gritton */ 37650304c731SJamie Gritton static char * 37660304c731SJamie Gritton prison_path(struct prison *pr1, struct prison *pr2) 37670304c731SJamie Gritton { 37680304c731SJamie Gritton char *path1, *path2; 37690304c731SJamie Gritton int len1; 37700304c731SJamie Gritton 37710304c731SJamie Gritton path1 = pr1->pr_path; 37720304c731SJamie Gritton path2 = pr2->pr_path; 37730304c731SJamie Gritton if (!strcmp(path1, "/")) 37740304c731SJamie Gritton return (path2); 37750304c731SJamie Gritton len1 = strlen(path1); 37760304c731SJamie Gritton if (strncmp(path1, path2, len1)) 37770304c731SJamie Gritton return (path2); 37780304c731SJamie Gritton if (path2[len1] == '\0') 37790304c731SJamie Gritton return "/"; 37800304c731SJamie Gritton if (path2[len1] == '/') 37810304c731SJamie Gritton return (path2 + len1); 37820304c731SJamie Gritton return (path2); 37830304c731SJamie Gritton } 37840304c731SJamie Gritton 37850304c731SJamie Gritton /* 37860304c731SJamie Gritton * Jail-related sysctls. 37870304c731SJamie Gritton */ 37887029da5cSPawel Biernacki static SYSCTL_NODE(_security, OID_AUTO, jail, CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 37890304c731SJamie Gritton "Jails"); 37900304c731SJamie Gritton 3791fd7a8150SMike Barcroft static int 3792fd7a8150SMike Barcroft sysctl_jail_list(SYSCTL_HANDLER_ARGS) 3793fd7a8150SMike Barcroft { 3794b38ff370SJamie Gritton struct xprison *xp; 37950304c731SJamie Gritton struct prison *pr, *cpr; 3796b38ff370SJamie Gritton #ifdef INET 3797b38ff370SJamie Gritton struct in_addr *ip4 = NULL; 3798b38ff370SJamie Gritton int ip4s = 0; 3799b38ff370SJamie Gritton #endif 3800b38ff370SJamie Gritton #ifdef INET6 38013beefaedSColin Percival struct in6_addr *ip6 = NULL; 3802b38ff370SJamie Gritton int ip6s = 0; 3803b38ff370SJamie Gritton #endif 38040304c731SJamie Gritton int descend, error; 3805fd7a8150SMike Barcroft 3806b38ff370SJamie Gritton xp = malloc(sizeof(*xp), M_TEMP, M_WAITOK); 38070304c731SJamie Gritton pr = req->td->td_ucred->cr_prison; 3808b38ff370SJamie Gritton error = 0; 3809dc68a633SPawel Jakub Dawidek sx_slock(&allprison_lock); 38100304c731SJamie Gritton FOREACH_PRISON_DESCENDANT(pr, cpr, descend) { 38110304c731SJamie Gritton #if defined(INET) || defined(INET6) 3812b38ff370SJamie Gritton again: 38130304c731SJamie Gritton #endif 38140304c731SJamie Gritton mtx_lock(&cpr->pr_mtx); 3815413628a7SBjoern A. Zeeb #ifdef INET 38160304c731SJamie Gritton if (cpr->pr_ip4s > 0) { 38170304c731SJamie Gritton if (ip4s < cpr->pr_ip4s) { 38180304c731SJamie Gritton ip4s = cpr->pr_ip4s; 38190304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3820b38ff370SJamie Gritton ip4 = realloc(ip4, ip4s * 3821b38ff370SJamie Gritton sizeof(struct in_addr), M_TEMP, M_WAITOK); 3822b38ff370SJamie Gritton goto again; 3823b38ff370SJamie Gritton } 38240304c731SJamie Gritton bcopy(cpr->pr_ip4, ip4, 38250304c731SJamie Gritton cpr->pr_ip4s * sizeof(struct in_addr)); 3826b38ff370SJamie Gritton } 3827413628a7SBjoern A. Zeeb #endif 3828413628a7SBjoern A. Zeeb #ifdef INET6 38290304c731SJamie Gritton if (cpr->pr_ip6s > 0) { 38300304c731SJamie Gritton if (ip6s < cpr->pr_ip6s) { 38310304c731SJamie Gritton ip6s = cpr->pr_ip6s; 38320304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3833b38ff370SJamie Gritton ip6 = realloc(ip6, ip6s * 3834b38ff370SJamie Gritton sizeof(struct in6_addr), M_TEMP, M_WAITOK); 3835b38ff370SJamie Gritton goto again; 3836413628a7SBjoern A. Zeeb } 38370304c731SJamie Gritton bcopy(cpr->pr_ip6, ip6, 38380304c731SJamie Gritton cpr->pr_ip6s * sizeof(struct in6_addr)); 3839b38ff370SJamie Gritton } 3840b38ff370SJamie Gritton #endif 3841b38ff370SJamie Gritton bzero(xp, sizeof(*xp)); 3842fd7a8150SMike Barcroft xp->pr_version = XPRISON_VERSION; 38430304c731SJamie Gritton xp->pr_id = cpr->pr_id; 38441158508aSJamie Gritton xp->pr_state = cpr->pr_state; 38450304c731SJamie Gritton strlcpy(xp->pr_path, prison_path(pr, cpr), sizeof(xp->pr_path)); 3846c1f19219SJamie Gritton strlcpy(xp->pr_host, cpr->pr_hostname, sizeof(xp->pr_host)); 38470304c731SJamie Gritton strlcpy(xp->pr_name, prison_name(pr, cpr), sizeof(xp->pr_name)); 3848413628a7SBjoern A. Zeeb #ifdef INET 38490304c731SJamie Gritton xp->pr_ip4s = cpr->pr_ip4s; 3850413628a7SBjoern A. Zeeb #endif 3851413628a7SBjoern A. Zeeb #ifdef INET6 38520304c731SJamie Gritton xp->pr_ip6s = cpr->pr_ip6s; 3853413628a7SBjoern A. Zeeb #endif 38540304c731SJamie Gritton mtx_unlock(&cpr->pr_mtx); 3855b38ff370SJamie Gritton error = SYSCTL_OUT(req, xp, sizeof(*xp)); 3856b38ff370SJamie Gritton if (error) 3857b38ff370SJamie Gritton break; 3858413628a7SBjoern A. Zeeb #ifdef INET 3859b38ff370SJamie Gritton if (xp->pr_ip4s > 0) { 3860b38ff370SJamie Gritton error = SYSCTL_OUT(req, ip4, 3861b38ff370SJamie Gritton xp->pr_ip4s * sizeof(struct in_addr)); 3862b38ff370SJamie Gritton if (error) 3863b38ff370SJamie Gritton break; 3864413628a7SBjoern A. Zeeb } 3865413628a7SBjoern A. Zeeb #endif 3866413628a7SBjoern A. Zeeb #ifdef INET6 3867b38ff370SJamie Gritton if (xp->pr_ip6s > 0) { 3868b38ff370SJamie Gritton error = SYSCTL_OUT(req, ip6, 3869b38ff370SJamie Gritton xp->pr_ip6s * sizeof(struct in6_addr)); 3870b38ff370SJamie Gritton if (error) 3871b38ff370SJamie Gritton break; 3872413628a7SBjoern A. Zeeb } 3873413628a7SBjoern A. Zeeb #endif 3874fd7a8150SMike Barcroft } 3875dc68a633SPawel Jakub Dawidek sx_sunlock(&allprison_lock); 3876b38ff370SJamie Gritton free(xp, M_TEMP); 3877b38ff370SJamie Gritton #ifdef INET 3878b38ff370SJamie Gritton free(ip4, M_TEMP); 3879b38ff370SJamie Gritton #endif 3880b38ff370SJamie Gritton #ifdef INET6 3881b38ff370SJamie Gritton free(ip6, M_TEMP); 3882b38ff370SJamie Gritton #endif 3883fd7a8150SMike Barcroft return (error); 3884fd7a8150SMike Barcroft } 3885fd7a8150SMike Barcroft 3886f3b86a5fSEd Schouten SYSCTL_OID(_security_jail, OID_AUTO, list, 3887f3b86a5fSEd Schouten CTLTYPE_STRUCT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0, 3888f3b86a5fSEd Schouten sysctl_jail_list, "S", "List of active jails"); 3889461167c2SPawel Jakub Dawidek 3890461167c2SPawel Jakub Dawidek static int 3891461167c2SPawel Jakub Dawidek sysctl_jail_jailed(SYSCTL_HANDLER_ARGS) 3892461167c2SPawel Jakub Dawidek { 3893461167c2SPawel Jakub Dawidek int error, injail; 3894461167c2SPawel Jakub Dawidek 3895461167c2SPawel Jakub Dawidek injail = jailed(req->td->td_ucred); 3896461167c2SPawel Jakub Dawidek error = SYSCTL_OUT(req, &injail, sizeof(injail)); 3897461167c2SPawel Jakub Dawidek 3898461167c2SPawel Jakub Dawidek return (error); 3899461167c2SPawel Jakub Dawidek } 39000304c731SJamie Gritton 3901f3b86a5fSEd Schouten SYSCTL_PROC(_security_jail, OID_AUTO, jailed, 3902f3b86a5fSEd Schouten CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0, 3903f3b86a5fSEd Schouten sysctl_jail_jailed, "I", "Process in jail?"); 3904413628a7SBjoern A. Zeeb 3905761d2bb5SJamie Gritton static int 3906761d2bb5SJamie Gritton sysctl_jail_vnet(SYSCTL_HANDLER_ARGS) 3907761d2bb5SJamie Gritton { 3908761d2bb5SJamie Gritton int error, havevnet; 3909761d2bb5SJamie Gritton #ifdef VIMAGE 3910761d2bb5SJamie Gritton struct ucred *cred = req->td->td_ucred; 3911761d2bb5SJamie Gritton 3912761d2bb5SJamie Gritton havevnet = jailed(cred) && prison_owns_vnet(cred); 3913761d2bb5SJamie Gritton #else 3914761d2bb5SJamie Gritton havevnet = 0; 3915761d2bb5SJamie Gritton #endif 3916761d2bb5SJamie Gritton error = SYSCTL_OUT(req, &havevnet, sizeof(havevnet)); 3917761d2bb5SJamie Gritton 3918761d2bb5SJamie Gritton return (error); 3919761d2bb5SJamie Gritton } 3920761d2bb5SJamie Gritton 3921761d2bb5SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, vnet, 3922761d2bb5SJamie Gritton CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, NULL, 0, 3923bb8f1623SBjoern A. Zeeb sysctl_jail_vnet, "I", "Jail owns vnet?"); 3924761d2bb5SJamie Gritton 39250304c731SJamie Gritton #if defined(INET) || defined(INET6) 3926e92e0574SJamie Gritton SYSCTL_UINT(_security_jail, OID_AUTO, jail_max_af_ips, CTLFLAG_RW, 39270304c731SJamie Gritton &jail_max_af_ips, 0, 3928c542c43eSJamie Gritton "Number of IP addresses a jail may have at most per address family (deprecated)"); 39290304c731SJamie Gritton #endif 39300304c731SJamie Gritton 39310304c731SJamie Gritton /* 3932c542c43eSJamie Gritton * Default parameters for jail(2) compatibility. For historical reasons, 3933c542c43eSJamie Gritton * the sysctl names have varying similarity to the parameter names. Prisons 3934c542c43eSJamie Gritton * just see their own parameters, and can't change them. 39350304c731SJamie Gritton */ 39360304c731SJamie Gritton static int 39370304c731SJamie Gritton sysctl_jail_default_allow(SYSCTL_HANDLER_ARGS) 39380304c731SJamie Gritton { 39390fe74ae6SJamie Gritton int error, i; 39400304c731SJamie Gritton 39410304c731SJamie Gritton /* Get the current flag value, and convert it to a boolean. */ 39420fe74ae6SJamie Gritton if (req->td->td_ucred->cr_prison == &prison0) { 39430fe74ae6SJamie Gritton mtx_lock(&prison0.pr_mtx); 39440fe74ae6SJamie Gritton i = (jail_default_allow & arg2) != 0; 39450fe74ae6SJamie Gritton mtx_unlock(&prison0.pr_mtx); 39460fe74ae6SJamie Gritton } else 39470fe74ae6SJamie Gritton i = prison_allow(req->td->td_ucred, arg2); 39480fe74ae6SJamie Gritton 39490304c731SJamie Gritton if (arg1 != NULL) 39500304c731SJamie Gritton i = !i; 39510304c731SJamie Gritton error = sysctl_handle_int(oidp, &i, 0, req); 3952c542c43eSJamie Gritton if (error || !req->newptr) 39530304c731SJamie Gritton return (error); 39540304c731SJamie Gritton i = i ? arg2 : 0; 39550304c731SJamie Gritton if (arg1 != NULL) 39560304c731SJamie Gritton i ^= arg2; 39570304c731SJamie Gritton /* 39580304c731SJamie Gritton * The sysctls don't have CTLFLAGS_PRISON, so assume prison0 39590304c731SJamie Gritton * for writing. 39600304c731SJamie Gritton */ 39610304c731SJamie Gritton mtx_lock(&prison0.pr_mtx); 39620304c731SJamie Gritton jail_default_allow = (jail_default_allow & ~arg2) | i; 39630304c731SJamie Gritton mtx_unlock(&prison0.pr_mtx); 39640304c731SJamie Gritton return (0); 39650304c731SJamie Gritton } 39660304c731SJamie Gritton 39670304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, set_hostname_allowed, 3968c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 39690304c731SJamie Gritton NULL, PR_ALLOW_SET_HOSTNAME, sysctl_jail_default_allow, "I", 3970c542c43eSJamie Gritton "Processes in jail can set their hostnames (deprecated)"); 39710304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, socket_unixiproute_only, 3972c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 39730304c731SJamie Gritton (void *)1, PR_ALLOW_SOCKET_AF, sysctl_jail_default_allow, "I", 3974c542c43eSJamie Gritton "Processes in jail are limited to creating UNIX/IP/route sockets only (deprecated)"); 39750304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, sysvipc_allowed, 3976c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 39770304c731SJamie Gritton NULL, PR_ALLOW_SYSVIPC, sysctl_jail_default_allow, "I", 3978c542c43eSJamie Gritton "Processes in jail can use System V IPC primitives (deprecated)"); 39790304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, allow_raw_sockets, 3980c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 39810304c731SJamie Gritton NULL, PR_ALLOW_RAW_SOCKETS, sysctl_jail_default_allow, "I", 3982c542c43eSJamie Gritton "Prison root can create raw sockets (deprecated)"); 39830304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, chflags_allowed, 3984c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 39850304c731SJamie Gritton NULL, PR_ALLOW_CHFLAGS, sysctl_jail_default_allow, "I", 3986c542c43eSJamie Gritton "Processes in jail can alter system file flags (deprecated)"); 39870304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, mount_allowed, 3988c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 39890304c731SJamie Gritton NULL, PR_ALLOW_MOUNT, sysctl_jail_default_allow, "I", 3990c542c43eSJamie Gritton "Processes in jail can mount/unmount jail-friendly file systems (deprecated)"); 39910304c731SJamie Gritton 39920304c731SJamie Gritton static int 39930304c731SJamie Gritton sysctl_jail_default_level(SYSCTL_HANDLER_ARGS) 39940304c731SJamie Gritton { 39950304c731SJamie Gritton struct prison *pr; 39960304c731SJamie Gritton int level, error; 39970304c731SJamie Gritton 39980304c731SJamie Gritton pr = req->td->td_ucred->cr_prison; 39990304c731SJamie Gritton level = (pr == &prison0) ? *(int *)arg1 : *(int *)((char *)pr + arg2); 40000304c731SJamie Gritton error = sysctl_handle_int(oidp, &level, 0, req); 4001c542c43eSJamie Gritton if (error || !req->newptr) 40020304c731SJamie Gritton return (error); 40030304c731SJamie Gritton *(int *)arg1 = level; 40040304c731SJamie Gritton return (0); 40050304c731SJamie Gritton } 40060304c731SJamie Gritton 40070304c731SJamie Gritton SYSCTL_PROC(_security_jail, OID_AUTO, enforce_statfs, 4008c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 4009c542c43eSJamie Gritton &jail_default_enforce_statfs, offsetof(struct prison, pr_enforce_statfs), 40100304c731SJamie Gritton sysctl_jail_default_level, "I", 4011c542c43eSJamie Gritton "Processes in jail cannot see all mounted file systems (deprecated)"); 4012c542c43eSJamie Gritton 40130cc207a6SMartin Matuska SYSCTL_PROC(_security_jail, OID_AUTO, devfs_ruleset, 4014c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, 4015c542c43eSJamie Gritton &jail_default_devfs_rsnum, offsetof(struct prison, pr_devfs_rsnum), 40160cc207a6SMartin Matuska sysctl_jail_default_level, "I", 4017c542c43eSJamie Gritton "Ruleset for the devfs filesystem in jail (deprecated)"); 40180cc207a6SMartin Matuska 40190304c731SJamie Gritton /* 40200304c731SJamie Gritton * Nodes to describe jail parameters. Maximum length of string parameters 40210304c731SJamie Gritton * is returned in the string itself, and the other parameters exist merely 40220304c731SJamie Gritton * to make themselves and their types known. 40230304c731SJamie Gritton */ 40247029da5cSPawel Biernacki SYSCTL_NODE(_security_jail, OID_AUTO, param, CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 40250304c731SJamie Gritton "Jail parameters"); 40260304c731SJamie Gritton 40270304c731SJamie Gritton int 40280304c731SJamie Gritton sysctl_jail_param(SYSCTL_HANDLER_ARGS) 40290304c731SJamie Gritton { 40300304c731SJamie Gritton int i; 40310304c731SJamie Gritton long l; 40320304c731SJamie Gritton size_t s; 40330304c731SJamie Gritton char numbuf[12]; 40340304c731SJamie Gritton 40350304c731SJamie Gritton switch (oidp->oid_kind & CTLTYPE) 40360304c731SJamie Gritton { 40370304c731SJamie Gritton case CTLTYPE_LONG: 40380304c731SJamie Gritton case CTLTYPE_ULONG: 40390304c731SJamie Gritton l = 0; 40400304c731SJamie Gritton #ifdef SCTL_MASK32 40410304c731SJamie Gritton if (!(req->flags & SCTL_MASK32)) 40420304c731SJamie Gritton #endif 40430304c731SJamie Gritton return (SYSCTL_OUT(req, &l, sizeof(l))); 40440304c731SJamie Gritton case CTLTYPE_INT: 40450304c731SJamie Gritton case CTLTYPE_UINT: 40460304c731SJamie Gritton i = 0; 40470304c731SJamie Gritton return (SYSCTL_OUT(req, &i, sizeof(i))); 40480304c731SJamie Gritton case CTLTYPE_STRING: 4049e4cd31ddSJeff Roberson snprintf(numbuf, sizeof(numbuf), "%jd", (intmax_t)arg2); 40500304c731SJamie Gritton return 40510304c731SJamie Gritton (sysctl_handle_string(oidp, numbuf, sizeof(numbuf), req)); 40520304c731SJamie Gritton case CTLTYPE_STRUCT: 40530304c731SJamie Gritton s = (size_t)arg2; 40540304c731SJamie Gritton return (SYSCTL_OUT(req, &s, sizeof(s))); 40550304c731SJamie Gritton } 40560304c731SJamie Gritton return (0); 40570304c731SJamie Gritton } 40580304c731SJamie Gritton 4059b96bd95bSIan Lepore /* 4060b96bd95bSIan Lepore * CTLFLAG_RDTUN in the following indicates jail parameters that can be set at 4061b96bd95bSIan Lepore * jail creation time but cannot be changed in an existing jail. 4062b96bd95bSIan Lepore */ 40630304c731SJamie Gritton SYSCTL_JAIL_PARAM(, jid, CTLTYPE_INT | CTLFLAG_RDTUN, "I", "Jail ID"); 40640304c731SJamie Gritton SYSCTL_JAIL_PARAM(, parent, CTLTYPE_INT | CTLFLAG_RD, "I", "Jail parent ID"); 40650304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRING(, name, CTLFLAG_RW, MAXHOSTNAMELEN, "Jail name"); 40660304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRING(, path, CTLFLAG_RDTUN, MAXPATHLEN, "Jail root path"); 40670304c731SJamie Gritton SYSCTL_JAIL_PARAM(, securelevel, CTLTYPE_INT | CTLFLAG_RW, 40680304c731SJamie Gritton "I", "Jail secure level"); 4069b96bd95bSIan Lepore SYSCTL_JAIL_PARAM(, osreldate, CTLTYPE_INT | CTLFLAG_RDTUN, "I", 4070b96bd95bSIan Lepore "Jail value for kern.osreldate and uname -K"); 4071b96bd95bSIan Lepore SYSCTL_JAIL_PARAM_STRING(, osrelease, CTLFLAG_RDTUN, OSRELEASELEN, 4072b96bd95bSIan Lepore "Jail value for kern.osrelease and uname -r"); 40730304c731SJamie Gritton SYSCTL_JAIL_PARAM(, enforce_statfs, CTLTYPE_INT | CTLFLAG_RW, 40740304c731SJamie Gritton "I", "Jail cannot see all mounted file systems"); 40750cc207a6SMartin Matuska SYSCTL_JAIL_PARAM(, devfs_ruleset, CTLTYPE_INT | CTLFLAG_RW, 40760cc207a6SMartin Matuska "I", "Ruleset for in-jail devfs mounts"); 40770304c731SJamie Gritton SYSCTL_JAIL_PARAM(, persist, CTLTYPE_INT | CTLFLAG_RW, 40780304c731SJamie Gritton "B", "Jail persistence"); 4079679e1390SJamie Gritton #ifdef VIMAGE 4080679e1390SJamie Gritton SYSCTL_JAIL_PARAM(, vnet, CTLTYPE_INT | CTLFLAG_RDTUN, 40817cbf7213SJamie Gritton "E,jailsys", "Virtual network stack"); 4082679e1390SJamie Gritton #endif 40830304c731SJamie Gritton SYSCTL_JAIL_PARAM(, dying, CTLTYPE_INT | CTLFLAG_RD, 40840304c731SJamie Gritton "B", "Jail is in the process of shutting down"); 40850304c731SJamie Gritton 4086b97457e2SJamie Gritton SYSCTL_JAIL_PARAM_NODE(children, "Number of child jails"); 4087b97457e2SJamie Gritton SYSCTL_JAIL_PARAM(_children, cur, CTLTYPE_INT | CTLFLAG_RD, 4088b97457e2SJamie Gritton "I", "Current number of child jails"); 4089b97457e2SJamie Gritton SYSCTL_JAIL_PARAM(_children, max, CTLTYPE_INT | CTLFLAG_RW, 4090b97457e2SJamie Gritton "I", "Maximum number of child jails"); 4091b97457e2SJamie Gritton 40927cbf7213SJamie Gritton SYSCTL_JAIL_PARAM_SYS_NODE(host, CTLFLAG_RW, "Jail host info"); 40930304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRING(_host, hostname, CTLFLAG_RW, MAXHOSTNAMELEN, 40940304c731SJamie Gritton "Jail hostname"); 409576ca6f88SJamie Gritton SYSCTL_JAIL_PARAM_STRING(_host, domainname, CTLFLAG_RW, MAXHOSTNAMELEN, 409676ca6f88SJamie Gritton "Jail NIS domainname"); 409776ca6f88SJamie Gritton SYSCTL_JAIL_PARAM_STRING(_host, hostuuid, CTLFLAG_RW, HOSTUUIDLEN, 409876ca6f88SJamie Gritton "Jail host UUID"); 409976ca6f88SJamie Gritton SYSCTL_JAIL_PARAM(_host, hostid, CTLTYPE_ULONG | CTLFLAG_RW, 410076ca6f88SJamie Gritton "LU", "Jail host ID"); 41010304c731SJamie Gritton 41020304c731SJamie Gritton SYSCTL_JAIL_PARAM_NODE(cpuset, "Jail cpuset"); 41030304c731SJamie Gritton SYSCTL_JAIL_PARAM(_cpuset, id, CTLTYPE_INT | CTLFLAG_RD, "I", "Jail cpuset ID"); 41040304c731SJamie Gritton 41050304c731SJamie Gritton #ifdef INET 41062b0d6f81SJamie Gritton SYSCTL_JAIL_PARAM_SYS_NODE(ip4, CTLFLAG_RDTUN, 41072b0d6f81SJamie Gritton "Jail IPv4 address virtualization"); 41080304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRUCT(_ip4, addr, CTLFLAG_RW, sizeof(struct in_addr), 41090304c731SJamie Gritton "S,in_addr,a", "Jail IPv4 addresses"); 4110592bcae8SBjoern A. Zeeb SYSCTL_JAIL_PARAM(_ip4, saddrsel, CTLTYPE_INT | CTLFLAG_RW, 4111592bcae8SBjoern A. Zeeb "B", "Do (not) use IPv4 source address selection rather than the " 4112592bcae8SBjoern A. Zeeb "primary jail IPv4 address."); 41130304c731SJamie Gritton #endif 41140304c731SJamie Gritton #ifdef INET6 41152b0d6f81SJamie Gritton SYSCTL_JAIL_PARAM_SYS_NODE(ip6, CTLFLAG_RDTUN, 41162b0d6f81SJamie Gritton "Jail IPv6 address virtualization"); 41170304c731SJamie Gritton SYSCTL_JAIL_PARAM_STRUCT(_ip6, addr, CTLFLAG_RW, sizeof(struct in6_addr), 41180304c731SJamie Gritton "S,in6_addr,a", "Jail IPv6 addresses"); 4119592bcae8SBjoern A. Zeeb SYSCTL_JAIL_PARAM(_ip6, saddrsel, CTLTYPE_INT | CTLFLAG_RW, 4120592bcae8SBjoern A. Zeeb "B", "Do (not) use IPv6 source address selection rather than the " 4121592bcae8SBjoern A. Zeeb "primary jail IPv6 address."); 41220304c731SJamie Gritton #endif 41230304c731SJamie Gritton 41240304c731SJamie Gritton SYSCTL_JAIL_PARAM_NODE(allow, "Jail permission flags"); 41250304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, set_hostname, CTLTYPE_INT | CTLFLAG_RW, 41260304c731SJamie Gritton "B", "Jail may set hostname"); 41270304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, sysvipc, CTLTYPE_INT | CTLFLAG_RW, 41280304c731SJamie Gritton "B", "Jail may use SYSV IPC"); 41290304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, raw_sockets, CTLTYPE_INT | CTLFLAG_RW, 41300304c731SJamie Gritton "B", "Jail may create raw sockets"); 41310304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, chflags, CTLTYPE_INT | CTLFLAG_RW, 41320304c731SJamie Gritton "B", "Jail may alter system file flags"); 41330304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, quotas, CTLTYPE_INT | CTLFLAG_RW, 41340304c731SJamie Gritton "B", "Jail may set file quotas"); 41350304c731SJamie Gritton SYSCTL_JAIL_PARAM(_allow, socket_af, CTLTYPE_INT | CTLFLAG_RW, 41360304c731SJamie Gritton "B", "Jail may create sockets other than just UNIX/IPv4/IPv6/route"); 4137ccd6ac9fSAntoine Brodin SYSCTL_JAIL_PARAM(_allow, mlock, CTLTYPE_INT | CTLFLAG_RW, 4138ccd6ac9fSAntoine Brodin "B", "Jail may lock (unlock) physical pages in memory"); 4139e28f9b7dSAllan Jude SYSCTL_JAIL_PARAM(_allow, reserved_ports, CTLTYPE_INT | CTLFLAG_RW, 4140e28f9b7dSAllan Jude "B", "Jail may bind sockets to reserved ports"); 4141b19d66fdSJamie Gritton SYSCTL_JAIL_PARAM(_allow, read_msgbuf, CTLTYPE_INT | CTLFLAG_RW, 4142b19d66fdSJamie Gritton "B", "Jail may read the kernel message buffer"); 4143b3079544SJamie Gritton SYSCTL_JAIL_PARAM(_allow, unprivileged_proc_debug, CTLTYPE_INT | CTLFLAG_RW, 4144b3079544SJamie Gritton "B", "Unprivileged processes may use process debugging facilities"); 414505e1e482SMariusz Zaborski SYSCTL_JAIL_PARAM(_allow, suser, CTLTYPE_INT | CTLFLAG_RW, 414605e1e482SMariusz Zaborski "B", "Processes in jail with uid 0 have privilege"); 41470304c731SJamie Gritton 4148bf3db8aaSMartin Matuska SYSCTL_JAIL_PARAM_SUBNODE(allow, mount, "Jail mount/unmount permission flags"); 4149bf3db8aaSMartin Matuska SYSCTL_JAIL_PARAM(_allow_mount, , CTLTYPE_INT | CTLFLAG_RW, 4150bf3db8aaSMartin Matuska "B", "Jail may mount/unmount jail-friendly file systems in general"); 41510e5c6bd4SJamie Gritton 41520e5c6bd4SJamie Gritton /* 41530a172404SJamie Gritton * Add a dynamic parameter allow.<name>, or allow.<prefix>.<name>. Return 41540a172404SJamie Gritton * its associated bit in the pr_allow bitmask, or zero if the parameter was 41550a172404SJamie Gritton * not created. 41560e5c6bd4SJamie Gritton */ 41570a172404SJamie Gritton unsigned 41580a172404SJamie Gritton prison_add_allow(const char *prefix, const char *name, const char *prefix_descr, 41590a172404SJamie Gritton const char *descr) 41600e5c6bd4SJamie Gritton { 41610e5c6bd4SJamie Gritton struct bool_flags *bf; 41620a172404SJamie Gritton struct sysctl_oid *parent; 41630a172404SJamie Gritton char *allow_name, *allow_noname, *allowed; 4164c542c43eSJamie Gritton #ifndef NO_SYSCTL_DESCR 4165c542c43eSJamie Gritton char *descr_deprecated; 4166c542c43eSJamie Gritton #endif 41675d58f959SJamie Gritton u_int allow_flag; 41680e5c6bd4SJamie Gritton 41690a172404SJamie Gritton if (prefix 41700a172404SJamie Gritton ? asprintf(&allow_name, M_PRISON, "allow.%s.%s", prefix, name) 41710a172404SJamie Gritton < 0 || 41720a172404SJamie Gritton asprintf(&allow_noname, M_PRISON, "allow.%s.no%s", prefix, name) 41730a172404SJamie Gritton < 0 41740a172404SJamie Gritton : asprintf(&allow_name, M_PRISON, "allow.%s", name) < 0 || 41750a172404SJamie Gritton asprintf(&allow_noname, M_PRISON, "allow.no%s", name) < 0) { 41760e5c6bd4SJamie Gritton free(allow_name, M_PRISON); 41770a172404SJamie Gritton return 0; 41780e5c6bd4SJamie Gritton } 41790e5c6bd4SJamie Gritton 41800e5c6bd4SJamie Gritton /* 41810a172404SJamie Gritton * See if this parameter has already beed added, i.e. a module was 41820a172404SJamie Gritton * previously loaded/unloaded. 41830e5c6bd4SJamie Gritton */ 41840e5c6bd4SJamie Gritton mtx_lock(&prison0.pr_mtx); 41850e5c6bd4SJamie Gritton for (bf = pr_flag_allow; 41865d58f959SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && 41875d58f959SJamie Gritton atomic_load_int(&bf->flag) != 0; 41880e5c6bd4SJamie Gritton bf++) { 41890e5c6bd4SJamie Gritton if (strcmp(bf->name, allow_name) == 0) { 41900a172404SJamie Gritton allow_flag = bf->flag; 41910e5c6bd4SJamie Gritton goto no_add; 41920e5c6bd4SJamie Gritton } 41930e5c6bd4SJamie Gritton } 41940e5c6bd4SJamie Gritton 41950e5c6bd4SJamie Gritton /* 41965d58f959SJamie Gritton * Find a free bit in pr_allow_all, failing if there are none 41970e5c6bd4SJamie Gritton * (which shouldn't happen as long as we keep track of how many 41980a172404SJamie Gritton * potential dynamic flags exist). 41990e5c6bd4SJamie Gritton */ 42000e5c6bd4SJamie Gritton for (allow_flag = 1;; allow_flag <<= 1) { 42010e5c6bd4SJamie Gritton if (allow_flag == 0) 42020e5c6bd4SJamie Gritton goto no_add; 42035d58f959SJamie Gritton if ((pr_allow_all & allow_flag) == 0) 42040e5c6bd4SJamie Gritton break; 42050e5c6bd4SJamie Gritton } 42060e5c6bd4SJamie Gritton 42075d58f959SJamie Gritton /* Note the parameter in the next open slot in pr_flag_allow. */ 42085d58f959SJamie Gritton for (bf = pr_flag_allow; ; bf++) { 42090e5c6bd4SJamie Gritton if (bf == pr_flag_allow + nitems(pr_flag_allow)) { 42100e5c6bd4SJamie Gritton /* This should never happen, but is not fatal. */ 42110a172404SJamie Gritton allow_flag = 0; 42120e5c6bd4SJamie Gritton goto no_add; 42130e5c6bd4SJamie Gritton } 42145d58f959SJamie Gritton if (atomic_load_int(&bf->flag) == 0) 42155d58f959SJamie Gritton break; 42165d58f959SJamie Gritton } 42170e5c6bd4SJamie Gritton bf->name = allow_name; 42180e5c6bd4SJamie Gritton bf->noname = allow_noname; 42195d58f959SJamie Gritton pr_allow_all |= allow_flag; 42205d58f959SJamie Gritton /* 42215d58f959SJamie Gritton * prison0 always has permission for the new parameter. 42225d58f959SJamie Gritton * Other jails must have it granted to them. 42235d58f959SJamie Gritton */ 42245d58f959SJamie Gritton prison0.pr_allow |= allow_flag; 42255d58f959SJamie Gritton /* The flag indicates a valid entry, so make sure it is set last. */ 42265d58f959SJamie Gritton atomic_store_rel_int(&bf->flag, allow_flag); 42270e5c6bd4SJamie Gritton mtx_unlock(&prison0.pr_mtx); 42280e5c6bd4SJamie Gritton 4229c542c43eSJamie Gritton /* 4230c542c43eSJamie Gritton * Create sysctls for the paramter, and the back-compat global 4231c542c43eSJamie Gritton * permission. 4232c542c43eSJamie Gritton */ 42330a172404SJamie Gritton parent = prefix 42340a172404SJamie Gritton ? SYSCTL_ADD_NODE(NULL, 42350a172404SJamie Gritton SYSCTL_CHILDREN(&sysctl___security_jail_param_allow), 42367029da5cSPawel Biernacki OID_AUTO, prefix, CTLFLAG_MPSAFE, 0, prefix_descr) 42370a172404SJamie Gritton : &sysctl___security_jail_param_allow; 42380a172404SJamie Gritton (void)SYSCTL_ADD_PROC(NULL, SYSCTL_CHILDREN(parent), OID_AUTO, 42390a172404SJamie Gritton name, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, 42400e5c6bd4SJamie Gritton NULL, 0, sysctl_jail_param, "B", descr); 42410a172404SJamie Gritton if ((prefix 42420a172404SJamie Gritton ? asprintf(&allowed, M_TEMP, "%s_%s_allowed", prefix, name) 42430a172404SJamie Gritton : asprintf(&allowed, M_TEMP, "%s_allowed", name)) >= 0) { 4244c542c43eSJamie Gritton #ifndef NO_SYSCTL_DESCR 4245c542c43eSJamie Gritton (void)asprintf(&descr_deprecated, M_TEMP, "%s (deprecated)", 4246c542c43eSJamie Gritton descr); 4247c542c43eSJamie Gritton #endif 42480e5c6bd4SJamie Gritton (void)SYSCTL_ADD_PROC(NULL, 42490a172404SJamie Gritton SYSCTL_CHILDREN(&sysctl___security_jail), OID_AUTO, allowed, 4250c542c43eSJamie Gritton CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, NULL, allow_flag, 4251c542c43eSJamie Gritton sysctl_jail_default_allow, "I", descr_deprecated); 4252c542c43eSJamie Gritton #ifndef NO_SYSCTL_DESCR 4253c542c43eSJamie Gritton free(descr_deprecated, M_TEMP); 4254c542c43eSJamie Gritton #endif 42550a172404SJamie Gritton free(allowed, M_TEMP); 42560e5c6bd4SJamie Gritton } 42570a172404SJamie Gritton return allow_flag; 42580e5c6bd4SJamie Gritton 42590e5c6bd4SJamie Gritton no_add: 42600e5c6bd4SJamie Gritton mtx_unlock(&prison0.pr_mtx); 42610e5c6bd4SJamie Gritton free(allow_name, M_PRISON); 42620e5c6bd4SJamie Gritton free(allow_noname, M_PRISON); 42630a172404SJamie Gritton return allow_flag; 42640a172404SJamie Gritton } 42650a172404SJamie Gritton 42660a172404SJamie Gritton /* 42670a172404SJamie Gritton * The VFS system will register jail-aware filesystems here. They each get 42680a172404SJamie Gritton * a parameter allow.mount.xxxfs and a flag to check when a jailed user 42690a172404SJamie Gritton * attempts to mount. 42700a172404SJamie Gritton */ 42710a172404SJamie Gritton void 42720a172404SJamie Gritton prison_add_vfs(struct vfsconf *vfsp) 42730a172404SJamie Gritton { 42740a172404SJamie Gritton #ifdef NO_SYSCTL_DESCR 42750a172404SJamie Gritton 42760a172404SJamie Gritton vfsp->vfc_prison_flag = prison_add_allow("mount", vfsp->vfc_name, 42770a172404SJamie Gritton NULL, NULL); 42780a172404SJamie Gritton #else 42790a172404SJamie Gritton char *descr; 42800a172404SJamie Gritton 42810a172404SJamie Gritton (void)asprintf(&descr, M_TEMP, "Jail may mount the %s file system", 42820a172404SJamie Gritton vfsp->vfc_name); 42830a172404SJamie Gritton vfsp->vfc_prison_flag = prison_add_allow("mount", vfsp->vfc_name, 42840a172404SJamie Gritton NULL, descr); 42850a172404SJamie Gritton free(descr, M_TEMP); 42860a172404SJamie Gritton #endif 42870e5c6bd4SJamie Gritton } 4288bf3db8aaSMartin Matuska 42894b5c9cf6SEdward Tomasz Napierala #ifdef RACCT 4290097055e2SEdward Tomasz Napierala void 4291097055e2SEdward Tomasz Napierala prison_racct_foreach(void (*callback)(struct racct *racct, 429215db3c07SEdward Tomasz Napierala void *arg2, void *arg3), void (*pre)(void), void (*post)(void), 429315db3c07SEdward Tomasz Napierala void *arg2, void *arg3) 4294097055e2SEdward Tomasz Napierala { 4295a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 4296097055e2SEdward Tomasz Napierala 42974b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 42984b5c9cf6SEdward Tomasz Napierala 4299097055e2SEdward Tomasz Napierala sx_slock(&allprison_lock); 430015db3c07SEdward Tomasz Napierala if (pre != NULL) 430115db3c07SEdward Tomasz Napierala (pre)(); 4302a7ad07bfSEdward Tomasz Napierala LIST_FOREACH(prr, &allprison_racct, prr_next) 4303a7ad07bfSEdward Tomasz Napierala (callback)(prr->prr_racct, arg2, arg3); 430415db3c07SEdward Tomasz Napierala if (post != NULL) 430515db3c07SEdward Tomasz Napierala (post)(); 4306097055e2SEdward Tomasz Napierala sx_sunlock(&allprison_lock); 4307097055e2SEdward Tomasz Napierala } 43080304c731SJamie Gritton 4309a7ad07bfSEdward Tomasz Napierala static struct prison_racct * 4310a7ad07bfSEdward Tomasz Napierala prison_racct_find_locked(const char *name) 4311a7ad07bfSEdward Tomasz Napierala { 4312a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 4313a7ad07bfSEdward Tomasz Napierala 43144b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4315a7ad07bfSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_XLOCKED); 4316a7ad07bfSEdward Tomasz Napierala 4317a7ad07bfSEdward Tomasz Napierala if (name[0] == '\0' || strlen(name) >= MAXHOSTNAMELEN) 4318a7ad07bfSEdward Tomasz Napierala return (NULL); 4319a7ad07bfSEdward Tomasz Napierala 4320a7ad07bfSEdward Tomasz Napierala LIST_FOREACH(prr, &allprison_racct, prr_next) { 4321a7ad07bfSEdward Tomasz Napierala if (strcmp(name, prr->prr_name) != 0) 4322a7ad07bfSEdward Tomasz Napierala continue; 4323a7ad07bfSEdward Tomasz Napierala 4324a7ad07bfSEdward Tomasz Napierala /* Found prison_racct with a matching name? */ 4325a7ad07bfSEdward Tomasz Napierala prison_racct_hold(prr); 4326a7ad07bfSEdward Tomasz Napierala return (prr); 4327a7ad07bfSEdward Tomasz Napierala } 4328a7ad07bfSEdward Tomasz Napierala 4329a7ad07bfSEdward Tomasz Napierala /* Add new prison_racct. */ 4330a7ad07bfSEdward Tomasz Napierala prr = malloc(sizeof(*prr), M_PRISON_RACCT, M_ZERO | M_WAITOK); 4331a7ad07bfSEdward Tomasz Napierala racct_create(&prr->prr_racct); 4332a7ad07bfSEdward Tomasz Napierala 4333a7ad07bfSEdward Tomasz Napierala strcpy(prr->prr_name, name); 4334a7ad07bfSEdward Tomasz Napierala refcount_init(&prr->prr_refcount, 1); 4335a7ad07bfSEdward Tomasz Napierala LIST_INSERT_HEAD(&allprison_racct, prr, prr_next); 4336a7ad07bfSEdward Tomasz Napierala 4337a7ad07bfSEdward Tomasz Napierala return (prr); 4338a7ad07bfSEdward Tomasz Napierala } 4339a7ad07bfSEdward Tomasz Napierala 4340a7ad07bfSEdward Tomasz Napierala struct prison_racct * 4341a7ad07bfSEdward Tomasz Napierala prison_racct_find(const char *name) 4342a7ad07bfSEdward Tomasz Napierala { 4343a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 4344a7ad07bfSEdward Tomasz Napierala 43454b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 43464b5c9cf6SEdward Tomasz Napierala 4347a7ad07bfSEdward Tomasz Napierala sx_xlock(&allprison_lock); 4348a7ad07bfSEdward Tomasz Napierala prr = prison_racct_find_locked(name); 4349a7ad07bfSEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4350a7ad07bfSEdward Tomasz Napierala return (prr); 4351a7ad07bfSEdward Tomasz Napierala } 4352a7ad07bfSEdward Tomasz Napierala 4353a7ad07bfSEdward Tomasz Napierala void 4354a7ad07bfSEdward Tomasz Napierala prison_racct_hold(struct prison_racct *prr) 4355a7ad07bfSEdward Tomasz Napierala { 4356a7ad07bfSEdward Tomasz Napierala 43574b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 43584b5c9cf6SEdward Tomasz Napierala 4359a7ad07bfSEdward Tomasz Napierala refcount_acquire(&prr->prr_refcount); 4360a7ad07bfSEdward Tomasz Napierala } 4361a7ad07bfSEdward Tomasz Napierala 4362c34bbd2aSEdward Tomasz Napierala static void 4363c34bbd2aSEdward Tomasz Napierala prison_racct_free_locked(struct prison_racct *prr) 4364c34bbd2aSEdward Tomasz Napierala { 4365c34bbd2aSEdward Tomasz Napierala 43664b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4367c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_XLOCKED); 4368c34bbd2aSEdward Tomasz Napierala 4369c34bbd2aSEdward Tomasz Napierala if (refcount_release(&prr->prr_refcount)) { 4370c34bbd2aSEdward Tomasz Napierala racct_destroy(&prr->prr_racct); 4371c34bbd2aSEdward Tomasz Napierala LIST_REMOVE(prr, prr_next); 4372c34bbd2aSEdward Tomasz Napierala free(prr, M_PRISON_RACCT); 4373c34bbd2aSEdward Tomasz Napierala } 4374c34bbd2aSEdward Tomasz Napierala } 4375c34bbd2aSEdward Tomasz Napierala 4376a7ad07bfSEdward Tomasz Napierala void 4377a7ad07bfSEdward Tomasz Napierala prison_racct_free(struct prison_racct *prr) 4378a7ad07bfSEdward Tomasz Napierala { 4379a7ad07bfSEdward Tomasz Napierala 43804b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4381c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_UNLOCKED); 4382c34bbd2aSEdward Tomasz Napierala 43836ff4688bSMateusz Guzik if (refcount_release_if_not_last(&prr->prr_refcount)) 4384a7ad07bfSEdward Tomasz Napierala return; 4385a7ad07bfSEdward Tomasz Napierala 4386a7ad07bfSEdward Tomasz Napierala sx_xlock(&allprison_lock); 4387c34bbd2aSEdward Tomasz Napierala prison_racct_free_locked(prr); 4388a7ad07bfSEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4389a7ad07bfSEdward Tomasz Napierala } 4390a7ad07bfSEdward Tomasz Napierala 4391a7ad07bfSEdward Tomasz Napierala static void 4392a7ad07bfSEdward Tomasz Napierala prison_racct_attach(struct prison *pr) 4393a7ad07bfSEdward Tomasz Napierala { 4394a7ad07bfSEdward Tomasz Napierala struct prison_racct *prr; 4395a7ad07bfSEdward Tomasz Napierala 43964b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4397c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_XLOCKED); 4398c34bbd2aSEdward Tomasz Napierala 4399a7ad07bfSEdward Tomasz Napierala prr = prison_racct_find_locked(pr->pr_name); 4400a7ad07bfSEdward Tomasz Napierala KASSERT(prr != NULL, ("cannot find prison_racct")); 4401a7ad07bfSEdward Tomasz Napierala 4402a7ad07bfSEdward Tomasz Napierala pr->pr_prison_racct = prr; 4403a7ad07bfSEdward Tomasz Napierala } 4404a7ad07bfSEdward Tomasz Napierala 4405c34bbd2aSEdward Tomasz Napierala /* 4406c34bbd2aSEdward Tomasz Napierala * Handle jail renaming. From the racct point of view, renaming means 4407c34bbd2aSEdward Tomasz Napierala * moving from one prison_racct to another. 4408c34bbd2aSEdward Tomasz Napierala */ 4409c34bbd2aSEdward Tomasz Napierala static void 4410c34bbd2aSEdward Tomasz Napierala prison_racct_modify(struct prison *pr) 4411c34bbd2aSEdward Tomasz Napierala { 4412dbadb015SKonstantin Belousov #ifdef RCTL 4413c34bbd2aSEdward Tomasz Napierala struct proc *p; 4414c34bbd2aSEdward Tomasz Napierala struct ucred *cred; 4415dbadb015SKonstantin Belousov #endif 4416c34bbd2aSEdward Tomasz Napierala struct prison_racct *oldprr; 4417c34bbd2aSEdward Tomasz Napierala 44184b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 44194b5c9cf6SEdward Tomasz Napierala 4420c34bbd2aSEdward Tomasz Napierala sx_slock(&allproc_lock); 4421c34bbd2aSEdward Tomasz Napierala sx_xlock(&allprison_lock); 4422c34bbd2aSEdward Tomasz Napierala 4423e30345e7SEdward Tomasz Napierala if (strcmp(pr->pr_name, pr->pr_prison_racct->prr_name) == 0) { 4424e30345e7SEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4425e30345e7SEdward Tomasz Napierala sx_sunlock(&allproc_lock); 4426c34bbd2aSEdward Tomasz Napierala return; 4427e30345e7SEdward Tomasz Napierala } 4428c34bbd2aSEdward Tomasz Napierala 4429c34bbd2aSEdward Tomasz Napierala oldprr = pr->pr_prison_racct; 4430c34bbd2aSEdward Tomasz Napierala pr->pr_prison_racct = NULL; 4431c34bbd2aSEdward Tomasz Napierala 4432c34bbd2aSEdward Tomasz Napierala prison_racct_attach(pr); 4433c34bbd2aSEdward Tomasz Napierala 4434c34bbd2aSEdward Tomasz Napierala /* 4435c34bbd2aSEdward Tomasz Napierala * Move resource utilisation records. 4436c34bbd2aSEdward Tomasz Napierala */ 4437c34bbd2aSEdward Tomasz Napierala racct_move(pr->pr_prison_racct->prr_racct, oldprr->prr_racct); 4438c34bbd2aSEdward Tomasz Napierala 4439f87beb93SAndriy Gapon #ifdef RCTL 4440c34bbd2aSEdward Tomasz Napierala /* 4441c34bbd2aSEdward Tomasz Napierala * Force rctl to reattach rules to processes. 4442c34bbd2aSEdward Tomasz Napierala */ 4443c34bbd2aSEdward Tomasz Napierala FOREACH_PROC_IN_SYSTEM(p) { 4444c34bbd2aSEdward Tomasz Napierala PROC_LOCK(p); 4445c34bbd2aSEdward Tomasz Napierala cred = crhold(p->p_ucred); 4446c34bbd2aSEdward Tomasz Napierala PROC_UNLOCK(p); 4447f87beb93SAndriy Gapon rctl_proc_ucred_changed(p, cred); 4448c34bbd2aSEdward Tomasz Napierala crfree(cred); 4449c34bbd2aSEdward Tomasz Napierala } 4450f87beb93SAndriy Gapon #endif 4451c34bbd2aSEdward Tomasz Napierala 4452c34bbd2aSEdward Tomasz Napierala sx_sunlock(&allproc_lock); 4453c34bbd2aSEdward Tomasz Napierala prison_racct_free_locked(oldprr); 4454c34bbd2aSEdward Tomasz Napierala sx_xunlock(&allprison_lock); 4455c34bbd2aSEdward Tomasz Napierala } 4456c34bbd2aSEdward Tomasz Napierala 4457a7ad07bfSEdward Tomasz Napierala static void 4458a7ad07bfSEdward Tomasz Napierala prison_racct_detach(struct prison *pr) 4459a7ad07bfSEdward Tomasz Napierala { 4460c34bbd2aSEdward Tomasz Napierala 44614b5c9cf6SEdward Tomasz Napierala ASSERT_RACCT_ENABLED(); 4462c34bbd2aSEdward Tomasz Napierala sx_assert(&allprison_lock, SA_UNLOCKED); 4463c34bbd2aSEdward Tomasz Napierala 4464af3c786cSMateusz Guzik if (pr->pr_prison_racct == NULL) 4465af3c786cSMateusz Guzik return; 4466a7ad07bfSEdward Tomasz Napierala prison_racct_free(pr->pr_prison_racct); 4467a7ad07bfSEdward Tomasz Napierala pr->pr_prison_racct = NULL; 4468a7ad07bfSEdward Tomasz Napierala } 4469a7ad07bfSEdward Tomasz Napierala #endif /* RACCT */ 4470a7ad07bfSEdward Tomasz Napierala 4471413628a7SBjoern A. Zeeb #ifdef DDB 4472b38ff370SJamie Gritton 4473b38ff370SJamie Gritton static void 4474b38ff370SJamie Gritton db_show_prison(struct prison *pr) 4475413628a7SBjoern A. Zeeb { 4476672756aaSJamie Gritton struct bool_flags *bf; 4477672756aaSJamie Gritton struct jailsys_flags *jsf; 4478b38ff370SJamie Gritton #if defined(INET) || defined(INET6) 4479b38ff370SJamie Gritton int ii; 4480413628a7SBjoern A. Zeeb #endif 4481672756aaSJamie Gritton unsigned f; 44828144690aSEric van Gyzen #ifdef INET 44838144690aSEric van Gyzen char ip4buf[INET_ADDRSTRLEN]; 44848144690aSEric van Gyzen #endif 4485413628a7SBjoern A. Zeeb #ifdef INET6 4486413628a7SBjoern A. Zeeb char ip6buf[INET6_ADDRSTRLEN]; 4487413628a7SBjoern A. Zeeb #endif 4488413628a7SBjoern A. Zeeb 4489b38ff370SJamie Gritton db_printf("prison %p:\n", pr); 4490b38ff370SJamie Gritton db_printf(" jid = %d\n", pr->pr_id); 4491b38ff370SJamie Gritton db_printf(" name = %s\n", pr->pr_name); 44920304c731SJamie Gritton db_printf(" parent = %p\n", pr->pr_parent); 4493b38ff370SJamie Gritton db_printf(" ref = %d\n", pr->pr_ref); 4494b38ff370SJamie Gritton db_printf(" uref = %d\n", pr->pr_uref); 44951158508aSJamie Gritton db_printf(" state = %s\n", 44961158508aSJamie Gritton pr->pr_state == PRISON_STATE_ALIVE ? "alive" : 44971158508aSJamie Gritton pr->pr_state == PRISON_STATE_DYING ? "dying" : 44981158508aSJamie Gritton "invalid"); 4499b38ff370SJamie Gritton db_printf(" path = %s\n", pr->pr_path); 4500b38ff370SJamie Gritton db_printf(" cpuset = %d\n", pr->pr_cpuset 4501b38ff370SJamie Gritton ? pr->pr_cpuset->cs_id : -1); 4502679e1390SJamie Gritton #ifdef VIMAGE 4503679e1390SJamie Gritton db_printf(" vnet = %p\n", pr->pr_vnet); 4504679e1390SJamie Gritton #endif 4505b38ff370SJamie Gritton db_printf(" root = %p\n", pr->pr_root); 4506b38ff370SJamie Gritton db_printf(" securelevel = %d\n", pr->pr_securelevel); 45070cc207a6SMartin Matuska db_printf(" devfs_rsnum = %d\n", pr->pr_devfs_rsnum); 4508fe0518e9SBjoern A. Zeeb db_printf(" children.max = %d\n", pr->pr_childmax); 4509fe0518e9SBjoern A. Zeeb db_printf(" children.cur = %d\n", pr->pr_childcount); 45100304c731SJamie Gritton db_printf(" child = %p\n", LIST_FIRST(&pr->pr_children)); 45110304c731SJamie Gritton db_printf(" sibling = %p\n", LIST_NEXT(pr, pr_sibling)); 4512fe0518e9SBjoern A. Zeeb db_printf(" flags = 0x%x", pr->pr_flags); 4513672756aaSJamie Gritton for (bf = pr_flag_bool; bf < pr_flag_bool + nitems(pr_flag_bool); bf++) 4514672756aaSJamie Gritton if (pr->pr_flags & bf->flag) 4515672756aaSJamie Gritton db_printf(" %s", bf->name); 4516672756aaSJamie Gritton for (jsf = pr_flag_jailsys; 4517672756aaSJamie Gritton jsf < pr_flag_jailsys + nitems(pr_flag_jailsys); 4518672756aaSJamie Gritton jsf++) { 4519672756aaSJamie Gritton f = pr->pr_flags & (jsf->disable | jsf->new); 4520672756aaSJamie Gritton db_printf(" %-16s= %s\n", jsf->name, 4521672756aaSJamie Gritton (f != 0 && f == jsf->disable) ? "disable" 4522672756aaSJamie Gritton : (f == jsf->new) ? "new" 45237cbf7213SJamie Gritton : "inherit"); 45247cbf7213SJamie Gritton } 4525fe0518e9SBjoern A. Zeeb db_printf(" allow = 0x%x", pr->pr_allow); 4526672756aaSJamie Gritton for (bf = pr_flag_allow; 45275d58f959SJamie Gritton bf < pr_flag_allow + nitems(pr_flag_allow) && 45285d58f959SJamie Gritton atomic_load_int(&bf->flag) != 0; 4529672756aaSJamie Gritton bf++) 4530672756aaSJamie Gritton if (pr->pr_allow & bf->flag) 4531672756aaSJamie Gritton db_printf(" %s", bf->name); 4532b38ff370SJamie Gritton db_printf("\n"); 45330304c731SJamie Gritton db_printf(" enforce_statfs = %d\n", pr->pr_enforce_statfs); 4534c1f19219SJamie Gritton db_printf(" host.hostname = %s\n", pr->pr_hostname); 4535c1f19219SJamie Gritton db_printf(" host.domainname = %s\n", pr->pr_domainname); 4536c1f19219SJamie Gritton db_printf(" host.hostuuid = %s\n", pr->pr_hostuuid); 453776ca6f88SJamie Gritton db_printf(" host.hostid = %lu\n", pr->pr_hostid); 4538413628a7SBjoern A. Zeeb #ifdef INET 4539b38ff370SJamie Gritton db_printf(" ip4s = %d\n", pr->pr_ip4s); 4540b38ff370SJamie Gritton for (ii = 0; ii < pr->pr_ip4s; ii++) 4541b38ff370SJamie Gritton db_printf(" %s %s\n", 4542fe0518e9SBjoern A. Zeeb ii == 0 ? "ip4.addr =" : " ", 45438144690aSEric van Gyzen inet_ntoa_r(pr->pr_ip4[ii], ip4buf)); 4544413628a7SBjoern A. Zeeb #endif 4545413628a7SBjoern A. Zeeb #ifdef INET6 4546b38ff370SJamie Gritton db_printf(" ip6s = %d\n", pr->pr_ip6s); 4547b38ff370SJamie Gritton for (ii = 0; ii < pr->pr_ip6s; ii++) 4548b38ff370SJamie Gritton db_printf(" %s %s\n", 4549fe0518e9SBjoern A. Zeeb ii == 0 ? "ip6.addr =" : " ", 4550b38ff370SJamie Gritton ip6_sprintf(ip6buf, &pr->pr_ip6[ii])); 4551b38ff370SJamie Gritton #endif 4552b38ff370SJamie Gritton } 4553b38ff370SJamie Gritton 4554b38ff370SJamie Gritton DB_SHOW_COMMAND(prison, db_show_prison_command) 4555b38ff370SJamie Gritton { 4556b38ff370SJamie Gritton struct prison *pr; 4557b38ff370SJamie Gritton 4558b38ff370SJamie Gritton if (!have_addr) { 45590304c731SJamie Gritton /* 45600304c731SJamie Gritton * Show all prisons in the list, and prison0 which is not 45610304c731SJamie Gritton * listed. 45620304c731SJamie Gritton */ 45630304c731SJamie Gritton db_show_prison(&prison0); 45640304c731SJamie Gritton if (!db_pager_quit) { 4565b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) { 4566b38ff370SJamie Gritton db_show_prison(pr); 4567413628a7SBjoern A. Zeeb if (db_pager_quit) 4568413628a7SBjoern A. Zeeb break; 4569413628a7SBjoern A. Zeeb } 45700304c731SJamie Gritton } 4571b38ff370SJamie Gritton return; 4572413628a7SBjoern A. Zeeb } 4573b38ff370SJamie Gritton 45740304c731SJamie Gritton if (addr == 0) 45750304c731SJamie Gritton pr = &prison0; 45760304c731SJamie Gritton else { 4577b38ff370SJamie Gritton /* Look for a prison with the ID and with references. */ 4578b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) 4579b38ff370SJamie Gritton if (pr->pr_id == addr && pr->pr_ref > 0) 4580b38ff370SJamie Gritton break; 4581b38ff370SJamie Gritton if (pr == NULL) 4582b38ff370SJamie Gritton /* Look again, without requiring a reference. */ 4583b38ff370SJamie Gritton TAILQ_FOREACH(pr, &allprison, pr_list) 4584b38ff370SJamie Gritton if (pr->pr_id == addr) 4585b38ff370SJamie Gritton break; 4586b38ff370SJamie Gritton if (pr == NULL) 4587b38ff370SJamie Gritton /* Assume address points to a valid prison. */ 4588b38ff370SJamie Gritton pr = (struct prison *)addr; 45890304c731SJamie Gritton } 4590b38ff370SJamie Gritton db_show_prison(pr); 4591b38ff370SJamie Gritton } 4592b38ff370SJamie Gritton 4593413628a7SBjoern A. Zeeb #endif /* DDB */ 4594