14c3df794SDoug Rabson /*- 28a36da99SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 38a36da99SPedro F. Giffuni * 44c3df794SDoug Rabson * Copyright (c) 1999 Assar Westerlund 54c3df794SDoug Rabson * All rights reserved. 64c3df794SDoug Rabson * 74c3df794SDoug Rabson * Redistribution and use in source and binary forms, with or without 84c3df794SDoug Rabson * modification, are permitted provided that the following conditions 94c3df794SDoug Rabson * are met: 104c3df794SDoug Rabson * 1. Redistributions of source code must retain the above copyright 114c3df794SDoug Rabson * notice, this list of conditions and the following disclaimer. 124c3df794SDoug Rabson * 2. Redistributions in binary form must reproduce the above copyright 134c3df794SDoug Rabson * notice, this list of conditions and the following disclaimer in the 144c3df794SDoug Rabson * documentation and/or other materials provided with the distribution. 154c3df794SDoug Rabson * 164c3df794SDoug Rabson * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 174c3df794SDoug Rabson * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 184c3df794SDoug Rabson * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 194c3df794SDoug Rabson * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 204c3df794SDoug Rabson * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 214c3df794SDoug Rabson * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 224c3df794SDoug Rabson * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 234c3df794SDoug Rabson * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 244c3df794SDoug Rabson * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 254c3df794SDoug Rabson * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 264c3df794SDoug Rabson * SUCH DAMAGE. 274c3df794SDoug Rabson */ 284c3df794SDoug Rabson 29677b542eSDavid E. O'Brien #include <sys/cdefs.h> 30677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 31677b542eSDavid E. O'Brien 324c3df794SDoug Rabson #include <sys/param.h> 33153ac44cSKonstantin Belousov #include <sys/kernel.h> 349b3851e9SAndrew R. Reiter #include <sys/lock.h> 354c3df794SDoug Rabson #include <sys/module.h> 364ea6a9a2SMateusz Guzik #include <sys/mutex.h> 374ea6a9a2SMateusz Guzik #include <sys/proc.h> 38f6f6d240SMateusz Guzik #include <sys/resourcevar.h> 39da672ec2SJohn Baldwin #include <sys/sx.h> 40da672ec2SJohn Baldwin #include <sys/syscall.h> 41da672ec2SJohn Baldwin #include <sys/sysent.h> 42da672ec2SJohn Baldwin #include <sys/sysproto.h> 43153ac44cSKonstantin Belousov #include <sys/systm.h> 44153ac44cSKonstantin Belousov #include <machine/atomic.h> 454c3df794SDoug Rabson 4646db4836SPeter Wemm /* 4746db4836SPeter Wemm * Acts like "nosys" but can be identified in sysent for dynamic call 4846db4836SPeter Wemm * number assignment for a limited number of calls. 4946db4836SPeter Wemm * 5046db4836SPeter Wemm * Place holder for system call slots reserved for loadable modules. 5146db4836SPeter Wemm */ 5246db4836SPeter Wemm int 53b40ce416SJulian Elischer lkmnosys(struct thread *td, struct nosys_args *args) 5446db4836SPeter Wemm { 55da672ec2SJohn Baldwin 56b40ce416SJulian Elischer return (nosys(td, args)); 5746db4836SPeter Wemm } 5846db4836SPeter Wemm 594c3df794SDoug Rabson int 60b40ce416SJulian Elischer lkmressys(struct thread *td, struct nosys_args *args) 6178525ce3SAlfred Perlstein { 62da672ec2SJohn Baldwin 63b40ce416SJulian Elischer return (nosys(td, args)); 6478525ce3SAlfred Perlstein } 6578525ce3SAlfred Perlstein 66153ac44cSKonstantin Belousov static void 67153ac44cSKonstantin Belousov syscall_thread_drain(struct sysent *se) 68153ac44cSKonstantin Belousov { 69153ac44cSKonstantin Belousov u_int32_t cnt, oldcnt; 70153ac44cSKonstantin Belousov 71153ac44cSKonstantin Belousov do { 72153ac44cSKonstantin Belousov oldcnt = se->sy_thrcnt; 73153ac44cSKonstantin Belousov KASSERT((oldcnt & SY_THR_STATIC) == 0, 74153ac44cSKonstantin Belousov ("drain on static syscall")); 75153ac44cSKonstantin Belousov cnt = oldcnt | SY_THR_DRAINING; 76153ac44cSKonstantin Belousov } while (atomic_cmpset_acq_32(&se->sy_thrcnt, oldcnt, cnt) == 0); 77153ac44cSKonstantin Belousov while (atomic_cmpset_32(&se->sy_thrcnt, SY_THR_DRAINING, 78153ac44cSKonstantin Belousov SY_THR_ABSENT) == 0) 79153ac44cSKonstantin Belousov pause("scdrn", hz/2); 80153ac44cSKonstantin Belousov } 81153ac44cSKonstantin Belousov 82153ac44cSKonstantin Belousov int 83153ac44cSKonstantin Belousov syscall_thread_enter(struct thread *td, struct sysent *se) 84153ac44cSKonstantin Belousov { 85153ac44cSKonstantin Belousov u_int32_t cnt, oldcnt; 86153ac44cSKonstantin Belousov 87153ac44cSKonstantin Belousov do { 88153ac44cSKonstantin Belousov oldcnt = se->sy_thrcnt; 89153ac44cSKonstantin Belousov if ((oldcnt & SY_THR_STATIC) != 0) 90153ac44cSKonstantin Belousov return (0); 91153ac44cSKonstantin Belousov if ((oldcnt & (SY_THR_DRAINING | SY_THR_ABSENT)) != 0) 92153ac44cSKonstantin Belousov return (ENOSYS); 93153ac44cSKonstantin Belousov cnt = oldcnt + SY_THR_INCR; 94153ac44cSKonstantin Belousov } while (atomic_cmpset_acq_32(&se->sy_thrcnt, oldcnt, cnt) == 0); 95153ac44cSKonstantin Belousov return (0); 96153ac44cSKonstantin Belousov } 97153ac44cSKonstantin Belousov 98153ac44cSKonstantin Belousov void 99153ac44cSKonstantin Belousov syscall_thread_exit(struct thread *td, struct sysent *se) 100153ac44cSKonstantin Belousov { 101153ac44cSKonstantin Belousov u_int32_t cnt, oldcnt; 102153ac44cSKonstantin Belousov 103153ac44cSKonstantin Belousov do { 104153ac44cSKonstantin Belousov oldcnt = se->sy_thrcnt; 105153ac44cSKonstantin Belousov if ((oldcnt & SY_THR_STATIC) != 0) 106153ac44cSKonstantin Belousov return; 107153ac44cSKonstantin Belousov cnt = oldcnt - SY_THR_INCR; 108153ac44cSKonstantin Belousov } while (atomic_cmpset_rel_32(&se->sy_thrcnt, oldcnt, cnt) == 0); 109153ac44cSKonstantin Belousov } 110153ac44cSKonstantin Belousov 11178525ce3SAlfred Perlstein int 112*b81e88d2SBrooks Davis kern_syscall_register(struct sysent *sysents, int *offset, 113*b81e88d2SBrooks Davis struct sysent *new_sysent, struct sysent *old_sysent, int flags) 1144c3df794SDoug Rabson { 1154c3df794SDoug Rabson int i; 1164c3df794SDoug Rabson 117e015b1abSMateusz Guzik if ((flags & ~SY_THR_STATIC) != 0) 118e015b1abSMateusz Guzik return (EINVAL); 119e015b1abSMateusz Guzik 120da672ec2SJohn Baldwin if (*offset == NO_SYSCALL) { 1214c3df794SDoug Rabson for (i = 1; i < SYS_MAXSYSCALL; ++i) 122*b81e88d2SBrooks Davis if (sysents[i].sy_call == (sy_call_t *)lkmnosys) 1234c3df794SDoug Rabson break; 1244c3df794SDoug Rabson if (i == SYS_MAXSYSCALL) 125da672ec2SJohn Baldwin return (ENFILE); 1264c3df794SDoug Rabson *offset = i; 1274c3df794SDoug Rabson } else if (*offset < 0 || *offset >= SYS_MAXSYSCALL) 128da672ec2SJohn Baldwin return (EINVAL); 129*b81e88d2SBrooks Davis else if (sysents[*offset].sy_call != (sy_call_t *)lkmnosys && 130*b81e88d2SBrooks Davis sysents[*offset].sy_call != (sy_call_t *)lkmressys) 131da672ec2SJohn Baldwin return (EEXIST); 1324c3df794SDoug Rabson 133*b81e88d2SBrooks Davis KASSERT(sysents[*offset].sy_thrcnt == SY_THR_ABSENT, 134153ac44cSKonstantin Belousov ("dynamic syscall is not protected")); 135*b81e88d2SBrooks Davis *old_sysent = sysents[*offset]; 136153ac44cSKonstantin Belousov new_sysent->sy_thrcnt = SY_THR_ABSENT; 137*b81e88d2SBrooks Davis sysents[*offset] = *new_sysent; 138*b81e88d2SBrooks Davis atomic_store_rel_32(&sysents[*offset].sy_thrcnt, flags); 139da672ec2SJohn Baldwin return (0); 1404c3df794SDoug Rabson } 1414c3df794SDoug Rabson 1424c3df794SDoug Rabson int 143*b81e88d2SBrooks Davis kern_syscall_deregister(struct sysent *sysents, int offset, 144*b81e88d2SBrooks Davis const struct sysent *old_sysent) 1454c3df794SDoug Rabson { 146e015b1abSMateusz Guzik struct sysent *se; 147da672ec2SJohn Baldwin 148*b81e88d2SBrooks Davis if (offset == 0) 149e015b1abSMateusz Guzik return (0); /* XXX? */ 150e015b1abSMateusz Guzik 151*b81e88d2SBrooks Davis se = &sysents[offset]; 152e015b1abSMateusz Guzik if ((se->sy_thrcnt & SY_THR_STATIC) != 0) 153e015b1abSMateusz Guzik return (EINVAL); 154e015b1abSMateusz Guzik syscall_thread_drain(se); 155*b81e88d2SBrooks Davis sysent[offset] = *old_sysent; 156da672ec2SJohn Baldwin return (0); 1574c3df794SDoug Rabson } 1584c3df794SDoug Rabson 1594c3df794SDoug Rabson int 1604c3df794SDoug Rabson syscall_module_handler(struct module *mod, int what, void *arg) 1614c3df794SDoug Rabson { 162*b81e88d2SBrooks Davis 163*b81e88d2SBrooks Davis return (kern_syscall_module_handler(sysent, mod, what, arg)); 164*b81e88d2SBrooks Davis } 165*b81e88d2SBrooks Davis 166*b81e88d2SBrooks Davis int 167*b81e88d2SBrooks Davis kern_syscall_module_handler(struct sysent *sysents, struct module *mod, 168*b81e88d2SBrooks Davis int what, void *arg) 169*b81e88d2SBrooks Davis { 170da672ec2SJohn Baldwin struct syscall_module_data *data = arg; 171a35261efSDoug Rabson modspecific_t ms; 1724c3df794SDoug Rabson int error; 1734c3df794SDoug Rabson 1744c3df794SDoug Rabson switch (what) { 1754c3df794SDoug Rabson case MOD_LOAD: 176*b81e88d2SBrooks Davis error = kern_syscall_register(sysents, data->offset, 177*b81e88d2SBrooks Davis data->new_sysent, &data->old_sysent, data->flags); 17803e161fdSJohn Baldwin if (error) { 17903e161fdSJohn Baldwin /* Leave a mark so we know to safely unload below. */ 18003e161fdSJohn Baldwin data->offset = NULL; 181da672ec2SJohn Baldwin return (error); 18203e161fdSJohn Baldwin } 183a35261efSDoug Rabson ms.intval = *data->offset; 1849b3851e9SAndrew R. Reiter MOD_XLOCK; 185a35261efSDoug Rabson module_setspecific(mod, &ms); 1869b3851e9SAndrew R. Reiter MOD_XUNLOCK; 187c049aba8SDoug Rabson if (data->chainevh) 188c049aba8SDoug Rabson error = data->chainevh(mod, what, data->chainarg); 189da672ec2SJohn Baldwin return (error); 1904c3df794SDoug Rabson case MOD_UNLOAD: 19103e161fdSJohn Baldwin /* 19203e161fdSJohn Baldwin * MOD_LOAD failed, so just return without calling the 19303e161fdSJohn Baldwin * chained handler since we didn't pass along the MOD_LOAD 19403e161fdSJohn Baldwin * event. 19503e161fdSJohn Baldwin */ 19603e161fdSJohn Baldwin if (data->offset == NULL) 19703e161fdSJohn Baldwin return (0); 198c049aba8SDoug Rabson if (data->chainevh) { 199c049aba8SDoug Rabson error = data->chainevh(mod, what, data->chainarg); 2004c3df794SDoug Rabson if (error) 2014c3df794SDoug Rabson return error; 2024c3df794SDoug Rabson } 203*b81e88d2SBrooks Davis error = kern_syscall_deregister(sysents, *data->offset, 204*b81e88d2SBrooks Davis &data->old_sysent); 205da672ec2SJohn Baldwin return (error); 2063e019deaSPoul-Henning Kamp default: 2075e5fd037SXin LI if (data->chainevh) 2085e5fd037SXin LI return (data->chainevh(mod, what, data->chainarg)); 2095e5fd037SXin LI return (EOPNOTSUPP); 210c049aba8SDoug Rabson } 211c049aba8SDoug Rabson 21200e3c12eSXin LI /* NOTREACHED */ 2134c3df794SDoug Rabson } 2140687ba3eSKonstantin Belousov 2150687ba3eSKonstantin Belousov int 216e015b1abSMateusz Guzik syscall_helper_register(struct syscall_helper_data *sd, int flags) 2170687ba3eSKonstantin Belousov { 218*b81e88d2SBrooks Davis 219*b81e88d2SBrooks Davis return (kern_syscall_helper_register(sysent, sd, flags)); 220*b81e88d2SBrooks Davis } 221*b81e88d2SBrooks Davis 222*b81e88d2SBrooks Davis int 223*b81e88d2SBrooks Davis kern_syscall_helper_register(struct sysent *sysents, 224*b81e88d2SBrooks Davis struct syscall_helper_data *sd, int flags) 225*b81e88d2SBrooks Davis { 2260687ba3eSKonstantin Belousov struct syscall_helper_data *sd1; 2270687ba3eSKonstantin Belousov int error; 2280687ba3eSKonstantin Belousov 2290687ba3eSKonstantin Belousov for (sd1 = sd; sd1->syscall_no != NO_SYSCALL; sd1++) { 230*b81e88d2SBrooks Davis error = kern_syscall_register(sysents, &sd1->syscall_no, 231*b81e88d2SBrooks Davis &sd1->new_sysent, &sd1->old_sysent, flags); 2320687ba3eSKonstantin Belousov if (error != 0) { 233*b81e88d2SBrooks Davis kern_syscall_helper_unregister(sysents, sd); 2340687ba3eSKonstantin Belousov return (error); 2350687ba3eSKonstantin Belousov } 2360687ba3eSKonstantin Belousov sd1->registered = 1; 2370687ba3eSKonstantin Belousov } 2380687ba3eSKonstantin Belousov return (0); 2390687ba3eSKonstantin Belousov } 2400687ba3eSKonstantin Belousov 2410687ba3eSKonstantin Belousov int 2420687ba3eSKonstantin Belousov syscall_helper_unregister(struct syscall_helper_data *sd) 2430687ba3eSKonstantin Belousov { 244*b81e88d2SBrooks Davis 245*b81e88d2SBrooks Davis return (kern_syscall_helper_unregister(sysent, sd)); 246*b81e88d2SBrooks Davis } 247*b81e88d2SBrooks Davis 248*b81e88d2SBrooks Davis int 249*b81e88d2SBrooks Davis kern_syscall_helper_unregister(struct sysent *sysents, 250*b81e88d2SBrooks Davis struct syscall_helper_data *sd) 251*b81e88d2SBrooks Davis { 2520687ba3eSKonstantin Belousov struct syscall_helper_data *sd1; 2530687ba3eSKonstantin Belousov 2540687ba3eSKonstantin Belousov for (sd1 = sd; sd1->registered != 0; sd1++) { 255*b81e88d2SBrooks Davis kern_syscall_deregister(sysents, sd1->syscall_no, 256*b81e88d2SBrooks Davis &sd1->old_sysent); 2570687ba3eSKonstantin Belousov sd1->registered = 0; 2580687ba3eSKonstantin Belousov } 2590687ba3eSKonstantin Belousov return (0); 2600687ba3eSKonstantin Belousov } 261