xref: /freebsd/sys/kern/kern_syscalls.c (revision 8a36da99deb0e19363ec04e4d3facd869c1028f5)
14c3df794SDoug Rabson /*-
2*8a36da99SPedro F. Giffuni  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3*8a36da99SPedro F. Giffuni  *
44c3df794SDoug Rabson  * Copyright (c) 1999 Assar Westerlund
54c3df794SDoug Rabson  * All rights reserved.
64c3df794SDoug Rabson  *
74c3df794SDoug Rabson  * Redistribution and use in source and binary forms, with or without
84c3df794SDoug Rabson  * modification, are permitted provided that the following conditions
94c3df794SDoug Rabson  * are met:
104c3df794SDoug Rabson  * 1. Redistributions of source code must retain the above copyright
114c3df794SDoug Rabson  *    notice, this list of conditions and the following disclaimer.
124c3df794SDoug Rabson  * 2. Redistributions in binary form must reproduce the above copyright
134c3df794SDoug Rabson  *    notice, this list of conditions and the following disclaimer in the
144c3df794SDoug Rabson  *    documentation and/or other materials provided with the distribution.
154c3df794SDoug Rabson  *
164c3df794SDoug Rabson  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
174c3df794SDoug Rabson  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
184c3df794SDoug Rabson  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
194c3df794SDoug Rabson  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
204c3df794SDoug Rabson  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
214c3df794SDoug Rabson  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
224c3df794SDoug Rabson  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
234c3df794SDoug Rabson  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
244c3df794SDoug Rabson  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
254c3df794SDoug Rabson  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
264c3df794SDoug Rabson  * SUCH DAMAGE.
274c3df794SDoug Rabson  */
284c3df794SDoug Rabson 
29677b542eSDavid E. O'Brien #include <sys/cdefs.h>
30677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
31677b542eSDavid E. O'Brien 
324c3df794SDoug Rabson #include <sys/param.h>
33153ac44cSKonstantin Belousov #include <sys/kernel.h>
349b3851e9SAndrew R. Reiter #include <sys/lock.h>
354c3df794SDoug Rabson #include <sys/module.h>
364ea6a9a2SMateusz Guzik #include <sys/mutex.h>
374ea6a9a2SMateusz Guzik #include <sys/proc.h>
38f6f6d240SMateusz Guzik #include <sys/resourcevar.h>
39da672ec2SJohn Baldwin #include <sys/sx.h>
40da672ec2SJohn Baldwin #include <sys/syscall.h>
41da672ec2SJohn Baldwin #include <sys/sysent.h>
42da672ec2SJohn Baldwin #include <sys/sysproto.h>
43153ac44cSKonstantin Belousov #include <sys/systm.h>
44153ac44cSKonstantin Belousov #include <machine/atomic.h>
454c3df794SDoug Rabson 
4646db4836SPeter Wemm /*
4746db4836SPeter Wemm  * Acts like "nosys" but can be identified in sysent for dynamic call
4846db4836SPeter Wemm  * number assignment for a limited number of calls.
4946db4836SPeter Wemm  *
5046db4836SPeter Wemm  * Place holder for system call slots reserved for loadable modules.
5146db4836SPeter Wemm  */
5246db4836SPeter Wemm int
53b40ce416SJulian Elischer lkmnosys(struct thread *td, struct nosys_args *args)
5446db4836SPeter Wemm {
55da672ec2SJohn Baldwin 
56b40ce416SJulian Elischer 	return (nosys(td, args));
5746db4836SPeter Wemm }
5846db4836SPeter Wemm 
594c3df794SDoug Rabson int
60b40ce416SJulian Elischer lkmressys(struct thread *td, struct nosys_args *args)
6178525ce3SAlfred Perlstein {
62da672ec2SJohn Baldwin 
63b40ce416SJulian Elischer 	return (nosys(td, args));
6478525ce3SAlfred Perlstein }
6578525ce3SAlfred Perlstein 
66153ac44cSKonstantin Belousov static void
67153ac44cSKonstantin Belousov syscall_thread_drain(struct sysent *se)
68153ac44cSKonstantin Belousov {
69153ac44cSKonstantin Belousov 	u_int32_t cnt, oldcnt;
70153ac44cSKonstantin Belousov 
71153ac44cSKonstantin Belousov 	do {
72153ac44cSKonstantin Belousov 		oldcnt = se->sy_thrcnt;
73153ac44cSKonstantin Belousov 		KASSERT((oldcnt & SY_THR_STATIC) == 0,
74153ac44cSKonstantin Belousov 		    ("drain on static syscall"));
75153ac44cSKonstantin Belousov 		cnt = oldcnt | SY_THR_DRAINING;
76153ac44cSKonstantin Belousov 	} while (atomic_cmpset_acq_32(&se->sy_thrcnt, oldcnt, cnt) == 0);
77153ac44cSKonstantin Belousov 	while (atomic_cmpset_32(&se->sy_thrcnt, SY_THR_DRAINING,
78153ac44cSKonstantin Belousov 	    SY_THR_ABSENT) == 0)
79153ac44cSKonstantin Belousov 		pause("scdrn", hz/2);
80153ac44cSKonstantin Belousov }
81153ac44cSKonstantin Belousov 
82153ac44cSKonstantin Belousov int
83153ac44cSKonstantin Belousov syscall_thread_enter(struct thread *td, struct sysent *se)
84153ac44cSKonstantin Belousov {
85153ac44cSKonstantin Belousov 	u_int32_t cnt, oldcnt;
86153ac44cSKonstantin Belousov 
87153ac44cSKonstantin Belousov 	do {
88153ac44cSKonstantin Belousov 		oldcnt = se->sy_thrcnt;
89153ac44cSKonstantin Belousov 		if ((oldcnt & SY_THR_STATIC) != 0)
90153ac44cSKonstantin Belousov 			return (0);
91153ac44cSKonstantin Belousov 		if ((oldcnt & (SY_THR_DRAINING | SY_THR_ABSENT)) != 0)
92153ac44cSKonstantin Belousov 			return (ENOSYS);
93153ac44cSKonstantin Belousov 		cnt = oldcnt + SY_THR_INCR;
94153ac44cSKonstantin Belousov 	} while (atomic_cmpset_acq_32(&se->sy_thrcnt, oldcnt, cnt) == 0);
95153ac44cSKonstantin Belousov 	return (0);
96153ac44cSKonstantin Belousov }
97153ac44cSKonstantin Belousov 
98153ac44cSKonstantin Belousov void
99153ac44cSKonstantin Belousov syscall_thread_exit(struct thread *td, struct sysent *se)
100153ac44cSKonstantin Belousov {
101153ac44cSKonstantin Belousov 	u_int32_t cnt, oldcnt;
102153ac44cSKonstantin Belousov 
103153ac44cSKonstantin Belousov 	do {
104153ac44cSKonstantin Belousov 		oldcnt = se->sy_thrcnt;
105153ac44cSKonstantin Belousov 		if ((oldcnt & SY_THR_STATIC) != 0)
106153ac44cSKonstantin Belousov 			return;
107153ac44cSKonstantin Belousov 		cnt = oldcnt - SY_THR_INCR;
108153ac44cSKonstantin Belousov 	} while (atomic_cmpset_rel_32(&se->sy_thrcnt, oldcnt, cnt) == 0);
109153ac44cSKonstantin Belousov }
110153ac44cSKonstantin Belousov 
11178525ce3SAlfred Perlstein int
1124c3df794SDoug Rabson syscall_register(int *offset, struct sysent *new_sysent,
113e015b1abSMateusz Guzik     struct sysent *old_sysent, int flags)
1144c3df794SDoug Rabson {
1154c3df794SDoug Rabson 	int i;
1164c3df794SDoug Rabson 
117e015b1abSMateusz Guzik 	if ((flags & ~SY_THR_STATIC) != 0)
118e015b1abSMateusz Guzik 		return (EINVAL);
119e015b1abSMateusz Guzik 
120da672ec2SJohn Baldwin 	if (*offset == NO_SYSCALL) {
1214c3df794SDoug Rabson 		for (i = 1; i < SYS_MAXSYSCALL; ++i)
1224c3df794SDoug Rabson 			if (sysent[i].sy_call == (sy_call_t *)lkmnosys)
1234c3df794SDoug Rabson 				break;
1244c3df794SDoug Rabson 		if (i == SYS_MAXSYSCALL)
125da672ec2SJohn Baldwin 			return (ENFILE);
1264c3df794SDoug Rabson 		*offset = i;
1274c3df794SDoug Rabson 	} else if (*offset < 0 || *offset >= SYS_MAXSYSCALL)
128da672ec2SJohn Baldwin 		return (EINVAL);
12978525ce3SAlfred Perlstein 	else if (sysent[*offset].sy_call != (sy_call_t *)lkmnosys &&
13078525ce3SAlfred Perlstein 	    sysent[*offset].sy_call != (sy_call_t *)lkmressys)
131da672ec2SJohn Baldwin 		return (EEXIST);
1324c3df794SDoug Rabson 
133153ac44cSKonstantin Belousov 	KASSERT(sysent[*offset].sy_thrcnt == SY_THR_ABSENT,
134153ac44cSKonstantin Belousov 	    ("dynamic syscall is not protected"));
1354c3df794SDoug Rabson 	*old_sysent = sysent[*offset];
136153ac44cSKonstantin Belousov 	new_sysent->sy_thrcnt = SY_THR_ABSENT;
1374c3df794SDoug Rabson 	sysent[*offset] = *new_sysent;
138e015b1abSMateusz Guzik 	atomic_store_rel_32(&sysent[*offset].sy_thrcnt, flags);
139da672ec2SJohn Baldwin 	return (0);
1404c3df794SDoug Rabson }
1414c3df794SDoug Rabson 
1424c3df794SDoug Rabson int
1434c3df794SDoug Rabson syscall_deregister(int *offset, struct sysent *old_sysent)
1444c3df794SDoug Rabson {
145e015b1abSMateusz Guzik 	struct sysent *se;
146da672ec2SJohn Baldwin 
147e015b1abSMateusz Guzik 	if (*offset == 0)
148e015b1abSMateusz Guzik 		return (0); /* XXX? */
149e015b1abSMateusz Guzik 
150e015b1abSMateusz Guzik 	se = &sysent[*offset];
151e015b1abSMateusz Guzik 	if ((se->sy_thrcnt & SY_THR_STATIC) != 0)
152e015b1abSMateusz Guzik 		return (EINVAL);
153e015b1abSMateusz Guzik 	syscall_thread_drain(se);
1544c3df794SDoug Rabson 	sysent[*offset] = *old_sysent;
155da672ec2SJohn Baldwin 	return (0);
1564c3df794SDoug Rabson }
1574c3df794SDoug Rabson 
1584c3df794SDoug Rabson int
1594c3df794SDoug Rabson syscall_module_handler(struct module *mod, int what, void *arg)
1604c3df794SDoug Rabson {
161da672ec2SJohn Baldwin 	struct syscall_module_data *data = arg;
162a35261efSDoug Rabson 	modspecific_t ms;
1634c3df794SDoug Rabson 	int error;
1644c3df794SDoug Rabson 
1654c3df794SDoug Rabson 	switch (what) {
1664c3df794SDoug Rabson 	case MOD_LOAD:
1674c3df794SDoug Rabson 		error = syscall_register(data->offset, data->new_sysent,
168cdcf2428SMateusz Guzik 		    &data->old_sysent, data->flags);
16903e161fdSJohn Baldwin 		if (error) {
17003e161fdSJohn Baldwin 			/* Leave a mark so we know to safely unload below. */
17103e161fdSJohn Baldwin 			data->offset = NULL;
172da672ec2SJohn Baldwin 			return (error);
17303e161fdSJohn Baldwin 		}
174a35261efSDoug Rabson 		ms.intval = *data->offset;
1759b3851e9SAndrew R. Reiter 		MOD_XLOCK;
176a35261efSDoug Rabson 		module_setspecific(mod, &ms);
1779b3851e9SAndrew R. Reiter 		MOD_XUNLOCK;
178c049aba8SDoug Rabson 		if (data->chainevh)
179c049aba8SDoug Rabson 			error = data->chainevh(mod, what, data->chainarg);
180da672ec2SJohn Baldwin 		return (error);
1814c3df794SDoug Rabson 	case MOD_UNLOAD:
18203e161fdSJohn Baldwin 		/*
18303e161fdSJohn Baldwin 		 * MOD_LOAD failed, so just return without calling the
18403e161fdSJohn Baldwin 		 * chained handler since we didn't pass along the MOD_LOAD
18503e161fdSJohn Baldwin 		 * event.
18603e161fdSJohn Baldwin 		 */
18703e161fdSJohn Baldwin 		if (data->offset == NULL)
18803e161fdSJohn Baldwin 			return (0);
189c049aba8SDoug Rabson 		if (data->chainevh) {
190c049aba8SDoug Rabson 			error = data->chainevh(mod, what, data->chainarg);
1914c3df794SDoug Rabson 			if (error)
1924c3df794SDoug Rabson 				return error;
1934c3df794SDoug Rabson 		}
194c049aba8SDoug Rabson 		error = syscall_deregister(data->offset, &data->old_sysent);
195da672ec2SJohn Baldwin 		return (error);
1963e019deaSPoul-Henning Kamp 	default:
1975e5fd037SXin LI 		if (data->chainevh)
1985e5fd037SXin LI 			return (data->chainevh(mod, what, data->chainarg));
1995e5fd037SXin LI 		return (EOPNOTSUPP);
200c049aba8SDoug Rabson 	}
201c049aba8SDoug Rabson 
20200e3c12eSXin LI 	/* NOTREACHED */
2034c3df794SDoug Rabson }
2040687ba3eSKonstantin Belousov 
2050687ba3eSKonstantin Belousov int
206e015b1abSMateusz Guzik syscall_helper_register(struct syscall_helper_data *sd, int flags)
2070687ba3eSKonstantin Belousov {
2080687ba3eSKonstantin Belousov 	struct syscall_helper_data *sd1;
2090687ba3eSKonstantin Belousov 	int error;
2100687ba3eSKonstantin Belousov 
2110687ba3eSKonstantin Belousov 	for (sd1 = sd; sd1->syscall_no != NO_SYSCALL; sd1++) {
2120687ba3eSKonstantin Belousov 		error = syscall_register(&sd1->syscall_no, &sd1->new_sysent,
213e015b1abSMateusz Guzik 		    &sd1->old_sysent, flags);
2140687ba3eSKonstantin Belousov 		if (error != 0) {
2150687ba3eSKonstantin Belousov 			syscall_helper_unregister(sd);
2160687ba3eSKonstantin Belousov 			return (error);
2170687ba3eSKonstantin Belousov 		}
2180687ba3eSKonstantin Belousov 		sd1->registered = 1;
2190687ba3eSKonstantin Belousov 	}
2200687ba3eSKonstantin Belousov 	return (0);
2210687ba3eSKonstantin Belousov }
2220687ba3eSKonstantin Belousov 
2230687ba3eSKonstantin Belousov int
2240687ba3eSKonstantin Belousov syscall_helper_unregister(struct syscall_helper_data *sd)
2250687ba3eSKonstantin Belousov {
2260687ba3eSKonstantin Belousov 	struct syscall_helper_data *sd1;
2270687ba3eSKonstantin Belousov 
2280687ba3eSKonstantin Belousov 	for (sd1 = sd; sd1->registered != 0; sd1++) {
2290687ba3eSKonstantin Belousov 		syscall_deregister(&sd1->syscall_no, &sd1->old_sysent);
2300687ba3eSKonstantin Belousov 		sd1->registered = 0;
2310687ba3eSKonstantin Belousov 	}
2320687ba3eSKonstantin Belousov 	return (0);
2330687ba3eSKonstantin Belousov }
234