xref: /freebsd/sys/i386/linux/linux_machdep.c (revision f12c03487461c0d1004e5a8ab7d7796a3ec91e4e)
1146aad74SMarcel Moolenaar /*-
2146aad74SMarcel Moolenaar  * Copyright (c) 2000 Marcel Moolenaar
3146aad74SMarcel Moolenaar  * All rights reserved.
4146aad74SMarcel Moolenaar  *
5146aad74SMarcel Moolenaar  * Redistribution and use in source and binary forms, with or without
6146aad74SMarcel Moolenaar  * modification, are permitted provided that the following conditions
7146aad74SMarcel Moolenaar  * are met:
8146aad74SMarcel Moolenaar  * 1. Redistributions of source code must retain the above copyright
9146aad74SMarcel Moolenaar  *    notice, this list of conditions and the following disclaimer
10146aad74SMarcel Moolenaar  *    in this position and unchanged.
11146aad74SMarcel Moolenaar  * 2. Redistributions in binary form must reproduce the above copyright
12146aad74SMarcel Moolenaar  *    notice, this list of conditions and the following disclaimer in the
13146aad74SMarcel Moolenaar  *    documentation and/or other materials provided with the distribution.
14146aad74SMarcel Moolenaar  * 3. The name of the author may not be used to endorse or promote products
15bc34729cSMarcel Moolenaar  *    derived from this software without specific prior written permission.
16146aad74SMarcel Moolenaar  *
17146aad74SMarcel Moolenaar  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18146aad74SMarcel Moolenaar  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19146aad74SMarcel Moolenaar  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20146aad74SMarcel Moolenaar  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21146aad74SMarcel Moolenaar  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22146aad74SMarcel Moolenaar  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23146aad74SMarcel Moolenaar  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24146aad74SMarcel Moolenaar  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25146aad74SMarcel Moolenaar  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26146aad74SMarcel Moolenaar  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27146aad74SMarcel Moolenaar  */
28146aad74SMarcel Moolenaar 
2927e0099cSDavid E. O'Brien #include <sys/cdefs.h>
3027e0099cSDavid E. O'Brien __FBSDID("$FreeBSD$");
3127e0099cSDavid E. O'Brien 
32146aad74SMarcel Moolenaar #include <sys/param.h>
33146aad74SMarcel Moolenaar #include <sys/systm.h>
34a312f6a3SAlexander Leidinger #include <sys/file.h>
35a312f6a3SAlexander Leidinger #include <sys/fcntl.h>
36610ecfe0SMaxim Sobolev #include <sys/imgact.h>
377106ca0dSJohn Baldwin #include <sys/lock.h>
38610ecfe0SMaxim Sobolev #include <sys/malloc.h>
39fb919e4dSMark Murray #include <sys/mman.h>
40fb919e4dSMark Murray #include <sys/mutex.h>
419b44bfc5SAlexander Leidinger #include <sys/sx.h>
42acd3428bSRobert Watson #include <sys/priv.h>
43fb919e4dSMark Murray #include <sys/proc.h>
449b44bfc5SAlexander Leidinger #include <sys/queue.h>
45242fae60SAndrew Gallatin #include <sys/resource.h>
46242fae60SAndrew Gallatin #include <sys/resourcevar.h>
471bc85c0dSDoug Rabson #include <sys/signalvar.h>
48206a5d3aSIan Dowse #include <sys/syscallsubr.h>
49fb919e4dSMark Murray #include <sys/sysproto.h>
50fb919e4dSMark Murray #include <sys/unistd.h>
519b44bfc5SAlexander Leidinger #include <sys/wait.h>
52f0393f06SJeff Roberson #include <sys/sched.h>
53146aad74SMarcel Moolenaar 
54146aad74SMarcel Moolenaar #include <machine/frame.h>
55146aad74SMarcel Moolenaar #include <machine/psl.h>
56146aad74SMarcel Moolenaar #include <machine/segments.h>
57146aad74SMarcel Moolenaar #include <machine/sysarch.h>
58146aad74SMarcel Moolenaar 
59242fae60SAndrew Gallatin #include <vm/vm.h>
60242fae60SAndrew Gallatin #include <vm/pmap.h>
61242fae60SAndrew Gallatin #include <vm/vm_map.h>
62242fae60SAndrew Gallatin 
63146aad74SMarcel Moolenaar #include <i386/linux/linux.h>
64ebea8660SMarcel Moolenaar #include <i386/linux/linux_proto.h>
65146aad74SMarcel Moolenaar #include <compat/linux/linux_ipc.h>
66146aad74SMarcel Moolenaar #include <compat/linux/linux_signal.h>
67146aad74SMarcel Moolenaar #include <compat/linux/linux_util.h>
689b44bfc5SAlexander Leidinger #include <compat/linux/linux_emul.h>
699b44bfc5SAlexander Leidinger 
709b44bfc5SAlexander Leidinger #include <i386/include/pcb.h>			/* needed for pcb definition in linux_set_thread_area */
719b44bfc5SAlexander Leidinger 
729b44bfc5SAlexander Leidinger #include "opt_posix.h"
739b44bfc5SAlexander Leidinger 
749b44bfc5SAlexander Leidinger extern struct sysentvec elf32_freebsd_sysvec;	/* defined in i386/i386/elf_machdep.c */
75146aad74SMarcel Moolenaar 
765002a60fSMarcel Moolenaar struct l_descriptor {
775002a60fSMarcel Moolenaar 	l_uint		entry_number;
785002a60fSMarcel Moolenaar 	l_ulong		base_addr;
795002a60fSMarcel Moolenaar 	l_uint		limit;
805002a60fSMarcel Moolenaar 	l_uint		seg_32bit:1;
815002a60fSMarcel Moolenaar 	l_uint		contents:2;
825002a60fSMarcel Moolenaar 	l_uint		read_exec_only:1;
835002a60fSMarcel Moolenaar 	l_uint		limit_in_pages:1;
845002a60fSMarcel Moolenaar 	l_uint		seg_not_present:1;
855002a60fSMarcel Moolenaar 	l_uint		useable:1;
86146aad74SMarcel Moolenaar };
87146aad74SMarcel Moolenaar 
885002a60fSMarcel Moolenaar struct l_old_select_argv {
895002a60fSMarcel Moolenaar 	l_int		nfds;
905002a60fSMarcel Moolenaar 	l_fd_set	*readfds;
915002a60fSMarcel Moolenaar 	l_fd_set	*writefds;
925002a60fSMarcel Moolenaar 	l_fd_set	*exceptfds;
935002a60fSMarcel Moolenaar 	struct l_timeval	*timeout;
94146aad74SMarcel Moolenaar };
95146aad74SMarcel Moolenaar 
96f12c0348SJohn Baldwin static int	linux_mmap_common(struct thread *td, l_uintptr_t addr,
97f12c0348SJohn Baldwin 		    l_size_t len, l_int prot, l_int flags, l_int fd,
98f12c0348SJohn Baldwin 		    l_loff_t pos);
99f12c0348SJohn Baldwin 
100146aad74SMarcel Moolenaar int
101931a7258SAndrew Gallatin linux_to_bsd_sigaltstack(int lsa)
102931a7258SAndrew Gallatin {
103931a7258SAndrew Gallatin 	int bsa = 0;
104931a7258SAndrew Gallatin 
105931a7258SAndrew Gallatin 	if (lsa & LINUX_SS_DISABLE)
106931a7258SAndrew Gallatin 		bsa |= SS_DISABLE;
107931a7258SAndrew Gallatin 	if (lsa & LINUX_SS_ONSTACK)
108931a7258SAndrew Gallatin 		bsa |= SS_ONSTACK;
109931a7258SAndrew Gallatin 	return (bsa);
110931a7258SAndrew Gallatin }
111931a7258SAndrew Gallatin 
112931a7258SAndrew Gallatin int
113931a7258SAndrew Gallatin bsd_to_linux_sigaltstack(int bsa)
114931a7258SAndrew Gallatin {
115931a7258SAndrew Gallatin 	int lsa = 0;
116931a7258SAndrew Gallatin 
117931a7258SAndrew Gallatin 	if (bsa & SS_DISABLE)
118931a7258SAndrew Gallatin 		lsa |= LINUX_SS_DISABLE;
119931a7258SAndrew Gallatin 	if (bsa & SS_ONSTACK)
120931a7258SAndrew Gallatin 		lsa |= LINUX_SS_ONSTACK;
121931a7258SAndrew Gallatin 	return (lsa);
122931a7258SAndrew Gallatin }
123931a7258SAndrew Gallatin 
124931a7258SAndrew Gallatin int
125b40ce416SJulian Elischer linux_execve(struct thread *td, struct linux_execve_args *args)
126146aad74SMarcel Moolenaar {
127610ecfe0SMaxim Sobolev 	int error;
128610ecfe0SMaxim Sobolev 	char *newpath;
129610ecfe0SMaxim Sobolev 	struct image_args eargs;
130146aad74SMarcel Moolenaar 
131d9e97471SJohn Baldwin 	LCONVPATHEXIST(td, args->path, &newpath);
132146aad74SMarcel Moolenaar 
133146aad74SMarcel Moolenaar #ifdef DEBUG
13424593369SJonathan Lemon 	if (ldebug(execve))
135610ecfe0SMaxim Sobolev 		printf(ARGS(execve, "%s"), newpath);
136146aad74SMarcel Moolenaar #endif
137146aad74SMarcel Moolenaar 
138610ecfe0SMaxim Sobolev 	error = exec_copyin_args(&eargs, newpath, UIO_SYSSPACE,
139610ecfe0SMaxim Sobolev 	    args->argp, args->envp);
140610ecfe0SMaxim Sobolev 	free(newpath, M_TEMP);
141610ecfe0SMaxim Sobolev 	if (error == 0)
142c035ac04SMaxim Sobolev 		error = kern_execve(td, &eargs, NULL);
1439b44bfc5SAlexander Leidinger 	if (error == 0)
1449b44bfc5SAlexander Leidinger 	   	/* linux process can exec fbsd one, dont attempt
1459b44bfc5SAlexander Leidinger 		 * to create emuldata for such process using
1469b44bfc5SAlexander Leidinger 		 * linux_proc_init, this leads to a panic on KASSERT
1479b44bfc5SAlexander Leidinger 		 * because such process has p->p_emuldata == NULL
1489b44bfc5SAlexander Leidinger 		 */
1499b44bfc5SAlexander Leidinger 	   	if (td->td_proc->p_sysent == &elf_linux_sysvec)
1509b44bfc5SAlexander Leidinger    		   	error = linux_proc_init(td, 0, 0);
151610ecfe0SMaxim Sobolev 	return (error);
152146aad74SMarcel Moolenaar }
153146aad74SMarcel Moolenaar 
1545002a60fSMarcel Moolenaar struct l_ipc_kludge {
1555002a60fSMarcel Moolenaar 	struct l_msgbuf *msgp;
1565002a60fSMarcel Moolenaar 	l_long msgtyp;
1575002a60fSMarcel Moolenaar };
1585002a60fSMarcel Moolenaar 
159146aad74SMarcel Moolenaar int
160b40ce416SJulian Elischer linux_ipc(struct thread *td, struct linux_ipc_args *args)
161146aad74SMarcel Moolenaar {
1625002a60fSMarcel Moolenaar 
1635002a60fSMarcel Moolenaar 	switch (args->what & 0xFFFF) {
1645002a60fSMarcel Moolenaar 	case LINUX_SEMOP: {
1655002a60fSMarcel Moolenaar 		struct linux_semop_args a;
1665002a60fSMarcel Moolenaar 
1675002a60fSMarcel Moolenaar 		a.semid = args->arg1;
1685002a60fSMarcel Moolenaar 		a.tsops = args->ptr;
1695002a60fSMarcel Moolenaar 		a.nsops = args->arg2;
170b40ce416SJulian Elischer 		return (linux_semop(td, &a));
1715002a60fSMarcel Moolenaar 	}
1725002a60fSMarcel Moolenaar 	case LINUX_SEMGET: {
1735002a60fSMarcel Moolenaar 		struct linux_semget_args a;
1745002a60fSMarcel Moolenaar 
1755002a60fSMarcel Moolenaar 		a.key = args->arg1;
1765002a60fSMarcel Moolenaar 		a.nsems = args->arg2;
1775002a60fSMarcel Moolenaar 		a.semflg = args->arg3;
178b40ce416SJulian Elischer 		return (linux_semget(td, &a));
1795002a60fSMarcel Moolenaar 	}
1805002a60fSMarcel Moolenaar 	case LINUX_SEMCTL: {
1815002a60fSMarcel Moolenaar 		struct linux_semctl_args a;
1825002a60fSMarcel Moolenaar 		int error;
1835002a60fSMarcel Moolenaar 
1845002a60fSMarcel Moolenaar 		a.semid = args->arg1;
1855002a60fSMarcel Moolenaar 		a.semnum = args->arg2;
1865002a60fSMarcel Moolenaar 		a.cmd = args->arg3;
1874b7ef73dSDag-Erling Smørgrav 		error = copyin(args->ptr, &a.arg, sizeof(a.arg));
1885002a60fSMarcel Moolenaar 		if (error)
1895002a60fSMarcel Moolenaar 			return (error);
190b40ce416SJulian Elischer 		return (linux_semctl(td, &a));
1915002a60fSMarcel Moolenaar 	}
1925002a60fSMarcel Moolenaar 	case LINUX_MSGSND: {
1935002a60fSMarcel Moolenaar 		struct linux_msgsnd_args a;
1945002a60fSMarcel Moolenaar 
1955002a60fSMarcel Moolenaar 		a.msqid = args->arg1;
1965002a60fSMarcel Moolenaar 		a.msgp = args->ptr;
1975002a60fSMarcel Moolenaar 		a.msgsz = args->arg2;
1985002a60fSMarcel Moolenaar 		a.msgflg = args->arg3;
199b40ce416SJulian Elischer 		return (linux_msgsnd(td, &a));
2005002a60fSMarcel Moolenaar 	}
2015002a60fSMarcel Moolenaar 	case LINUX_MSGRCV: {
2025002a60fSMarcel Moolenaar 		struct linux_msgrcv_args a;
2035002a60fSMarcel Moolenaar 
2045002a60fSMarcel Moolenaar 		a.msqid = args->arg1;
2055002a60fSMarcel Moolenaar 		a.msgsz = args->arg2;
2065002a60fSMarcel Moolenaar 		a.msgflg = args->arg3;
2075002a60fSMarcel Moolenaar 		if ((args->what >> 16) == 0) {
2085002a60fSMarcel Moolenaar 			struct l_ipc_kludge tmp;
2095002a60fSMarcel Moolenaar 			int error;
2105002a60fSMarcel Moolenaar 
2115002a60fSMarcel Moolenaar 			if (args->ptr == NULL)
2125002a60fSMarcel Moolenaar 				return (EINVAL);
2134b7ef73dSDag-Erling Smørgrav 			error = copyin(args->ptr, &tmp, sizeof(tmp));
2145002a60fSMarcel Moolenaar 			if (error)
2155002a60fSMarcel Moolenaar 				return (error);
2165002a60fSMarcel Moolenaar 			a.msgp = tmp.msgp;
2175002a60fSMarcel Moolenaar 			a.msgtyp = tmp.msgtyp;
2185002a60fSMarcel Moolenaar 		} else {
2195002a60fSMarcel Moolenaar 			a.msgp = args->ptr;
2205002a60fSMarcel Moolenaar 			a.msgtyp = args->arg5;
2215002a60fSMarcel Moolenaar 		}
222b40ce416SJulian Elischer 		return (linux_msgrcv(td, &a));
2235002a60fSMarcel Moolenaar 	}
2245002a60fSMarcel Moolenaar 	case LINUX_MSGGET: {
2255002a60fSMarcel Moolenaar 		struct linux_msgget_args a;
2265002a60fSMarcel Moolenaar 
2275002a60fSMarcel Moolenaar 		a.key = args->arg1;
2285002a60fSMarcel Moolenaar 		a.msgflg = args->arg2;
229b40ce416SJulian Elischer 		return (linux_msgget(td, &a));
2305002a60fSMarcel Moolenaar 	}
2315002a60fSMarcel Moolenaar 	case LINUX_MSGCTL: {
2325002a60fSMarcel Moolenaar 		struct linux_msgctl_args a;
2335002a60fSMarcel Moolenaar 
2345002a60fSMarcel Moolenaar 		a.msqid = args->arg1;
2355002a60fSMarcel Moolenaar 		a.cmd = args->arg2;
2365002a60fSMarcel Moolenaar 		a.buf = args->ptr;
237b40ce416SJulian Elischer 		return (linux_msgctl(td, &a));
2385002a60fSMarcel Moolenaar 	}
2395002a60fSMarcel Moolenaar 	case LINUX_SHMAT: {
2405002a60fSMarcel Moolenaar 		struct linux_shmat_args a;
2415002a60fSMarcel Moolenaar 
2425002a60fSMarcel Moolenaar 		a.shmid = args->arg1;
2435002a60fSMarcel Moolenaar 		a.shmaddr = args->ptr;
2445002a60fSMarcel Moolenaar 		a.shmflg = args->arg2;
2455002a60fSMarcel Moolenaar 		a.raddr = (l_ulong *)args->arg3;
246b40ce416SJulian Elischer 		return (linux_shmat(td, &a));
2475002a60fSMarcel Moolenaar 	}
2485002a60fSMarcel Moolenaar 	case LINUX_SHMDT: {
2495002a60fSMarcel Moolenaar 		struct linux_shmdt_args a;
2505002a60fSMarcel Moolenaar 
2515002a60fSMarcel Moolenaar 		a.shmaddr = args->ptr;
252b40ce416SJulian Elischer 		return (linux_shmdt(td, &a));
2535002a60fSMarcel Moolenaar 	}
2545002a60fSMarcel Moolenaar 	case LINUX_SHMGET: {
2555002a60fSMarcel Moolenaar 		struct linux_shmget_args a;
2565002a60fSMarcel Moolenaar 
2575002a60fSMarcel Moolenaar 		a.key = args->arg1;
2585002a60fSMarcel Moolenaar 		a.size = args->arg2;
2595002a60fSMarcel Moolenaar 		a.shmflg = args->arg3;
260b40ce416SJulian Elischer 		return (linux_shmget(td, &a));
2615002a60fSMarcel Moolenaar 	}
2625002a60fSMarcel Moolenaar 	case LINUX_SHMCTL: {
2635002a60fSMarcel Moolenaar 		struct linux_shmctl_args a;
2645002a60fSMarcel Moolenaar 
2655002a60fSMarcel Moolenaar 		a.shmid = args->arg1;
2665002a60fSMarcel Moolenaar 		a.cmd = args->arg2;
2675002a60fSMarcel Moolenaar 		a.buf = args->ptr;
268b40ce416SJulian Elischer 		return (linux_shmctl(td, &a));
2695002a60fSMarcel Moolenaar 	}
2705002a60fSMarcel Moolenaar 	default:
2715002a60fSMarcel Moolenaar 		break;
272146aad74SMarcel Moolenaar 	}
273146aad74SMarcel Moolenaar 
2745002a60fSMarcel Moolenaar 	return (EINVAL);
275146aad74SMarcel Moolenaar }
276146aad74SMarcel Moolenaar 
277146aad74SMarcel Moolenaar int
278b40ce416SJulian Elischer linux_old_select(struct thread *td, struct linux_old_select_args *args)
279146aad74SMarcel Moolenaar {
2805002a60fSMarcel Moolenaar 	struct l_old_select_argv linux_args;
2815002a60fSMarcel Moolenaar 	struct linux_select_args newsel;
282146aad74SMarcel Moolenaar 	int error;
283146aad74SMarcel Moolenaar 
2845002a60fSMarcel Moolenaar #ifdef DEBUG
2855002a60fSMarcel Moolenaar 	if (ldebug(old_select))
2866aea6777SPeter Wemm 		printf(ARGS(old_select, "%p"), args->ptr);
287146aad74SMarcel Moolenaar #endif
288146aad74SMarcel Moolenaar 
2894b7ef73dSDag-Erling Smørgrav 	error = copyin(args->ptr, &linux_args, sizeof(linux_args));
290146aad74SMarcel Moolenaar 	if (error)
291146aad74SMarcel Moolenaar 		return (error);
292146aad74SMarcel Moolenaar 
293146aad74SMarcel Moolenaar 	newsel.nfds = linux_args.nfds;
294146aad74SMarcel Moolenaar 	newsel.readfds = linux_args.readfds;
295146aad74SMarcel Moolenaar 	newsel.writefds = linux_args.writefds;
296146aad74SMarcel Moolenaar 	newsel.exceptfds = linux_args.exceptfds;
297146aad74SMarcel Moolenaar 	newsel.timeout = linux_args.timeout;
298b40ce416SJulian Elischer 	return (linux_select(td, &newsel));
299146aad74SMarcel Moolenaar }
300146aad74SMarcel Moolenaar 
301146aad74SMarcel Moolenaar int
302b40ce416SJulian Elischer linux_fork(struct thread *td, struct linux_fork_args *args)
303146aad74SMarcel Moolenaar {
304146aad74SMarcel Moolenaar 	int error;
305d071f504SAlexander Leidinger 	struct proc *p2;
306d071f504SAlexander Leidinger 	struct thread *td2;
307146aad74SMarcel Moolenaar 
308146aad74SMarcel Moolenaar #ifdef DEBUG
30924593369SJonathan Lemon 	if (ldebug(fork))
31024593369SJonathan Lemon 		printf(ARGS(fork, ""));
311146aad74SMarcel Moolenaar #endif
312146aad74SMarcel Moolenaar 
313d071f504SAlexander Leidinger 	if ((error = fork1(td, RFFDG | RFPROC | RFSTOPPED, 0, &p2)) != 0)
314146aad74SMarcel Moolenaar 		return (error);
315146aad74SMarcel Moolenaar 
316d071f504SAlexander Leidinger 	if (error == 0) {
317d071f504SAlexander Leidinger 		td->td_retval[0] = p2->p_pid;
318d071f504SAlexander Leidinger 		td->td_retval[1] = 0;
319d071f504SAlexander Leidinger 	}
320d071f504SAlexander Leidinger 
321b40ce416SJulian Elischer 	if (td->td_retval[1] == 1)
322b40ce416SJulian Elischer 		td->td_retval[0] = 0;
3239b44bfc5SAlexander Leidinger 	error = linux_proc_init(td, td->td_retval[0], 0);
3249b44bfc5SAlexander Leidinger 	if (error)
3259b44bfc5SAlexander Leidinger 		return (error);
3269b44bfc5SAlexander Leidinger 
327d071f504SAlexander Leidinger 	td2 = FIRST_THREAD_IN_PROC(p2);
328d071f504SAlexander Leidinger 
329d071f504SAlexander Leidinger 	/*
330d071f504SAlexander Leidinger 	 * Make this runnable after we are finished with it.
331d071f504SAlexander Leidinger 	 */
332982d11f8SJeff Roberson 	thread_lock(td2);
333d071f504SAlexander Leidinger 	TD_SET_CAN_RUN(td2);
334f0393f06SJeff Roberson 	sched_add(td2, SRQ_BORING);
335982d11f8SJeff Roberson 	thread_unlock(td2);
336d071f504SAlexander Leidinger 
337146aad74SMarcel Moolenaar 	return (0);
338146aad74SMarcel Moolenaar }
339146aad74SMarcel Moolenaar 
340146aad74SMarcel Moolenaar int
341b40ce416SJulian Elischer linux_vfork(struct thread *td, struct linux_vfork_args *args)
342146aad74SMarcel Moolenaar {
343146aad74SMarcel Moolenaar 	int error;
34440f734ddSAlexander Leidinger 	struct proc *p2;
345d071f504SAlexander Leidinger 	struct thread *td2;
346146aad74SMarcel Moolenaar 
347146aad74SMarcel Moolenaar #ifdef DEBUG
34824593369SJonathan Lemon 	if (ldebug(vfork))
34924593369SJonathan Lemon 		printf(ARGS(vfork, ""));
350146aad74SMarcel Moolenaar #endif
351146aad74SMarcel Moolenaar 
35240f734ddSAlexander Leidinger 	/* exclude RFPPWAIT */
353d071f504SAlexander Leidinger 	if ((error = fork1(td, RFFDG | RFPROC | RFMEM | RFSTOPPED, 0, &p2)) != 0)
354146aad74SMarcel Moolenaar 		return (error);
35540f734ddSAlexander Leidinger 	if (error == 0) {
35640f734ddSAlexander Leidinger 		td->td_retval[0] = p2->p_pid;
35740f734ddSAlexander Leidinger 		td->td_retval[1] = 0;
35840f734ddSAlexander Leidinger 	}
359146aad74SMarcel Moolenaar 	/* Are we the child? */
360b40ce416SJulian Elischer 	if (td->td_retval[1] == 1)
361b40ce416SJulian Elischer 		td->td_retval[0] = 0;
3629b44bfc5SAlexander Leidinger 	error = linux_proc_init(td, td->td_retval[0], 0);
3639b44bfc5SAlexander Leidinger 	if (error)
3649b44bfc5SAlexander Leidinger 		return (error);
365d071f504SAlexander Leidinger 
36640f734ddSAlexander Leidinger 	PROC_LOCK(p2);
367973ac082SAlexander Leidinger 	p2->p_flag |= P_PPWAIT;
368d071f504SAlexander Leidinger 	PROC_UNLOCK(p2);
369d071f504SAlexander Leidinger 
370d071f504SAlexander Leidinger 	td2 = FIRST_THREAD_IN_PROC(p2);
371d071f504SAlexander Leidinger 
372d071f504SAlexander Leidinger 	/*
373d071f504SAlexander Leidinger 	 * Make this runnable after we are finished with it.
374d071f504SAlexander Leidinger 	 */
375982d11f8SJeff Roberson 	thread_lock(td2);
376d071f504SAlexander Leidinger 	TD_SET_CAN_RUN(td2);
377f0393f06SJeff Roberson 	sched_add(td2, SRQ_BORING);
378982d11f8SJeff Roberson 	thread_unlock(td2);
379d071f504SAlexander Leidinger 
380d071f504SAlexander Leidinger 	/* wait for the children to exit, ie. emulate vfork */
381d071f504SAlexander Leidinger 	PROC_LOCK(p2);
38240f734ddSAlexander Leidinger 	while (p2->p_flag & P_PPWAIT)
38399b7f1a1SKonstantin Belousov 		cv_wait(&p2->p_pwait, &p2->p_mtx);
38440f734ddSAlexander Leidinger 	PROC_UNLOCK(p2);
38540f734ddSAlexander Leidinger 
386146aad74SMarcel Moolenaar 	return (0);
387146aad74SMarcel Moolenaar }
388146aad74SMarcel Moolenaar 
389146aad74SMarcel Moolenaar int
390b40ce416SJulian Elischer linux_clone(struct thread *td, struct linux_clone_args *args)
391146aad74SMarcel Moolenaar {
3926ad0e7c5SJohn Baldwin 	int error, ff = RFPROC | RFSTOPPED;
393146aad74SMarcel Moolenaar 	struct proc *p2;
3949eb78fcfSJohn Baldwin 	struct thread *td2;
395146aad74SMarcel Moolenaar 	int exit_signal;
3969b44bfc5SAlexander Leidinger 	struct linux_emuldata *em;
397146aad74SMarcel Moolenaar 
398146aad74SMarcel Moolenaar #ifdef DEBUG
39924593369SJonathan Lemon 	if (ldebug(clone)) {
4009b44bfc5SAlexander Leidinger    	   	printf(ARGS(clone, "flags %x, stack %x, parent tid: %x, child tid: %x"),
4019b44bfc5SAlexander Leidinger 		    (unsigned int)args->flags, (unsigned int)args->stack,
4029b44bfc5SAlexander Leidinger 		    (unsigned int)args->parent_tidptr, (unsigned int)args->child_tidptr);
40324593369SJonathan Lemon 	}
404146aad74SMarcel Moolenaar #endif
405146aad74SMarcel Moolenaar 
406146aad74SMarcel Moolenaar 	exit_signal = args->flags & 0x000000ff;
407ec69a8a6SAlexander Kabaev 	if (LINUX_SIG_VALID(exit_signal)) {
408146aad74SMarcel Moolenaar 		if (exit_signal <= LINUX_SIGTBLSZ)
409ec69a8a6SAlexander Kabaev 			exit_signal =
410ec69a8a6SAlexander Kabaev 			    linux_to_bsd_signal[_SIG_IDX(exit_signal)];
411ec69a8a6SAlexander Kabaev 	} else if (exit_signal != 0)
412ec69a8a6SAlexander Kabaev 		return (EINVAL);
413146aad74SMarcel Moolenaar 
414a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_VM)
415146aad74SMarcel Moolenaar 		ff |= RFMEM;
416a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_SIGHAND)
417146aad74SMarcel Moolenaar 		ff |= RFSIGSHARE;
4184b3583a3SAlexander Leidinger 	/*
4194b3583a3SAlexander Leidinger 	 * XXX: in linux sharing of fs info (chroot/cwd/umask)
4204b3583a3SAlexander Leidinger 	 * and open files is independant. in fbsd its in one
421802e08a3SAlexander Leidinger 	 * structure but in reality it doesn't cause any problems
422802e08a3SAlexander Leidinger 	 * because both of these flags are usually set together.
4234b3583a3SAlexander Leidinger 	 */
424a4e3bad7SJung-uk Kim 	if (!(args->flags & (LINUX_CLONE_FILES | LINUX_CLONE_FS)))
425146aad74SMarcel Moolenaar 		ff |= RFFDG;
426146aad74SMarcel Moolenaar 
4274b178336SMaxim Sobolev 	/*
4284b178336SMaxim Sobolev 	 * Attempt to detect when linux_clone(2) is used for creating
4294b178336SMaxim Sobolev 	 * kernel threads. Unfortunately despite the existence of the
4304b178336SMaxim Sobolev 	 * CLONE_THREAD flag, version of linuxthreads package used in
4314b178336SMaxim Sobolev 	 * most popular distros as of beginning of 2005 doesn't make
432802e08a3SAlexander Leidinger 	 * any use of it. Therefore, this detection relies on
4334b178336SMaxim Sobolev 	 * empirical observation that linuxthreads sets certain
4344b178336SMaxim Sobolev 	 * combination of flags, so that we can make more or less
4354b178336SMaxim Sobolev 	 * precise detection and notify the FreeBSD kernel that several
4364b178336SMaxim Sobolev 	 * processes are in fact part of the same threading group, so
4374b178336SMaxim Sobolev 	 * that special treatment is necessary for signal delivery
4384b178336SMaxim Sobolev 	 * between those processes and fd locking.
4394b178336SMaxim Sobolev 	 */
440a4e3bad7SJung-uk Kim 	if ((args->flags & 0xffffff00) == LINUX_THREADING_FLAGS)
4414b178336SMaxim Sobolev 		ff |= RFTHREAD;
4424b178336SMaxim Sobolev 
443a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_PARENT_SETTID)
4441a26db0aSAlexander Leidinger 		if (args->parent_tidptr == NULL)
4451a26db0aSAlexander Leidinger 			return (EINVAL);
4461a26db0aSAlexander Leidinger 
447316ec49aSScott Long 	error = fork1(td, ff, 0, &p2);
4489eb78fcfSJohn Baldwin 	if (error)
4499eb78fcfSJohn Baldwin 		return (error);
4509eb78fcfSJohn Baldwin 
451a4e3bad7SJung-uk Kim 	if (args->flags & (LINUX_CLONE_PARENT | LINUX_CLONE_THREAD)) {
452a9ccaccfSKonstantin Belousov 	   	sx_xlock(&proctree_lock);
453a9ccaccfSKonstantin Belousov 		PROC_LOCK(p2);
454a9ccaccfSKonstantin Belousov 		proc_reparent(p2, td->td_proc->p_pptr);
455a9ccaccfSKonstantin Belousov 		PROC_UNLOCK(p2);
456a9ccaccfSKonstantin Belousov 		sx_xunlock(&proctree_lock);
457a9ccaccfSKonstantin Belousov 	}
458a9ccaccfSKonstantin Belousov 
4599b44bfc5SAlexander Leidinger 	/* create the emuldata */
4609b44bfc5SAlexander Leidinger 	error = linux_proc_init(td, p2->p_pid, args->flags);
4619b44bfc5SAlexander Leidinger 	/* reference it - no need to check this */
4621c65504cSAlexander Leidinger 	em = em_find(p2, EMUL_DOLOCK);
4639b44bfc5SAlexander Leidinger 	KASSERT(em != NULL, ("clone: emuldata not found.\n"));
4649b44bfc5SAlexander Leidinger 	/* and adjust it */
4659b44bfc5SAlexander Leidinger 
466a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_THREAD) {
4679b44bfc5SAlexander Leidinger 	   	/* XXX: linux mangles pgrp and pptr somehow
4689b44bfc5SAlexander Leidinger 		 * I think it might be this but I am not sure.
4699b44bfc5SAlexander Leidinger 		 */
4709b44bfc5SAlexander Leidinger #ifdef notyet
471a6c5f813SAlexander Leidinger 	   	PROC_LOCK(p2);
4729b44bfc5SAlexander Leidinger 	   	p2->p_pgrp = td->td_proc->p_pgrp;
473a6c5f813SAlexander Leidinger 	   	PROC_UNLOCK(p2);
4749b44bfc5SAlexander Leidinger #endif
4759b44bfc5SAlexander Leidinger 	 	exit_signal = 0;
4769b44bfc5SAlexander Leidinger 	}
4779b44bfc5SAlexander Leidinger 
478a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_CHILD_SETTID)
4799b44bfc5SAlexander Leidinger 		em->child_set_tid = args->child_tidptr;
4809b44bfc5SAlexander Leidinger 	else
4819b44bfc5SAlexander Leidinger 	   	em->child_set_tid = NULL;
4829b44bfc5SAlexander Leidinger 
483a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_CHILD_CLEARTID)
4849b44bfc5SAlexander Leidinger 		em->child_clear_tid = args->child_tidptr;
4859b44bfc5SAlexander Leidinger 	else
4869b44bfc5SAlexander Leidinger 	   	em->child_clear_tid = NULL;
487a6c5f813SAlexander Leidinger 
4889b44bfc5SAlexander Leidinger 	EMUL_UNLOCK(&emul_lock);
489146aad74SMarcel Moolenaar 
490a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_PARENT_SETTID) {
4911a26db0aSAlexander Leidinger 		error = copyout(&p2->p_pid, args->parent_tidptr, sizeof(p2->p_pid));
4921a26db0aSAlexander Leidinger 		if (error)
4931a26db0aSAlexander Leidinger 			printf(LMSG("copyout failed!"));
4941a26db0aSAlexander Leidinger 	}
4951a26db0aSAlexander Leidinger 
496fdfdfb78SJohn Baldwin 	PROC_LOCK(p2);
497146aad74SMarcel Moolenaar 	p2->p_sigparent = exit_signal;
4989eb78fcfSJohn Baldwin 	PROC_UNLOCK(p2);
4999eb78fcfSJohn Baldwin 	td2 = FIRST_THREAD_IN_PROC(p2);
5000eef2f8aSAlexander Leidinger 	/*
5010eef2f8aSAlexander Leidinger 	 * in a case of stack = NULL we are supposed to COW calling process stack
5029b44bfc5SAlexander Leidinger 	 * this is what normal fork() does so we just keep the tf_esp arg intact
5039b44bfc5SAlexander Leidinger 	 */
5049b44bfc5SAlexander Leidinger 	if (args->stack)
5059eb78fcfSJohn Baldwin    	   	td2->td_frame->tf_esp = (unsigned int)args->stack;
506146aad74SMarcel Moolenaar 
507a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_SETTLS) {
5089b44bfc5SAlexander Leidinger    	   	struct l_user_desc info;
5099b44bfc5SAlexander Leidinger    	   	int idx;
5109b44bfc5SAlexander Leidinger 	   	int a[2];
5119b44bfc5SAlexander Leidinger 		struct segment_descriptor sd;
5129b44bfc5SAlexander Leidinger 
5139b44bfc5SAlexander Leidinger 	   	error = copyin((void *)td->td_frame->tf_esi, &info, sizeof(struct l_user_desc));
5141a26db0aSAlexander Leidinger 		if (error) {
5151a26db0aSAlexander Leidinger 			printf(LMSG("copyin failed!"));
5161a26db0aSAlexander Leidinger 		} else {
5179b44bfc5SAlexander Leidinger 
5189b44bfc5SAlexander Leidinger 			idx = info.entry_number;
5199b44bfc5SAlexander Leidinger 
5200eef2f8aSAlexander Leidinger 			/*
5210eef2f8aSAlexander Leidinger 			 * looks like we're getting the idx we returned
5229b44bfc5SAlexander Leidinger 			 * in the set_thread_area() syscall
5239b44bfc5SAlexander Leidinger 			 */
5241a26db0aSAlexander Leidinger 			if (idx != 6 && idx != 3) {
5251a26db0aSAlexander Leidinger 				printf(LMSG("resetting idx!"));
5261a26db0aSAlexander Leidinger 				idx = 3;
5271a26db0aSAlexander Leidinger 			}
5289b44bfc5SAlexander Leidinger 
5299b44bfc5SAlexander Leidinger 			/* this doesnt happen in practice */
5309b44bfc5SAlexander Leidinger 			if (idx == 6) {
5319b44bfc5SAlexander Leidinger 		   		/* we might copy out the entry_number as 3 */
5329b44bfc5SAlexander Leidinger 			   	info.entry_number = 3;
5339b44bfc5SAlexander Leidinger 				error = copyout(&info, (void *) td->td_frame->tf_esi, sizeof(struct l_user_desc));
5349b44bfc5SAlexander Leidinger 				if (error)
5351a26db0aSAlexander Leidinger 					printf(LMSG("copyout failed!"));
5369b44bfc5SAlexander Leidinger 			}
5379b44bfc5SAlexander Leidinger 
538a4e3bad7SJung-uk Kim 			a[0] = LINUX_LDT_entry_a(&info);
539a4e3bad7SJung-uk Kim 			a[1] = LINUX_LDT_entry_b(&info);
5409b44bfc5SAlexander Leidinger 
5419b44bfc5SAlexander Leidinger 			memcpy(&sd, &a, sizeof(a));
5429b44bfc5SAlexander Leidinger #ifdef DEBUG
5439b44bfc5SAlexander Leidinger 		if (ldebug(clone))
5449b44bfc5SAlexander Leidinger 		   	printf("Segment created in clone with CLONE_SETTLS: lobase: %x, hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, def32: %i, gran: %i\n", sd.sd_lobase,
5459b44bfc5SAlexander Leidinger 			sd.sd_hibase,
5469b44bfc5SAlexander Leidinger 			sd.sd_lolimit,
5479b44bfc5SAlexander Leidinger 			sd.sd_hilimit,
5489b44bfc5SAlexander Leidinger 			sd.sd_type,
5499b44bfc5SAlexander Leidinger 			sd.sd_dpl,
5509b44bfc5SAlexander Leidinger 			sd.sd_p,
5519b44bfc5SAlexander Leidinger 			sd.sd_xx,
5529b44bfc5SAlexander Leidinger 			sd.sd_def32,
5539b44bfc5SAlexander Leidinger 			sd.sd_gran);
5549b44bfc5SAlexander Leidinger #endif
5559b44bfc5SAlexander Leidinger 
5569b44bfc5SAlexander Leidinger 			/* set %gs */
5579b44bfc5SAlexander Leidinger 			td2->td_pcb->pcb_gsd = sd;
558a6c5f813SAlexander Leidinger 			td2->td_pcb->pcb_gs = GSEL(GUGS_SEL, SEL_UPL);
5599b44bfc5SAlexander Leidinger 		}
5601a26db0aSAlexander Leidinger 	}
5619b44bfc5SAlexander Leidinger 
562146aad74SMarcel Moolenaar #ifdef DEBUG
56324593369SJonathan Lemon 	if (ldebug(clone))
5649eb78fcfSJohn Baldwin 		printf(LMSG("clone: successful rfork to %ld, stack %p sig = %d"),
5659eb78fcfSJohn Baldwin 		    (long)p2->p_pid, args->stack, exit_signal);
566146aad74SMarcel Moolenaar #endif
567a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_VFORK) {
568d071f504SAlexander Leidinger 	   	PROC_LOCK(p2);
569d071f504SAlexander Leidinger 		p2->p_flag |= P_PPWAIT;
570d071f504SAlexander Leidinger 	   	PROC_UNLOCK(p2);
571d071f504SAlexander Leidinger 	}
572146aad74SMarcel Moolenaar 
5736ad0e7c5SJohn Baldwin 	/*
5746ad0e7c5SJohn Baldwin 	 * Make this runnable after we are finished with it.
5756ad0e7c5SJohn Baldwin 	 */
576982d11f8SJeff Roberson 	thread_lock(td2);
5779eb78fcfSJohn Baldwin 	TD_SET_CAN_RUN(td2);
578f0393f06SJeff Roberson 	sched_add(td2, SRQ_BORING);
579982d11f8SJeff Roberson 	thread_unlock(td2);
5806ad0e7c5SJohn Baldwin 
5819eb78fcfSJohn Baldwin 	td->td_retval[0] = p2->p_pid;
5829eb78fcfSJohn Baldwin 	td->td_retval[1] = 0;
5830a62e035SAlexander Leidinger 
584a4e3bad7SJung-uk Kim 	if (args->flags & LINUX_CLONE_VFORK) {
5850a62e035SAlexander Leidinger    	   	/* wait for the children to exit, ie. emulate vfork */
5860a62e035SAlexander Leidinger    	   	PROC_LOCK(p2);
5870a62e035SAlexander Leidinger 		while (p2->p_flag & P_PPWAIT)
58899b7f1a1SKonstantin Belousov 			cv_wait(&p2->p_pwait, &p2->p_mtx);
5890a62e035SAlexander Leidinger 		PROC_UNLOCK(p2);
5900a62e035SAlexander Leidinger 	}
5910a62e035SAlexander Leidinger 
5929eb78fcfSJohn Baldwin 	return (0);
593146aad74SMarcel Moolenaar }
594146aad74SMarcel Moolenaar 
595146aad74SMarcel Moolenaar #define STACK_SIZE  (2 * 1024 * 1024)
596146aad74SMarcel Moolenaar #define GUARD_SIZE  (4 * PAGE_SIZE)
597146aad74SMarcel Moolenaar 
5983ad9c842SMaxim Sobolev int
5993ad9c842SMaxim Sobolev linux_mmap2(struct thread *td, struct linux_mmap2_args *args)
6003ad9c842SMaxim Sobolev {
6013ad9c842SMaxim Sobolev 
6023ad9c842SMaxim Sobolev #ifdef DEBUG
6033ad9c842SMaxim Sobolev 	if (ldebug(mmap2))
6043ad9c842SMaxim Sobolev 		printf(ARGS(mmap2, "%p, %d, %d, 0x%08x, %d, %d"),
6053ad9c842SMaxim Sobolev 		    (void *)args->addr, args->len, args->prot,
6063ad9c842SMaxim Sobolev 		    args->flags, args->fd, args->pgoff);
6073ad9c842SMaxim Sobolev #endif
6083ad9c842SMaxim Sobolev 
609f12c0348SJohn Baldwin 	return (linux_mmap_common(td, args->addr, args->len, args->prot,
610f12c0348SJohn Baldwin 		args->flags, args->fd, (uint64_t)(uint32_t)args->pgoff *
611f12c0348SJohn Baldwin 		PAGE_SIZE));
6123ad9c842SMaxim Sobolev }
6133ad9c842SMaxim Sobolev 
614146aad74SMarcel Moolenaar int
615b40ce416SJulian Elischer linux_mmap(struct thread *td, struct linux_mmap_args *args)
616146aad74SMarcel Moolenaar {
6173ad9c842SMaxim Sobolev 	int error;
6183ad9c842SMaxim Sobolev 	struct l_mmap_argv linux_args;
6193ad9c842SMaxim Sobolev 
6204b7ef73dSDag-Erling Smørgrav 	error = copyin(args->ptr, &linux_args, sizeof(linux_args));
6213ad9c842SMaxim Sobolev 	if (error)
6223ad9c842SMaxim Sobolev 		return (error);
6233ad9c842SMaxim Sobolev 
6243ad9c842SMaxim Sobolev #ifdef DEBUG
6253ad9c842SMaxim Sobolev 	if (ldebug(mmap))
6263ad9c842SMaxim Sobolev 		printf(ARGS(mmap, "%p, %d, %d, 0x%08x, %d, %d"),
627b45bbfc3SBruce Evans 		    (void *)linux_args.addr, linux_args.len, linux_args.prot,
62810931a46SJung-uk Kim 		    linux_args.flags, linux_args.fd, linux_args.pgoff);
6293ad9c842SMaxim Sobolev #endif
6303ad9c842SMaxim Sobolev 
631f12c0348SJohn Baldwin 	return (linux_mmap_common(td, linux_args.addr, linux_args.len,
632f12c0348SJohn Baldwin 	    linux_args.prot, linux_args.flags, linux_args.fd,
633f12c0348SJohn Baldwin 	    (uint32_t)linux_args.pgoff));
6343ad9c842SMaxim Sobolev }
6353ad9c842SMaxim Sobolev 
6363ad9c842SMaxim Sobolev static int
637f12c0348SJohn Baldwin linux_mmap_common(struct thread *td, l_uintptr_t addr, l_size_t len, l_int prot,
638f12c0348SJohn Baldwin     l_int flags, l_int fd, l_loff_t pos)
6393ad9c842SMaxim Sobolev {
640b40ce416SJulian Elischer 	struct proc *p = td->td_proc;
641146aad74SMarcel Moolenaar 	struct mmap_args /* {
642146aad74SMarcel Moolenaar 		caddr_t addr;
643146aad74SMarcel Moolenaar 		size_t len;
644146aad74SMarcel Moolenaar 		int prot;
645146aad74SMarcel Moolenaar 		int flags;
646146aad74SMarcel Moolenaar 		int fd;
647146aad74SMarcel Moolenaar 		long pad;
648146aad74SMarcel Moolenaar 		off_t pos;
649146aad74SMarcel Moolenaar 	} */ bsd_args;
65091d631e5SMatthew N. Dodd 	int error;
651a312f6a3SAlexander Leidinger 	struct file *fp;
652146aad74SMarcel Moolenaar 
65391d631e5SMatthew N. Dodd 	error = 0;
654146aad74SMarcel Moolenaar 	bsd_args.flags = 0;
655a312f6a3SAlexander Leidinger 	fp = NULL;
656a312f6a3SAlexander Leidinger 
657a312f6a3SAlexander Leidinger 	/*
658a312f6a3SAlexander Leidinger 	 * Linux mmap(2):
659a312f6a3SAlexander Leidinger 	 * You must specify exactly one of MAP_SHARED and MAP_PRIVATE
660a312f6a3SAlexander Leidinger 	 */
661f12c0348SJohn Baldwin 	if (!((flags & LINUX_MAP_SHARED) ^ (flags & LINUX_MAP_PRIVATE)))
6626dc4e810SAlexander Leidinger 		return (EINVAL);
663a312f6a3SAlexander Leidinger 
664f12c0348SJohn Baldwin 	if (flags & LINUX_MAP_SHARED)
665146aad74SMarcel Moolenaar 		bsd_args.flags |= MAP_SHARED;
666f12c0348SJohn Baldwin 	if (flags & LINUX_MAP_PRIVATE)
667146aad74SMarcel Moolenaar 		bsd_args.flags |= MAP_PRIVATE;
668f12c0348SJohn Baldwin 	if (flags & LINUX_MAP_FIXED)
669146aad74SMarcel Moolenaar 		bsd_args.flags |= MAP_FIXED;
670f12c0348SJohn Baldwin 	if (flags & LINUX_MAP_ANON)
671146aad74SMarcel Moolenaar 		bsd_args.flags |= MAP_ANON;
6720cc3ac8bSMatthew Dillon 	else
6730cc3ac8bSMatthew Dillon 		bsd_args.flags |= MAP_NOSYNC;
674f12c0348SJohn Baldwin 	if (flags & LINUX_MAP_GROWSDOWN)
675146aad74SMarcel Moolenaar 		bsd_args.flags |= MAP_STACK;
676146aad74SMarcel Moolenaar 
6770eef2f8aSAlexander Leidinger 	/*
67810931a46SJung-uk Kim 	 * PROT_READ, PROT_WRITE, or PROT_EXEC implies PROT_READ and PROT_EXEC
67910931a46SJung-uk Kim 	 * on Linux/i386. We do this to ensure maximum compatibility.
68010931a46SJung-uk Kim 	 * Linux/ia64 does the same in i386 emulation mode.
68110931a46SJung-uk Kim 	 */
682f12c0348SJohn Baldwin 	bsd_args.prot = prot;
68310931a46SJung-uk Kim 	if (bsd_args.prot & (PROT_READ | PROT_WRITE | PROT_EXEC))
68410931a46SJung-uk Kim 		bsd_args.prot |= PROT_READ | PROT_EXEC;
68510931a46SJung-uk Kim 
6866a5964d3SJung-uk Kim 	/* Linux does not check file descriptor when MAP_ANONYMOUS is set. */
687f12c0348SJohn Baldwin 	bsd_args.fd = (bsd_args.flags & MAP_ANON) ? -1 : fd;
6886a5964d3SJung-uk Kim 	if (bsd_args.fd != -1) {
68910931a46SJung-uk Kim 		/*
69010931a46SJung-uk Kim 		 * Linux follows Solaris mmap(2) description:
69110931a46SJung-uk Kim 		 * The file descriptor fildes is opened with
69210931a46SJung-uk Kim 		 * read permission, regardless of the
69310931a46SJung-uk Kim 		 * protection options specified.
69410931a46SJung-uk Kim 		 */
69510931a46SJung-uk Kim 
6966a5964d3SJung-uk Kim 		if ((error = fget(td, bsd_args.fd, &fp)) != 0)
69710931a46SJung-uk Kim 			return (error);
69810931a46SJung-uk Kim 		if (fp->f_type != DTYPE_VNODE) {
69910931a46SJung-uk Kim 			fdrop(fp, td);
70010931a46SJung-uk Kim 			return (EINVAL);
70110931a46SJung-uk Kim 		}
70210931a46SJung-uk Kim 
70310931a46SJung-uk Kim 		/* Linux mmap() just fails for O_WRONLY files */
70410931a46SJung-uk Kim 		if (!(fp->f_flag & FREAD)) {
70510931a46SJung-uk Kim 			fdrop(fp, td);
70610931a46SJung-uk Kim 			return (EACCES);
70710931a46SJung-uk Kim 		}
70810931a46SJung-uk Kim 
70910931a46SJung-uk Kim 		fdrop(fp, td);
71010931a46SJung-uk Kim 	}
71110931a46SJung-uk Kim 
712f12c0348SJohn Baldwin 	if (flags & LINUX_MAP_GROWSDOWN) {
71310931a46SJung-uk Kim 		/*
714f12c0348SJohn Baldwin 		 * The Linux MAP_GROWSDOWN option does not limit auto
715146aad74SMarcel Moolenaar 		 * growth of the region.  Linux mmap with this option
716146aad74SMarcel Moolenaar 		 * takes as addr the inital BOS, and as len, the initial
717146aad74SMarcel Moolenaar 		 * region size.  It can then grow down from addr without
718146aad74SMarcel Moolenaar 		 * limit.  However, linux threads has an implicit internal
719146aad74SMarcel Moolenaar 		 * limit to stack size of STACK_SIZE.  Its just not
720146aad74SMarcel Moolenaar 		 * enforced explicitly in linux.  But, here we impose
721146aad74SMarcel Moolenaar 		 * a limit of (STACK_SIZE - GUARD_SIZE) on the stack
722146aad74SMarcel Moolenaar 		 * region, since we can do this with our mmap.
723146aad74SMarcel Moolenaar 		 *
724146aad74SMarcel Moolenaar 		 * Our mmap with MAP_STACK takes addr as the maximum
725146aad74SMarcel Moolenaar 		 * downsize limit on BOS, and as len the max size of
726146aad74SMarcel Moolenaar 		 * the region.  It them maps the top SGROWSIZ bytes,
727802e08a3SAlexander Leidinger 		 * and auto grows the region down, up to the limit
728146aad74SMarcel Moolenaar 		 * in addr.
729146aad74SMarcel Moolenaar 		 *
730146aad74SMarcel Moolenaar 		 * If we don't use the MAP_STACK option, the effect
731146aad74SMarcel Moolenaar 		 * of this code is to allocate a stack region of a
732146aad74SMarcel Moolenaar 		 * fixed size of (STACK_SIZE - GUARD_SIZE).
733146aad74SMarcel Moolenaar 		 */
734146aad74SMarcel Moolenaar 
735f12c0348SJohn Baldwin 		if ((caddr_t)PTRIN(addr) + len > p->p_vmspace->vm_maxsaddr) {
7360eef2f8aSAlexander Leidinger 			/*
7370eef2f8aSAlexander Leidinger 			 * Some linux apps will attempt to mmap
738242fae60SAndrew Gallatin 			 * thread stacks near the top of their
739242fae60SAndrew Gallatin 			 * address space.  If their TOS is greater
740242fae60SAndrew Gallatin 			 * than vm_maxsaddr, vm_map_growstack()
741242fae60SAndrew Gallatin 			 * will confuse the thread stack with the
742242fae60SAndrew Gallatin 			 * process stack and deliver a SEGV if they
743242fae60SAndrew Gallatin 			 * attempt to grow the thread stack past their
744242fae60SAndrew Gallatin 			 * current stacksize rlimit.  To avoid this,
745242fae60SAndrew Gallatin 			 * adjust vm_maxsaddr upwards to reflect
746242fae60SAndrew Gallatin 			 * the current stacksize rlimit rather
747242fae60SAndrew Gallatin 			 * than the maximum possible stacksize.
748242fae60SAndrew Gallatin 			 * It would be better to adjust the
749242fae60SAndrew Gallatin 			 * mmap'ed region, but some apps do not check
750242fae60SAndrew Gallatin 			 * mmap's return value.
751242fae60SAndrew Gallatin 			 */
75291d5354aSJohn Baldwin 			PROC_LOCK(p);
753242fae60SAndrew Gallatin 			p->p_vmspace->vm_maxsaddr = (char *)USRSTACK -
75491d5354aSJohn Baldwin 			    lim_cur(p, RLIMIT_STACK);
75591d5354aSJohn Baldwin 			PROC_UNLOCK(p);
756242fae60SAndrew Gallatin 		}
757242fae60SAndrew Gallatin 
7580eef2f8aSAlexander Leidinger 		/*
759865df544SJung-uk Kim 		 * This gives us our maximum stack size and a new BOS.
760865df544SJung-uk Kim 		 * If we're using VM_STACK, then mmap will just map
761865df544SJung-uk Kim 		 * the top SGROWSIZ bytes, and let the stack grow down
762865df544SJung-uk Kim 		 * to the limit at BOS.  If we're not using VM_STACK
763865df544SJung-uk Kim 		 * we map the full stack, since we don't have a way
764865df544SJung-uk Kim 		 * to autogrow it.
765146aad74SMarcel Moolenaar 		 */
766f12c0348SJohn Baldwin 		if (len > STACK_SIZE - GUARD_SIZE) {
767f12c0348SJohn Baldwin 			bsd_args.addr = (caddr_t)PTRIN(addr);
768f12c0348SJohn Baldwin 			bsd_args.len = len;
769865df544SJung-uk Kim 		} else {
770f12c0348SJohn Baldwin 			bsd_args.addr = (caddr_t)PTRIN(addr) -
771f12c0348SJohn Baldwin 			    (STACK_SIZE - GUARD_SIZE - len);
772865df544SJung-uk Kim 			bsd_args.len = STACK_SIZE - GUARD_SIZE;
773865df544SJung-uk Kim 		}
774146aad74SMarcel Moolenaar 	} else {
775f12c0348SJohn Baldwin 		bsd_args.addr = (caddr_t)PTRIN(addr);
776f12c0348SJohn Baldwin 		bsd_args.len  = len;
777146aad74SMarcel Moolenaar 	}
778f12c0348SJohn Baldwin 	bsd_args.pos = pos;
779146aad74SMarcel Moolenaar 
780146aad74SMarcel Moolenaar #ifdef DEBUG
78124593369SJonathan Lemon 	if (ldebug(mmap))
78291d631e5SMatthew N. Dodd 		printf("-> %s(%p, %d, %d, 0x%08x, %d, 0x%x)\n",
78391d631e5SMatthew N. Dodd 		    __func__,
78424593369SJonathan Lemon 		    (void *)bsd_args.addr, bsd_args.len, bsd_args.prot,
78524593369SJonathan Lemon 		    bsd_args.flags, bsd_args.fd, (int)bsd_args.pos);
786146aad74SMarcel Moolenaar #endif
78791d631e5SMatthew N. Dodd 	error = mmap(td, &bsd_args);
78891d631e5SMatthew N. Dodd #ifdef DEBUG
78991d631e5SMatthew N. Dodd 	if (ldebug(mmap))
79091d631e5SMatthew N. Dodd 		printf("-> %s() return: 0x%x (0x%08x)\n",
79191d631e5SMatthew N. Dodd 			__func__, error, (u_int)td->td_retval[0]);
79291d631e5SMatthew N. Dodd #endif
79391d631e5SMatthew N. Dodd 	return (error);
794146aad74SMarcel Moolenaar }
795146aad74SMarcel Moolenaar 
796146aad74SMarcel Moolenaar int
79710931a46SJung-uk Kim linux_mprotect(struct thread *td, struct linux_mprotect_args *uap)
79810931a46SJung-uk Kim {
79910931a46SJung-uk Kim 	struct mprotect_args bsd_args;
80010931a46SJung-uk Kim 
80110931a46SJung-uk Kim 	bsd_args.addr = uap->addr;
80210931a46SJung-uk Kim 	bsd_args.len = uap->len;
80310931a46SJung-uk Kim 	bsd_args.prot = uap->prot;
80410931a46SJung-uk Kim 	if (bsd_args.prot & (PROT_READ | PROT_WRITE | PROT_EXEC))
80510931a46SJung-uk Kim 		bsd_args.prot |= PROT_READ | PROT_EXEC;
80610931a46SJung-uk Kim 	return (mprotect(td, &bsd_args));
80710931a46SJung-uk Kim }
80810931a46SJung-uk Kim 
80910931a46SJung-uk Kim int
810b40ce416SJulian Elischer linux_pipe(struct thread *td, struct linux_pipe_args *args)
811146aad74SMarcel Moolenaar {
812146aad74SMarcel Moolenaar 	int error;
813ab0d10f6SEd Schouten 	int fildes[2];
814146aad74SMarcel Moolenaar 
815146aad74SMarcel Moolenaar #ifdef DEBUG
81624593369SJonathan Lemon 	if (ldebug(pipe))
81724593369SJonathan Lemon 		printf(ARGS(pipe, "*"));
818146aad74SMarcel Moolenaar #endif
819146aad74SMarcel Moolenaar 
820ab0d10f6SEd Schouten 	error = kern_pipe(td, fildes);
821ab0d10f6SEd Schouten 	if (error)
822146aad74SMarcel Moolenaar 		return (error);
823146aad74SMarcel Moolenaar 
824ab0d10f6SEd Schouten 	/* XXX: Close descriptors on error. */
825ab0d10f6SEd Schouten 	return (copyout(fildes, args->pipefds, sizeof fildes));
826146aad74SMarcel Moolenaar }
827146aad74SMarcel Moolenaar 
828146aad74SMarcel Moolenaar int
829b40ce416SJulian Elischer linux_ioperm(struct thread *td, struct linux_ioperm_args *args)
830146aad74SMarcel Moolenaar {
83184569dffSMaxim Sobolev 	int error;
83284569dffSMaxim Sobolev 	struct i386_ioperm_args iia;
833146aad74SMarcel Moolenaar 
83484569dffSMaxim Sobolev 	iia.start = args->start;
83584569dffSMaxim Sobolev 	iia.length = args->length;
83684569dffSMaxim Sobolev 	iia.enable = args->enable;
83784569dffSMaxim Sobolev 	error = i386_set_ioperm(td, &iia);
83884569dffSMaxim Sobolev 	return (error);
839146aad74SMarcel Moolenaar }
840146aad74SMarcel Moolenaar 
841146aad74SMarcel Moolenaar int
842b40ce416SJulian Elischer linux_iopl(struct thread *td, struct linux_iopl_args *args)
843146aad74SMarcel Moolenaar {
844146aad74SMarcel Moolenaar 	int error;
845146aad74SMarcel Moolenaar 
846146aad74SMarcel Moolenaar 	if (args->level < 0 || args->level > 3)
847146aad74SMarcel Moolenaar 		return (EINVAL);
848acd3428bSRobert Watson 	if ((error = priv_check(td, PRIV_IO)) != 0)
849146aad74SMarcel Moolenaar 		return (error);
850a854ed98SJohn Baldwin 	if ((error = securelevel_gt(td->td_ucred, 0)) != 0)
85141c42188SRobert Watson 		return (error);
852b40ce416SJulian Elischer 	td->td_frame->tf_eflags = (td->td_frame->tf_eflags & ~PSL_IOPL) |
853146aad74SMarcel Moolenaar 	    (args->level * (PSL_IOPL / 3));
854146aad74SMarcel Moolenaar 	return (0);
855146aad74SMarcel Moolenaar }
856146aad74SMarcel Moolenaar 
857146aad74SMarcel Moolenaar int
858b07cd97eSMark Murray linux_modify_ldt(struct thread *td, struct linux_modify_ldt_args *uap)
859146aad74SMarcel Moolenaar {
860146aad74SMarcel Moolenaar 	int error;
86184569dffSMaxim Sobolev 	struct i386_ldt_args ldt;
8625002a60fSMarcel Moolenaar 	struct l_descriptor ld;
86384569dffSMaxim Sobolev 	union descriptor desc;
8646259969dSKonstantin Belousov 	int size, written;
865146aad74SMarcel Moolenaar 
866146aad74SMarcel Moolenaar 	switch (uap->func) {
867146aad74SMarcel Moolenaar 	case 0x00: /* read_ldt */
86884569dffSMaxim Sobolev 		ldt.start = 0;
86984569dffSMaxim Sobolev 		ldt.descs = uap->ptr;
87084569dffSMaxim Sobolev 		ldt.num = uap->bytecount / sizeof(union descriptor);
87184569dffSMaxim Sobolev 		error = i386_get_ldt(td, &ldt);
872b40ce416SJulian Elischer 		td->td_retval[0] *= sizeof(union descriptor);
873146aad74SMarcel Moolenaar 		break;
8746259969dSKonstantin Belousov 	case 0x02: /* read_default_ldt = 0 */
8756259969dSKonstantin Belousov 		size = 5*sizeof(struct l_desc_struct);
8766259969dSKonstantin Belousov 		if (size > uap->bytecount)
8776259969dSKonstantin Belousov 			size = uap->bytecount;
8786259969dSKonstantin Belousov 		for (written = error = 0; written < size && error == 0; written++)
8796259969dSKonstantin Belousov 			error = subyte((char *)uap->ptr + written, 0);
8806259969dSKonstantin Belousov 		td->td_retval[0] = written;
8816259969dSKonstantin Belousov 		break;
882146aad74SMarcel Moolenaar 	case 0x01: /* write_ldt */
883146aad74SMarcel Moolenaar 	case 0x11: /* write_ldt */
884146aad74SMarcel Moolenaar 		if (uap->bytecount != sizeof(ld))
885146aad74SMarcel Moolenaar 			return (EINVAL);
886146aad74SMarcel Moolenaar 
887146aad74SMarcel Moolenaar 		error = copyin(uap->ptr, &ld, sizeof(ld));
888146aad74SMarcel Moolenaar 		if (error)
889146aad74SMarcel Moolenaar 			return (error);
890146aad74SMarcel Moolenaar 
89184569dffSMaxim Sobolev 		ldt.start = ld.entry_number;
89284569dffSMaxim Sobolev 		ldt.descs = &desc;
89384569dffSMaxim Sobolev 		ldt.num = 1;
89484569dffSMaxim Sobolev 		desc.sd.sd_lolimit = (ld.limit & 0x0000ffff);
89584569dffSMaxim Sobolev 		desc.sd.sd_hilimit = (ld.limit & 0x000f0000) >> 16;
89684569dffSMaxim Sobolev 		desc.sd.sd_lobase = (ld.base_addr & 0x00ffffff);
89784569dffSMaxim Sobolev 		desc.sd.sd_hibase = (ld.base_addr & 0xff000000) >> 24;
89884569dffSMaxim Sobolev 		desc.sd.sd_type = SDT_MEMRO | ((ld.read_exec_only ^ 1) << 1) |
899146aad74SMarcel Moolenaar 			(ld.contents << 2);
90084569dffSMaxim Sobolev 		desc.sd.sd_dpl = 3;
90184569dffSMaxim Sobolev 		desc.sd.sd_p = (ld.seg_not_present ^ 1);
90284569dffSMaxim Sobolev 		desc.sd.sd_xx = 0;
90384569dffSMaxim Sobolev 		desc.sd.sd_def32 = ld.seg_32bit;
90484569dffSMaxim Sobolev 		desc.sd.sd_gran = ld.limit_in_pages;
90584569dffSMaxim Sobolev 		error = i386_set_ldt(td, &ldt, &desc);
906146aad74SMarcel Moolenaar 		break;
907146aad74SMarcel Moolenaar 	default:
9087c020cbbSJohn Baldwin 		error = ENOSYS;
909146aad74SMarcel Moolenaar 		break;
910146aad74SMarcel Moolenaar 	}
911146aad74SMarcel Moolenaar 
912146aad74SMarcel Moolenaar 	if (error == EOPNOTSUPP) {
913146aad74SMarcel Moolenaar 		printf("linux: modify_ldt needs kernel option USER_LDT\n");
914146aad74SMarcel Moolenaar 		error = ENOSYS;
915146aad74SMarcel Moolenaar 	}
916146aad74SMarcel Moolenaar 
917146aad74SMarcel Moolenaar 	return (error);
918146aad74SMarcel Moolenaar }
919146aad74SMarcel Moolenaar 
920146aad74SMarcel Moolenaar int
921b40ce416SJulian Elischer linux_sigaction(struct thread *td, struct linux_sigaction_args *args)
922146aad74SMarcel Moolenaar {
9235002a60fSMarcel Moolenaar 	l_osigaction_t osa;
9245002a60fSMarcel Moolenaar 	l_sigaction_t act, oact;
925146aad74SMarcel Moolenaar 	int error;
926146aad74SMarcel Moolenaar 
927146aad74SMarcel Moolenaar #ifdef DEBUG
92824593369SJonathan Lemon 	if (ldebug(sigaction))
92924593369SJonathan Lemon 		printf(ARGS(sigaction, "%d, %p, %p"),
930146aad74SMarcel Moolenaar 		    args->sig, (void *)args->nsa, (void *)args->osa);
931146aad74SMarcel Moolenaar #endif
932146aad74SMarcel Moolenaar 
933146aad74SMarcel Moolenaar 	if (args->nsa != NULL) {
9344b7ef73dSDag-Erling Smørgrav 		error = copyin(args->nsa, &osa, sizeof(l_osigaction_t));
935146aad74SMarcel Moolenaar 		if (error)
936146aad74SMarcel Moolenaar 			return (error);
937146aad74SMarcel Moolenaar 		act.lsa_handler = osa.lsa_handler;
938146aad74SMarcel Moolenaar 		act.lsa_flags = osa.lsa_flags;
939146aad74SMarcel Moolenaar 		act.lsa_restorer = osa.lsa_restorer;
940146aad74SMarcel Moolenaar 		LINUX_SIGEMPTYSET(act.lsa_mask);
941146aad74SMarcel Moolenaar 		act.lsa_mask.__bits[0] = osa.lsa_mask;
942146aad74SMarcel Moolenaar 	}
943146aad74SMarcel Moolenaar 
944b40ce416SJulian Elischer 	error = linux_do_sigaction(td, args->sig, args->nsa ? &act : NULL,
945146aad74SMarcel Moolenaar 	    args->osa ? &oact : NULL);
946146aad74SMarcel Moolenaar 
947146aad74SMarcel Moolenaar 	if (args->osa != NULL && !error) {
948146aad74SMarcel Moolenaar 		osa.lsa_handler = oact.lsa_handler;
949146aad74SMarcel Moolenaar 		osa.lsa_flags = oact.lsa_flags;
950146aad74SMarcel Moolenaar 		osa.lsa_restorer = oact.lsa_restorer;
951146aad74SMarcel Moolenaar 		osa.lsa_mask = oact.lsa_mask.__bits[0];
9524b7ef73dSDag-Erling Smørgrav 		error = copyout(&osa, args->osa, sizeof(l_osigaction_t));
953146aad74SMarcel Moolenaar 	}
954146aad74SMarcel Moolenaar 
955146aad74SMarcel Moolenaar 	return (error);
956146aad74SMarcel Moolenaar }
957146aad74SMarcel Moolenaar 
958146aad74SMarcel Moolenaar /*
959146aad74SMarcel Moolenaar  * Linux has two extra args, restart and oldmask.  We dont use these,
960146aad74SMarcel Moolenaar  * but it seems that "restart" is actually a context pointer that
961146aad74SMarcel Moolenaar  * enables the signal to happen with a different register set.
962146aad74SMarcel Moolenaar  */
963146aad74SMarcel Moolenaar int
964b40ce416SJulian Elischer linux_sigsuspend(struct thread *td, struct linux_sigsuspend_args *args)
965146aad74SMarcel Moolenaar {
966206a5d3aSIan Dowse 	sigset_t sigmask;
9675002a60fSMarcel Moolenaar 	l_sigset_t mask;
968146aad74SMarcel Moolenaar 
969146aad74SMarcel Moolenaar #ifdef DEBUG
97024593369SJonathan Lemon 	if (ldebug(sigsuspend))
97124593369SJonathan Lemon 		printf(ARGS(sigsuspend, "%08lx"), (unsigned long)args->mask);
972146aad74SMarcel Moolenaar #endif
973146aad74SMarcel Moolenaar 
974146aad74SMarcel Moolenaar 	LINUX_SIGEMPTYSET(mask);
975146aad74SMarcel Moolenaar 	mask.__bits[0] = args->mask;
976206a5d3aSIan Dowse 	linux_to_bsd_sigset(&mask, &sigmask);
977206a5d3aSIan Dowse 	return (kern_sigsuspend(td, sigmask));
978146aad74SMarcel Moolenaar }
979146aad74SMarcel Moolenaar 
980146aad74SMarcel Moolenaar int
981b07cd97eSMark Murray linux_rt_sigsuspend(struct thread *td, struct linux_rt_sigsuspend_args *uap)
982146aad74SMarcel Moolenaar {
9835002a60fSMarcel Moolenaar 	l_sigset_t lmask;
984206a5d3aSIan Dowse 	sigset_t sigmask;
985146aad74SMarcel Moolenaar 	int error;
986146aad74SMarcel Moolenaar 
987146aad74SMarcel Moolenaar #ifdef DEBUG
98824593369SJonathan Lemon 	if (ldebug(rt_sigsuspend))
98924593369SJonathan Lemon 		printf(ARGS(rt_sigsuspend, "%p, %d"),
990146aad74SMarcel Moolenaar 		    (void *)uap->newset, uap->sigsetsize);
991146aad74SMarcel Moolenaar #endif
992146aad74SMarcel Moolenaar 
9935002a60fSMarcel Moolenaar 	if (uap->sigsetsize != sizeof(l_sigset_t))
994146aad74SMarcel Moolenaar 		return (EINVAL);
995146aad74SMarcel Moolenaar 
9965002a60fSMarcel Moolenaar 	error = copyin(uap->newset, &lmask, sizeof(l_sigset_t));
997146aad74SMarcel Moolenaar 	if (error)
998146aad74SMarcel Moolenaar 		return (error);
999146aad74SMarcel Moolenaar 
1000206a5d3aSIan Dowse 	linux_to_bsd_sigset(&lmask, &sigmask);
1001206a5d3aSIan Dowse 	return (kern_sigsuspend(td, sigmask));
1002146aad74SMarcel Moolenaar }
1003146aad74SMarcel Moolenaar 
1004146aad74SMarcel Moolenaar int
1005b40ce416SJulian Elischer linux_pause(struct thread *td, struct linux_pause_args *args)
1006146aad74SMarcel Moolenaar {
1007b40ce416SJulian Elischer 	struct proc *p = td->td_proc;
1008206a5d3aSIan Dowse 	sigset_t sigmask;
1009146aad74SMarcel Moolenaar 
1010146aad74SMarcel Moolenaar #ifdef DEBUG
101124593369SJonathan Lemon 	if (ldebug(pause))
101224593369SJonathan Lemon 		printf(ARGS(pause, ""));
1013146aad74SMarcel Moolenaar #endif
1014146aad74SMarcel Moolenaar 
1015fdfdfb78SJohn Baldwin 	PROC_LOCK(p);
10164093529dSJeff Roberson 	sigmask = td->td_sigmask;
1017fdfdfb78SJohn Baldwin 	PROC_UNLOCK(p);
1018206a5d3aSIan Dowse 	return (kern_sigsuspend(td, sigmask));
1019146aad74SMarcel Moolenaar }
1020146aad74SMarcel Moolenaar 
1021146aad74SMarcel Moolenaar int
1022b40ce416SJulian Elischer linux_sigaltstack(struct thread *td, struct linux_sigaltstack_args *uap)
1023146aad74SMarcel Moolenaar {
1024206a5d3aSIan Dowse 	stack_t ss, oss;
10255002a60fSMarcel Moolenaar 	l_stack_t lss;
1026146aad74SMarcel Moolenaar 	int error;
1027146aad74SMarcel Moolenaar 
1028146aad74SMarcel Moolenaar #ifdef DEBUG
102924593369SJonathan Lemon 	if (ldebug(sigaltstack))
103024593369SJonathan Lemon 		printf(ARGS(sigaltstack, "%p, %p"), uap->uss, uap->uoss);
1031146aad74SMarcel Moolenaar #endif
1032146aad74SMarcel Moolenaar 
1033206a5d3aSIan Dowse 	if (uap->uss != NULL) {
10345002a60fSMarcel Moolenaar 		error = copyin(uap->uss, &lss, sizeof(l_stack_t));
1035146aad74SMarcel Moolenaar 		if (error)
1036146aad74SMarcel Moolenaar 			return (error);
1037146aad74SMarcel Moolenaar 
1038206a5d3aSIan Dowse 		ss.ss_sp = lss.ss_sp;
1039206a5d3aSIan Dowse 		ss.ss_size = lss.ss_size;
1040206a5d3aSIan Dowse 		ss.ss_flags = linux_to_bsd_sigaltstack(lss.ss_flags);
1041931a7258SAndrew Gallatin 	}
1042ef36ad69SJohn Baldwin 	error = kern_sigaltstack(td, (uap->uss != NULL) ? &ss : NULL,
1043ef36ad69SJohn Baldwin 	    (uap->uoss != NULL) ? &oss : NULL);
1044206a5d3aSIan Dowse 	if (!error && uap->uoss != NULL) {
1045206a5d3aSIan Dowse 		lss.ss_sp = oss.ss_sp;
1046206a5d3aSIan Dowse 		lss.ss_size = oss.ss_size;
1047206a5d3aSIan Dowse 		lss.ss_flags = bsd_to_linux_sigaltstack(oss.ss_flags);
10485002a60fSMarcel Moolenaar 		error = copyout(&lss, uap->uoss, sizeof(l_stack_t));
1049146aad74SMarcel Moolenaar 	}
1050146aad74SMarcel Moolenaar 
1051146aad74SMarcel Moolenaar 	return (error);
1052146aad74SMarcel Moolenaar }
10533ad9c842SMaxim Sobolev 
10543ad9c842SMaxim Sobolev int
10553ad9c842SMaxim Sobolev linux_ftruncate64(struct thread *td, struct linux_ftruncate64_args *args)
10563ad9c842SMaxim Sobolev {
10573ad9c842SMaxim Sobolev 	struct ftruncate_args sa;
10583ad9c842SMaxim Sobolev 
10593ad9c842SMaxim Sobolev #ifdef DEBUG
10603ad9c842SMaxim Sobolev 	if (ldebug(ftruncate64))
1061b45bbfc3SBruce Evans 		printf(ARGS(ftruncate64, "%u, %jd"), args->fd,
1062b45bbfc3SBruce Evans 		    (intmax_t)args->length);
10633ad9c842SMaxim Sobolev #endif
10643ad9c842SMaxim Sobolev 
10653ad9c842SMaxim Sobolev 	sa.fd = args->fd;
10663ad9c842SMaxim Sobolev 	sa.length = args->length;
10673ad9c842SMaxim Sobolev 	return ftruncate(td, &sa);
10683ad9c842SMaxim Sobolev }
10691bc85c0dSDoug Rabson 
10701bc85c0dSDoug Rabson int
10711bc85c0dSDoug Rabson linux_set_thread_area(struct thread *td, struct linux_set_thread_area_args *args)
10721bc85c0dSDoug Rabson {
10739b44bfc5SAlexander Leidinger 	struct l_user_desc info;
10749b44bfc5SAlexander Leidinger 	int error;
10759b44bfc5SAlexander Leidinger 	int idx;
10769b44bfc5SAlexander Leidinger 	int a[2];
10779b44bfc5SAlexander Leidinger 	struct segment_descriptor sd;
10789b44bfc5SAlexander Leidinger 
10799b44bfc5SAlexander Leidinger 	error = copyin(args->desc, &info, sizeof(struct l_user_desc));
10809b44bfc5SAlexander Leidinger 	if (error)
10819b44bfc5SAlexander Leidinger 		return (error);
10829b44bfc5SAlexander Leidinger 
10839b44bfc5SAlexander Leidinger #ifdef DEBUG
10849b44bfc5SAlexander Leidinger 	if (ldebug(set_thread_area))
10859b44bfc5SAlexander Leidinger 	   	printf(ARGS(set_thread_area, "%i, %x, %x, %i, %i, %i, %i, %i, %i\n"),
10869b44bfc5SAlexander Leidinger 		      info.entry_number,
10879b44bfc5SAlexander Leidinger       		      info.base_addr,
10889b44bfc5SAlexander Leidinger       		      info.limit,
10899b44bfc5SAlexander Leidinger       		      info.seg_32bit,
10909b44bfc5SAlexander Leidinger 		      info.contents,
10919b44bfc5SAlexander Leidinger       		      info.read_exec_only,
10929b44bfc5SAlexander Leidinger       		      info.limit_in_pages,
10939b44bfc5SAlexander Leidinger       		      info.seg_not_present,
10949b44bfc5SAlexander Leidinger       		      info.useable);
10959b44bfc5SAlexander Leidinger #endif
10969b44bfc5SAlexander Leidinger 
10979b44bfc5SAlexander Leidinger 	idx = info.entry_number;
10980eef2f8aSAlexander Leidinger 	/*
1099802e08a3SAlexander Leidinger 	 * Semantics of linux version: every thread in the system has array of
1100802e08a3SAlexander Leidinger 	 * 3 tls descriptors. 1st is GLIBC TLS, 2nd is WINE, 3rd unknown. This
1101802e08a3SAlexander Leidinger 	 * syscall loads one of the selected tls decriptors with a value and
1102802e08a3SAlexander Leidinger 	 * also loads GDT descriptors 6, 7 and 8 with the content of the
1103802e08a3SAlexander Leidinger 	 * per-thread descriptors.
11049b44bfc5SAlexander Leidinger 	 *
1105802e08a3SAlexander Leidinger 	 * Semantics of fbsd version: I think we can ignore that linux has 3
1106802e08a3SAlexander Leidinger 	 * per-thread descriptors and use just the 1st one. The tls_array[]
1107802e08a3SAlexander Leidinger 	 * is used only in set/get-thread_area() syscalls and for loading the
1108802e08a3SAlexander Leidinger 	 * GDT descriptors. In fbsd we use just one GDT descriptor for TLS so
1109802e08a3SAlexander Leidinger 	 * we will load just one.
1110802e08a3SAlexander Leidinger 	 *
1111802e08a3SAlexander Leidinger 	 * XXX: this doesn't work when a user space process tries to use more
1112802e08a3SAlexander Leidinger 	 * than 1 TLS segment. Comment in the linux sources says wine might do
1113802e08a3SAlexander Leidinger 	 * this.
11141bc85c0dSDoug Rabson 	 */
11159b44bfc5SAlexander Leidinger 
11160eef2f8aSAlexander Leidinger 	/*
11170eef2f8aSAlexander Leidinger 	 * we support just GLIBC TLS now
11189b44bfc5SAlexander Leidinger 	 * we should let 3 proceed as well because we use this segment so
11199b44bfc5SAlexander Leidinger 	 * if code does two subsequent calls it should succeed
11209b44bfc5SAlexander Leidinger 	 */
11219b44bfc5SAlexander Leidinger 	if (idx != 6 && idx != -1 && idx != 3)
11229b44bfc5SAlexander Leidinger 		return (EINVAL);
11239b44bfc5SAlexander Leidinger 
11240eef2f8aSAlexander Leidinger 	/*
11250eef2f8aSAlexander Leidinger 	 * we have to copy out the GDT entry we use
11269b44bfc5SAlexander Leidinger 	 * FreeBSD uses GDT entry #3 for storing %gs so load that
1127802e08a3SAlexander Leidinger 	 *
1128802e08a3SAlexander Leidinger 	 * XXX: what if a user space program doesn't check this value and tries
11299b44bfc5SAlexander Leidinger 	 * to use 6, 7 or 8?
11309b44bfc5SAlexander Leidinger 	 */
11319b44bfc5SAlexander Leidinger 	idx = info.entry_number = 3;
11329b44bfc5SAlexander Leidinger 	error = copyout(&info, args->desc, sizeof(struct l_user_desc));
11339b44bfc5SAlexander Leidinger 	if (error)
11349b44bfc5SAlexander Leidinger 		return (error);
11359b44bfc5SAlexander Leidinger 
1136a4e3bad7SJung-uk Kim 	if (LINUX_LDT_empty(&info)) {
11379b44bfc5SAlexander Leidinger 		a[0] = 0;
11389b44bfc5SAlexander Leidinger 		a[1] = 0;
11399b44bfc5SAlexander Leidinger 	} else {
1140a4e3bad7SJung-uk Kim 		a[0] = LINUX_LDT_entry_a(&info);
1141a4e3bad7SJung-uk Kim 		a[1] = LINUX_LDT_entry_b(&info);
11421bc85c0dSDoug Rabson 	}
11431bc85c0dSDoug Rabson 
11449b44bfc5SAlexander Leidinger 	memcpy(&sd, &a, sizeof(a));
11459b44bfc5SAlexander Leidinger #ifdef DEBUG
11469b44bfc5SAlexander Leidinger 	if (ldebug(set_thread_area))
11479b44bfc5SAlexander Leidinger 	   	printf("Segment created in set_thread_area: lobase: %x, hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, def32: %i, gran: %i\n", sd.sd_lobase,
11489b44bfc5SAlexander Leidinger 			sd.sd_hibase,
11499b44bfc5SAlexander Leidinger 			sd.sd_lolimit,
11509b44bfc5SAlexander Leidinger 			sd.sd_hilimit,
11519b44bfc5SAlexander Leidinger 			sd.sd_type,
11529b44bfc5SAlexander Leidinger 			sd.sd_dpl,
11539b44bfc5SAlexander Leidinger 			sd.sd_p,
11549b44bfc5SAlexander Leidinger 			sd.sd_xx,
11559b44bfc5SAlexander Leidinger 			sd.sd_def32,
11569b44bfc5SAlexander Leidinger 			sd.sd_gran);
11579b44bfc5SAlexander Leidinger #endif
11581bc85c0dSDoug Rabson 
11599b44bfc5SAlexander Leidinger 	/* this is taken from i386 version of cpu_set_user_tls() */
11609b44bfc5SAlexander Leidinger 	critical_enter();
11619b44bfc5SAlexander Leidinger 	/* set %gs */
11629b44bfc5SAlexander Leidinger 	td->td_pcb->pcb_gsd = sd;
11639b44bfc5SAlexander Leidinger 	PCPU_GET(fsgs_gdt)[1] = sd;
11649b44bfc5SAlexander Leidinger 	load_gs(GSEL(GUGS_SEL, SEL_UPL));
11659b44bfc5SAlexander Leidinger 	critical_exit();
11669b44bfc5SAlexander Leidinger 
11671bc85c0dSDoug Rabson 	return (0);
11681bc85c0dSDoug Rabson }
11691bc85c0dSDoug Rabson 
11701bc85c0dSDoug Rabson int
11719b44bfc5SAlexander Leidinger linux_get_thread_area(struct thread *td, struct linux_get_thread_area_args *args)
11721bc85c0dSDoug Rabson {
11731bc85c0dSDoug Rabson 
11749b44bfc5SAlexander Leidinger 	struct l_user_desc info;
11759b44bfc5SAlexander Leidinger 	int error;
11769b44bfc5SAlexander Leidinger 	int idx;
11779b44bfc5SAlexander Leidinger 	struct l_desc_struct desc;
11789b44bfc5SAlexander Leidinger 	struct segment_descriptor sd;
11799b44bfc5SAlexander Leidinger 
11809b44bfc5SAlexander Leidinger #ifdef DEBUG
11819b44bfc5SAlexander Leidinger 	if (ldebug(get_thread_area))
11829b44bfc5SAlexander Leidinger 		printf(ARGS(get_thread_area, "%p"), args->desc);
11839b44bfc5SAlexander Leidinger #endif
11849b44bfc5SAlexander Leidinger 
11859b44bfc5SAlexander Leidinger 	error = copyin(args->desc, &info, sizeof(struct l_user_desc));
11869b44bfc5SAlexander Leidinger 	if (error)
11879b44bfc5SAlexander Leidinger 		return (error);
11889b44bfc5SAlexander Leidinger 
11899b44bfc5SAlexander Leidinger 	idx = info.entry_number;
11909b44bfc5SAlexander Leidinger 	/* XXX: I am not sure if we want 3 to be allowed too. */
11919b44bfc5SAlexander Leidinger 	if (idx != 6 && idx != 3)
11929b44bfc5SAlexander Leidinger 		return (EINVAL);
11939b44bfc5SAlexander Leidinger 
11949b44bfc5SAlexander Leidinger 	idx = 3;
11959b44bfc5SAlexander Leidinger 
11969b44bfc5SAlexander Leidinger 	memset(&info, 0, sizeof(info));
11979b44bfc5SAlexander Leidinger 
11989b44bfc5SAlexander Leidinger 	sd = PCPU_GET(fsgs_gdt)[1];
11999b44bfc5SAlexander Leidinger 
12009b44bfc5SAlexander Leidinger 	memcpy(&desc, &sd, sizeof(desc));
12019b44bfc5SAlexander Leidinger 
12029b44bfc5SAlexander Leidinger 	info.entry_number = idx;
1203a4e3bad7SJung-uk Kim 	info.base_addr = LINUX_GET_BASE(&desc);
1204a4e3bad7SJung-uk Kim 	info.limit = LINUX_GET_LIMIT(&desc);
1205a4e3bad7SJung-uk Kim 	info.seg_32bit = LINUX_GET_32BIT(&desc);
1206a4e3bad7SJung-uk Kim 	info.contents = LINUX_GET_CONTENTS(&desc);
1207a4e3bad7SJung-uk Kim 	info.read_exec_only = !LINUX_GET_WRITABLE(&desc);
1208a4e3bad7SJung-uk Kim 	info.limit_in_pages = LINUX_GET_LIMIT_PAGES(&desc);
1209a4e3bad7SJung-uk Kim 	info.seg_not_present = !LINUX_GET_PRESENT(&desc);
1210a4e3bad7SJung-uk Kim 	info.useable = LINUX_GET_USEABLE(&desc);
12119b44bfc5SAlexander Leidinger 
12129b44bfc5SAlexander Leidinger 	error = copyout(&info, args->desc, sizeof(struct l_user_desc));
12139b44bfc5SAlexander Leidinger 	if (error)
12149b44bfc5SAlexander Leidinger 	   	return (EFAULT);
12159b44bfc5SAlexander Leidinger 
12169b44bfc5SAlexander Leidinger 	return (0);
12179b44bfc5SAlexander Leidinger }
12189b44bfc5SAlexander Leidinger 
12199b44bfc5SAlexander Leidinger /* copied from kern/kern_time.c */
12209b44bfc5SAlexander Leidinger int
12219b44bfc5SAlexander Leidinger linux_timer_create(struct thread *td, struct linux_timer_create_args *args)
12229b44bfc5SAlexander Leidinger {
12239b44bfc5SAlexander Leidinger    	return ktimer_create(td, (struct ktimer_create_args *) args);
12249b44bfc5SAlexander Leidinger }
12259b44bfc5SAlexander Leidinger 
12269b44bfc5SAlexander Leidinger int
12279b44bfc5SAlexander Leidinger linux_timer_settime(struct thread *td, struct linux_timer_settime_args *args)
12289b44bfc5SAlexander Leidinger {
12299b44bfc5SAlexander Leidinger    	return ktimer_settime(td, (struct ktimer_settime_args *) args);
12309b44bfc5SAlexander Leidinger }
12319b44bfc5SAlexander Leidinger 
12329b44bfc5SAlexander Leidinger int
12339b44bfc5SAlexander Leidinger linux_timer_gettime(struct thread *td, struct linux_timer_gettime_args *args)
12349b44bfc5SAlexander Leidinger {
12359b44bfc5SAlexander Leidinger    	return ktimer_gettime(td, (struct ktimer_gettime_args *) args);
12369b44bfc5SAlexander Leidinger }
12379b44bfc5SAlexander Leidinger 
12389b44bfc5SAlexander Leidinger int
12399b44bfc5SAlexander Leidinger linux_timer_getoverrun(struct thread *td, struct linux_timer_getoverrun_args *args)
12409b44bfc5SAlexander Leidinger {
12419b44bfc5SAlexander Leidinger    	return ktimer_getoverrun(td, (struct ktimer_getoverrun_args *) args);
12429b44bfc5SAlexander Leidinger }
12439b44bfc5SAlexander Leidinger 
12449b44bfc5SAlexander Leidinger int
12459b44bfc5SAlexander Leidinger linux_timer_delete(struct thread *td, struct linux_timer_delete_args *args)
12469b44bfc5SAlexander Leidinger {
12479b44bfc5SAlexander Leidinger    	return ktimer_delete(td, (struct ktimer_delete_args *) args);
12489b44bfc5SAlexander Leidinger }
12499b44bfc5SAlexander Leidinger 
12509b44bfc5SAlexander Leidinger /* XXX: this wont work with module - convert it */
12519b44bfc5SAlexander Leidinger int
12529b44bfc5SAlexander Leidinger linux_mq_open(struct thread *td, struct linux_mq_open_args *args)
12539b44bfc5SAlexander Leidinger {
12549b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE
12559b44bfc5SAlexander Leidinger    	return kmq_open(td, (struct kmq_open_args *) args);
12569b44bfc5SAlexander Leidinger #else
12579b44bfc5SAlexander Leidinger 	return (ENOSYS);
12589b44bfc5SAlexander Leidinger #endif
12599b44bfc5SAlexander Leidinger }
12609b44bfc5SAlexander Leidinger 
12619b44bfc5SAlexander Leidinger int
12629b44bfc5SAlexander Leidinger linux_mq_unlink(struct thread *td, struct linux_mq_unlink_args *args)
12639b44bfc5SAlexander Leidinger {
12649b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE
12659b44bfc5SAlexander Leidinger    	return kmq_unlink(td, (struct kmq_unlink_args *) args);
12669b44bfc5SAlexander Leidinger #else
12679b44bfc5SAlexander Leidinger 	return (ENOSYS);
12689b44bfc5SAlexander Leidinger #endif
12699b44bfc5SAlexander Leidinger }
12709b44bfc5SAlexander Leidinger 
12719b44bfc5SAlexander Leidinger int
12729b44bfc5SAlexander Leidinger linux_mq_timedsend(struct thread *td, struct linux_mq_timedsend_args *args)
12739b44bfc5SAlexander Leidinger {
12749b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE
12759b44bfc5SAlexander Leidinger    	return kmq_timedsend(td, (struct kmq_timedsend_args *) args);
12769b44bfc5SAlexander Leidinger #else
12779b44bfc5SAlexander Leidinger 	return (ENOSYS);
12789b44bfc5SAlexander Leidinger #endif
12799b44bfc5SAlexander Leidinger }
12809b44bfc5SAlexander Leidinger 
12819b44bfc5SAlexander Leidinger int
12829b44bfc5SAlexander Leidinger linux_mq_timedreceive(struct thread *td, struct linux_mq_timedreceive_args *args)
12839b44bfc5SAlexander Leidinger {
12849b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE
12859b44bfc5SAlexander Leidinger    	return kmq_timedreceive(td, (struct kmq_timedreceive_args *) args);
12869b44bfc5SAlexander Leidinger #else
12879b44bfc5SAlexander Leidinger 	return (ENOSYS);
12889b44bfc5SAlexander Leidinger #endif
12899b44bfc5SAlexander Leidinger }
12909b44bfc5SAlexander Leidinger 
12919b44bfc5SAlexander Leidinger int
12929b44bfc5SAlexander Leidinger linux_mq_notify(struct thread *td, struct linux_mq_notify_args *args)
12939b44bfc5SAlexander Leidinger {
12949b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE
12959b44bfc5SAlexander Leidinger 	return kmq_notify(td, (struct kmq_notify_args *) args);
12969b44bfc5SAlexander Leidinger #else
12979b44bfc5SAlexander Leidinger 	return (ENOSYS);
12989b44bfc5SAlexander Leidinger #endif
12999b44bfc5SAlexander Leidinger }
13009b44bfc5SAlexander Leidinger 
13019b44bfc5SAlexander Leidinger int
13029b44bfc5SAlexander Leidinger linux_mq_getsetattr(struct thread *td, struct linux_mq_getsetattr_args *args)
13039b44bfc5SAlexander Leidinger {
13049b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE
13059b44bfc5SAlexander Leidinger    	return kmq_setattr(td, (struct kmq_setattr_args *) args);
13069b44bfc5SAlexander Leidinger #else
13079b44bfc5SAlexander Leidinger 	return (ENOSYS);
13089b44bfc5SAlexander Leidinger #endif
13091bc85c0dSDoug Rabson }
13101bc85c0dSDoug Rabson 
1311