1146aad74SMarcel Moolenaar /*- 2146aad74SMarcel Moolenaar * Copyright (c) 2000 Marcel Moolenaar 3146aad74SMarcel Moolenaar * All rights reserved. 4146aad74SMarcel Moolenaar * 5146aad74SMarcel Moolenaar * Redistribution and use in source and binary forms, with or without 6146aad74SMarcel Moolenaar * modification, are permitted provided that the following conditions 7146aad74SMarcel Moolenaar * are met: 8146aad74SMarcel Moolenaar * 1. Redistributions of source code must retain the above copyright 9146aad74SMarcel Moolenaar * notice, this list of conditions and the following disclaimer 10146aad74SMarcel Moolenaar * in this position and unchanged. 11146aad74SMarcel Moolenaar * 2. Redistributions in binary form must reproduce the above copyright 12146aad74SMarcel Moolenaar * notice, this list of conditions and the following disclaimer in the 13146aad74SMarcel Moolenaar * documentation and/or other materials provided with the distribution. 14146aad74SMarcel Moolenaar * 3. The name of the author may not be used to endorse or promote products 15bc34729cSMarcel Moolenaar * derived from this software without specific prior written permission. 16146aad74SMarcel Moolenaar * 17146aad74SMarcel Moolenaar * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 18146aad74SMarcel Moolenaar * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 19146aad74SMarcel Moolenaar * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 20146aad74SMarcel Moolenaar * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 21146aad74SMarcel Moolenaar * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 22146aad74SMarcel Moolenaar * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23146aad74SMarcel Moolenaar * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24146aad74SMarcel Moolenaar * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25146aad74SMarcel Moolenaar * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 26146aad74SMarcel Moolenaar * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27146aad74SMarcel Moolenaar */ 28146aad74SMarcel Moolenaar 2927e0099cSDavid E. O'Brien #include <sys/cdefs.h> 3027e0099cSDavid E. O'Brien __FBSDID("$FreeBSD$"); 3127e0099cSDavid E. O'Brien 32146aad74SMarcel Moolenaar #include <sys/param.h> 33146aad74SMarcel Moolenaar #include <sys/systm.h> 34a312f6a3SAlexander Leidinger #include <sys/file.h> 35a312f6a3SAlexander Leidinger #include <sys/fcntl.h> 36610ecfe0SMaxim Sobolev #include <sys/imgact.h> 377106ca0dSJohn Baldwin #include <sys/lock.h> 38610ecfe0SMaxim Sobolev #include <sys/malloc.h> 39fb919e4dSMark Murray #include <sys/mman.h> 40fb919e4dSMark Murray #include <sys/mutex.h> 419b44bfc5SAlexander Leidinger #include <sys/sx.h> 42acd3428bSRobert Watson #include <sys/priv.h> 43fb919e4dSMark Murray #include <sys/proc.h> 449b44bfc5SAlexander Leidinger #include <sys/queue.h> 45242fae60SAndrew Gallatin #include <sys/resource.h> 46242fae60SAndrew Gallatin #include <sys/resourcevar.h> 471bc85c0dSDoug Rabson #include <sys/signalvar.h> 48206a5d3aSIan Dowse #include <sys/syscallsubr.h> 49fb919e4dSMark Murray #include <sys/sysproto.h> 50fb919e4dSMark Murray #include <sys/unistd.h> 519b44bfc5SAlexander Leidinger #include <sys/wait.h> 52f0393f06SJeff Roberson #include <sys/sched.h> 53146aad74SMarcel Moolenaar 54146aad74SMarcel Moolenaar #include <machine/frame.h> 55146aad74SMarcel Moolenaar #include <machine/psl.h> 56146aad74SMarcel Moolenaar #include <machine/segments.h> 57146aad74SMarcel Moolenaar #include <machine/sysarch.h> 58146aad74SMarcel Moolenaar 59242fae60SAndrew Gallatin #include <vm/vm.h> 60242fae60SAndrew Gallatin #include <vm/pmap.h> 61242fae60SAndrew Gallatin #include <vm/vm_map.h> 62242fae60SAndrew Gallatin 63146aad74SMarcel Moolenaar #include <i386/linux/linux.h> 64ebea8660SMarcel Moolenaar #include <i386/linux/linux_proto.h> 65146aad74SMarcel Moolenaar #include <compat/linux/linux_ipc.h> 66146aad74SMarcel Moolenaar #include <compat/linux/linux_signal.h> 67146aad74SMarcel Moolenaar #include <compat/linux/linux_util.h> 689b44bfc5SAlexander Leidinger #include <compat/linux/linux_emul.h> 699b44bfc5SAlexander Leidinger 709b44bfc5SAlexander Leidinger #include <i386/include/pcb.h> /* needed for pcb definition in linux_set_thread_area */ 719b44bfc5SAlexander Leidinger 729b44bfc5SAlexander Leidinger #include "opt_posix.h" 739b44bfc5SAlexander Leidinger 749b44bfc5SAlexander Leidinger extern struct sysentvec elf32_freebsd_sysvec; /* defined in i386/i386/elf_machdep.c */ 75146aad74SMarcel Moolenaar 765002a60fSMarcel Moolenaar struct l_descriptor { 775002a60fSMarcel Moolenaar l_uint entry_number; 785002a60fSMarcel Moolenaar l_ulong base_addr; 795002a60fSMarcel Moolenaar l_uint limit; 805002a60fSMarcel Moolenaar l_uint seg_32bit:1; 815002a60fSMarcel Moolenaar l_uint contents:2; 825002a60fSMarcel Moolenaar l_uint read_exec_only:1; 835002a60fSMarcel Moolenaar l_uint limit_in_pages:1; 845002a60fSMarcel Moolenaar l_uint seg_not_present:1; 855002a60fSMarcel Moolenaar l_uint useable:1; 86146aad74SMarcel Moolenaar }; 87146aad74SMarcel Moolenaar 885002a60fSMarcel Moolenaar struct l_old_select_argv { 895002a60fSMarcel Moolenaar l_int nfds; 905002a60fSMarcel Moolenaar l_fd_set *readfds; 915002a60fSMarcel Moolenaar l_fd_set *writefds; 925002a60fSMarcel Moolenaar l_fd_set *exceptfds; 935002a60fSMarcel Moolenaar struct l_timeval *timeout; 94146aad74SMarcel Moolenaar }; 95146aad74SMarcel Moolenaar 96146aad74SMarcel Moolenaar int 97931a7258SAndrew Gallatin linux_to_bsd_sigaltstack(int lsa) 98931a7258SAndrew Gallatin { 99931a7258SAndrew Gallatin int bsa = 0; 100931a7258SAndrew Gallatin 101931a7258SAndrew Gallatin if (lsa & LINUX_SS_DISABLE) 102931a7258SAndrew Gallatin bsa |= SS_DISABLE; 103931a7258SAndrew Gallatin if (lsa & LINUX_SS_ONSTACK) 104931a7258SAndrew Gallatin bsa |= SS_ONSTACK; 105931a7258SAndrew Gallatin return (bsa); 106931a7258SAndrew Gallatin } 107931a7258SAndrew Gallatin 108931a7258SAndrew Gallatin int 109931a7258SAndrew Gallatin bsd_to_linux_sigaltstack(int bsa) 110931a7258SAndrew Gallatin { 111931a7258SAndrew Gallatin int lsa = 0; 112931a7258SAndrew Gallatin 113931a7258SAndrew Gallatin if (bsa & SS_DISABLE) 114931a7258SAndrew Gallatin lsa |= LINUX_SS_DISABLE; 115931a7258SAndrew Gallatin if (bsa & SS_ONSTACK) 116931a7258SAndrew Gallatin lsa |= LINUX_SS_ONSTACK; 117931a7258SAndrew Gallatin return (lsa); 118931a7258SAndrew Gallatin } 119931a7258SAndrew Gallatin 120931a7258SAndrew Gallatin int 121b40ce416SJulian Elischer linux_execve(struct thread *td, struct linux_execve_args *args) 122146aad74SMarcel Moolenaar { 123610ecfe0SMaxim Sobolev int error; 124610ecfe0SMaxim Sobolev char *newpath; 125610ecfe0SMaxim Sobolev struct image_args eargs; 126146aad74SMarcel Moolenaar 127d9e97471SJohn Baldwin LCONVPATHEXIST(td, args->path, &newpath); 128146aad74SMarcel Moolenaar 129146aad74SMarcel Moolenaar #ifdef DEBUG 13024593369SJonathan Lemon if (ldebug(execve)) 131610ecfe0SMaxim Sobolev printf(ARGS(execve, "%s"), newpath); 132146aad74SMarcel Moolenaar #endif 133146aad74SMarcel Moolenaar 134610ecfe0SMaxim Sobolev error = exec_copyin_args(&eargs, newpath, UIO_SYSSPACE, 135610ecfe0SMaxim Sobolev args->argp, args->envp); 136610ecfe0SMaxim Sobolev free(newpath, M_TEMP); 137610ecfe0SMaxim Sobolev if (error == 0) 138c035ac04SMaxim Sobolev error = kern_execve(td, &eargs, NULL); 1399b44bfc5SAlexander Leidinger if (error == 0) 1409b44bfc5SAlexander Leidinger /* linux process can exec fbsd one, dont attempt 1419b44bfc5SAlexander Leidinger * to create emuldata for such process using 1429b44bfc5SAlexander Leidinger * linux_proc_init, this leads to a panic on KASSERT 1439b44bfc5SAlexander Leidinger * because such process has p->p_emuldata == NULL 1449b44bfc5SAlexander Leidinger */ 1459b44bfc5SAlexander Leidinger if (td->td_proc->p_sysent == &elf_linux_sysvec) 1469b44bfc5SAlexander Leidinger error = linux_proc_init(td, 0, 0); 147610ecfe0SMaxim Sobolev return (error); 148146aad74SMarcel Moolenaar } 149146aad74SMarcel Moolenaar 1505002a60fSMarcel Moolenaar struct l_ipc_kludge { 1515002a60fSMarcel Moolenaar struct l_msgbuf *msgp; 1525002a60fSMarcel Moolenaar l_long msgtyp; 1535002a60fSMarcel Moolenaar }; 1545002a60fSMarcel Moolenaar 155146aad74SMarcel Moolenaar int 156b40ce416SJulian Elischer linux_ipc(struct thread *td, struct linux_ipc_args *args) 157146aad74SMarcel Moolenaar { 1585002a60fSMarcel Moolenaar 1595002a60fSMarcel Moolenaar switch (args->what & 0xFFFF) { 1605002a60fSMarcel Moolenaar case LINUX_SEMOP: { 1615002a60fSMarcel Moolenaar struct linux_semop_args a; 1625002a60fSMarcel Moolenaar 1635002a60fSMarcel Moolenaar a.semid = args->arg1; 1645002a60fSMarcel Moolenaar a.tsops = args->ptr; 1655002a60fSMarcel Moolenaar a.nsops = args->arg2; 166b40ce416SJulian Elischer return (linux_semop(td, &a)); 1675002a60fSMarcel Moolenaar } 1685002a60fSMarcel Moolenaar case LINUX_SEMGET: { 1695002a60fSMarcel Moolenaar struct linux_semget_args a; 1705002a60fSMarcel Moolenaar 1715002a60fSMarcel Moolenaar a.key = args->arg1; 1725002a60fSMarcel Moolenaar a.nsems = args->arg2; 1735002a60fSMarcel Moolenaar a.semflg = args->arg3; 174b40ce416SJulian Elischer return (linux_semget(td, &a)); 1755002a60fSMarcel Moolenaar } 1765002a60fSMarcel Moolenaar case LINUX_SEMCTL: { 1775002a60fSMarcel Moolenaar struct linux_semctl_args a; 1785002a60fSMarcel Moolenaar int error; 1795002a60fSMarcel Moolenaar 1805002a60fSMarcel Moolenaar a.semid = args->arg1; 1815002a60fSMarcel Moolenaar a.semnum = args->arg2; 1825002a60fSMarcel Moolenaar a.cmd = args->arg3; 1834b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &a.arg, sizeof(a.arg)); 1845002a60fSMarcel Moolenaar if (error) 1855002a60fSMarcel Moolenaar return (error); 186b40ce416SJulian Elischer return (linux_semctl(td, &a)); 1875002a60fSMarcel Moolenaar } 1885002a60fSMarcel Moolenaar case LINUX_MSGSND: { 1895002a60fSMarcel Moolenaar struct linux_msgsnd_args a; 1905002a60fSMarcel Moolenaar 1915002a60fSMarcel Moolenaar a.msqid = args->arg1; 1925002a60fSMarcel Moolenaar a.msgp = args->ptr; 1935002a60fSMarcel Moolenaar a.msgsz = args->arg2; 1945002a60fSMarcel Moolenaar a.msgflg = args->arg3; 195b40ce416SJulian Elischer return (linux_msgsnd(td, &a)); 1965002a60fSMarcel Moolenaar } 1975002a60fSMarcel Moolenaar case LINUX_MSGRCV: { 1985002a60fSMarcel Moolenaar struct linux_msgrcv_args a; 1995002a60fSMarcel Moolenaar 2005002a60fSMarcel Moolenaar a.msqid = args->arg1; 2015002a60fSMarcel Moolenaar a.msgsz = args->arg2; 2025002a60fSMarcel Moolenaar a.msgflg = args->arg3; 2035002a60fSMarcel Moolenaar if ((args->what >> 16) == 0) { 2045002a60fSMarcel Moolenaar struct l_ipc_kludge tmp; 2055002a60fSMarcel Moolenaar int error; 2065002a60fSMarcel Moolenaar 2075002a60fSMarcel Moolenaar if (args->ptr == NULL) 2085002a60fSMarcel Moolenaar return (EINVAL); 2094b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &tmp, sizeof(tmp)); 2105002a60fSMarcel Moolenaar if (error) 2115002a60fSMarcel Moolenaar return (error); 2125002a60fSMarcel Moolenaar a.msgp = tmp.msgp; 2135002a60fSMarcel Moolenaar a.msgtyp = tmp.msgtyp; 2145002a60fSMarcel Moolenaar } else { 2155002a60fSMarcel Moolenaar a.msgp = args->ptr; 2165002a60fSMarcel Moolenaar a.msgtyp = args->arg5; 2175002a60fSMarcel Moolenaar } 218b40ce416SJulian Elischer return (linux_msgrcv(td, &a)); 2195002a60fSMarcel Moolenaar } 2205002a60fSMarcel Moolenaar case LINUX_MSGGET: { 2215002a60fSMarcel Moolenaar struct linux_msgget_args a; 2225002a60fSMarcel Moolenaar 2235002a60fSMarcel Moolenaar a.key = args->arg1; 2245002a60fSMarcel Moolenaar a.msgflg = args->arg2; 225b40ce416SJulian Elischer return (linux_msgget(td, &a)); 2265002a60fSMarcel Moolenaar } 2275002a60fSMarcel Moolenaar case LINUX_MSGCTL: { 2285002a60fSMarcel Moolenaar struct linux_msgctl_args a; 2295002a60fSMarcel Moolenaar 2305002a60fSMarcel Moolenaar a.msqid = args->arg1; 2315002a60fSMarcel Moolenaar a.cmd = args->arg2; 2325002a60fSMarcel Moolenaar a.buf = args->ptr; 233b40ce416SJulian Elischer return (linux_msgctl(td, &a)); 2345002a60fSMarcel Moolenaar } 2355002a60fSMarcel Moolenaar case LINUX_SHMAT: { 2365002a60fSMarcel Moolenaar struct linux_shmat_args a; 2375002a60fSMarcel Moolenaar 2385002a60fSMarcel Moolenaar a.shmid = args->arg1; 2395002a60fSMarcel Moolenaar a.shmaddr = args->ptr; 2405002a60fSMarcel Moolenaar a.shmflg = args->arg2; 2415002a60fSMarcel Moolenaar a.raddr = (l_ulong *)args->arg3; 242b40ce416SJulian Elischer return (linux_shmat(td, &a)); 2435002a60fSMarcel Moolenaar } 2445002a60fSMarcel Moolenaar case LINUX_SHMDT: { 2455002a60fSMarcel Moolenaar struct linux_shmdt_args a; 2465002a60fSMarcel Moolenaar 2475002a60fSMarcel Moolenaar a.shmaddr = args->ptr; 248b40ce416SJulian Elischer return (linux_shmdt(td, &a)); 2495002a60fSMarcel Moolenaar } 2505002a60fSMarcel Moolenaar case LINUX_SHMGET: { 2515002a60fSMarcel Moolenaar struct linux_shmget_args a; 2525002a60fSMarcel Moolenaar 2535002a60fSMarcel Moolenaar a.key = args->arg1; 2545002a60fSMarcel Moolenaar a.size = args->arg2; 2555002a60fSMarcel Moolenaar a.shmflg = args->arg3; 256b40ce416SJulian Elischer return (linux_shmget(td, &a)); 2575002a60fSMarcel Moolenaar } 2585002a60fSMarcel Moolenaar case LINUX_SHMCTL: { 2595002a60fSMarcel Moolenaar struct linux_shmctl_args a; 2605002a60fSMarcel Moolenaar 2615002a60fSMarcel Moolenaar a.shmid = args->arg1; 2625002a60fSMarcel Moolenaar a.cmd = args->arg2; 2635002a60fSMarcel Moolenaar a.buf = args->ptr; 264b40ce416SJulian Elischer return (linux_shmctl(td, &a)); 2655002a60fSMarcel Moolenaar } 2665002a60fSMarcel Moolenaar default: 2675002a60fSMarcel Moolenaar break; 268146aad74SMarcel Moolenaar } 269146aad74SMarcel Moolenaar 2705002a60fSMarcel Moolenaar return (EINVAL); 271146aad74SMarcel Moolenaar } 272146aad74SMarcel Moolenaar 273146aad74SMarcel Moolenaar int 274b40ce416SJulian Elischer linux_old_select(struct thread *td, struct linux_old_select_args *args) 275146aad74SMarcel Moolenaar { 2765002a60fSMarcel Moolenaar struct l_old_select_argv linux_args; 2775002a60fSMarcel Moolenaar struct linux_select_args newsel; 278146aad74SMarcel Moolenaar int error; 279146aad74SMarcel Moolenaar 2805002a60fSMarcel Moolenaar #ifdef DEBUG 2815002a60fSMarcel Moolenaar if (ldebug(old_select)) 2826aea6777SPeter Wemm printf(ARGS(old_select, "%p"), args->ptr); 283146aad74SMarcel Moolenaar #endif 284146aad74SMarcel Moolenaar 2854b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &linux_args, sizeof(linux_args)); 286146aad74SMarcel Moolenaar if (error) 287146aad74SMarcel Moolenaar return (error); 288146aad74SMarcel Moolenaar 289146aad74SMarcel Moolenaar newsel.nfds = linux_args.nfds; 290146aad74SMarcel Moolenaar newsel.readfds = linux_args.readfds; 291146aad74SMarcel Moolenaar newsel.writefds = linux_args.writefds; 292146aad74SMarcel Moolenaar newsel.exceptfds = linux_args.exceptfds; 293146aad74SMarcel Moolenaar newsel.timeout = linux_args.timeout; 294b40ce416SJulian Elischer return (linux_select(td, &newsel)); 295146aad74SMarcel Moolenaar } 296146aad74SMarcel Moolenaar 297146aad74SMarcel Moolenaar int 298b40ce416SJulian Elischer linux_fork(struct thread *td, struct linux_fork_args *args) 299146aad74SMarcel Moolenaar { 300146aad74SMarcel Moolenaar int error; 301d071f504SAlexander Leidinger struct proc *p2; 302d071f504SAlexander Leidinger struct thread *td2; 303146aad74SMarcel Moolenaar 304146aad74SMarcel Moolenaar #ifdef DEBUG 30524593369SJonathan Lemon if (ldebug(fork)) 30624593369SJonathan Lemon printf(ARGS(fork, "")); 307146aad74SMarcel Moolenaar #endif 308146aad74SMarcel Moolenaar 309d071f504SAlexander Leidinger if ((error = fork1(td, RFFDG | RFPROC | RFSTOPPED, 0, &p2)) != 0) 310146aad74SMarcel Moolenaar return (error); 311146aad74SMarcel Moolenaar 312d071f504SAlexander Leidinger if (error == 0) { 313d071f504SAlexander Leidinger td->td_retval[0] = p2->p_pid; 314d071f504SAlexander Leidinger td->td_retval[1] = 0; 315d071f504SAlexander Leidinger } 316d071f504SAlexander Leidinger 317b40ce416SJulian Elischer if (td->td_retval[1] == 1) 318b40ce416SJulian Elischer td->td_retval[0] = 0; 3199b44bfc5SAlexander Leidinger error = linux_proc_init(td, td->td_retval[0], 0); 3209b44bfc5SAlexander Leidinger if (error) 3219b44bfc5SAlexander Leidinger return (error); 3229b44bfc5SAlexander Leidinger 323d071f504SAlexander Leidinger td2 = FIRST_THREAD_IN_PROC(p2); 324d071f504SAlexander Leidinger 325d071f504SAlexander Leidinger /* 326d071f504SAlexander Leidinger * Make this runnable after we are finished with it. 327d071f504SAlexander Leidinger */ 328d071f504SAlexander Leidinger mtx_lock_spin(&sched_lock); 329d071f504SAlexander Leidinger TD_SET_CAN_RUN(td2); 330f0393f06SJeff Roberson sched_add(td2, SRQ_BORING); 331d071f504SAlexander Leidinger mtx_unlock_spin(&sched_lock); 332d071f504SAlexander Leidinger 333146aad74SMarcel Moolenaar return (0); 334146aad74SMarcel Moolenaar } 335146aad74SMarcel Moolenaar 336146aad74SMarcel Moolenaar int 337b40ce416SJulian Elischer linux_vfork(struct thread *td, struct linux_vfork_args *args) 338146aad74SMarcel Moolenaar { 339146aad74SMarcel Moolenaar int error; 34040f734ddSAlexander Leidinger struct proc *p2; 341d071f504SAlexander Leidinger struct thread *td2; 342146aad74SMarcel Moolenaar 343146aad74SMarcel Moolenaar #ifdef DEBUG 34424593369SJonathan Lemon if (ldebug(vfork)) 34524593369SJonathan Lemon printf(ARGS(vfork, "")); 346146aad74SMarcel Moolenaar #endif 347146aad74SMarcel Moolenaar 34840f734ddSAlexander Leidinger /* exclude RFPPWAIT */ 349d071f504SAlexander Leidinger if ((error = fork1(td, RFFDG | RFPROC | RFMEM | RFSTOPPED, 0, &p2)) != 0) 350146aad74SMarcel Moolenaar return (error); 35140f734ddSAlexander Leidinger if (error == 0) { 35240f734ddSAlexander Leidinger td->td_retval[0] = p2->p_pid; 35340f734ddSAlexander Leidinger td->td_retval[1] = 0; 35440f734ddSAlexander Leidinger } 355146aad74SMarcel Moolenaar /* Are we the child? */ 356b40ce416SJulian Elischer if (td->td_retval[1] == 1) 357b40ce416SJulian Elischer td->td_retval[0] = 0; 3589b44bfc5SAlexander Leidinger error = linux_proc_init(td, td->td_retval[0], 0); 3599b44bfc5SAlexander Leidinger if (error) 3609b44bfc5SAlexander Leidinger return (error); 361d071f504SAlexander Leidinger 36240f734ddSAlexander Leidinger PROC_LOCK(p2); 363973ac082SAlexander Leidinger p2->p_flag |= P_PPWAIT; 364d071f504SAlexander Leidinger PROC_UNLOCK(p2); 365d071f504SAlexander Leidinger 366d071f504SAlexander Leidinger td2 = FIRST_THREAD_IN_PROC(p2); 367d071f504SAlexander Leidinger 368d071f504SAlexander Leidinger /* 369d071f504SAlexander Leidinger * Make this runnable after we are finished with it. 370d071f504SAlexander Leidinger */ 371d071f504SAlexander Leidinger mtx_lock_spin(&sched_lock); 372d071f504SAlexander Leidinger TD_SET_CAN_RUN(td2); 373f0393f06SJeff Roberson sched_add(td2, SRQ_BORING); 374d071f504SAlexander Leidinger mtx_unlock_spin(&sched_lock); 375d071f504SAlexander Leidinger 376d071f504SAlexander Leidinger /* wait for the children to exit, ie. emulate vfork */ 377d071f504SAlexander Leidinger PROC_LOCK(p2); 37840f734ddSAlexander Leidinger while (p2->p_flag & P_PPWAIT) 37940f734ddSAlexander Leidinger msleep(td->td_proc, &p2->p_mtx, PWAIT, "ppwait", 0); 38040f734ddSAlexander Leidinger PROC_UNLOCK(p2); 38140f734ddSAlexander Leidinger 382146aad74SMarcel Moolenaar return (0); 383146aad74SMarcel Moolenaar } 384146aad74SMarcel Moolenaar 385146aad74SMarcel Moolenaar int 386b40ce416SJulian Elischer linux_clone(struct thread *td, struct linux_clone_args *args) 387146aad74SMarcel Moolenaar { 3886ad0e7c5SJohn Baldwin int error, ff = RFPROC | RFSTOPPED; 389146aad74SMarcel Moolenaar struct proc *p2; 3909eb78fcfSJohn Baldwin struct thread *td2; 391146aad74SMarcel Moolenaar int exit_signal; 3929b44bfc5SAlexander Leidinger struct linux_emuldata *em; 393146aad74SMarcel Moolenaar 394146aad74SMarcel Moolenaar #ifdef DEBUG 39524593369SJonathan Lemon if (ldebug(clone)) { 3969b44bfc5SAlexander Leidinger printf(ARGS(clone, "flags %x, stack %x, parent tid: %x, child tid: %x"), 3979b44bfc5SAlexander Leidinger (unsigned int)args->flags, (unsigned int)args->stack, 3989b44bfc5SAlexander Leidinger (unsigned int)args->parent_tidptr, (unsigned int)args->child_tidptr); 39924593369SJonathan Lemon } 400146aad74SMarcel Moolenaar #endif 401146aad74SMarcel Moolenaar 402146aad74SMarcel Moolenaar exit_signal = args->flags & 0x000000ff; 4030f054958SAlexander Leidinger if (!LINUX_SIG_VALID(exit_signal) && exit_signal != 0) 404146aad74SMarcel Moolenaar return (EINVAL); 405146aad74SMarcel Moolenaar 406146aad74SMarcel Moolenaar if (exit_signal <= LINUX_SIGTBLSZ) 407146aad74SMarcel Moolenaar exit_signal = linux_to_bsd_signal[_SIG_IDX(exit_signal)]; 408146aad74SMarcel Moolenaar 409146aad74SMarcel Moolenaar if (args->flags & CLONE_VM) 410146aad74SMarcel Moolenaar ff |= RFMEM; 411146aad74SMarcel Moolenaar if (args->flags & CLONE_SIGHAND) 412146aad74SMarcel Moolenaar ff |= RFSIGSHARE; 4134b3583a3SAlexander Leidinger /* 4144b3583a3SAlexander Leidinger * XXX: in linux sharing of fs info (chroot/cwd/umask) 4154b3583a3SAlexander Leidinger * and open files is independant. in fbsd its in one 416802e08a3SAlexander Leidinger * structure but in reality it doesn't cause any problems 417802e08a3SAlexander Leidinger * because both of these flags are usually set together. 4184b3583a3SAlexander Leidinger */ 4194b3583a3SAlexander Leidinger if (!(args->flags & (CLONE_FILES | CLONE_FS))) 420146aad74SMarcel Moolenaar ff |= RFFDG; 421146aad74SMarcel Moolenaar 4224b178336SMaxim Sobolev /* 4234b178336SMaxim Sobolev * Attempt to detect when linux_clone(2) is used for creating 4244b178336SMaxim Sobolev * kernel threads. Unfortunately despite the existence of the 4254b178336SMaxim Sobolev * CLONE_THREAD flag, version of linuxthreads package used in 4264b178336SMaxim Sobolev * most popular distros as of beginning of 2005 doesn't make 427802e08a3SAlexander Leidinger * any use of it. Therefore, this detection relies on 4284b178336SMaxim Sobolev * empirical observation that linuxthreads sets certain 4294b178336SMaxim Sobolev * combination of flags, so that we can make more or less 4304b178336SMaxim Sobolev * precise detection and notify the FreeBSD kernel that several 4314b178336SMaxim Sobolev * processes are in fact part of the same threading group, so 4324b178336SMaxim Sobolev * that special treatment is necessary for signal delivery 4334b178336SMaxim Sobolev * between those processes and fd locking. 4344b178336SMaxim Sobolev */ 4354b178336SMaxim Sobolev if ((args->flags & 0xffffff00) == THREADING_FLAGS) 4364b178336SMaxim Sobolev ff |= RFTHREAD; 4374b178336SMaxim Sobolev 4381a26db0aSAlexander Leidinger if (args->flags & CLONE_PARENT_SETTID) 4391a26db0aSAlexander Leidinger if (args->parent_tidptr == NULL) 4401a26db0aSAlexander Leidinger return (EINVAL); 4411a26db0aSAlexander Leidinger 442316ec49aSScott Long error = fork1(td, ff, 0, &p2); 4439eb78fcfSJohn Baldwin if (error) 4449eb78fcfSJohn Baldwin return (error); 4459eb78fcfSJohn Baldwin 446a9ccaccfSKonstantin Belousov if (args->flags & (CLONE_PARENT|CLONE_THREAD)) { 447a9ccaccfSKonstantin Belousov sx_xlock(&proctree_lock); 448a9ccaccfSKonstantin Belousov PROC_LOCK(p2); 449a9ccaccfSKonstantin Belousov proc_reparent(p2, td->td_proc->p_pptr); 450a9ccaccfSKonstantin Belousov PROC_UNLOCK(p2); 451a9ccaccfSKonstantin Belousov sx_xunlock(&proctree_lock); 452a9ccaccfSKonstantin Belousov } 453a9ccaccfSKonstantin Belousov 4549b44bfc5SAlexander Leidinger /* create the emuldata */ 4559b44bfc5SAlexander Leidinger error = linux_proc_init(td, p2->p_pid, args->flags); 4569b44bfc5SAlexander Leidinger /* reference it - no need to check this */ 4571c65504cSAlexander Leidinger em = em_find(p2, EMUL_DOLOCK); 4589b44bfc5SAlexander Leidinger KASSERT(em != NULL, ("clone: emuldata not found.\n")); 4599b44bfc5SAlexander Leidinger /* and adjust it */ 4609b44bfc5SAlexander Leidinger 4619b44bfc5SAlexander Leidinger if (args->flags & CLONE_THREAD) { 4629b44bfc5SAlexander Leidinger /* XXX: linux mangles pgrp and pptr somehow 4639b44bfc5SAlexander Leidinger * I think it might be this but I am not sure. 4649b44bfc5SAlexander Leidinger */ 4659b44bfc5SAlexander Leidinger #ifdef notyet 466a6c5f813SAlexander Leidinger PROC_LOCK(p2); 4679b44bfc5SAlexander Leidinger p2->p_pgrp = td->td_proc->p_pgrp; 468a6c5f813SAlexander Leidinger PROC_UNLOCK(p2); 4699b44bfc5SAlexander Leidinger #endif 4709b44bfc5SAlexander Leidinger exit_signal = 0; 4719b44bfc5SAlexander Leidinger } 4729b44bfc5SAlexander Leidinger 4739b44bfc5SAlexander Leidinger if (args->flags & CLONE_CHILD_SETTID) 4749b44bfc5SAlexander Leidinger em->child_set_tid = args->child_tidptr; 4759b44bfc5SAlexander Leidinger else 4769b44bfc5SAlexander Leidinger em->child_set_tid = NULL; 4779b44bfc5SAlexander Leidinger 4789b44bfc5SAlexander Leidinger if (args->flags & CLONE_CHILD_CLEARTID) 4799b44bfc5SAlexander Leidinger em->child_clear_tid = args->child_tidptr; 4809b44bfc5SAlexander Leidinger else 4819b44bfc5SAlexander Leidinger em->child_clear_tid = NULL; 482a6c5f813SAlexander Leidinger 4839b44bfc5SAlexander Leidinger EMUL_UNLOCK(&emul_lock); 484146aad74SMarcel Moolenaar 4851a26db0aSAlexander Leidinger if (args->flags & CLONE_PARENT_SETTID) { 4861a26db0aSAlexander Leidinger error = copyout(&p2->p_pid, args->parent_tidptr, sizeof(p2->p_pid)); 4871a26db0aSAlexander Leidinger if (error) 4881a26db0aSAlexander Leidinger printf(LMSG("copyout failed!")); 4891a26db0aSAlexander Leidinger } 4901a26db0aSAlexander Leidinger 491fdfdfb78SJohn Baldwin PROC_LOCK(p2); 492146aad74SMarcel Moolenaar p2->p_sigparent = exit_signal; 4939eb78fcfSJohn Baldwin PROC_UNLOCK(p2); 4949eb78fcfSJohn Baldwin td2 = FIRST_THREAD_IN_PROC(p2); 4950eef2f8aSAlexander Leidinger /* 4960eef2f8aSAlexander Leidinger * in a case of stack = NULL we are supposed to COW calling process stack 4979b44bfc5SAlexander Leidinger * this is what normal fork() does so we just keep the tf_esp arg intact 4989b44bfc5SAlexander Leidinger */ 4999b44bfc5SAlexander Leidinger if (args->stack) 5009eb78fcfSJohn Baldwin td2->td_frame->tf_esp = (unsigned int)args->stack; 501146aad74SMarcel Moolenaar 5029b44bfc5SAlexander Leidinger if (args->flags & CLONE_SETTLS) { 5039b44bfc5SAlexander Leidinger struct l_user_desc info; 5049b44bfc5SAlexander Leidinger int idx; 5059b44bfc5SAlexander Leidinger int a[2]; 5069b44bfc5SAlexander Leidinger struct segment_descriptor sd; 5079b44bfc5SAlexander Leidinger 5089b44bfc5SAlexander Leidinger error = copyin((void *)td->td_frame->tf_esi, &info, sizeof(struct l_user_desc)); 5091a26db0aSAlexander Leidinger if (error) { 5101a26db0aSAlexander Leidinger printf(LMSG("copyin failed!")); 5111a26db0aSAlexander Leidinger } else { 5129b44bfc5SAlexander Leidinger 5139b44bfc5SAlexander Leidinger idx = info.entry_number; 5149b44bfc5SAlexander Leidinger 5150eef2f8aSAlexander Leidinger /* 5160eef2f8aSAlexander Leidinger * looks like we're getting the idx we returned 5179b44bfc5SAlexander Leidinger * in the set_thread_area() syscall 5189b44bfc5SAlexander Leidinger */ 5191a26db0aSAlexander Leidinger if (idx != 6 && idx != 3) { 5201a26db0aSAlexander Leidinger printf(LMSG("resetting idx!")); 5211a26db0aSAlexander Leidinger idx = 3; 5221a26db0aSAlexander Leidinger } 5239b44bfc5SAlexander Leidinger 5249b44bfc5SAlexander Leidinger /* this doesnt happen in practice */ 5259b44bfc5SAlexander Leidinger if (idx == 6) { 5269b44bfc5SAlexander Leidinger /* we might copy out the entry_number as 3 */ 5279b44bfc5SAlexander Leidinger info.entry_number = 3; 5289b44bfc5SAlexander Leidinger error = copyout(&info, (void *) td->td_frame->tf_esi, sizeof(struct l_user_desc)); 5299b44bfc5SAlexander Leidinger if (error) 5301a26db0aSAlexander Leidinger printf(LMSG("copyout failed!")); 5319b44bfc5SAlexander Leidinger } 5329b44bfc5SAlexander Leidinger 5339b44bfc5SAlexander Leidinger a[0] = LDT_entry_a(&info); 5349b44bfc5SAlexander Leidinger a[1] = LDT_entry_b(&info); 5359b44bfc5SAlexander Leidinger 5369b44bfc5SAlexander Leidinger memcpy(&sd, &a, sizeof(a)); 5379b44bfc5SAlexander Leidinger #ifdef DEBUG 5389b44bfc5SAlexander Leidinger if (ldebug(clone)) 5399b44bfc5SAlexander Leidinger printf("Segment created in clone with CLONE_SETTLS: lobase: %x, hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, def32: %i, gran: %i\n", sd.sd_lobase, 5409b44bfc5SAlexander Leidinger sd.sd_hibase, 5419b44bfc5SAlexander Leidinger sd.sd_lolimit, 5429b44bfc5SAlexander Leidinger sd.sd_hilimit, 5439b44bfc5SAlexander Leidinger sd.sd_type, 5449b44bfc5SAlexander Leidinger sd.sd_dpl, 5459b44bfc5SAlexander Leidinger sd.sd_p, 5469b44bfc5SAlexander Leidinger sd.sd_xx, 5479b44bfc5SAlexander Leidinger sd.sd_def32, 5489b44bfc5SAlexander Leidinger sd.sd_gran); 5499b44bfc5SAlexander Leidinger #endif 5509b44bfc5SAlexander Leidinger 5519b44bfc5SAlexander Leidinger /* set %gs */ 5529b44bfc5SAlexander Leidinger td2->td_pcb->pcb_gsd = sd; 553a6c5f813SAlexander Leidinger td2->td_pcb->pcb_gs = GSEL(GUGS_SEL, SEL_UPL); 5549b44bfc5SAlexander Leidinger } 5551a26db0aSAlexander Leidinger } 5569b44bfc5SAlexander Leidinger 557146aad74SMarcel Moolenaar #ifdef DEBUG 55824593369SJonathan Lemon if (ldebug(clone)) 5599eb78fcfSJohn Baldwin printf(LMSG("clone: successful rfork to %ld, stack %p sig = %d"), 5609eb78fcfSJohn Baldwin (long)p2->p_pid, args->stack, exit_signal); 561146aad74SMarcel Moolenaar #endif 562d071f504SAlexander Leidinger if (args->flags & CLONE_VFORK) { 563d071f504SAlexander Leidinger PROC_LOCK(p2); 564d071f504SAlexander Leidinger p2->p_flag |= P_PPWAIT; 565d071f504SAlexander Leidinger PROC_UNLOCK(p2); 566d071f504SAlexander Leidinger } 567146aad74SMarcel Moolenaar 5686ad0e7c5SJohn Baldwin /* 5696ad0e7c5SJohn Baldwin * Make this runnable after we are finished with it. 5706ad0e7c5SJohn Baldwin */ 5716ad0e7c5SJohn Baldwin mtx_lock_spin(&sched_lock); 5729eb78fcfSJohn Baldwin TD_SET_CAN_RUN(td2); 573f0393f06SJeff Roberson sched_add(td2, SRQ_BORING); 5746ad0e7c5SJohn Baldwin mtx_unlock_spin(&sched_lock); 5756ad0e7c5SJohn Baldwin 5769eb78fcfSJohn Baldwin td->td_retval[0] = p2->p_pid; 5779eb78fcfSJohn Baldwin td->td_retval[1] = 0; 5780a62e035SAlexander Leidinger 5790a62e035SAlexander Leidinger if (args->flags & CLONE_VFORK) { 5800a62e035SAlexander Leidinger /* wait for the children to exit, ie. emulate vfork */ 5810a62e035SAlexander Leidinger PROC_LOCK(p2); 5820a62e035SAlexander Leidinger while (p2->p_flag & P_PPWAIT) 5830a62e035SAlexander Leidinger msleep(td->td_proc, &p2->p_mtx, PWAIT, "ppwait", 0); 5840a62e035SAlexander Leidinger PROC_UNLOCK(p2); 5850a62e035SAlexander Leidinger } 5860a62e035SAlexander Leidinger 5879eb78fcfSJohn Baldwin return (0); 588146aad74SMarcel Moolenaar } 589146aad74SMarcel Moolenaar 590146aad74SMarcel Moolenaar #define STACK_SIZE (2 * 1024 * 1024) 591146aad74SMarcel Moolenaar #define GUARD_SIZE (4 * PAGE_SIZE) 592146aad74SMarcel Moolenaar 5933ad9c842SMaxim Sobolev static int linux_mmap_common(struct thread *, struct l_mmap_argv *); 5943ad9c842SMaxim Sobolev 5953ad9c842SMaxim Sobolev int 5963ad9c842SMaxim Sobolev linux_mmap2(struct thread *td, struct linux_mmap2_args *args) 5973ad9c842SMaxim Sobolev { 5983ad9c842SMaxim Sobolev struct l_mmap_argv linux_args; 5993ad9c842SMaxim Sobolev 6003ad9c842SMaxim Sobolev #ifdef DEBUG 6013ad9c842SMaxim Sobolev if (ldebug(mmap2)) 6023ad9c842SMaxim Sobolev printf(ARGS(mmap2, "%p, %d, %d, 0x%08x, %d, %d"), 6033ad9c842SMaxim Sobolev (void *)args->addr, args->len, args->prot, 6043ad9c842SMaxim Sobolev args->flags, args->fd, args->pgoff); 6053ad9c842SMaxim Sobolev #endif 6063ad9c842SMaxim Sobolev 60710931a46SJung-uk Kim linux_args.addr = args->addr; 6083ad9c842SMaxim Sobolev linux_args.len = args->len; 6093ad9c842SMaxim Sobolev linux_args.prot = args->prot; 6103ad9c842SMaxim Sobolev linux_args.flags = args->flags; 6113ad9c842SMaxim Sobolev linux_args.fd = args->fd; 61210931a46SJung-uk Kim linux_args.pgoff = args->pgoff * PAGE_SIZE; 6133ad9c842SMaxim Sobolev 6143ad9c842SMaxim Sobolev return (linux_mmap_common(td, &linux_args)); 6153ad9c842SMaxim Sobolev } 6163ad9c842SMaxim Sobolev 617146aad74SMarcel Moolenaar int 618b40ce416SJulian Elischer linux_mmap(struct thread *td, struct linux_mmap_args *args) 619146aad74SMarcel Moolenaar { 6203ad9c842SMaxim Sobolev int error; 6213ad9c842SMaxim Sobolev struct l_mmap_argv linux_args; 6223ad9c842SMaxim Sobolev 6234b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &linux_args, sizeof(linux_args)); 6243ad9c842SMaxim Sobolev if (error) 6253ad9c842SMaxim Sobolev return (error); 6263ad9c842SMaxim Sobolev 6273ad9c842SMaxim Sobolev #ifdef DEBUG 6283ad9c842SMaxim Sobolev if (ldebug(mmap)) 6293ad9c842SMaxim Sobolev printf(ARGS(mmap, "%p, %d, %d, 0x%08x, %d, %d"), 630b45bbfc3SBruce Evans (void *)linux_args.addr, linux_args.len, linux_args.prot, 63110931a46SJung-uk Kim linux_args.flags, linux_args.fd, linux_args.pgoff); 6323ad9c842SMaxim Sobolev #endif 6333ad9c842SMaxim Sobolev 6343ad9c842SMaxim Sobolev return (linux_mmap_common(td, &linux_args)); 6353ad9c842SMaxim Sobolev } 6363ad9c842SMaxim Sobolev 6373ad9c842SMaxim Sobolev static int 6383ad9c842SMaxim Sobolev linux_mmap_common(struct thread *td, struct l_mmap_argv *linux_args) 6393ad9c842SMaxim Sobolev { 640b40ce416SJulian Elischer struct proc *p = td->td_proc; 641146aad74SMarcel Moolenaar struct mmap_args /* { 642146aad74SMarcel Moolenaar caddr_t addr; 643146aad74SMarcel Moolenaar size_t len; 644146aad74SMarcel Moolenaar int prot; 645146aad74SMarcel Moolenaar int flags; 646146aad74SMarcel Moolenaar int fd; 647146aad74SMarcel Moolenaar long pad; 648146aad74SMarcel Moolenaar off_t pos; 649146aad74SMarcel Moolenaar } */ bsd_args; 65091d631e5SMatthew N. Dodd int error; 651a312f6a3SAlexander Leidinger struct file *fp; 652146aad74SMarcel Moolenaar 65391d631e5SMatthew N. Dodd error = 0; 654146aad74SMarcel Moolenaar bsd_args.flags = 0; 655a312f6a3SAlexander Leidinger fp = NULL; 656a312f6a3SAlexander Leidinger 657a312f6a3SAlexander Leidinger /* 658a312f6a3SAlexander Leidinger * Linux mmap(2): 659a312f6a3SAlexander Leidinger * You must specify exactly one of MAP_SHARED and MAP_PRIVATE 660a312f6a3SAlexander Leidinger */ 661a312f6a3SAlexander Leidinger if (! ((linux_args->flags & LINUX_MAP_SHARED) ^ 662a312f6a3SAlexander Leidinger (linux_args->flags & LINUX_MAP_PRIVATE))) 6636dc4e810SAlexander Leidinger return (EINVAL); 664a312f6a3SAlexander Leidinger 6653ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_SHARED) 666146aad74SMarcel Moolenaar bsd_args.flags |= MAP_SHARED; 6673ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_PRIVATE) 668146aad74SMarcel Moolenaar bsd_args.flags |= MAP_PRIVATE; 6693ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_FIXED) 670146aad74SMarcel Moolenaar bsd_args.flags |= MAP_FIXED; 6713ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_ANON) 672146aad74SMarcel Moolenaar bsd_args.flags |= MAP_ANON; 6730cc3ac8bSMatthew Dillon else 6740cc3ac8bSMatthew Dillon bsd_args.flags |= MAP_NOSYNC; 67510931a46SJung-uk Kim if (linux_args->flags & LINUX_MAP_GROWSDOWN) 676146aad74SMarcel Moolenaar bsd_args.flags |= MAP_STACK; 677146aad74SMarcel Moolenaar 6780eef2f8aSAlexander Leidinger /* 67910931a46SJung-uk Kim * PROT_READ, PROT_WRITE, or PROT_EXEC implies PROT_READ and PROT_EXEC 68010931a46SJung-uk Kim * on Linux/i386. We do this to ensure maximum compatibility. 68110931a46SJung-uk Kim * Linux/ia64 does the same in i386 emulation mode. 68210931a46SJung-uk Kim */ 68310931a46SJung-uk Kim bsd_args.prot = linux_args->prot; 68410931a46SJung-uk Kim if (bsd_args.prot & (PROT_READ | PROT_WRITE | PROT_EXEC)) 68510931a46SJung-uk Kim bsd_args.prot |= PROT_READ | PROT_EXEC; 68610931a46SJung-uk Kim 68710931a46SJung-uk Kim if (linux_args->fd != -1) { 68810931a46SJung-uk Kim /* 68910931a46SJung-uk Kim * Linux follows Solaris mmap(2) description: 69010931a46SJung-uk Kim * The file descriptor fildes is opened with 69110931a46SJung-uk Kim * read permission, regardless of the 69210931a46SJung-uk Kim * protection options specified. 69310931a46SJung-uk Kim */ 69410931a46SJung-uk Kim 69510931a46SJung-uk Kim if ((error = fget(td, linux_args->fd, &fp)) != 0) 69610931a46SJung-uk Kim return (error); 69710931a46SJung-uk Kim if (fp->f_type != DTYPE_VNODE) { 69810931a46SJung-uk Kim fdrop(fp, td); 69910931a46SJung-uk Kim return (EINVAL); 70010931a46SJung-uk Kim } 70110931a46SJung-uk Kim 70210931a46SJung-uk Kim /* Linux mmap() just fails for O_WRONLY files */ 70310931a46SJung-uk Kim if (!(fp->f_flag & FREAD)) { 70410931a46SJung-uk Kim fdrop(fp, td); 70510931a46SJung-uk Kim return (EACCES); 70610931a46SJung-uk Kim } 70710931a46SJung-uk Kim 70810931a46SJung-uk Kim fdrop(fp, td); 70910931a46SJung-uk Kim } 71010931a46SJung-uk Kim bsd_args.fd = linux_args->fd; 71110931a46SJung-uk Kim 71210931a46SJung-uk Kim if (linux_args->flags & LINUX_MAP_GROWSDOWN) { 71310931a46SJung-uk Kim /* 7140eef2f8aSAlexander Leidinger * The linux MAP_GROWSDOWN option does not limit auto 715146aad74SMarcel Moolenaar * growth of the region. Linux mmap with this option 716146aad74SMarcel Moolenaar * takes as addr the inital BOS, and as len, the initial 717146aad74SMarcel Moolenaar * region size. It can then grow down from addr without 718146aad74SMarcel Moolenaar * limit. However, linux threads has an implicit internal 719146aad74SMarcel Moolenaar * limit to stack size of STACK_SIZE. Its just not 720146aad74SMarcel Moolenaar * enforced explicitly in linux. But, here we impose 721146aad74SMarcel Moolenaar * a limit of (STACK_SIZE - GUARD_SIZE) on the stack 722146aad74SMarcel Moolenaar * region, since we can do this with our mmap. 723146aad74SMarcel Moolenaar * 724146aad74SMarcel Moolenaar * Our mmap with MAP_STACK takes addr as the maximum 725146aad74SMarcel Moolenaar * downsize limit on BOS, and as len the max size of 726146aad74SMarcel Moolenaar * the region. It them maps the top SGROWSIZ bytes, 727802e08a3SAlexander Leidinger * and auto grows the region down, up to the limit 728146aad74SMarcel Moolenaar * in addr. 729146aad74SMarcel Moolenaar * 730146aad74SMarcel Moolenaar * If we don't use the MAP_STACK option, the effect 731146aad74SMarcel Moolenaar * of this code is to allocate a stack region of a 732146aad74SMarcel Moolenaar * fixed size of (STACK_SIZE - GUARD_SIZE). 733146aad74SMarcel Moolenaar */ 734146aad74SMarcel Moolenaar 73510931a46SJung-uk Kim if ((caddr_t)PTRIN(linux_args->addr) + linux_args->len > 73610931a46SJung-uk Kim p->p_vmspace->vm_maxsaddr) { 7370eef2f8aSAlexander Leidinger /* 7380eef2f8aSAlexander Leidinger * Some linux apps will attempt to mmap 739242fae60SAndrew Gallatin * thread stacks near the top of their 740242fae60SAndrew Gallatin * address space. If their TOS is greater 741242fae60SAndrew Gallatin * than vm_maxsaddr, vm_map_growstack() 742242fae60SAndrew Gallatin * will confuse the thread stack with the 743242fae60SAndrew Gallatin * process stack and deliver a SEGV if they 744242fae60SAndrew Gallatin * attempt to grow the thread stack past their 745242fae60SAndrew Gallatin * current stacksize rlimit. To avoid this, 746242fae60SAndrew Gallatin * adjust vm_maxsaddr upwards to reflect 747242fae60SAndrew Gallatin * the current stacksize rlimit rather 748242fae60SAndrew Gallatin * than the maximum possible stacksize. 749242fae60SAndrew Gallatin * It would be better to adjust the 750242fae60SAndrew Gallatin * mmap'ed region, but some apps do not check 751242fae60SAndrew Gallatin * mmap's return value. 752242fae60SAndrew Gallatin */ 75391d5354aSJohn Baldwin PROC_LOCK(p); 754242fae60SAndrew Gallatin p->p_vmspace->vm_maxsaddr = (char *)USRSTACK - 75591d5354aSJohn Baldwin lim_cur(p, RLIMIT_STACK); 75691d5354aSJohn Baldwin PROC_UNLOCK(p); 757242fae60SAndrew Gallatin } 758242fae60SAndrew Gallatin 759146aad74SMarcel Moolenaar /* This gives us our maximum stack size */ 7603ad9c842SMaxim Sobolev if (linux_args->len > STACK_SIZE - GUARD_SIZE) 7613ad9c842SMaxim Sobolev bsd_args.len = linux_args->len; 762146aad74SMarcel Moolenaar else 763146aad74SMarcel Moolenaar bsd_args.len = STACK_SIZE - GUARD_SIZE; 764146aad74SMarcel Moolenaar 7650eef2f8aSAlexander Leidinger /* 7660eef2f8aSAlexander Leidinger * This gives us a new BOS. If we're using VM_STACK, then 767146aad74SMarcel Moolenaar * mmap will just map the top SGROWSIZ bytes, and let 768146aad74SMarcel Moolenaar * the stack grow down to the limit at BOS. If we're 769146aad74SMarcel Moolenaar * not using VM_STACK we map the full stack, since we 770146aad74SMarcel Moolenaar * don't have a way to autogrow it. 771146aad74SMarcel Moolenaar */ 77210931a46SJung-uk Kim bsd_args.addr = (caddr_t)PTRIN(linux_args->addr) - 77310931a46SJung-uk Kim bsd_args.len; 774146aad74SMarcel Moolenaar } else { 77510931a46SJung-uk Kim bsd_args.addr = (caddr_t)PTRIN(linux_args->addr); 7763ad9c842SMaxim Sobolev bsd_args.len = linux_args->len; 777146aad74SMarcel Moolenaar } 77810931a46SJung-uk Kim bsd_args.pos = linux_args->pgoff; 779146aad74SMarcel Moolenaar bsd_args.pad = 0; 780146aad74SMarcel Moolenaar 781146aad74SMarcel Moolenaar #ifdef DEBUG 78224593369SJonathan Lemon if (ldebug(mmap)) 78391d631e5SMatthew N. Dodd printf("-> %s(%p, %d, %d, 0x%08x, %d, 0x%x)\n", 78491d631e5SMatthew N. Dodd __func__, 78524593369SJonathan Lemon (void *)bsd_args.addr, bsd_args.len, bsd_args.prot, 78624593369SJonathan Lemon bsd_args.flags, bsd_args.fd, (int)bsd_args.pos); 787146aad74SMarcel Moolenaar #endif 78891d631e5SMatthew N. Dodd error = mmap(td, &bsd_args); 78991d631e5SMatthew N. Dodd #ifdef DEBUG 79091d631e5SMatthew N. Dodd if (ldebug(mmap)) 79191d631e5SMatthew N. Dodd printf("-> %s() return: 0x%x (0x%08x)\n", 79291d631e5SMatthew N. Dodd __func__, error, (u_int)td->td_retval[0]); 79391d631e5SMatthew N. Dodd #endif 79491d631e5SMatthew N. Dodd return (error); 795146aad74SMarcel Moolenaar } 796146aad74SMarcel Moolenaar 797146aad74SMarcel Moolenaar int 79810931a46SJung-uk Kim linux_mprotect(struct thread *td, struct linux_mprotect_args *uap) 79910931a46SJung-uk Kim { 80010931a46SJung-uk Kim struct mprotect_args bsd_args; 80110931a46SJung-uk Kim 80210931a46SJung-uk Kim bsd_args.addr = uap->addr; 80310931a46SJung-uk Kim bsd_args.len = uap->len; 80410931a46SJung-uk Kim bsd_args.prot = uap->prot; 80510931a46SJung-uk Kim if (bsd_args.prot & (PROT_READ | PROT_WRITE | PROT_EXEC)) 80610931a46SJung-uk Kim bsd_args.prot |= PROT_READ | PROT_EXEC; 80710931a46SJung-uk Kim return (mprotect(td, &bsd_args)); 80810931a46SJung-uk Kim } 80910931a46SJung-uk Kim 81010931a46SJung-uk Kim int 811b40ce416SJulian Elischer linux_pipe(struct thread *td, struct linux_pipe_args *args) 812146aad74SMarcel Moolenaar { 813146aad74SMarcel Moolenaar int error; 814146aad74SMarcel Moolenaar int reg_edx; 815146aad74SMarcel Moolenaar 816146aad74SMarcel Moolenaar #ifdef DEBUG 81724593369SJonathan Lemon if (ldebug(pipe)) 81824593369SJonathan Lemon printf(ARGS(pipe, "*")); 819146aad74SMarcel Moolenaar #endif 820146aad74SMarcel Moolenaar 821b40ce416SJulian Elischer reg_edx = td->td_retval[1]; 822b40ce416SJulian Elischer error = pipe(td, 0); 823146aad74SMarcel Moolenaar if (error) { 824b40ce416SJulian Elischer td->td_retval[1] = reg_edx; 825146aad74SMarcel Moolenaar return (error); 826146aad74SMarcel Moolenaar } 827146aad74SMarcel Moolenaar 828b40ce416SJulian Elischer error = copyout(td->td_retval, args->pipefds, 2*sizeof(int)); 829146aad74SMarcel Moolenaar if (error) { 830b40ce416SJulian Elischer td->td_retval[1] = reg_edx; 831146aad74SMarcel Moolenaar return (error); 832146aad74SMarcel Moolenaar } 833146aad74SMarcel Moolenaar 834b40ce416SJulian Elischer td->td_retval[1] = reg_edx; 835b40ce416SJulian Elischer td->td_retval[0] = 0; 836146aad74SMarcel Moolenaar return (0); 837146aad74SMarcel Moolenaar } 838146aad74SMarcel Moolenaar 839146aad74SMarcel Moolenaar int 840b40ce416SJulian Elischer linux_ioperm(struct thread *td, struct linux_ioperm_args *args) 841146aad74SMarcel Moolenaar { 84284569dffSMaxim Sobolev int error; 84384569dffSMaxim Sobolev struct i386_ioperm_args iia; 844146aad74SMarcel Moolenaar 84584569dffSMaxim Sobolev iia.start = args->start; 84684569dffSMaxim Sobolev iia.length = args->length; 84784569dffSMaxim Sobolev iia.enable = args->enable; 84884569dffSMaxim Sobolev mtx_lock(&Giant); 84984569dffSMaxim Sobolev error = i386_set_ioperm(td, &iia); 85084569dffSMaxim Sobolev mtx_unlock(&Giant); 85184569dffSMaxim Sobolev return (error); 852146aad74SMarcel Moolenaar } 853146aad74SMarcel Moolenaar 854146aad74SMarcel Moolenaar int 855b40ce416SJulian Elischer linux_iopl(struct thread *td, struct linux_iopl_args *args) 856146aad74SMarcel Moolenaar { 857146aad74SMarcel Moolenaar int error; 858146aad74SMarcel Moolenaar 859146aad74SMarcel Moolenaar if (args->level < 0 || args->level > 3) 860146aad74SMarcel Moolenaar return (EINVAL); 861acd3428bSRobert Watson if ((error = priv_check(td, PRIV_IO)) != 0) 862146aad74SMarcel Moolenaar return (error); 863a854ed98SJohn Baldwin if ((error = securelevel_gt(td->td_ucred, 0)) != 0) 86441c42188SRobert Watson return (error); 865b40ce416SJulian Elischer td->td_frame->tf_eflags = (td->td_frame->tf_eflags & ~PSL_IOPL) | 866146aad74SMarcel Moolenaar (args->level * (PSL_IOPL / 3)); 867146aad74SMarcel Moolenaar return (0); 868146aad74SMarcel Moolenaar } 869146aad74SMarcel Moolenaar 870146aad74SMarcel Moolenaar int 871b07cd97eSMark Murray linux_modify_ldt(struct thread *td, struct linux_modify_ldt_args *uap) 872146aad74SMarcel Moolenaar { 873146aad74SMarcel Moolenaar int error; 87484569dffSMaxim Sobolev struct i386_ldt_args ldt; 8755002a60fSMarcel Moolenaar struct l_descriptor ld; 87684569dffSMaxim Sobolev union descriptor desc; 877146aad74SMarcel Moolenaar 878146aad74SMarcel Moolenaar if (uap->ptr == NULL) 879146aad74SMarcel Moolenaar return (EINVAL); 880146aad74SMarcel Moolenaar 881146aad74SMarcel Moolenaar switch (uap->func) { 882146aad74SMarcel Moolenaar case 0x00: /* read_ldt */ 88384569dffSMaxim Sobolev ldt.start = 0; 88484569dffSMaxim Sobolev ldt.descs = uap->ptr; 88584569dffSMaxim Sobolev ldt.num = uap->bytecount / sizeof(union descriptor); 88684569dffSMaxim Sobolev mtx_lock(&Giant); 88784569dffSMaxim Sobolev error = i386_get_ldt(td, &ldt); 888b40ce416SJulian Elischer td->td_retval[0] *= sizeof(union descriptor); 88984569dffSMaxim Sobolev mtx_unlock(&Giant); 890146aad74SMarcel Moolenaar break; 891146aad74SMarcel Moolenaar case 0x01: /* write_ldt */ 892146aad74SMarcel Moolenaar case 0x11: /* write_ldt */ 893146aad74SMarcel Moolenaar if (uap->bytecount != sizeof(ld)) 894146aad74SMarcel Moolenaar return (EINVAL); 895146aad74SMarcel Moolenaar 896146aad74SMarcel Moolenaar error = copyin(uap->ptr, &ld, sizeof(ld)); 897146aad74SMarcel Moolenaar if (error) 898146aad74SMarcel Moolenaar return (error); 899146aad74SMarcel Moolenaar 90084569dffSMaxim Sobolev ldt.start = ld.entry_number; 90184569dffSMaxim Sobolev ldt.descs = &desc; 90284569dffSMaxim Sobolev ldt.num = 1; 90384569dffSMaxim Sobolev desc.sd.sd_lolimit = (ld.limit & 0x0000ffff); 90484569dffSMaxim Sobolev desc.sd.sd_hilimit = (ld.limit & 0x000f0000) >> 16; 90584569dffSMaxim Sobolev desc.sd.sd_lobase = (ld.base_addr & 0x00ffffff); 90684569dffSMaxim Sobolev desc.sd.sd_hibase = (ld.base_addr & 0xff000000) >> 24; 90784569dffSMaxim Sobolev desc.sd.sd_type = SDT_MEMRO | ((ld.read_exec_only ^ 1) << 1) | 908146aad74SMarcel Moolenaar (ld.contents << 2); 90984569dffSMaxim Sobolev desc.sd.sd_dpl = 3; 91084569dffSMaxim Sobolev desc.sd.sd_p = (ld.seg_not_present ^ 1); 91184569dffSMaxim Sobolev desc.sd.sd_xx = 0; 91284569dffSMaxim Sobolev desc.sd.sd_def32 = ld.seg_32bit; 91384569dffSMaxim Sobolev desc.sd.sd_gran = ld.limit_in_pages; 91484569dffSMaxim Sobolev mtx_lock(&Giant); 91584569dffSMaxim Sobolev error = i386_set_ldt(td, &ldt, &desc); 91684569dffSMaxim Sobolev mtx_unlock(&Giant); 917146aad74SMarcel Moolenaar break; 918146aad74SMarcel Moolenaar default: 919146aad74SMarcel Moolenaar error = EINVAL; 920146aad74SMarcel Moolenaar break; 921146aad74SMarcel Moolenaar } 922146aad74SMarcel Moolenaar 923146aad74SMarcel Moolenaar if (error == EOPNOTSUPP) { 924146aad74SMarcel Moolenaar printf("linux: modify_ldt needs kernel option USER_LDT\n"); 925146aad74SMarcel Moolenaar error = ENOSYS; 926146aad74SMarcel Moolenaar } 927146aad74SMarcel Moolenaar 928146aad74SMarcel Moolenaar return (error); 929146aad74SMarcel Moolenaar } 930146aad74SMarcel Moolenaar 931146aad74SMarcel Moolenaar int 932b40ce416SJulian Elischer linux_sigaction(struct thread *td, struct linux_sigaction_args *args) 933146aad74SMarcel Moolenaar { 9345002a60fSMarcel Moolenaar l_osigaction_t osa; 9355002a60fSMarcel Moolenaar l_sigaction_t act, oact; 936146aad74SMarcel Moolenaar int error; 937146aad74SMarcel Moolenaar 938146aad74SMarcel Moolenaar #ifdef DEBUG 93924593369SJonathan Lemon if (ldebug(sigaction)) 94024593369SJonathan Lemon printf(ARGS(sigaction, "%d, %p, %p"), 941146aad74SMarcel Moolenaar args->sig, (void *)args->nsa, (void *)args->osa); 942146aad74SMarcel Moolenaar #endif 943146aad74SMarcel Moolenaar 944146aad74SMarcel Moolenaar if (args->nsa != NULL) { 9454b7ef73dSDag-Erling Smørgrav error = copyin(args->nsa, &osa, sizeof(l_osigaction_t)); 946146aad74SMarcel Moolenaar if (error) 947146aad74SMarcel Moolenaar return (error); 948146aad74SMarcel Moolenaar act.lsa_handler = osa.lsa_handler; 949146aad74SMarcel Moolenaar act.lsa_flags = osa.lsa_flags; 950146aad74SMarcel Moolenaar act.lsa_restorer = osa.lsa_restorer; 951146aad74SMarcel Moolenaar LINUX_SIGEMPTYSET(act.lsa_mask); 952146aad74SMarcel Moolenaar act.lsa_mask.__bits[0] = osa.lsa_mask; 953146aad74SMarcel Moolenaar } 954146aad74SMarcel Moolenaar 955b40ce416SJulian Elischer error = linux_do_sigaction(td, args->sig, args->nsa ? &act : NULL, 956146aad74SMarcel Moolenaar args->osa ? &oact : NULL); 957146aad74SMarcel Moolenaar 958146aad74SMarcel Moolenaar if (args->osa != NULL && !error) { 959146aad74SMarcel Moolenaar osa.lsa_handler = oact.lsa_handler; 960146aad74SMarcel Moolenaar osa.lsa_flags = oact.lsa_flags; 961146aad74SMarcel Moolenaar osa.lsa_restorer = oact.lsa_restorer; 962146aad74SMarcel Moolenaar osa.lsa_mask = oact.lsa_mask.__bits[0]; 9634b7ef73dSDag-Erling Smørgrav error = copyout(&osa, args->osa, sizeof(l_osigaction_t)); 964146aad74SMarcel Moolenaar } 965146aad74SMarcel Moolenaar 966146aad74SMarcel Moolenaar return (error); 967146aad74SMarcel Moolenaar } 968146aad74SMarcel Moolenaar 969146aad74SMarcel Moolenaar /* 970146aad74SMarcel Moolenaar * Linux has two extra args, restart and oldmask. We dont use these, 971146aad74SMarcel Moolenaar * but it seems that "restart" is actually a context pointer that 972146aad74SMarcel Moolenaar * enables the signal to happen with a different register set. 973146aad74SMarcel Moolenaar */ 974146aad74SMarcel Moolenaar int 975b40ce416SJulian Elischer linux_sigsuspend(struct thread *td, struct linux_sigsuspend_args *args) 976146aad74SMarcel Moolenaar { 977206a5d3aSIan Dowse sigset_t sigmask; 9785002a60fSMarcel Moolenaar l_sigset_t mask; 979146aad74SMarcel Moolenaar 980146aad74SMarcel Moolenaar #ifdef DEBUG 98124593369SJonathan Lemon if (ldebug(sigsuspend)) 98224593369SJonathan Lemon printf(ARGS(sigsuspend, "%08lx"), (unsigned long)args->mask); 983146aad74SMarcel Moolenaar #endif 984146aad74SMarcel Moolenaar 985146aad74SMarcel Moolenaar LINUX_SIGEMPTYSET(mask); 986146aad74SMarcel Moolenaar mask.__bits[0] = args->mask; 987206a5d3aSIan Dowse linux_to_bsd_sigset(&mask, &sigmask); 988206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 989146aad74SMarcel Moolenaar } 990146aad74SMarcel Moolenaar 991146aad74SMarcel Moolenaar int 992b07cd97eSMark Murray linux_rt_sigsuspend(struct thread *td, struct linux_rt_sigsuspend_args *uap) 993146aad74SMarcel Moolenaar { 9945002a60fSMarcel Moolenaar l_sigset_t lmask; 995206a5d3aSIan Dowse sigset_t sigmask; 996146aad74SMarcel Moolenaar int error; 997146aad74SMarcel Moolenaar 998146aad74SMarcel Moolenaar #ifdef DEBUG 99924593369SJonathan Lemon if (ldebug(rt_sigsuspend)) 100024593369SJonathan Lemon printf(ARGS(rt_sigsuspend, "%p, %d"), 1001146aad74SMarcel Moolenaar (void *)uap->newset, uap->sigsetsize); 1002146aad74SMarcel Moolenaar #endif 1003146aad74SMarcel Moolenaar 10045002a60fSMarcel Moolenaar if (uap->sigsetsize != sizeof(l_sigset_t)) 1005146aad74SMarcel Moolenaar return (EINVAL); 1006146aad74SMarcel Moolenaar 10075002a60fSMarcel Moolenaar error = copyin(uap->newset, &lmask, sizeof(l_sigset_t)); 1008146aad74SMarcel Moolenaar if (error) 1009146aad74SMarcel Moolenaar return (error); 1010146aad74SMarcel Moolenaar 1011206a5d3aSIan Dowse linux_to_bsd_sigset(&lmask, &sigmask); 1012206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 1013146aad74SMarcel Moolenaar } 1014146aad74SMarcel Moolenaar 1015146aad74SMarcel Moolenaar int 1016b40ce416SJulian Elischer linux_pause(struct thread *td, struct linux_pause_args *args) 1017146aad74SMarcel Moolenaar { 1018b40ce416SJulian Elischer struct proc *p = td->td_proc; 1019206a5d3aSIan Dowse sigset_t sigmask; 1020146aad74SMarcel Moolenaar 1021146aad74SMarcel Moolenaar #ifdef DEBUG 102224593369SJonathan Lemon if (ldebug(pause)) 102324593369SJonathan Lemon printf(ARGS(pause, "")); 1024146aad74SMarcel Moolenaar #endif 1025146aad74SMarcel Moolenaar 1026fdfdfb78SJohn Baldwin PROC_LOCK(p); 10274093529dSJeff Roberson sigmask = td->td_sigmask; 1028fdfdfb78SJohn Baldwin PROC_UNLOCK(p); 1029206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 1030146aad74SMarcel Moolenaar } 1031146aad74SMarcel Moolenaar 1032146aad74SMarcel Moolenaar int 1033b40ce416SJulian Elischer linux_sigaltstack(struct thread *td, struct linux_sigaltstack_args *uap) 1034146aad74SMarcel Moolenaar { 1035206a5d3aSIan Dowse stack_t ss, oss; 10365002a60fSMarcel Moolenaar l_stack_t lss; 1037146aad74SMarcel Moolenaar int error; 1038146aad74SMarcel Moolenaar 1039146aad74SMarcel Moolenaar #ifdef DEBUG 104024593369SJonathan Lemon if (ldebug(sigaltstack)) 104124593369SJonathan Lemon printf(ARGS(sigaltstack, "%p, %p"), uap->uss, uap->uoss); 1042146aad74SMarcel Moolenaar #endif 1043146aad74SMarcel Moolenaar 1044206a5d3aSIan Dowse if (uap->uss != NULL) { 10455002a60fSMarcel Moolenaar error = copyin(uap->uss, &lss, sizeof(l_stack_t)); 1046146aad74SMarcel Moolenaar if (error) 1047146aad74SMarcel Moolenaar return (error); 1048146aad74SMarcel Moolenaar 1049206a5d3aSIan Dowse ss.ss_sp = lss.ss_sp; 1050206a5d3aSIan Dowse ss.ss_size = lss.ss_size; 1051206a5d3aSIan Dowse ss.ss_flags = linux_to_bsd_sigaltstack(lss.ss_flags); 1052931a7258SAndrew Gallatin } 1053ef36ad69SJohn Baldwin error = kern_sigaltstack(td, (uap->uss != NULL) ? &ss : NULL, 1054ef36ad69SJohn Baldwin (uap->uoss != NULL) ? &oss : NULL); 1055206a5d3aSIan Dowse if (!error && uap->uoss != NULL) { 1056206a5d3aSIan Dowse lss.ss_sp = oss.ss_sp; 1057206a5d3aSIan Dowse lss.ss_size = oss.ss_size; 1058206a5d3aSIan Dowse lss.ss_flags = bsd_to_linux_sigaltstack(oss.ss_flags); 10595002a60fSMarcel Moolenaar error = copyout(&lss, uap->uoss, sizeof(l_stack_t)); 1060146aad74SMarcel Moolenaar } 1061146aad74SMarcel Moolenaar 1062146aad74SMarcel Moolenaar return (error); 1063146aad74SMarcel Moolenaar } 10643ad9c842SMaxim Sobolev 10653ad9c842SMaxim Sobolev int 10663ad9c842SMaxim Sobolev linux_ftruncate64(struct thread *td, struct linux_ftruncate64_args *args) 10673ad9c842SMaxim Sobolev { 10683ad9c842SMaxim Sobolev struct ftruncate_args sa; 10693ad9c842SMaxim Sobolev 10703ad9c842SMaxim Sobolev #ifdef DEBUG 10713ad9c842SMaxim Sobolev if (ldebug(ftruncate64)) 1072b45bbfc3SBruce Evans printf(ARGS(ftruncate64, "%u, %jd"), args->fd, 1073b45bbfc3SBruce Evans (intmax_t)args->length); 10743ad9c842SMaxim Sobolev #endif 10753ad9c842SMaxim Sobolev 10763ad9c842SMaxim Sobolev sa.fd = args->fd; 10773ad9c842SMaxim Sobolev sa.pad = 0; 10783ad9c842SMaxim Sobolev sa.length = args->length; 10793ad9c842SMaxim Sobolev return ftruncate(td, &sa); 10803ad9c842SMaxim Sobolev } 10811bc85c0dSDoug Rabson 10821bc85c0dSDoug Rabson int 10831bc85c0dSDoug Rabson linux_set_thread_area(struct thread *td, struct linux_set_thread_area_args *args) 10841bc85c0dSDoug Rabson { 10859b44bfc5SAlexander Leidinger struct l_user_desc info; 10869b44bfc5SAlexander Leidinger int error; 10879b44bfc5SAlexander Leidinger int idx; 10889b44bfc5SAlexander Leidinger int a[2]; 10899b44bfc5SAlexander Leidinger struct segment_descriptor sd; 10909b44bfc5SAlexander Leidinger 10919b44bfc5SAlexander Leidinger error = copyin(args->desc, &info, sizeof(struct l_user_desc)); 10929b44bfc5SAlexander Leidinger if (error) 10939b44bfc5SAlexander Leidinger return (error); 10949b44bfc5SAlexander Leidinger 10959b44bfc5SAlexander Leidinger #ifdef DEBUG 10969b44bfc5SAlexander Leidinger if (ldebug(set_thread_area)) 10979b44bfc5SAlexander Leidinger printf(ARGS(set_thread_area, "%i, %x, %x, %i, %i, %i, %i, %i, %i\n"), 10989b44bfc5SAlexander Leidinger info.entry_number, 10999b44bfc5SAlexander Leidinger info.base_addr, 11009b44bfc5SAlexander Leidinger info.limit, 11019b44bfc5SAlexander Leidinger info.seg_32bit, 11029b44bfc5SAlexander Leidinger info.contents, 11039b44bfc5SAlexander Leidinger info.read_exec_only, 11049b44bfc5SAlexander Leidinger info.limit_in_pages, 11059b44bfc5SAlexander Leidinger info.seg_not_present, 11069b44bfc5SAlexander Leidinger info.useable); 11079b44bfc5SAlexander Leidinger #endif 11089b44bfc5SAlexander Leidinger 11099b44bfc5SAlexander Leidinger idx = info.entry_number; 11100eef2f8aSAlexander Leidinger /* 1111802e08a3SAlexander Leidinger * Semantics of linux version: every thread in the system has array of 1112802e08a3SAlexander Leidinger * 3 tls descriptors. 1st is GLIBC TLS, 2nd is WINE, 3rd unknown. This 1113802e08a3SAlexander Leidinger * syscall loads one of the selected tls decriptors with a value and 1114802e08a3SAlexander Leidinger * also loads GDT descriptors 6, 7 and 8 with the content of the 1115802e08a3SAlexander Leidinger * per-thread descriptors. 11169b44bfc5SAlexander Leidinger * 1117802e08a3SAlexander Leidinger * Semantics of fbsd version: I think we can ignore that linux has 3 1118802e08a3SAlexander Leidinger * per-thread descriptors and use just the 1st one. The tls_array[] 1119802e08a3SAlexander Leidinger * is used only in set/get-thread_area() syscalls and for loading the 1120802e08a3SAlexander Leidinger * GDT descriptors. In fbsd we use just one GDT descriptor for TLS so 1121802e08a3SAlexander Leidinger * we will load just one. 1122802e08a3SAlexander Leidinger * 1123802e08a3SAlexander Leidinger * XXX: this doesn't work when a user space process tries to use more 1124802e08a3SAlexander Leidinger * than 1 TLS segment. Comment in the linux sources says wine might do 1125802e08a3SAlexander Leidinger * this. 11261bc85c0dSDoug Rabson */ 11279b44bfc5SAlexander Leidinger 11280eef2f8aSAlexander Leidinger /* 11290eef2f8aSAlexander Leidinger * we support just GLIBC TLS now 11309b44bfc5SAlexander Leidinger * we should let 3 proceed as well because we use this segment so 11319b44bfc5SAlexander Leidinger * if code does two subsequent calls it should succeed 11329b44bfc5SAlexander Leidinger */ 11339b44bfc5SAlexander Leidinger if (idx != 6 && idx != -1 && idx != 3) 11349b44bfc5SAlexander Leidinger return (EINVAL); 11359b44bfc5SAlexander Leidinger 11360eef2f8aSAlexander Leidinger /* 11370eef2f8aSAlexander Leidinger * we have to copy out the GDT entry we use 11389b44bfc5SAlexander Leidinger * FreeBSD uses GDT entry #3 for storing %gs so load that 1139802e08a3SAlexander Leidinger * 1140802e08a3SAlexander Leidinger * XXX: what if a user space program doesn't check this value and tries 11419b44bfc5SAlexander Leidinger * to use 6, 7 or 8? 11429b44bfc5SAlexander Leidinger */ 11439b44bfc5SAlexander Leidinger idx = info.entry_number = 3; 11449b44bfc5SAlexander Leidinger error = copyout(&info, args->desc, sizeof(struct l_user_desc)); 11459b44bfc5SAlexander Leidinger if (error) 11469b44bfc5SAlexander Leidinger return (error); 11479b44bfc5SAlexander Leidinger 11489b44bfc5SAlexander Leidinger if (LDT_empty(&info)) { 11499b44bfc5SAlexander Leidinger a[0] = 0; 11509b44bfc5SAlexander Leidinger a[1] = 0; 11519b44bfc5SAlexander Leidinger } else { 11529b44bfc5SAlexander Leidinger a[0] = LDT_entry_a(&info); 11539b44bfc5SAlexander Leidinger a[1] = LDT_entry_b(&info); 11541bc85c0dSDoug Rabson } 11551bc85c0dSDoug Rabson 11569b44bfc5SAlexander Leidinger memcpy(&sd, &a, sizeof(a)); 11579b44bfc5SAlexander Leidinger #ifdef DEBUG 11589b44bfc5SAlexander Leidinger if (ldebug(set_thread_area)) 11599b44bfc5SAlexander Leidinger printf("Segment created in set_thread_area: lobase: %x, hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, def32: %i, gran: %i\n", sd.sd_lobase, 11609b44bfc5SAlexander Leidinger sd.sd_hibase, 11619b44bfc5SAlexander Leidinger sd.sd_lolimit, 11629b44bfc5SAlexander Leidinger sd.sd_hilimit, 11639b44bfc5SAlexander Leidinger sd.sd_type, 11649b44bfc5SAlexander Leidinger sd.sd_dpl, 11659b44bfc5SAlexander Leidinger sd.sd_p, 11669b44bfc5SAlexander Leidinger sd.sd_xx, 11679b44bfc5SAlexander Leidinger sd.sd_def32, 11689b44bfc5SAlexander Leidinger sd.sd_gran); 11699b44bfc5SAlexander Leidinger #endif 11701bc85c0dSDoug Rabson 11719b44bfc5SAlexander Leidinger /* this is taken from i386 version of cpu_set_user_tls() */ 11729b44bfc5SAlexander Leidinger critical_enter(); 11739b44bfc5SAlexander Leidinger /* set %gs */ 11749b44bfc5SAlexander Leidinger td->td_pcb->pcb_gsd = sd; 11759b44bfc5SAlexander Leidinger PCPU_GET(fsgs_gdt)[1] = sd; 11769b44bfc5SAlexander Leidinger load_gs(GSEL(GUGS_SEL, SEL_UPL)); 11779b44bfc5SAlexander Leidinger critical_exit(); 11789b44bfc5SAlexander Leidinger 11791bc85c0dSDoug Rabson return (0); 11801bc85c0dSDoug Rabson } 11811bc85c0dSDoug Rabson 11821bc85c0dSDoug Rabson int 11839b44bfc5SAlexander Leidinger linux_get_thread_area(struct thread *td, struct linux_get_thread_area_args *args) 11841bc85c0dSDoug Rabson { 11851bc85c0dSDoug Rabson 11869b44bfc5SAlexander Leidinger struct l_user_desc info; 11879b44bfc5SAlexander Leidinger int error; 11889b44bfc5SAlexander Leidinger int idx; 11899b44bfc5SAlexander Leidinger struct l_desc_struct desc; 11909b44bfc5SAlexander Leidinger struct segment_descriptor sd; 11919b44bfc5SAlexander Leidinger 11929b44bfc5SAlexander Leidinger #ifdef DEBUG 11939b44bfc5SAlexander Leidinger if (ldebug(get_thread_area)) 11949b44bfc5SAlexander Leidinger printf(ARGS(get_thread_area, "%p"), args->desc); 11959b44bfc5SAlexander Leidinger #endif 11969b44bfc5SAlexander Leidinger 11979b44bfc5SAlexander Leidinger error = copyin(args->desc, &info, sizeof(struct l_user_desc)); 11989b44bfc5SAlexander Leidinger if (error) 11999b44bfc5SAlexander Leidinger return (error); 12009b44bfc5SAlexander Leidinger 12019b44bfc5SAlexander Leidinger idx = info.entry_number; 12029b44bfc5SAlexander Leidinger /* XXX: I am not sure if we want 3 to be allowed too. */ 12039b44bfc5SAlexander Leidinger if (idx != 6 && idx != 3) 12049b44bfc5SAlexander Leidinger return (EINVAL); 12059b44bfc5SAlexander Leidinger 12069b44bfc5SAlexander Leidinger idx = 3; 12079b44bfc5SAlexander Leidinger 12089b44bfc5SAlexander Leidinger memset(&info, 0, sizeof(info)); 12099b44bfc5SAlexander Leidinger 12109b44bfc5SAlexander Leidinger sd = PCPU_GET(fsgs_gdt)[1]; 12119b44bfc5SAlexander Leidinger 12129b44bfc5SAlexander Leidinger memcpy(&desc, &sd, sizeof(desc)); 12139b44bfc5SAlexander Leidinger 12149b44bfc5SAlexander Leidinger info.entry_number = idx; 12159b44bfc5SAlexander Leidinger info.base_addr = GET_BASE(&desc); 12169b44bfc5SAlexander Leidinger info.limit = GET_LIMIT(&desc); 12179b44bfc5SAlexander Leidinger info.seg_32bit = GET_32BIT(&desc); 12189b44bfc5SAlexander Leidinger info.contents = GET_CONTENTS(&desc); 12199b44bfc5SAlexander Leidinger info.read_exec_only = !GET_WRITABLE(&desc); 12209b44bfc5SAlexander Leidinger info.limit_in_pages = GET_LIMIT_PAGES(&desc); 12219b44bfc5SAlexander Leidinger info.seg_not_present = !GET_PRESENT(&desc); 12229b44bfc5SAlexander Leidinger info.useable = GET_USEABLE(&desc); 12239b44bfc5SAlexander Leidinger 12249b44bfc5SAlexander Leidinger error = copyout(&info, args->desc, sizeof(struct l_user_desc)); 12259b44bfc5SAlexander Leidinger if (error) 12269b44bfc5SAlexander Leidinger return (EFAULT); 12279b44bfc5SAlexander Leidinger 12289b44bfc5SAlexander Leidinger return (0); 12299b44bfc5SAlexander Leidinger } 12309b44bfc5SAlexander Leidinger 12319b44bfc5SAlexander Leidinger /* copied from kern/kern_time.c */ 12329b44bfc5SAlexander Leidinger int 12339b44bfc5SAlexander Leidinger linux_timer_create(struct thread *td, struct linux_timer_create_args *args) 12349b44bfc5SAlexander Leidinger { 12359b44bfc5SAlexander Leidinger return ktimer_create(td, (struct ktimer_create_args *) args); 12369b44bfc5SAlexander Leidinger } 12379b44bfc5SAlexander Leidinger 12389b44bfc5SAlexander Leidinger int 12399b44bfc5SAlexander Leidinger linux_timer_settime(struct thread *td, struct linux_timer_settime_args *args) 12409b44bfc5SAlexander Leidinger { 12419b44bfc5SAlexander Leidinger return ktimer_settime(td, (struct ktimer_settime_args *) args); 12429b44bfc5SAlexander Leidinger } 12439b44bfc5SAlexander Leidinger 12449b44bfc5SAlexander Leidinger int 12459b44bfc5SAlexander Leidinger linux_timer_gettime(struct thread *td, struct linux_timer_gettime_args *args) 12469b44bfc5SAlexander Leidinger { 12479b44bfc5SAlexander Leidinger return ktimer_gettime(td, (struct ktimer_gettime_args *) args); 12489b44bfc5SAlexander Leidinger } 12499b44bfc5SAlexander Leidinger 12509b44bfc5SAlexander Leidinger int 12519b44bfc5SAlexander Leidinger linux_timer_getoverrun(struct thread *td, struct linux_timer_getoverrun_args *args) 12529b44bfc5SAlexander Leidinger { 12539b44bfc5SAlexander Leidinger return ktimer_getoverrun(td, (struct ktimer_getoverrun_args *) args); 12549b44bfc5SAlexander Leidinger } 12559b44bfc5SAlexander Leidinger 12569b44bfc5SAlexander Leidinger int 12579b44bfc5SAlexander Leidinger linux_timer_delete(struct thread *td, struct linux_timer_delete_args *args) 12589b44bfc5SAlexander Leidinger { 12599b44bfc5SAlexander Leidinger return ktimer_delete(td, (struct ktimer_delete_args *) args); 12609b44bfc5SAlexander Leidinger } 12619b44bfc5SAlexander Leidinger 12629b44bfc5SAlexander Leidinger /* XXX: this wont work with module - convert it */ 12639b44bfc5SAlexander Leidinger int 12649b44bfc5SAlexander Leidinger linux_mq_open(struct thread *td, struct linux_mq_open_args *args) 12659b44bfc5SAlexander Leidinger { 12669b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12679b44bfc5SAlexander Leidinger return kmq_open(td, (struct kmq_open_args *) args); 12689b44bfc5SAlexander Leidinger #else 12699b44bfc5SAlexander Leidinger return (ENOSYS); 12709b44bfc5SAlexander Leidinger #endif 12719b44bfc5SAlexander Leidinger } 12729b44bfc5SAlexander Leidinger 12739b44bfc5SAlexander Leidinger int 12749b44bfc5SAlexander Leidinger linux_mq_unlink(struct thread *td, struct linux_mq_unlink_args *args) 12759b44bfc5SAlexander Leidinger { 12769b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12779b44bfc5SAlexander Leidinger return kmq_unlink(td, (struct kmq_unlink_args *) args); 12789b44bfc5SAlexander Leidinger #else 12799b44bfc5SAlexander Leidinger return (ENOSYS); 12809b44bfc5SAlexander Leidinger #endif 12819b44bfc5SAlexander Leidinger } 12829b44bfc5SAlexander Leidinger 12839b44bfc5SAlexander Leidinger int 12849b44bfc5SAlexander Leidinger linux_mq_timedsend(struct thread *td, struct linux_mq_timedsend_args *args) 12859b44bfc5SAlexander Leidinger { 12869b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12879b44bfc5SAlexander Leidinger return kmq_timedsend(td, (struct kmq_timedsend_args *) args); 12889b44bfc5SAlexander Leidinger #else 12899b44bfc5SAlexander Leidinger return (ENOSYS); 12909b44bfc5SAlexander Leidinger #endif 12919b44bfc5SAlexander Leidinger } 12929b44bfc5SAlexander Leidinger 12939b44bfc5SAlexander Leidinger int 12949b44bfc5SAlexander Leidinger linux_mq_timedreceive(struct thread *td, struct linux_mq_timedreceive_args *args) 12959b44bfc5SAlexander Leidinger { 12969b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12979b44bfc5SAlexander Leidinger return kmq_timedreceive(td, (struct kmq_timedreceive_args *) args); 12989b44bfc5SAlexander Leidinger #else 12999b44bfc5SAlexander Leidinger return (ENOSYS); 13009b44bfc5SAlexander Leidinger #endif 13019b44bfc5SAlexander Leidinger } 13029b44bfc5SAlexander Leidinger 13039b44bfc5SAlexander Leidinger int 13049b44bfc5SAlexander Leidinger linux_mq_notify(struct thread *td, struct linux_mq_notify_args *args) 13059b44bfc5SAlexander Leidinger { 13069b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 13079b44bfc5SAlexander Leidinger return kmq_notify(td, (struct kmq_notify_args *) args); 13089b44bfc5SAlexander Leidinger #else 13099b44bfc5SAlexander Leidinger return (ENOSYS); 13109b44bfc5SAlexander Leidinger #endif 13119b44bfc5SAlexander Leidinger } 13129b44bfc5SAlexander Leidinger 13139b44bfc5SAlexander Leidinger int 13149b44bfc5SAlexander Leidinger linux_mq_getsetattr(struct thread *td, struct linux_mq_getsetattr_args *args) 13159b44bfc5SAlexander Leidinger { 13169b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 13179b44bfc5SAlexander Leidinger return kmq_setattr(td, (struct kmq_setattr_args *) args); 13189b44bfc5SAlexander Leidinger #else 13199b44bfc5SAlexander Leidinger return (ENOSYS); 13209b44bfc5SAlexander Leidinger #endif 13211bc85c0dSDoug Rabson } 13221bc85c0dSDoug Rabson 1323