1146aad74SMarcel Moolenaar /*- 2146aad74SMarcel Moolenaar * Copyright (c) 2000 Marcel Moolenaar 3146aad74SMarcel Moolenaar * All rights reserved. 4146aad74SMarcel Moolenaar * 5146aad74SMarcel Moolenaar * Redistribution and use in source and binary forms, with or without 6146aad74SMarcel Moolenaar * modification, are permitted provided that the following conditions 7146aad74SMarcel Moolenaar * are met: 8146aad74SMarcel Moolenaar * 1. Redistributions of source code must retain the above copyright 9146aad74SMarcel Moolenaar * notice, this list of conditions and the following disclaimer 10146aad74SMarcel Moolenaar * in this position and unchanged. 11146aad74SMarcel Moolenaar * 2. Redistributions in binary form must reproduce the above copyright 12146aad74SMarcel Moolenaar * notice, this list of conditions and the following disclaimer in the 13146aad74SMarcel Moolenaar * documentation and/or other materials provided with the distribution. 14146aad74SMarcel Moolenaar * 3. The name of the author may not be used to endorse or promote products 15bc34729cSMarcel Moolenaar * derived from this software without specific prior written permission. 16146aad74SMarcel Moolenaar * 17146aad74SMarcel Moolenaar * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 18146aad74SMarcel Moolenaar * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 19146aad74SMarcel Moolenaar * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 20146aad74SMarcel Moolenaar * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 21146aad74SMarcel Moolenaar * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 22146aad74SMarcel Moolenaar * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23146aad74SMarcel Moolenaar * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24146aad74SMarcel Moolenaar * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25146aad74SMarcel Moolenaar * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 26146aad74SMarcel Moolenaar * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27146aad74SMarcel Moolenaar */ 28146aad74SMarcel Moolenaar 2927e0099cSDavid E. O'Brien #include <sys/cdefs.h> 3027e0099cSDavid E. O'Brien __FBSDID("$FreeBSD$"); 3127e0099cSDavid E. O'Brien 32146aad74SMarcel Moolenaar #include <sys/param.h> 33146aad74SMarcel Moolenaar #include <sys/systm.h> 34a312f6a3SAlexander Leidinger #include <sys/file.h> 35a312f6a3SAlexander Leidinger #include <sys/fcntl.h> 36610ecfe0SMaxim Sobolev #include <sys/imgact.h> 377106ca0dSJohn Baldwin #include <sys/lock.h> 38610ecfe0SMaxim Sobolev #include <sys/malloc.h> 39fb919e4dSMark Murray #include <sys/mman.h> 40fb919e4dSMark Murray #include <sys/mutex.h> 419b44bfc5SAlexander Leidinger #include <sys/sx.h> 42acd3428bSRobert Watson #include <sys/priv.h> 43fb919e4dSMark Murray #include <sys/proc.h> 449b44bfc5SAlexander Leidinger #include <sys/queue.h> 45242fae60SAndrew Gallatin #include <sys/resource.h> 46242fae60SAndrew Gallatin #include <sys/resourcevar.h> 471bc85c0dSDoug Rabson #include <sys/signalvar.h> 48206a5d3aSIan Dowse #include <sys/syscallsubr.h> 49fb919e4dSMark Murray #include <sys/sysproto.h> 50fb919e4dSMark Murray #include <sys/unistd.h> 519b44bfc5SAlexander Leidinger #include <sys/wait.h> 52f0393f06SJeff Roberson #include <sys/sched.h> 53146aad74SMarcel Moolenaar 54146aad74SMarcel Moolenaar #include <machine/frame.h> 55146aad74SMarcel Moolenaar #include <machine/psl.h> 56146aad74SMarcel Moolenaar #include <machine/segments.h> 57146aad74SMarcel Moolenaar #include <machine/sysarch.h> 58146aad74SMarcel Moolenaar 59242fae60SAndrew Gallatin #include <vm/vm.h> 60242fae60SAndrew Gallatin #include <vm/pmap.h> 61242fae60SAndrew Gallatin #include <vm/vm_map.h> 62242fae60SAndrew Gallatin 63146aad74SMarcel Moolenaar #include <i386/linux/linux.h> 64ebea8660SMarcel Moolenaar #include <i386/linux/linux_proto.h> 65146aad74SMarcel Moolenaar #include <compat/linux/linux_ipc.h> 66146aad74SMarcel Moolenaar #include <compat/linux/linux_signal.h> 67146aad74SMarcel Moolenaar #include <compat/linux/linux_util.h> 689b44bfc5SAlexander Leidinger #include <compat/linux/linux_emul.h> 699b44bfc5SAlexander Leidinger 709b44bfc5SAlexander Leidinger #include <i386/include/pcb.h> /* needed for pcb definition in linux_set_thread_area */ 719b44bfc5SAlexander Leidinger 729b44bfc5SAlexander Leidinger #include "opt_posix.h" 739b44bfc5SAlexander Leidinger 749b44bfc5SAlexander Leidinger extern struct sysentvec elf32_freebsd_sysvec; /* defined in i386/i386/elf_machdep.c */ 75146aad74SMarcel Moolenaar 765002a60fSMarcel Moolenaar struct l_descriptor { 775002a60fSMarcel Moolenaar l_uint entry_number; 785002a60fSMarcel Moolenaar l_ulong base_addr; 795002a60fSMarcel Moolenaar l_uint limit; 805002a60fSMarcel Moolenaar l_uint seg_32bit:1; 815002a60fSMarcel Moolenaar l_uint contents:2; 825002a60fSMarcel Moolenaar l_uint read_exec_only:1; 835002a60fSMarcel Moolenaar l_uint limit_in_pages:1; 845002a60fSMarcel Moolenaar l_uint seg_not_present:1; 855002a60fSMarcel Moolenaar l_uint useable:1; 86146aad74SMarcel Moolenaar }; 87146aad74SMarcel Moolenaar 885002a60fSMarcel Moolenaar struct l_old_select_argv { 895002a60fSMarcel Moolenaar l_int nfds; 905002a60fSMarcel Moolenaar l_fd_set *readfds; 915002a60fSMarcel Moolenaar l_fd_set *writefds; 925002a60fSMarcel Moolenaar l_fd_set *exceptfds; 935002a60fSMarcel Moolenaar struct l_timeval *timeout; 94146aad74SMarcel Moolenaar }; 95146aad74SMarcel Moolenaar 96146aad74SMarcel Moolenaar int 97931a7258SAndrew Gallatin linux_to_bsd_sigaltstack(int lsa) 98931a7258SAndrew Gallatin { 99931a7258SAndrew Gallatin int bsa = 0; 100931a7258SAndrew Gallatin 101931a7258SAndrew Gallatin if (lsa & LINUX_SS_DISABLE) 102931a7258SAndrew Gallatin bsa |= SS_DISABLE; 103931a7258SAndrew Gallatin if (lsa & LINUX_SS_ONSTACK) 104931a7258SAndrew Gallatin bsa |= SS_ONSTACK; 105931a7258SAndrew Gallatin return (bsa); 106931a7258SAndrew Gallatin } 107931a7258SAndrew Gallatin 108931a7258SAndrew Gallatin int 109931a7258SAndrew Gallatin bsd_to_linux_sigaltstack(int bsa) 110931a7258SAndrew Gallatin { 111931a7258SAndrew Gallatin int lsa = 0; 112931a7258SAndrew Gallatin 113931a7258SAndrew Gallatin if (bsa & SS_DISABLE) 114931a7258SAndrew Gallatin lsa |= LINUX_SS_DISABLE; 115931a7258SAndrew Gallatin if (bsa & SS_ONSTACK) 116931a7258SAndrew Gallatin lsa |= LINUX_SS_ONSTACK; 117931a7258SAndrew Gallatin return (lsa); 118931a7258SAndrew Gallatin } 119931a7258SAndrew Gallatin 120931a7258SAndrew Gallatin int 121b40ce416SJulian Elischer linux_execve(struct thread *td, struct linux_execve_args *args) 122146aad74SMarcel Moolenaar { 123610ecfe0SMaxim Sobolev int error; 124610ecfe0SMaxim Sobolev char *newpath; 125610ecfe0SMaxim Sobolev struct image_args eargs; 126146aad74SMarcel Moolenaar 127d9e97471SJohn Baldwin LCONVPATHEXIST(td, args->path, &newpath); 128146aad74SMarcel Moolenaar 129146aad74SMarcel Moolenaar #ifdef DEBUG 13024593369SJonathan Lemon if (ldebug(execve)) 131610ecfe0SMaxim Sobolev printf(ARGS(execve, "%s"), newpath); 132146aad74SMarcel Moolenaar #endif 133146aad74SMarcel Moolenaar 134610ecfe0SMaxim Sobolev error = exec_copyin_args(&eargs, newpath, UIO_SYSSPACE, 135610ecfe0SMaxim Sobolev args->argp, args->envp); 136610ecfe0SMaxim Sobolev free(newpath, M_TEMP); 137610ecfe0SMaxim Sobolev if (error == 0) 138c035ac04SMaxim Sobolev error = kern_execve(td, &eargs, NULL); 1399b44bfc5SAlexander Leidinger if (error == 0) 1409b44bfc5SAlexander Leidinger /* linux process can exec fbsd one, dont attempt 1419b44bfc5SAlexander Leidinger * to create emuldata for such process using 1429b44bfc5SAlexander Leidinger * linux_proc_init, this leads to a panic on KASSERT 1439b44bfc5SAlexander Leidinger * because such process has p->p_emuldata == NULL 1449b44bfc5SAlexander Leidinger */ 1459b44bfc5SAlexander Leidinger if (td->td_proc->p_sysent == &elf_linux_sysvec) 1469b44bfc5SAlexander Leidinger error = linux_proc_init(td, 0, 0); 147610ecfe0SMaxim Sobolev return (error); 148146aad74SMarcel Moolenaar } 149146aad74SMarcel Moolenaar 1505002a60fSMarcel Moolenaar struct l_ipc_kludge { 1515002a60fSMarcel Moolenaar struct l_msgbuf *msgp; 1525002a60fSMarcel Moolenaar l_long msgtyp; 1535002a60fSMarcel Moolenaar }; 1545002a60fSMarcel Moolenaar 155146aad74SMarcel Moolenaar int 156b40ce416SJulian Elischer linux_ipc(struct thread *td, struct linux_ipc_args *args) 157146aad74SMarcel Moolenaar { 1585002a60fSMarcel Moolenaar 1595002a60fSMarcel Moolenaar switch (args->what & 0xFFFF) { 1605002a60fSMarcel Moolenaar case LINUX_SEMOP: { 1615002a60fSMarcel Moolenaar struct linux_semop_args a; 1625002a60fSMarcel Moolenaar 1635002a60fSMarcel Moolenaar a.semid = args->arg1; 1645002a60fSMarcel Moolenaar a.tsops = args->ptr; 1655002a60fSMarcel Moolenaar a.nsops = args->arg2; 166b40ce416SJulian Elischer return (linux_semop(td, &a)); 1675002a60fSMarcel Moolenaar } 1685002a60fSMarcel Moolenaar case LINUX_SEMGET: { 1695002a60fSMarcel Moolenaar struct linux_semget_args a; 1705002a60fSMarcel Moolenaar 1715002a60fSMarcel Moolenaar a.key = args->arg1; 1725002a60fSMarcel Moolenaar a.nsems = args->arg2; 1735002a60fSMarcel Moolenaar a.semflg = args->arg3; 174b40ce416SJulian Elischer return (linux_semget(td, &a)); 1755002a60fSMarcel Moolenaar } 1765002a60fSMarcel Moolenaar case LINUX_SEMCTL: { 1775002a60fSMarcel Moolenaar struct linux_semctl_args a; 1785002a60fSMarcel Moolenaar int error; 1795002a60fSMarcel Moolenaar 1805002a60fSMarcel Moolenaar a.semid = args->arg1; 1815002a60fSMarcel Moolenaar a.semnum = args->arg2; 1825002a60fSMarcel Moolenaar a.cmd = args->arg3; 1834b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &a.arg, sizeof(a.arg)); 1845002a60fSMarcel Moolenaar if (error) 1855002a60fSMarcel Moolenaar return (error); 186b40ce416SJulian Elischer return (linux_semctl(td, &a)); 1875002a60fSMarcel Moolenaar } 1885002a60fSMarcel Moolenaar case LINUX_MSGSND: { 1895002a60fSMarcel Moolenaar struct linux_msgsnd_args a; 1905002a60fSMarcel Moolenaar 1915002a60fSMarcel Moolenaar a.msqid = args->arg1; 1925002a60fSMarcel Moolenaar a.msgp = args->ptr; 1935002a60fSMarcel Moolenaar a.msgsz = args->arg2; 1945002a60fSMarcel Moolenaar a.msgflg = args->arg3; 195b40ce416SJulian Elischer return (linux_msgsnd(td, &a)); 1965002a60fSMarcel Moolenaar } 1975002a60fSMarcel Moolenaar case LINUX_MSGRCV: { 1985002a60fSMarcel Moolenaar struct linux_msgrcv_args a; 1995002a60fSMarcel Moolenaar 2005002a60fSMarcel Moolenaar a.msqid = args->arg1; 2015002a60fSMarcel Moolenaar a.msgsz = args->arg2; 2025002a60fSMarcel Moolenaar a.msgflg = args->arg3; 2035002a60fSMarcel Moolenaar if ((args->what >> 16) == 0) { 2045002a60fSMarcel Moolenaar struct l_ipc_kludge tmp; 2055002a60fSMarcel Moolenaar int error; 2065002a60fSMarcel Moolenaar 2075002a60fSMarcel Moolenaar if (args->ptr == NULL) 2085002a60fSMarcel Moolenaar return (EINVAL); 2094b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &tmp, sizeof(tmp)); 2105002a60fSMarcel Moolenaar if (error) 2115002a60fSMarcel Moolenaar return (error); 2125002a60fSMarcel Moolenaar a.msgp = tmp.msgp; 2135002a60fSMarcel Moolenaar a.msgtyp = tmp.msgtyp; 2145002a60fSMarcel Moolenaar } else { 2155002a60fSMarcel Moolenaar a.msgp = args->ptr; 2165002a60fSMarcel Moolenaar a.msgtyp = args->arg5; 2175002a60fSMarcel Moolenaar } 218b40ce416SJulian Elischer return (linux_msgrcv(td, &a)); 2195002a60fSMarcel Moolenaar } 2205002a60fSMarcel Moolenaar case LINUX_MSGGET: { 2215002a60fSMarcel Moolenaar struct linux_msgget_args a; 2225002a60fSMarcel Moolenaar 2235002a60fSMarcel Moolenaar a.key = args->arg1; 2245002a60fSMarcel Moolenaar a.msgflg = args->arg2; 225b40ce416SJulian Elischer return (linux_msgget(td, &a)); 2265002a60fSMarcel Moolenaar } 2275002a60fSMarcel Moolenaar case LINUX_MSGCTL: { 2285002a60fSMarcel Moolenaar struct linux_msgctl_args a; 2295002a60fSMarcel Moolenaar 2305002a60fSMarcel Moolenaar a.msqid = args->arg1; 2315002a60fSMarcel Moolenaar a.cmd = args->arg2; 2325002a60fSMarcel Moolenaar a.buf = args->ptr; 233b40ce416SJulian Elischer return (linux_msgctl(td, &a)); 2345002a60fSMarcel Moolenaar } 2355002a60fSMarcel Moolenaar case LINUX_SHMAT: { 2365002a60fSMarcel Moolenaar struct linux_shmat_args a; 2375002a60fSMarcel Moolenaar 2385002a60fSMarcel Moolenaar a.shmid = args->arg1; 2395002a60fSMarcel Moolenaar a.shmaddr = args->ptr; 2405002a60fSMarcel Moolenaar a.shmflg = args->arg2; 2415002a60fSMarcel Moolenaar a.raddr = (l_ulong *)args->arg3; 242b40ce416SJulian Elischer return (linux_shmat(td, &a)); 2435002a60fSMarcel Moolenaar } 2445002a60fSMarcel Moolenaar case LINUX_SHMDT: { 2455002a60fSMarcel Moolenaar struct linux_shmdt_args a; 2465002a60fSMarcel Moolenaar 2475002a60fSMarcel Moolenaar a.shmaddr = args->ptr; 248b40ce416SJulian Elischer return (linux_shmdt(td, &a)); 2495002a60fSMarcel Moolenaar } 2505002a60fSMarcel Moolenaar case LINUX_SHMGET: { 2515002a60fSMarcel Moolenaar struct linux_shmget_args a; 2525002a60fSMarcel Moolenaar 2535002a60fSMarcel Moolenaar a.key = args->arg1; 2545002a60fSMarcel Moolenaar a.size = args->arg2; 2555002a60fSMarcel Moolenaar a.shmflg = args->arg3; 256b40ce416SJulian Elischer return (linux_shmget(td, &a)); 2575002a60fSMarcel Moolenaar } 2585002a60fSMarcel Moolenaar case LINUX_SHMCTL: { 2595002a60fSMarcel Moolenaar struct linux_shmctl_args a; 2605002a60fSMarcel Moolenaar 2615002a60fSMarcel Moolenaar a.shmid = args->arg1; 2625002a60fSMarcel Moolenaar a.cmd = args->arg2; 2635002a60fSMarcel Moolenaar a.buf = args->ptr; 264b40ce416SJulian Elischer return (linux_shmctl(td, &a)); 2655002a60fSMarcel Moolenaar } 2665002a60fSMarcel Moolenaar default: 2675002a60fSMarcel Moolenaar break; 268146aad74SMarcel Moolenaar } 269146aad74SMarcel Moolenaar 2705002a60fSMarcel Moolenaar return (EINVAL); 271146aad74SMarcel Moolenaar } 272146aad74SMarcel Moolenaar 273146aad74SMarcel Moolenaar int 274b40ce416SJulian Elischer linux_old_select(struct thread *td, struct linux_old_select_args *args) 275146aad74SMarcel Moolenaar { 2765002a60fSMarcel Moolenaar struct l_old_select_argv linux_args; 2775002a60fSMarcel Moolenaar struct linux_select_args newsel; 278146aad74SMarcel Moolenaar int error; 279146aad74SMarcel Moolenaar 2805002a60fSMarcel Moolenaar #ifdef DEBUG 2815002a60fSMarcel Moolenaar if (ldebug(old_select)) 2826aea6777SPeter Wemm printf(ARGS(old_select, "%p"), args->ptr); 283146aad74SMarcel Moolenaar #endif 284146aad74SMarcel Moolenaar 2854b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &linux_args, sizeof(linux_args)); 286146aad74SMarcel Moolenaar if (error) 287146aad74SMarcel Moolenaar return (error); 288146aad74SMarcel Moolenaar 289146aad74SMarcel Moolenaar newsel.nfds = linux_args.nfds; 290146aad74SMarcel Moolenaar newsel.readfds = linux_args.readfds; 291146aad74SMarcel Moolenaar newsel.writefds = linux_args.writefds; 292146aad74SMarcel Moolenaar newsel.exceptfds = linux_args.exceptfds; 293146aad74SMarcel Moolenaar newsel.timeout = linux_args.timeout; 294b40ce416SJulian Elischer return (linux_select(td, &newsel)); 295146aad74SMarcel Moolenaar } 296146aad74SMarcel Moolenaar 297146aad74SMarcel Moolenaar int 298b40ce416SJulian Elischer linux_fork(struct thread *td, struct linux_fork_args *args) 299146aad74SMarcel Moolenaar { 300146aad74SMarcel Moolenaar int error; 301d071f504SAlexander Leidinger struct proc *p2; 302d071f504SAlexander Leidinger struct thread *td2; 303146aad74SMarcel Moolenaar 304146aad74SMarcel Moolenaar #ifdef DEBUG 30524593369SJonathan Lemon if (ldebug(fork)) 30624593369SJonathan Lemon printf(ARGS(fork, "")); 307146aad74SMarcel Moolenaar #endif 308146aad74SMarcel Moolenaar 309d071f504SAlexander Leidinger if ((error = fork1(td, RFFDG | RFPROC | RFSTOPPED, 0, &p2)) != 0) 310146aad74SMarcel Moolenaar return (error); 311146aad74SMarcel Moolenaar 312d071f504SAlexander Leidinger if (error == 0) { 313d071f504SAlexander Leidinger td->td_retval[0] = p2->p_pid; 314d071f504SAlexander Leidinger td->td_retval[1] = 0; 315d071f504SAlexander Leidinger } 316d071f504SAlexander Leidinger 317b40ce416SJulian Elischer if (td->td_retval[1] == 1) 318b40ce416SJulian Elischer td->td_retval[0] = 0; 3199b44bfc5SAlexander Leidinger error = linux_proc_init(td, td->td_retval[0], 0); 3209b44bfc5SAlexander Leidinger if (error) 3219b44bfc5SAlexander Leidinger return (error); 3229b44bfc5SAlexander Leidinger 323d071f504SAlexander Leidinger td2 = FIRST_THREAD_IN_PROC(p2); 324d071f504SAlexander Leidinger 325d071f504SAlexander Leidinger /* 326d071f504SAlexander Leidinger * Make this runnable after we are finished with it. 327d071f504SAlexander Leidinger */ 328d071f504SAlexander Leidinger mtx_lock_spin(&sched_lock); 329d071f504SAlexander Leidinger TD_SET_CAN_RUN(td2); 330f0393f06SJeff Roberson sched_add(td2, SRQ_BORING); 331d071f504SAlexander Leidinger mtx_unlock_spin(&sched_lock); 332d071f504SAlexander Leidinger 333146aad74SMarcel Moolenaar return (0); 334146aad74SMarcel Moolenaar } 335146aad74SMarcel Moolenaar 336146aad74SMarcel Moolenaar int 337b40ce416SJulian Elischer linux_vfork(struct thread *td, struct linux_vfork_args *args) 338146aad74SMarcel Moolenaar { 339146aad74SMarcel Moolenaar int error; 34040f734ddSAlexander Leidinger struct proc *p2; 341d071f504SAlexander Leidinger struct thread *td2; 342146aad74SMarcel Moolenaar 343146aad74SMarcel Moolenaar #ifdef DEBUG 34424593369SJonathan Lemon if (ldebug(vfork)) 34524593369SJonathan Lemon printf(ARGS(vfork, "")); 346146aad74SMarcel Moolenaar #endif 347146aad74SMarcel Moolenaar 34840f734ddSAlexander Leidinger /* exclude RFPPWAIT */ 349d071f504SAlexander Leidinger if ((error = fork1(td, RFFDG | RFPROC | RFMEM | RFSTOPPED, 0, &p2)) != 0) 350146aad74SMarcel Moolenaar return (error); 35140f734ddSAlexander Leidinger if (error == 0) { 35240f734ddSAlexander Leidinger td->td_retval[0] = p2->p_pid; 35340f734ddSAlexander Leidinger td->td_retval[1] = 0; 35440f734ddSAlexander Leidinger } 355146aad74SMarcel Moolenaar /* Are we the child? */ 356b40ce416SJulian Elischer if (td->td_retval[1] == 1) 357b40ce416SJulian Elischer td->td_retval[0] = 0; 3589b44bfc5SAlexander Leidinger error = linux_proc_init(td, td->td_retval[0], 0); 3599b44bfc5SAlexander Leidinger if (error) 3609b44bfc5SAlexander Leidinger return (error); 361d071f504SAlexander Leidinger 36240f734ddSAlexander Leidinger PROC_LOCK(p2); 363973ac082SAlexander Leidinger p2->p_flag |= P_PPWAIT; 364d071f504SAlexander Leidinger PROC_UNLOCK(p2); 365d071f504SAlexander Leidinger 366d071f504SAlexander Leidinger td2 = FIRST_THREAD_IN_PROC(p2); 367d071f504SAlexander Leidinger 368d071f504SAlexander Leidinger /* 369d071f504SAlexander Leidinger * Make this runnable after we are finished with it. 370d071f504SAlexander Leidinger */ 371d071f504SAlexander Leidinger mtx_lock_spin(&sched_lock); 372d071f504SAlexander Leidinger TD_SET_CAN_RUN(td2); 373f0393f06SJeff Roberson sched_add(td2, SRQ_BORING); 374d071f504SAlexander Leidinger mtx_unlock_spin(&sched_lock); 375d071f504SAlexander Leidinger 376d071f504SAlexander Leidinger /* wait for the children to exit, ie. emulate vfork */ 377d071f504SAlexander Leidinger PROC_LOCK(p2); 37840f734ddSAlexander Leidinger while (p2->p_flag & P_PPWAIT) 37940f734ddSAlexander Leidinger msleep(td->td_proc, &p2->p_mtx, PWAIT, "ppwait", 0); 38040f734ddSAlexander Leidinger PROC_UNLOCK(p2); 38140f734ddSAlexander Leidinger 382146aad74SMarcel Moolenaar return (0); 383146aad74SMarcel Moolenaar } 384146aad74SMarcel Moolenaar 385146aad74SMarcel Moolenaar int 386b40ce416SJulian Elischer linux_clone(struct thread *td, struct linux_clone_args *args) 387146aad74SMarcel Moolenaar { 3886ad0e7c5SJohn Baldwin int error, ff = RFPROC | RFSTOPPED; 389146aad74SMarcel Moolenaar struct proc *p2; 3909eb78fcfSJohn Baldwin struct thread *td2; 391146aad74SMarcel Moolenaar int exit_signal; 3929b44bfc5SAlexander Leidinger struct linux_emuldata *em; 393146aad74SMarcel Moolenaar 394146aad74SMarcel Moolenaar #ifdef DEBUG 39524593369SJonathan Lemon if (ldebug(clone)) { 3969b44bfc5SAlexander Leidinger printf(ARGS(clone, "flags %x, stack %x, parent tid: %x, child tid: %x"), 3979b44bfc5SAlexander Leidinger (unsigned int)args->flags, (unsigned int)args->stack, 3989b44bfc5SAlexander Leidinger (unsigned int)args->parent_tidptr, (unsigned int)args->child_tidptr); 39924593369SJonathan Lemon } 400146aad74SMarcel Moolenaar #endif 401146aad74SMarcel Moolenaar 402146aad74SMarcel Moolenaar exit_signal = args->flags & 0x000000ff; 4030f054958SAlexander Leidinger if (!LINUX_SIG_VALID(exit_signal) && exit_signal != 0) 404146aad74SMarcel Moolenaar return (EINVAL); 405146aad74SMarcel Moolenaar 406146aad74SMarcel Moolenaar if (exit_signal <= LINUX_SIGTBLSZ) 407146aad74SMarcel Moolenaar exit_signal = linux_to_bsd_signal[_SIG_IDX(exit_signal)]; 408146aad74SMarcel Moolenaar 409a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_VM) 410146aad74SMarcel Moolenaar ff |= RFMEM; 411a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_SIGHAND) 412146aad74SMarcel Moolenaar ff |= RFSIGSHARE; 4134b3583a3SAlexander Leidinger /* 4144b3583a3SAlexander Leidinger * XXX: in linux sharing of fs info (chroot/cwd/umask) 4154b3583a3SAlexander Leidinger * and open files is independant. in fbsd its in one 416802e08a3SAlexander Leidinger * structure but in reality it doesn't cause any problems 417802e08a3SAlexander Leidinger * because both of these flags are usually set together. 4184b3583a3SAlexander Leidinger */ 419a4e3bad7SJung-uk Kim if (!(args->flags & (LINUX_CLONE_FILES | LINUX_CLONE_FS))) 420146aad74SMarcel Moolenaar ff |= RFFDG; 421146aad74SMarcel Moolenaar 4224b178336SMaxim Sobolev /* 4234b178336SMaxim Sobolev * Attempt to detect when linux_clone(2) is used for creating 4244b178336SMaxim Sobolev * kernel threads. Unfortunately despite the existence of the 4254b178336SMaxim Sobolev * CLONE_THREAD flag, version of linuxthreads package used in 4264b178336SMaxim Sobolev * most popular distros as of beginning of 2005 doesn't make 427802e08a3SAlexander Leidinger * any use of it. Therefore, this detection relies on 4284b178336SMaxim Sobolev * empirical observation that linuxthreads sets certain 4294b178336SMaxim Sobolev * combination of flags, so that we can make more or less 4304b178336SMaxim Sobolev * precise detection and notify the FreeBSD kernel that several 4314b178336SMaxim Sobolev * processes are in fact part of the same threading group, so 4324b178336SMaxim Sobolev * that special treatment is necessary for signal delivery 4334b178336SMaxim Sobolev * between those processes and fd locking. 4344b178336SMaxim Sobolev */ 435a4e3bad7SJung-uk Kim if ((args->flags & 0xffffff00) == LINUX_THREADING_FLAGS) 4364b178336SMaxim Sobolev ff |= RFTHREAD; 4374b178336SMaxim Sobolev 438a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_PARENT_SETTID) 4391a26db0aSAlexander Leidinger if (args->parent_tidptr == NULL) 4401a26db0aSAlexander Leidinger return (EINVAL); 4411a26db0aSAlexander Leidinger 442316ec49aSScott Long error = fork1(td, ff, 0, &p2); 4439eb78fcfSJohn Baldwin if (error) 4449eb78fcfSJohn Baldwin return (error); 4459eb78fcfSJohn Baldwin 446a4e3bad7SJung-uk Kim if (args->flags & (LINUX_CLONE_PARENT | LINUX_CLONE_THREAD)) { 447a9ccaccfSKonstantin Belousov sx_xlock(&proctree_lock); 448a9ccaccfSKonstantin Belousov PROC_LOCK(p2); 449a9ccaccfSKonstantin Belousov proc_reparent(p2, td->td_proc->p_pptr); 450a9ccaccfSKonstantin Belousov PROC_UNLOCK(p2); 451a9ccaccfSKonstantin Belousov sx_xunlock(&proctree_lock); 452a9ccaccfSKonstantin Belousov } 453a9ccaccfSKonstantin Belousov 4549b44bfc5SAlexander Leidinger /* create the emuldata */ 4559b44bfc5SAlexander Leidinger error = linux_proc_init(td, p2->p_pid, args->flags); 4569b44bfc5SAlexander Leidinger /* reference it - no need to check this */ 4571c65504cSAlexander Leidinger em = em_find(p2, EMUL_DOLOCK); 4589b44bfc5SAlexander Leidinger KASSERT(em != NULL, ("clone: emuldata not found.\n")); 4599b44bfc5SAlexander Leidinger /* and adjust it */ 4609b44bfc5SAlexander Leidinger 461a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_THREAD) { 4629b44bfc5SAlexander Leidinger /* XXX: linux mangles pgrp and pptr somehow 4639b44bfc5SAlexander Leidinger * I think it might be this but I am not sure. 4649b44bfc5SAlexander Leidinger */ 4659b44bfc5SAlexander Leidinger #ifdef notyet 466a6c5f813SAlexander Leidinger PROC_LOCK(p2); 4679b44bfc5SAlexander Leidinger p2->p_pgrp = td->td_proc->p_pgrp; 468a6c5f813SAlexander Leidinger PROC_UNLOCK(p2); 4699b44bfc5SAlexander Leidinger #endif 4709b44bfc5SAlexander Leidinger exit_signal = 0; 4719b44bfc5SAlexander Leidinger } 4729b44bfc5SAlexander Leidinger 473a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_CHILD_SETTID) 4749b44bfc5SAlexander Leidinger em->child_set_tid = args->child_tidptr; 4759b44bfc5SAlexander Leidinger else 4769b44bfc5SAlexander Leidinger em->child_set_tid = NULL; 4779b44bfc5SAlexander Leidinger 478a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_CHILD_CLEARTID) 4799b44bfc5SAlexander Leidinger em->child_clear_tid = args->child_tidptr; 4809b44bfc5SAlexander Leidinger else 4819b44bfc5SAlexander Leidinger em->child_clear_tid = NULL; 482a6c5f813SAlexander Leidinger 4839b44bfc5SAlexander Leidinger EMUL_UNLOCK(&emul_lock); 484146aad74SMarcel Moolenaar 485a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_PARENT_SETTID) { 4861a26db0aSAlexander Leidinger error = copyout(&p2->p_pid, args->parent_tidptr, sizeof(p2->p_pid)); 4871a26db0aSAlexander Leidinger if (error) 4881a26db0aSAlexander Leidinger printf(LMSG("copyout failed!")); 4891a26db0aSAlexander Leidinger } 4901a26db0aSAlexander Leidinger 491fdfdfb78SJohn Baldwin PROC_LOCK(p2); 492146aad74SMarcel Moolenaar p2->p_sigparent = exit_signal; 4939eb78fcfSJohn Baldwin PROC_UNLOCK(p2); 4949eb78fcfSJohn Baldwin td2 = FIRST_THREAD_IN_PROC(p2); 4950eef2f8aSAlexander Leidinger /* 4960eef2f8aSAlexander Leidinger * in a case of stack = NULL we are supposed to COW calling process stack 4979b44bfc5SAlexander Leidinger * this is what normal fork() does so we just keep the tf_esp arg intact 4989b44bfc5SAlexander Leidinger */ 4999b44bfc5SAlexander Leidinger if (args->stack) 5009eb78fcfSJohn Baldwin td2->td_frame->tf_esp = (unsigned int)args->stack; 501146aad74SMarcel Moolenaar 502a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_SETTLS) { 5039b44bfc5SAlexander Leidinger struct l_user_desc info; 5049b44bfc5SAlexander Leidinger int idx; 5059b44bfc5SAlexander Leidinger int a[2]; 5069b44bfc5SAlexander Leidinger struct segment_descriptor sd; 5079b44bfc5SAlexander Leidinger 5089b44bfc5SAlexander Leidinger error = copyin((void *)td->td_frame->tf_esi, &info, sizeof(struct l_user_desc)); 5091a26db0aSAlexander Leidinger if (error) { 5101a26db0aSAlexander Leidinger printf(LMSG("copyin failed!")); 5111a26db0aSAlexander Leidinger } else { 5129b44bfc5SAlexander Leidinger 5139b44bfc5SAlexander Leidinger idx = info.entry_number; 5149b44bfc5SAlexander Leidinger 5150eef2f8aSAlexander Leidinger /* 5160eef2f8aSAlexander Leidinger * looks like we're getting the idx we returned 5179b44bfc5SAlexander Leidinger * in the set_thread_area() syscall 5189b44bfc5SAlexander Leidinger */ 5191a26db0aSAlexander Leidinger if (idx != 6 && idx != 3) { 5201a26db0aSAlexander Leidinger printf(LMSG("resetting idx!")); 5211a26db0aSAlexander Leidinger idx = 3; 5221a26db0aSAlexander Leidinger } 5239b44bfc5SAlexander Leidinger 5249b44bfc5SAlexander Leidinger /* this doesnt happen in practice */ 5259b44bfc5SAlexander Leidinger if (idx == 6) { 5269b44bfc5SAlexander Leidinger /* we might copy out the entry_number as 3 */ 5279b44bfc5SAlexander Leidinger info.entry_number = 3; 5289b44bfc5SAlexander Leidinger error = copyout(&info, (void *) td->td_frame->tf_esi, sizeof(struct l_user_desc)); 5299b44bfc5SAlexander Leidinger if (error) 5301a26db0aSAlexander Leidinger printf(LMSG("copyout failed!")); 5319b44bfc5SAlexander Leidinger } 5329b44bfc5SAlexander Leidinger 533a4e3bad7SJung-uk Kim a[0] = LINUX_LDT_entry_a(&info); 534a4e3bad7SJung-uk Kim a[1] = LINUX_LDT_entry_b(&info); 5359b44bfc5SAlexander Leidinger 5369b44bfc5SAlexander Leidinger memcpy(&sd, &a, sizeof(a)); 5379b44bfc5SAlexander Leidinger #ifdef DEBUG 5389b44bfc5SAlexander Leidinger if (ldebug(clone)) 5399b44bfc5SAlexander Leidinger printf("Segment created in clone with CLONE_SETTLS: lobase: %x, hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, def32: %i, gran: %i\n", sd.sd_lobase, 5409b44bfc5SAlexander Leidinger sd.sd_hibase, 5419b44bfc5SAlexander Leidinger sd.sd_lolimit, 5429b44bfc5SAlexander Leidinger sd.sd_hilimit, 5439b44bfc5SAlexander Leidinger sd.sd_type, 5449b44bfc5SAlexander Leidinger sd.sd_dpl, 5459b44bfc5SAlexander Leidinger sd.sd_p, 5469b44bfc5SAlexander Leidinger sd.sd_xx, 5479b44bfc5SAlexander Leidinger sd.sd_def32, 5489b44bfc5SAlexander Leidinger sd.sd_gran); 5499b44bfc5SAlexander Leidinger #endif 5509b44bfc5SAlexander Leidinger 5519b44bfc5SAlexander Leidinger /* set %gs */ 5529b44bfc5SAlexander Leidinger td2->td_pcb->pcb_gsd = sd; 553a6c5f813SAlexander Leidinger td2->td_pcb->pcb_gs = GSEL(GUGS_SEL, SEL_UPL); 5549b44bfc5SAlexander Leidinger } 5551a26db0aSAlexander Leidinger } 5569b44bfc5SAlexander Leidinger 557146aad74SMarcel Moolenaar #ifdef DEBUG 55824593369SJonathan Lemon if (ldebug(clone)) 5599eb78fcfSJohn Baldwin printf(LMSG("clone: successful rfork to %ld, stack %p sig = %d"), 5609eb78fcfSJohn Baldwin (long)p2->p_pid, args->stack, exit_signal); 561146aad74SMarcel Moolenaar #endif 562a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_VFORK) { 563d071f504SAlexander Leidinger PROC_LOCK(p2); 564d071f504SAlexander Leidinger p2->p_flag |= P_PPWAIT; 565d071f504SAlexander Leidinger PROC_UNLOCK(p2); 566d071f504SAlexander Leidinger } 567146aad74SMarcel Moolenaar 5686ad0e7c5SJohn Baldwin /* 5696ad0e7c5SJohn Baldwin * Make this runnable after we are finished with it. 5706ad0e7c5SJohn Baldwin */ 5716ad0e7c5SJohn Baldwin mtx_lock_spin(&sched_lock); 5729eb78fcfSJohn Baldwin TD_SET_CAN_RUN(td2); 573f0393f06SJeff Roberson sched_add(td2, SRQ_BORING); 5746ad0e7c5SJohn Baldwin mtx_unlock_spin(&sched_lock); 5756ad0e7c5SJohn Baldwin 5769eb78fcfSJohn Baldwin td->td_retval[0] = p2->p_pid; 5779eb78fcfSJohn Baldwin td->td_retval[1] = 0; 5780a62e035SAlexander Leidinger 579a4e3bad7SJung-uk Kim if (args->flags & LINUX_CLONE_VFORK) { 5800a62e035SAlexander Leidinger /* wait for the children to exit, ie. emulate vfork */ 5810a62e035SAlexander Leidinger PROC_LOCK(p2); 5820a62e035SAlexander Leidinger while (p2->p_flag & P_PPWAIT) 5830a62e035SAlexander Leidinger msleep(td->td_proc, &p2->p_mtx, PWAIT, "ppwait", 0); 5840a62e035SAlexander Leidinger PROC_UNLOCK(p2); 5850a62e035SAlexander Leidinger } 5860a62e035SAlexander Leidinger 5879eb78fcfSJohn Baldwin return (0); 588146aad74SMarcel Moolenaar } 589146aad74SMarcel Moolenaar 590146aad74SMarcel Moolenaar #define STACK_SIZE (2 * 1024 * 1024) 591146aad74SMarcel Moolenaar #define GUARD_SIZE (4 * PAGE_SIZE) 592146aad74SMarcel Moolenaar 5933ad9c842SMaxim Sobolev static int linux_mmap_common(struct thread *, struct l_mmap_argv *); 5943ad9c842SMaxim Sobolev 5953ad9c842SMaxim Sobolev int 5963ad9c842SMaxim Sobolev linux_mmap2(struct thread *td, struct linux_mmap2_args *args) 5973ad9c842SMaxim Sobolev { 5983ad9c842SMaxim Sobolev struct l_mmap_argv linux_args; 5993ad9c842SMaxim Sobolev 6003ad9c842SMaxim Sobolev #ifdef DEBUG 6013ad9c842SMaxim Sobolev if (ldebug(mmap2)) 6023ad9c842SMaxim Sobolev printf(ARGS(mmap2, "%p, %d, %d, 0x%08x, %d, %d"), 6033ad9c842SMaxim Sobolev (void *)args->addr, args->len, args->prot, 6043ad9c842SMaxim Sobolev args->flags, args->fd, args->pgoff); 6053ad9c842SMaxim Sobolev #endif 6063ad9c842SMaxim Sobolev 60710931a46SJung-uk Kim linux_args.addr = args->addr; 6083ad9c842SMaxim Sobolev linux_args.len = args->len; 6093ad9c842SMaxim Sobolev linux_args.prot = args->prot; 6103ad9c842SMaxim Sobolev linux_args.flags = args->flags; 6113ad9c842SMaxim Sobolev linux_args.fd = args->fd; 61210931a46SJung-uk Kim linux_args.pgoff = args->pgoff * PAGE_SIZE; 6133ad9c842SMaxim Sobolev 6143ad9c842SMaxim Sobolev return (linux_mmap_common(td, &linux_args)); 6153ad9c842SMaxim Sobolev } 6163ad9c842SMaxim Sobolev 617146aad74SMarcel Moolenaar int 618b40ce416SJulian Elischer linux_mmap(struct thread *td, struct linux_mmap_args *args) 619146aad74SMarcel Moolenaar { 6203ad9c842SMaxim Sobolev int error; 6213ad9c842SMaxim Sobolev struct l_mmap_argv linux_args; 6223ad9c842SMaxim Sobolev 6234b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &linux_args, sizeof(linux_args)); 6243ad9c842SMaxim Sobolev if (error) 6253ad9c842SMaxim Sobolev return (error); 6263ad9c842SMaxim Sobolev 6273ad9c842SMaxim Sobolev #ifdef DEBUG 6283ad9c842SMaxim Sobolev if (ldebug(mmap)) 6293ad9c842SMaxim Sobolev printf(ARGS(mmap, "%p, %d, %d, 0x%08x, %d, %d"), 630b45bbfc3SBruce Evans (void *)linux_args.addr, linux_args.len, linux_args.prot, 63110931a46SJung-uk Kim linux_args.flags, linux_args.fd, linux_args.pgoff); 6323ad9c842SMaxim Sobolev #endif 6333ad9c842SMaxim Sobolev 6343ad9c842SMaxim Sobolev return (linux_mmap_common(td, &linux_args)); 6353ad9c842SMaxim Sobolev } 6363ad9c842SMaxim Sobolev 6373ad9c842SMaxim Sobolev static int 6383ad9c842SMaxim Sobolev linux_mmap_common(struct thread *td, struct l_mmap_argv *linux_args) 6393ad9c842SMaxim Sobolev { 640b40ce416SJulian Elischer struct proc *p = td->td_proc; 641146aad74SMarcel Moolenaar struct mmap_args /* { 642146aad74SMarcel Moolenaar caddr_t addr; 643146aad74SMarcel Moolenaar size_t len; 644146aad74SMarcel Moolenaar int prot; 645146aad74SMarcel Moolenaar int flags; 646146aad74SMarcel Moolenaar int fd; 647146aad74SMarcel Moolenaar long pad; 648146aad74SMarcel Moolenaar off_t pos; 649146aad74SMarcel Moolenaar } */ bsd_args; 65091d631e5SMatthew N. Dodd int error; 651a312f6a3SAlexander Leidinger struct file *fp; 652146aad74SMarcel Moolenaar 65391d631e5SMatthew N. Dodd error = 0; 654146aad74SMarcel Moolenaar bsd_args.flags = 0; 655a312f6a3SAlexander Leidinger fp = NULL; 656a312f6a3SAlexander Leidinger 657a312f6a3SAlexander Leidinger /* 658a312f6a3SAlexander Leidinger * Linux mmap(2): 659a312f6a3SAlexander Leidinger * You must specify exactly one of MAP_SHARED and MAP_PRIVATE 660a312f6a3SAlexander Leidinger */ 661a312f6a3SAlexander Leidinger if (! ((linux_args->flags & LINUX_MAP_SHARED) ^ 662a312f6a3SAlexander Leidinger (linux_args->flags & LINUX_MAP_PRIVATE))) 6636dc4e810SAlexander Leidinger return (EINVAL); 664a312f6a3SAlexander Leidinger 6653ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_SHARED) 666146aad74SMarcel Moolenaar bsd_args.flags |= MAP_SHARED; 6673ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_PRIVATE) 668146aad74SMarcel Moolenaar bsd_args.flags |= MAP_PRIVATE; 6693ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_FIXED) 670146aad74SMarcel Moolenaar bsd_args.flags |= MAP_FIXED; 6713ad9c842SMaxim Sobolev if (linux_args->flags & LINUX_MAP_ANON) 672146aad74SMarcel Moolenaar bsd_args.flags |= MAP_ANON; 6730cc3ac8bSMatthew Dillon else 6740cc3ac8bSMatthew Dillon bsd_args.flags |= MAP_NOSYNC; 67510931a46SJung-uk Kim if (linux_args->flags & LINUX_MAP_GROWSDOWN) 676146aad74SMarcel Moolenaar bsd_args.flags |= MAP_STACK; 677146aad74SMarcel Moolenaar 6780eef2f8aSAlexander Leidinger /* 67910931a46SJung-uk Kim * PROT_READ, PROT_WRITE, or PROT_EXEC implies PROT_READ and PROT_EXEC 68010931a46SJung-uk Kim * on Linux/i386. We do this to ensure maximum compatibility. 68110931a46SJung-uk Kim * Linux/ia64 does the same in i386 emulation mode. 68210931a46SJung-uk Kim */ 68310931a46SJung-uk Kim bsd_args.prot = linux_args->prot; 68410931a46SJung-uk Kim if (bsd_args.prot & (PROT_READ | PROT_WRITE | PROT_EXEC)) 68510931a46SJung-uk Kim bsd_args.prot |= PROT_READ | PROT_EXEC; 68610931a46SJung-uk Kim 6876a5964d3SJung-uk Kim /* Linux does not check file descriptor when MAP_ANONYMOUS is set. */ 6886a5964d3SJung-uk Kim bsd_args.fd = (bsd_args.flags & MAP_ANON) ? -1 : linux_args->fd; 6896a5964d3SJung-uk Kim if (bsd_args.fd != -1) { 69010931a46SJung-uk Kim /* 69110931a46SJung-uk Kim * Linux follows Solaris mmap(2) description: 69210931a46SJung-uk Kim * The file descriptor fildes is opened with 69310931a46SJung-uk Kim * read permission, regardless of the 69410931a46SJung-uk Kim * protection options specified. 69510931a46SJung-uk Kim */ 69610931a46SJung-uk Kim 6976a5964d3SJung-uk Kim if ((error = fget(td, bsd_args.fd, &fp)) != 0) 69810931a46SJung-uk Kim return (error); 69910931a46SJung-uk Kim if (fp->f_type != DTYPE_VNODE) { 70010931a46SJung-uk Kim fdrop(fp, td); 70110931a46SJung-uk Kim return (EINVAL); 70210931a46SJung-uk Kim } 70310931a46SJung-uk Kim 70410931a46SJung-uk Kim /* Linux mmap() just fails for O_WRONLY files */ 70510931a46SJung-uk Kim if (!(fp->f_flag & FREAD)) { 70610931a46SJung-uk Kim fdrop(fp, td); 70710931a46SJung-uk Kim return (EACCES); 70810931a46SJung-uk Kim } 70910931a46SJung-uk Kim 71010931a46SJung-uk Kim fdrop(fp, td); 71110931a46SJung-uk Kim } 71210931a46SJung-uk Kim 71310931a46SJung-uk Kim if (linux_args->flags & LINUX_MAP_GROWSDOWN) { 71410931a46SJung-uk Kim /* 7150eef2f8aSAlexander Leidinger * The linux MAP_GROWSDOWN option does not limit auto 716146aad74SMarcel Moolenaar * growth of the region. Linux mmap with this option 717146aad74SMarcel Moolenaar * takes as addr the inital BOS, and as len, the initial 718146aad74SMarcel Moolenaar * region size. It can then grow down from addr without 719146aad74SMarcel Moolenaar * limit. However, linux threads has an implicit internal 720146aad74SMarcel Moolenaar * limit to stack size of STACK_SIZE. Its just not 721146aad74SMarcel Moolenaar * enforced explicitly in linux. But, here we impose 722146aad74SMarcel Moolenaar * a limit of (STACK_SIZE - GUARD_SIZE) on the stack 723146aad74SMarcel Moolenaar * region, since we can do this with our mmap. 724146aad74SMarcel Moolenaar * 725146aad74SMarcel Moolenaar * Our mmap with MAP_STACK takes addr as the maximum 726146aad74SMarcel Moolenaar * downsize limit on BOS, and as len the max size of 727146aad74SMarcel Moolenaar * the region. It them maps the top SGROWSIZ bytes, 728802e08a3SAlexander Leidinger * and auto grows the region down, up to the limit 729146aad74SMarcel Moolenaar * in addr. 730146aad74SMarcel Moolenaar * 731146aad74SMarcel Moolenaar * If we don't use the MAP_STACK option, the effect 732146aad74SMarcel Moolenaar * of this code is to allocate a stack region of a 733146aad74SMarcel Moolenaar * fixed size of (STACK_SIZE - GUARD_SIZE). 734146aad74SMarcel Moolenaar */ 735146aad74SMarcel Moolenaar 73610931a46SJung-uk Kim if ((caddr_t)PTRIN(linux_args->addr) + linux_args->len > 73710931a46SJung-uk Kim p->p_vmspace->vm_maxsaddr) { 7380eef2f8aSAlexander Leidinger /* 7390eef2f8aSAlexander Leidinger * Some linux apps will attempt to mmap 740242fae60SAndrew Gallatin * thread stacks near the top of their 741242fae60SAndrew Gallatin * address space. If their TOS is greater 742242fae60SAndrew Gallatin * than vm_maxsaddr, vm_map_growstack() 743242fae60SAndrew Gallatin * will confuse the thread stack with the 744242fae60SAndrew Gallatin * process stack and deliver a SEGV if they 745242fae60SAndrew Gallatin * attempt to grow the thread stack past their 746242fae60SAndrew Gallatin * current stacksize rlimit. To avoid this, 747242fae60SAndrew Gallatin * adjust vm_maxsaddr upwards to reflect 748242fae60SAndrew Gallatin * the current stacksize rlimit rather 749242fae60SAndrew Gallatin * than the maximum possible stacksize. 750242fae60SAndrew Gallatin * It would be better to adjust the 751242fae60SAndrew Gallatin * mmap'ed region, but some apps do not check 752242fae60SAndrew Gallatin * mmap's return value. 753242fae60SAndrew Gallatin */ 75491d5354aSJohn Baldwin PROC_LOCK(p); 755242fae60SAndrew Gallatin p->p_vmspace->vm_maxsaddr = (char *)USRSTACK - 75691d5354aSJohn Baldwin lim_cur(p, RLIMIT_STACK); 75791d5354aSJohn Baldwin PROC_UNLOCK(p); 758242fae60SAndrew Gallatin } 759242fae60SAndrew Gallatin 760146aad74SMarcel Moolenaar /* This gives us our maximum stack size */ 7613ad9c842SMaxim Sobolev if (linux_args->len > STACK_SIZE - GUARD_SIZE) 7623ad9c842SMaxim Sobolev bsd_args.len = linux_args->len; 763146aad74SMarcel Moolenaar else 764146aad74SMarcel Moolenaar bsd_args.len = STACK_SIZE - GUARD_SIZE; 765146aad74SMarcel Moolenaar 7660eef2f8aSAlexander Leidinger /* 7670eef2f8aSAlexander Leidinger * This gives us a new BOS. If we're using VM_STACK, then 768146aad74SMarcel Moolenaar * mmap will just map the top SGROWSIZ bytes, and let 769146aad74SMarcel Moolenaar * the stack grow down to the limit at BOS. If we're 770146aad74SMarcel Moolenaar * not using VM_STACK we map the full stack, since we 771146aad74SMarcel Moolenaar * don't have a way to autogrow it. 772146aad74SMarcel Moolenaar */ 77310931a46SJung-uk Kim bsd_args.addr = (caddr_t)PTRIN(linux_args->addr) - 77410931a46SJung-uk Kim bsd_args.len; 775146aad74SMarcel Moolenaar } else { 77610931a46SJung-uk Kim bsd_args.addr = (caddr_t)PTRIN(linux_args->addr); 7773ad9c842SMaxim Sobolev bsd_args.len = linux_args->len; 778146aad74SMarcel Moolenaar } 77910931a46SJung-uk Kim bsd_args.pos = linux_args->pgoff; 780146aad74SMarcel Moolenaar bsd_args.pad = 0; 781146aad74SMarcel Moolenaar 782146aad74SMarcel Moolenaar #ifdef DEBUG 78324593369SJonathan Lemon if (ldebug(mmap)) 78491d631e5SMatthew N. Dodd printf("-> %s(%p, %d, %d, 0x%08x, %d, 0x%x)\n", 78591d631e5SMatthew N. Dodd __func__, 78624593369SJonathan Lemon (void *)bsd_args.addr, bsd_args.len, bsd_args.prot, 78724593369SJonathan Lemon bsd_args.flags, bsd_args.fd, (int)bsd_args.pos); 788146aad74SMarcel Moolenaar #endif 78991d631e5SMatthew N. Dodd error = mmap(td, &bsd_args); 79091d631e5SMatthew N. Dodd #ifdef DEBUG 79191d631e5SMatthew N. Dodd if (ldebug(mmap)) 79291d631e5SMatthew N. Dodd printf("-> %s() return: 0x%x (0x%08x)\n", 79391d631e5SMatthew N. Dodd __func__, error, (u_int)td->td_retval[0]); 79491d631e5SMatthew N. Dodd #endif 79591d631e5SMatthew N. Dodd return (error); 796146aad74SMarcel Moolenaar } 797146aad74SMarcel Moolenaar 798146aad74SMarcel Moolenaar int 79910931a46SJung-uk Kim linux_mprotect(struct thread *td, struct linux_mprotect_args *uap) 80010931a46SJung-uk Kim { 80110931a46SJung-uk Kim struct mprotect_args bsd_args; 80210931a46SJung-uk Kim 80310931a46SJung-uk Kim bsd_args.addr = uap->addr; 80410931a46SJung-uk Kim bsd_args.len = uap->len; 80510931a46SJung-uk Kim bsd_args.prot = uap->prot; 80610931a46SJung-uk Kim if (bsd_args.prot & (PROT_READ | PROT_WRITE | PROT_EXEC)) 80710931a46SJung-uk Kim bsd_args.prot |= PROT_READ | PROT_EXEC; 80810931a46SJung-uk Kim return (mprotect(td, &bsd_args)); 80910931a46SJung-uk Kim } 81010931a46SJung-uk Kim 81110931a46SJung-uk Kim int 812b40ce416SJulian Elischer linux_pipe(struct thread *td, struct linux_pipe_args *args) 813146aad74SMarcel Moolenaar { 814146aad74SMarcel Moolenaar int error; 815146aad74SMarcel Moolenaar int reg_edx; 816146aad74SMarcel Moolenaar 817146aad74SMarcel Moolenaar #ifdef DEBUG 81824593369SJonathan Lemon if (ldebug(pipe)) 81924593369SJonathan Lemon printf(ARGS(pipe, "*")); 820146aad74SMarcel Moolenaar #endif 821146aad74SMarcel Moolenaar 822b40ce416SJulian Elischer reg_edx = td->td_retval[1]; 823b40ce416SJulian Elischer error = pipe(td, 0); 824146aad74SMarcel Moolenaar if (error) { 825b40ce416SJulian Elischer td->td_retval[1] = reg_edx; 826146aad74SMarcel Moolenaar return (error); 827146aad74SMarcel Moolenaar } 828146aad74SMarcel Moolenaar 829b40ce416SJulian Elischer error = copyout(td->td_retval, args->pipefds, 2*sizeof(int)); 830146aad74SMarcel Moolenaar if (error) { 831b40ce416SJulian Elischer td->td_retval[1] = reg_edx; 832146aad74SMarcel Moolenaar return (error); 833146aad74SMarcel Moolenaar } 834146aad74SMarcel Moolenaar 835b40ce416SJulian Elischer td->td_retval[1] = reg_edx; 836b40ce416SJulian Elischer td->td_retval[0] = 0; 837146aad74SMarcel Moolenaar return (0); 838146aad74SMarcel Moolenaar } 839146aad74SMarcel Moolenaar 840146aad74SMarcel Moolenaar int 841b40ce416SJulian Elischer linux_ioperm(struct thread *td, struct linux_ioperm_args *args) 842146aad74SMarcel Moolenaar { 84384569dffSMaxim Sobolev int error; 84484569dffSMaxim Sobolev struct i386_ioperm_args iia; 845146aad74SMarcel Moolenaar 84684569dffSMaxim Sobolev iia.start = args->start; 84784569dffSMaxim Sobolev iia.length = args->length; 84884569dffSMaxim Sobolev iia.enable = args->enable; 84984569dffSMaxim Sobolev mtx_lock(&Giant); 85084569dffSMaxim Sobolev error = i386_set_ioperm(td, &iia); 85184569dffSMaxim Sobolev mtx_unlock(&Giant); 85284569dffSMaxim Sobolev return (error); 853146aad74SMarcel Moolenaar } 854146aad74SMarcel Moolenaar 855146aad74SMarcel Moolenaar int 856b40ce416SJulian Elischer linux_iopl(struct thread *td, struct linux_iopl_args *args) 857146aad74SMarcel Moolenaar { 858146aad74SMarcel Moolenaar int error; 859146aad74SMarcel Moolenaar 860146aad74SMarcel Moolenaar if (args->level < 0 || args->level > 3) 861146aad74SMarcel Moolenaar return (EINVAL); 862acd3428bSRobert Watson if ((error = priv_check(td, PRIV_IO)) != 0) 863146aad74SMarcel Moolenaar return (error); 864a854ed98SJohn Baldwin if ((error = securelevel_gt(td->td_ucred, 0)) != 0) 86541c42188SRobert Watson return (error); 866b40ce416SJulian Elischer td->td_frame->tf_eflags = (td->td_frame->tf_eflags & ~PSL_IOPL) | 867146aad74SMarcel Moolenaar (args->level * (PSL_IOPL / 3)); 868146aad74SMarcel Moolenaar return (0); 869146aad74SMarcel Moolenaar } 870146aad74SMarcel Moolenaar 871146aad74SMarcel Moolenaar int 872b07cd97eSMark Murray linux_modify_ldt(struct thread *td, struct linux_modify_ldt_args *uap) 873146aad74SMarcel Moolenaar { 874146aad74SMarcel Moolenaar int error; 87584569dffSMaxim Sobolev struct i386_ldt_args ldt; 8765002a60fSMarcel Moolenaar struct l_descriptor ld; 87784569dffSMaxim Sobolev union descriptor desc; 878146aad74SMarcel Moolenaar 879146aad74SMarcel Moolenaar if (uap->ptr == NULL) 880146aad74SMarcel Moolenaar return (EINVAL); 881146aad74SMarcel Moolenaar 882146aad74SMarcel Moolenaar switch (uap->func) { 883146aad74SMarcel Moolenaar case 0x00: /* read_ldt */ 88484569dffSMaxim Sobolev ldt.start = 0; 88584569dffSMaxim Sobolev ldt.descs = uap->ptr; 88684569dffSMaxim Sobolev ldt.num = uap->bytecount / sizeof(union descriptor); 88784569dffSMaxim Sobolev mtx_lock(&Giant); 88884569dffSMaxim Sobolev error = i386_get_ldt(td, &ldt); 889b40ce416SJulian Elischer td->td_retval[0] *= sizeof(union descriptor); 89084569dffSMaxim Sobolev mtx_unlock(&Giant); 891146aad74SMarcel Moolenaar break; 892146aad74SMarcel Moolenaar case 0x01: /* write_ldt */ 893146aad74SMarcel Moolenaar case 0x11: /* write_ldt */ 894146aad74SMarcel Moolenaar if (uap->bytecount != sizeof(ld)) 895146aad74SMarcel Moolenaar return (EINVAL); 896146aad74SMarcel Moolenaar 897146aad74SMarcel Moolenaar error = copyin(uap->ptr, &ld, sizeof(ld)); 898146aad74SMarcel Moolenaar if (error) 899146aad74SMarcel Moolenaar return (error); 900146aad74SMarcel Moolenaar 90184569dffSMaxim Sobolev ldt.start = ld.entry_number; 90284569dffSMaxim Sobolev ldt.descs = &desc; 90384569dffSMaxim Sobolev ldt.num = 1; 90484569dffSMaxim Sobolev desc.sd.sd_lolimit = (ld.limit & 0x0000ffff); 90584569dffSMaxim Sobolev desc.sd.sd_hilimit = (ld.limit & 0x000f0000) >> 16; 90684569dffSMaxim Sobolev desc.sd.sd_lobase = (ld.base_addr & 0x00ffffff); 90784569dffSMaxim Sobolev desc.sd.sd_hibase = (ld.base_addr & 0xff000000) >> 24; 90884569dffSMaxim Sobolev desc.sd.sd_type = SDT_MEMRO | ((ld.read_exec_only ^ 1) << 1) | 909146aad74SMarcel Moolenaar (ld.contents << 2); 91084569dffSMaxim Sobolev desc.sd.sd_dpl = 3; 91184569dffSMaxim Sobolev desc.sd.sd_p = (ld.seg_not_present ^ 1); 91284569dffSMaxim Sobolev desc.sd.sd_xx = 0; 91384569dffSMaxim Sobolev desc.sd.sd_def32 = ld.seg_32bit; 91484569dffSMaxim Sobolev desc.sd.sd_gran = ld.limit_in_pages; 91584569dffSMaxim Sobolev mtx_lock(&Giant); 91684569dffSMaxim Sobolev error = i386_set_ldt(td, &ldt, &desc); 91784569dffSMaxim Sobolev mtx_unlock(&Giant); 918146aad74SMarcel Moolenaar break; 919146aad74SMarcel Moolenaar default: 920146aad74SMarcel Moolenaar error = EINVAL; 921146aad74SMarcel Moolenaar break; 922146aad74SMarcel Moolenaar } 923146aad74SMarcel Moolenaar 924146aad74SMarcel Moolenaar if (error == EOPNOTSUPP) { 925146aad74SMarcel Moolenaar printf("linux: modify_ldt needs kernel option USER_LDT\n"); 926146aad74SMarcel Moolenaar error = ENOSYS; 927146aad74SMarcel Moolenaar } 928146aad74SMarcel Moolenaar 929146aad74SMarcel Moolenaar return (error); 930146aad74SMarcel Moolenaar } 931146aad74SMarcel Moolenaar 932146aad74SMarcel Moolenaar int 933b40ce416SJulian Elischer linux_sigaction(struct thread *td, struct linux_sigaction_args *args) 934146aad74SMarcel Moolenaar { 9355002a60fSMarcel Moolenaar l_osigaction_t osa; 9365002a60fSMarcel Moolenaar l_sigaction_t act, oact; 937146aad74SMarcel Moolenaar int error; 938146aad74SMarcel Moolenaar 939146aad74SMarcel Moolenaar #ifdef DEBUG 94024593369SJonathan Lemon if (ldebug(sigaction)) 94124593369SJonathan Lemon printf(ARGS(sigaction, "%d, %p, %p"), 942146aad74SMarcel Moolenaar args->sig, (void *)args->nsa, (void *)args->osa); 943146aad74SMarcel Moolenaar #endif 944146aad74SMarcel Moolenaar 945146aad74SMarcel Moolenaar if (args->nsa != NULL) { 9464b7ef73dSDag-Erling Smørgrav error = copyin(args->nsa, &osa, sizeof(l_osigaction_t)); 947146aad74SMarcel Moolenaar if (error) 948146aad74SMarcel Moolenaar return (error); 949146aad74SMarcel Moolenaar act.lsa_handler = osa.lsa_handler; 950146aad74SMarcel Moolenaar act.lsa_flags = osa.lsa_flags; 951146aad74SMarcel Moolenaar act.lsa_restorer = osa.lsa_restorer; 952146aad74SMarcel Moolenaar LINUX_SIGEMPTYSET(act.lsa_mask); 953146aad74SMarcel Moolenaar act.lsa_mask.__bits[0] = osa.lsa_mask; 954146aad74SMarcel Moolenaar } 955146aad74SMarcel Moolenaar 956b40ce416SJulian Elischer error = linux_do_sigaction(td, args->sig, args->nsa ? &act : NULL, 957146aad74SMarcel Moolenaar args->osa ? &oact : NULL); 958146aad74SMarcel Moolenaar 959146aad74SMarcel Moolenaar if (args->osa != NULL && !error) { 960146aad74SMarcel Moolenaar osa.lsa_handler = oact.lsa_handler; 961146aad74SMarcel Moolenaar osa.lsa_flags = oact.lsa_flags; 962146aad74SMarcel Moolenaar osa.lsa_restorer = oact.lsa_restorer; 963146aad74SMarcel Moolenaar osa.lsa_mask = oact.lsa_mask.__bits[0]; 9644b7ef73dSDag-Erling Smørgrav error = copyout(&osa, args->osa, sizeof(l_osigaction_t)); 965146aad74SMarcel Moolenaar } 966146aad74SMarcel Moolenaar 967146aad74SMarcel Moolenaar return (error); 968146aad74SMarcel Moolenaar } 969146aad74SMarcel Moolenaar 970146aad74SMarcel Moolenaar /* 971146aad74SMarcel Moolenaar * Linux has two extra args, restart and oldmask. We dont use these, 972146aad74SMarcel Moolenaar * but it seems that "restart" is actually a context pointer that 973146aad74SMarcel Moolenaar * enables the signal to happen with a different register set. 974146aad74SMarcel Moolenaar */ 975146aad74SMarcel Moolenaar int 976b40ce416SJulian Elischer linux_sigsuspend(struct thread *td, struct linux_sigsuspend_args *args) 977146aad74SMarcel Moolenaar { 978206a5d3aSIan Dowse sigset_t sigmask; 9795002a60fSMarcel Moolenaar l_sigset_t mask; 980146aad74SMarcel Moolenaar 981146aad74SMarcel Moolenaar #ifdef DEBUG 98224593369SJonathan Lemon if (ldebug(sigsuspend)) 98324593369SJonathan Lemon printf(ARGS(sigsuspend, "%08lx"), (unsigned long)args->mask); 984146aad74SMarcel Moolenaar #endif 985146aad74SMarcel Moolenaar 986146aad74SMarcel Moolenaar LINUX_SIGEMPTYSET(mask); 987146aad74SMarcel Moolenaar mask.__bits[0] = args->mask; 988206a5d3aSIan Dowse linux_to_bsd_sigset(&mask, &sigmask); 989206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 990146aad74SMarcel Moolenaar } 991146aad74SMarcel Moolenaar 992146aad74SMarcel Moolenaar int 993b07cd97eSMark Murray linux_rt_sigsuspend(struct thread *td, struct linux_rt_sigsuspend_args *uap) 994146aad74SMarcel Moolenaar { 9955002a60fSMarcel Moolenaar l_sigset_t lmask; 996206a5d3aSIan Dowse sigset_t sigmask; 997146aad74SMarcel Moolenaar int error; 998146aad74SMarcel Moolenaar 999146aad74SMarcel Moolenaar #ifdef DEBUG 100024593369SJonathan Lemon if (ldebug(rt_sigsuspend)) 100124593369SJonathan Lemon printf(ARGS(rt_sigsuspend, "%p, %d"), 1002146aad74SMarcel Moolenaar (void *)uap->newset, uap->sigsetsize); 1003146aad74SMarcel Moolenaar #endif 1004146aad74SMarcel Moolenaar 10055002a60fSMarcel Moolenaar if (uap->sigsetsize != sizeof(l_sigset_t)) 1006146aad74SMarcel Moolenaar return (EINVAL); 1007146aad74SMarcel Moolenaar 10085002a60fSMarcel Moolenaar error = copyin(uap->newset, &lmask, sizeof(l_sigset_t)); 1009146aad74SMarcel Moolenaar if (error) 1010146aad74SMarcel Moolenaar return (error); 1011146aad74SMarcel Moolenaar 1012206a5d3aSIan Dowse linux_to_bsd_sigset(&lmask, &sigmask); 1013206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 1014146aad74SMarcel Moolenaar } 1015146aad74SMarcel Moolenaar 1016146aad74SMarcel Moolenaar int 1017b40ce416SJulian Elischer linux_pause(struct thread *td, struct linux_pause_args *args) 1018146aad74SMarcel Moolenaar { 1019b40ce416SJulian Elischer struct proc *p = td->td_proc; 1020206a5d3aSIan Dowse sigset_t sigmask; 1021146aad74SMarcel Moolenaar 1022146aad74SMarcel Moolenaar #ifdef DEBUG 102324593369SJonathan Lemon if (ldebug(pause)) 102424593369SJonathan Lemon printf(ARGS(pause, "")); 1025146aad74SMarcel Moolenaar #endif 1026146aad74SMarcel Moolenaar 1027fdfdfb78SJohn Baldwin PROC_LOCK(p); 10284093529dSJeff Roberson sigmask = td->td_sigmask; 1029fdfdfb78SJohn Baldwin PROC_UNLOCK(p); 1030206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 1031146aad74SMarcel Moolenaar } 1032146aad74SMarcel Moolenaar 1033146aad74SMarcel Moolenaar int 1034b40ce416SJulian Elischer linux_sigaltstack(struct thread *td, struct linux_sigaltstack_args *uap) 1035146aad74SMarcel Moolenaar { 1036206a5d3aSIan Dowse stack_t ss, oss; 10375002a60fSMarcel Moolenaar l_stack_t lss; 1038146aad74SMarcel Moolenaar int error; 1039146aad74SMarcel Moolenaar 1040146aad74SMarcel Moolenaar #ifdef DEBUG 104124593369SJonathan Lemon if (ldebug(sigaltstack)) 104224593369SJonathan Lemon printf(ARGS(sigaltstack, "%p, %p"), uap->uss, uap->uoss); 1043146aad74SMarcel Moolenaar #endif 1044146aad74SMarcel Moolenaar 1045206a5d3aSIan Dowse if (uap->uss != NULL) { 10465002a60fSMarcel Moolenaar error = copyin(uap->uss, &lss, sizeof(l_stack_t)); 1047146aad74SMarcel Moolenaar if (error) 1048146aad74SMarcel Moolenaar return (error); 1049146aad74SMarcel Moolenaar 1050206a5d3aSIan Dowse ss.ss_sp = lss.ss_sp; 1051206a5d3aSIan Dowse ss.ss_size = lss.ss_size; 1052206a5d3aSIan Dowse ss.ss_flags = linux_to_bsd_sigaltstack(lss.ss_flags); 1053931a7258SAndrew Gallatin } 1054ef36ad69SJohn Baldwin error = kern_sigaltstack(td, (uap->uss != NULL) ? &ss : NULL, 1055ef36ad69SJohn Baldwin (uap->uoss != NULL) ? &oss : NULL); 1056206a5d3aSIan Dowse if (!error && uap->uoss != NULL) { 1057206a5d3aSIan Dowse lss.ss_sp = oss.ss_sp; 1058206a5d3aSIan Dowse lss.ss_size = oss.ss_size; 1059206a5d3aSIan Dowse lss.ss_flags = bsd_to_linux_sigaltstack(oss.ss_flags); 10605002a60fSMarcel Moolenaar error = copyout(&lss, uap->uoss, sizeof(l_stack_t)); 1061146aad74SMarcel Moolenaar } 1062146aad74SMarcel Moolenaar 1063146aad74SMarcel Moolenaar return (error); 1064146aad74SMarcel Moolenaar } 10653ad9c842SMaxim Sobolev 10663ad9c842SMaxim Sobolev int 10673ad9c842SMaxim Sobolev linux_ftruncate64(struct thread *td, struct linux_ftruncate64_args *args) 10683ad9c842SMaxim Sobolev { 10693ad9c842SMaxim Sobolev struct ftruncate_args sa; 10703ad9c842SMaxim Sobolev 10713ad9c842SMaxim Sobolev #ifdef DEBUG 10723ad9c842SMaxim Sobolev if (ldebug(ftruncate64)) 1073b45bbfc3SBruce Evans printf(ARGS(ftruncate64, "%u, %jd"), args->fd, 1074b45bbfc3SBruce Evans (intmax_t)args->length); 10753ad9c842SMaxim Sobolev #endif 10763ad9c842SMaxim Sobolev 10773ad9c842SMaxim Sobolev sa.fd = args->fd; 10783ad9c842SMaxim Sobolev sa.pad = 0; 10793ad9c842SMaxim Sobolev sa.length = args->length; 10803ad9c842SMaxim Sobolev return ftruncate(td, &sa); 10813ad9c842SMaxim Sobolev } 10821bc85c0dSDoug Rabson 10831bc85c0dSDoug Rabson int 10841bc85c0dSDoug Rabson linux_set_thread_area(struct thread *td, struct linux_set_thread_area_args *args) 10851bc85c0dSDoug Rabson { 10869b44bfc5SAlexander Leidinger struct l_user_desc info; 10879b44bfc5SAlexander Leidinger int error; 10889b44bfc5SAlexander Leidinger int idx; 10899b44bfc5SAlexander Leidinger int a[2]; 10909b44bfc5SAlexander Leidinger struct segment_descriptor sd; 10919b44bfc5SAlexander Leidinger 10929b44bfc5SAlexander Leidinger error = copyin(args->desc, &info, sizeof(struct l_user_desc)); 10939b44bfc5SAlexander Leidinger if (error) 10949b44bfc5SAlexander Leidinger return (error); 10959b44bfc5SAlexander Leidinger 10969b44bfc5SAlexander Leidinger #ifdef DEBUG 10979b44bfc5SAlexander Leidinger if (ldebug(set_thread_area)) 10989b44bfc5SAlexander Leidinger printf(ARGS(set_thread_area, "%i, %x, %x, %i, %i, %i, %i, %i, %i\n"), 10999b44bfc5SAlexander Leidinger info.entry_number, 11009b44bfc5SAlexander Leidinger info.base_addr, 11019b44bfc5SAlexander Leidinger info.limit, 11029b44bfc5SAlexander Leidinger info.seg_32bit, 11039b44bfc5SAlexander Leidinger info.contents, 11049b44bfc5SAlexander Leidinger info.read_exec_only, 11059b44bfc5SAlexander Leidinger info.limit_in_pages, 11069b44bfc5SAlexander Leidinger info.seg_not_present, 11079b44bfc5SAlexander Leidinger info.useable); 11089b44bfc5SAlexander Leidinger #endif 11099b44bfc5SAlexander Leidinger 11109b44bfc5SAlexander Leidinger idx = info.entry_number; 11110eef2f8aSAlexander Leidinger /* 1112802e08a3SAlexander Leidinger * Semantics of linux version: every thread in the system has array of 1113802e08a3SAlexander Leidinger * 3 tls descriptors. 1st is GLIBC TLS, 2nd is WINE, 3rd unknown. This 1114802e08a3SAlexander Leidinger * syscall loads one of the selected tls decriptors with a value and 1115802e08a3SAlexander Leidinger * also loads GDT descriptors 6, 7 and 8 with the content of the 1116802e08a3SAlexander Leidinger * per-thread descriptors. 11179b44bfc5SAlexander Leidinger * 1118802e08a3SAlexander Leidinger * Semantics of fbsd version: I think we can ignore that linux has 3 1119802e08a3SAlexander Leidinger * per-thread descriptors and use just the 1st one. The tls_array[] 1120802e08a3SAlexander Leidinger * is used only in set/get-thread_area() syscalls and for loading the 1121802e08a3SAlexander Leidinger * GDT descriptors. In fbsd we use just one GDT descriptor for TLS so 1122802e08a3SAlexander Leidinger * we will load just one. 1123802e08a3SAlexander Leidinger * 1124802e08a3SAlexander Leidinger * XXX: this doesn't work when a user space process tries to use more 1125802e08a3SAlexander Leidinger * than 1 TLS segment. Comment in the linux sources says wine might do 1126802e08a3SAlexander Leidinger * this. 11271bc85c0dSDoug Rabson */ 11289b44bfc5SAlexander Leidinger 11290eef2f8aSAlexander Leidinger /* 11300eef2f8aSAlexander Leidinger * we support just GLIBC TLS now 11319b44bfc5SAlexander Leidinger * we should let 3 proceed as well because we use this segment so 11329b44bfc5SAlexander Leidinger * if code does two subsequent calls it should succeed 11339b44bfc5SAlexander Leidinger */ 11349b44bfc5SAlexander Leidinger if (idx != 6 && idx != -1 && idx != 3) 11359b44bfc5SAlexander Leidinger return (EINVAL); 11369b44bfc5SAlexander Leidinger 11370eef2f8aSAlexander Leidinger /* 11380eef2f8aSAlexander Leidinger * we have to copy out the GDT entry we use 11399b44bfc5SAlexander Leidinger * FreeBSD uses GDT entry #3 for storing %gs so load that 1140802e08a3SAlexander Leidinger * 1141802e08a3SAlexander Leidinger * XXX: what if a user space program doesn't check this value and tries 11429b44bfc5SAlexander Leidinger * to use 6, 7 or 8? 11439b44bfc5SAlexander Leidinger */ 11449b44bfc5SAlexander Leidinger idx = info.entry_number = 3; 11459b44bfc5SAlexander Leidinger error = copyout(&info, args->desc, sizeof(struct l_user_desc)); 11469b44bfc5SAlexander Leidinger if (error) 11479b44bfc5SAlexander Leidinger return (error); 11489b44bfc5SAlexander Leidinger 1149a4e3bad7SJung-uk Kim if (LINUX_LDT_empty(&info)) { 11509b44bfc5SAlexander Leidinger a[0] = 0; 11519b44bfc5SAlexander Leidinger a[1] = 0; 11529b44bfc5SAlexander Leidinger } else { 1153a4e3bad7SJung-uk Kim a[0] = LINUX_LDT_entry_a(&info); 1154a4e3bad7SJung-uk Kim a[1] = LINUX_LDT_entry_b(&info); 11551bc85c0dSDoug Rabson } 11561bc85c0dSDoug Rabson 11579b44bfc5SAlexander Leidinger memcpy(&sd, &a, sizeof(a)); 11589b44bfc5SAlexander Leidinger #ifdef DEBUG 11599b44bfc5SAlexander Leidinger if (ldebug(set_thread_area)) 11609b44bfc5SAlexander Leidinger printf("Segment created in set_thread_area: lobase: %x, hibase: %x, lolimit: %x, hilimit: %x, type: %i, dpl: %i, p: %i, xx: %i, def32: %i, gran: %i\n", sd.sd_lobase, 11619b44bfc5SAlexander Leidinger sd.sd_hibase, 11629b44bfc5SAlexander Leidinger sd.sd_lolimit, 11639b44bfc5SAlexander Leidinger sd.sd_hilimit, 11649b44bfc5SAlexander Leidinger sd.sd_type, 11659b44bfc5SAlexander Leidinger sd.sd_dpl, 11669b44bfc5SAlexander Leidinger sd.sd_p, 11679b44bfc5SAlexander Leidinger sd.sd_xx, 11689b44bfc5SAlexander Leidinger sd.sd_def32, 11699b44bfc5SAlexander Leidinger sd.sd_gran); 11709b44bfc5SAlexander Leidinger #endif 11711bc85c0dSDoug Rabson 11729b44bfc5SAlexander Leidinger /* this is taken from i386 version of cpu_set_user_tls() */ 11739b44bfc5SAlexander Leidinger critical_enter(); 11749b44bfc5SAlexander Leidinger /* set %gs */ 11759b44bfc5SAlexander Leidinger td->td_pcb->pcb_gsd = sd; 11769b44bfc5SAlexander Leidinger PCPU_GET(fsgs_gdt)[1] = sd; 11779b44bfc5SAlexander Leidinger load_gs(GSEL(GUGS_SEL, SEL_UPL)); 11789b44bfc5SAlexander Leidinger critical_exit(); 11799b44bfc5SAlexander Leidinger 11801bc85c0dSDoug Rabson return (0); 11811bc85c0dSDoug Rabson } 11821bc85c0dSDoug Rabson 11831bc85c0dSDoug Rabson int 11849b44bfc5SAlexander Leidinger linux_get_thread_area(struct thread *td, struct linux_get_thread_area_args *args) 11851bc85c0dSDoug Rabson { 11861bc85c0dSDoug Rabson 11879b44bfc5SAlexander Leidinger struct l_user_desc info; 11889b44bfc5SAlexander Leidinger int error; 11899b44bfc5SAlexander Leidinger int idx; 11909b44bfc5SAlexander Leidinger struct l_desc_struct desc; 11919b44bfc5SAlexander Leidinger struct segment_descriptor sd; 11929b44bfc5SAlexander Leidinger 11939b44bfc5SAlexander Leidinger #ifdef DEBUG 11949b44bfc5SAlexander Leidinger if (ldebug(get_thread_area)) 11959b44bfc5SAlexander Leidinger printf(ARGS(get_thread_area, "%p"), args->desc); 11969b44bfc5SAlexander Leidinger #endif 11979b44bfc5SAlexander Leidinger 11989b44bfc5SAlexander Leidinger error = copyin(args->desc, &info, sizeof(struct l_user_desc)); 11999b44bfc5SAlexander Leidinger if (error) 12009b44bfc5SAlexander Leidinger return (error); 12019b44bfc5SAlexander Leidinger 12029b44bfc5SAlexander Leidinger idx = info.entry_number; 12039b44bfc5SAlexander Leidinger /* XXX: I am not sure if we want 3 to be allowed too. */ 12049b44bfc5SAlexander Leidinger if (idx != 6 && idx != 3) 12059b44bfc5SAlexander Leidinger return (EINVAL); 12069b44bfc5SAlexander Leidinger 12079b44bfc5SAlexander Leidinger idx = 3; 12089b44bfc5SAlexander Leidinger 12099b44bfc5SAlexander Leidinger memset(&info, 0, sizeof(info)); 12109b44bfc5SAlexander Leidinger 12119b44bfc5SAlexander Leidinger sd = PCPU_GET(fsgs_gdt)[1]; 12129b44bfc5SAlexander Leidinger 12139b44bfc5SAlexander Leidinger memcpy(&desc, &sd, sizeof(desc)); 12149b44bfc5SAlexander Leidinger 12159b44bfc5SAlexander Leidinger info.entry_number = idx; 1216a4e3bad7SJung-uk Kim info.base_addr = LINUX_GET_BASE(&desc); 1217a4e3bad7SJung-uk Kim info.limit = LINUX_GET_LIMIT(&desc); 1218a4e3bad7SJung-uk Kim info.seg_32bit = LINUX_GET_32BIT(&desc); 1219a4e3bad7SJung-uk Kim info.contents = LINUX_GET_CONTENTS(&desc); 1220a4e3bad7SJung-uk Kim info.read_exec_only = !LINUX_GET_WRITABLE(&desc); 1221a4e3bad7SJung-uk Kim info.limit_in_pages = LINUX_GET_LIMIT_PAGES(&desc); 1222a4e3bad7SJung-uk Kim info.seg_not_present = !LINUX_GET_PRESENT(&desc); 1223a4e3bad7SJung-uk Kim info.useable = LINUX_GET_USEABLE(&desc); 12249b44bfc5SAlexander Leidinger 12259b44bfc5SAlexander Leidinger error = copyout(&info, args->desc, sizeof(struct l_user_desc)); 12269b44bfc5SAlexander Leidinger if (error) 12279b44bfc5SAlexander Leidinger return (EFAULT); 12289b44bfc5SAlexander Leidinger 12299b44bfc5SAlexander Leidinger return (0); 12309b44bfc5SAlexander Leidinger } 12319b44bfc5SAlexander Leidinger 12329b44bfc5SAlexander Leidinger /* copied from kern/kern_time.c */ 12339b44bfc5SAlexander Leidinger int 12349b44bfc5SAlexander Leidinger linux_timer_create(struct thread *td, struct linux_timer_create_args *args) 12359b44bfc5SAlexander Leidinger { 12369b44bfc5SAlexander Leidinger return ktimer_create(td, (struct ktimer_create_args *) args); 12379b44bfc5SAlexander Leidinger } 12389b44bfc5SAlexander Leidinger 12399b44bfc5SAlexander Leidinger int 12409b44bfc5SAlexander Leidinger linux_timer_settime(struct thread *td, struct linux_timer_settime_args *args) 12419b44bfc5SAlexander Leidinger { 12429b44bfc5SAlexander Leidinger return ktimer_settime(td, (struct ktimer_settime_args *) args); 12439b44bfc5SAlexander Leidinger } 12449b44bfc5SAlexander Leidinger 12459b44bfc5SAlexander Leidinger int 12469b44bfc5SAlexander Leidinger linux_timer_gettime(struct thread *td, struct linux_timer_gettime_args *args) 12479b44bfc5SAlexander Leidinger { 12489b44bfc5SAlexander Leidinger return ktimer_gettime(td, (struct ktimer_gettime_args *) args); 12499b44bfc5SAlexander Leidinger } 12509b44bfc5SAlexander Leidinger 12519b44bfc5SAlexander Leidinger int 12529b44bfc5SAlexander Leidinger linux_timer_getoverrun(struct thread *td, struct linux_timer_getoverrun_args *args) 12539b44bfc5SAlexander Leidinger { 12549b44bfc5SAlexander Leidinger return ktimer_getoverrun(td, (struct ktimer_getoverrun_args *) args); 12559b44bfc5SAlexander Leidinger } 12569b44bfc5SAlexander Leidinger 12579b44bfc5SAlexander Leidinger int 12589b44bfc5SAlexander Leidinger linux_timer_delete(struct thread *td, struct linux_timer_delete_args *args) 12599b44bfc5SAlexander Leidinger { 12609b44bfc5SAlexander Leidinger return ktimer_delete(td, (struct ktimer_delete_args *) args); 12619b44bfc5SAlexander Leidinger } 12629b44bfc5SAlexander Leidinger 12639b44bfc5SAlexander Leidinger /* XXX: this wont work with module - convert it */ 12649b44bfc5SAlexander Leidinger int 12659b44bfc5SAlexander Leidinger linux_mq_open(struct thread *td, struct linux_mq_open_args *args) 12669b44bfc5SAlexander Leidinger { 12679b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12689b44bfc5SAlexander Leidinger return kmq_open(td, (struct kmq_open_args *) args); 12699b44bfc5SAlexander Leidinger #else 12709b44bfc5SAlexander Leidinger return (ENOSYS); 12719b44bfc5SAlexander Leidinger #endif 12729b44bfc5SAlexander Leidinger } 12739b44bfc5SAlexander Leidinger 12749b44bfc5SAlexander Leidinger int 12759b44bfc5SAlexander Leidinger linux_mq_unlink(struct thread *td, struct linux_mq_unlink_args *args) 12769b44bfc5SAlexander Leidinger { 12779b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12789b44bfc5SAlexander Leidinger return kmq_unlink(td, (struct kmq_unlink_args *) args); 12799b44bfc5SAlexander Leidinger #else 12809b44bfc5SAlexander Leidinger return (ENOSYS); 12819b44bfc5SAlexander Leidinger #endif 12829b44bfc5SAlexander Leidinger } 12839b44bfc5SAlexander Leidinger 12849b44bfc5SAlexander Leidinger int 12859b44bfc5SAlexander Leidinger linux_mq_timedsend(struct thread *td, struct linux_mq_timedsend_args *args) 12869b44bfc5SAlexander Leidinger { 12879b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12889b44bfc5SAlexander Leidinger return kmq_timedsend(td, (struct kmq_timedsend_args *) args); 12899b44bfc5SAlexander Leidinger #else 12909b44bfc5SAlexander Leidinger return (ENOSYS); 12919b44bfc5SAlexander Leidinger #endif 12929b44bfc5SAlexander Leidinger } 12939b44bfc5SAlexander Leidinger 12949b44bfc5SAlexander Leidinger int 12959b44bfc5SAlexander Leidinger linux_mq_timedreceive(struct thread *td, struct linux_mq_timedreceive_args *args) 12969b44bfc5SAlexander Leidinger { 12979b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 12989b44bfc5SAlexander Leidinger return kmq_timedreceive(td, (struct kmq_timedreceive_args *) args); 12999b44bfc5SAlexander Leidinger #else 13009b44bfc5SAlexander Leidinger return (ENOSYS); 13019b44bfc5SAlexander Leidinger #endif 13029b44bfc5SAlexander Leidinger } 13039b44bfc5SAlexander Leidinger 13049b44bfc5SAlexander Leidinger int 13059b44bfc5SAlexander Leidinger linux_mq_notify(struct thread *td, struct linux_mq_notify_args *args) 13069b44bfc5SAlexander Leidinger { 13079b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 13089b44bfc5SAlexander Leidinger return kmq_notify(td, (struct kmq_notify_args *) args); 13099b44bfc5SAlexander Leidinger #else 13109b44bfc5SAlexander Leidinger return (ENOSYS); 13119b44bfc5SAlexander Leidinger #endif 13129b44bfc5SAlexander Leidinger } 13139b44bfc5SAlexander Leidinger 13149b44bfc5SAlexander Leidinger int 13159b44bfc5SAlexander Leidinger linux_mq_getsetattr(struct thread *td, struct linux_mq_getsetattr_args *args) 13169b44bfc5SAlexander Leidinger { 13179b44bfc5SAlexander Leidinger #ifdef P1003_1B_MQUEUE 13189b44bfc5SAlexander Leidinger return kmq_setattr(td, (struct kmq_setattr_args *) args); 13199b44bfc5SAlexander Leidinger #else 13209b44bfc5SAlexander Leidinger return (ENOSYS); 13219b44bfc5SAlexander Leidinger #endif 13221bc85c0dSDoug Rabson } 13231bc85c0dSDoug Rabson 1324