1146aad74SMarcel Moolenaar /*- 24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause 383ef78beSPedro F. Giffuni * 4146aad74SMarcel Moolenaar * Copyright (c) 2000 Marcel Moolenaar 5146aad74SMarcel Moolenaar * All rights reserved. 6146aad74SMarcel Moolenaar * 7146aad74SMarcel Moolenaar * Redistribution and use in source and binary forms, with or without 8146aad74SMarcel Moolenaar * modification, are permitted provided that the following conditions 9146aad74SMarcel Moolenaar * are met: 10146aad74SMarcel Moolenaar * 1. Redistributions of source code must retain the above copyright 110ba1b365SEd Maste * notice, this list of conditions and the following disclaimer. 12146aad74SMarcel Moolenaar * 2. Redistributions in binary form must reproduce the above copyright 13146aad74SMarcel Moolenaar * notice, this list of conditions and the following disclaimer in the 14146aad74SMarcel Moolenaar * documentation and/or other materials provided with the distribution. 15146aad74SMarcel Moolenaar * 160ba1b365SEd Maste * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 170ba1b365SEd Maste * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 180ba1b365SEd Maste * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 190ba1b365SEd Maste * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 200ba1b365SEd Maste * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 210ba1b365SEd Maste * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 220ba1b365SEd Maste * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 230ba1b365SEd Maste * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 240ba1b365SEd Maste * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 250ba1b365SEd Maste * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 260ba1b365SEd Maste * SUCH DAMAGE. 27146aad74SMarcel Moolenaar */ 28146aad74SMarcel Moolenaar 29f4a512a5SDmitry Chagin #include "opt_posix.h" 30f4a512a5SDmitry Chagin 31146aad74SMarcel Moolenaar #include <sys/param.h> 3250c85a32SDmitry Chagin #include <sys/imgact_aout.h> 33a312f6a3SAlexander Leidinger #include <sys/fcntl.h> 347106ca0dSJohn Baldwin #include <sys/lock.h> 35610ecfe0SMaxim Sobolev #include <sys/malloc.h> 36fb919e4dSMark Murray #include <sys/mman.h> 37fb919e4dSMark Murray #include <sys/mutex.h> 3850c85a32SDmitry Chagin #include <sys/namei.h> 39acd3428bSRobert Watson #include <sys/priv.h> 40fb919e4dSMark Murray #include <sys/proc.h> 4150c85a32SDmitry Chagin #include <sys/racct.h> 42242fae60SAndrew Gallatin #include <sys/resource.h> 43242fae60SAndrew Gallatin #include <sys/resourcevar.h> 44206a5d3aSIan Dowse #include <sys/syscallsubr.h> 45fb919e4dSMark Murray #include <sys/sysproto.h> 4650c85a32SDmitry Chagin #include <sys/vnode.h> 47146aad74SMarcel Moolenaar 4850c85a32SDmitry Chagin #include <security/audit/audit.h> 4950c85a32SDmitry Chagin #include <security/mac/mac_framework.h> 5050c85a32SDmitry Chagin 51146aad74SMarcel Moolenaar #include <machine/frame.h> 52f4a512a5SDmitry Chagin #include <machine/pcb.h> /* needed for pcb definition in linux_set_thread_area */ 53146aad74SMarcel Moolenaar #include <machine/psl.h> 54146aad74SMarcel Moolenaar #include <machine/segments.h> 55146aad74SMarcel Moolenaar #include <machine/sysarch.h> 56146aad74SMarcel Moolenaar 57242fae60SAndrew Gallatin #include <vm/pmap.h> 58c0aa0e2cSEd Maste #include <vm/vm.h> 5950c85a32SDmitry Chagin #include <vm/vm_extern.h> 60f4a512a5SDmitry Chagin #include <vm/vm_kern.h> 61242fae60SAndrew Gallatin #include <vm/vm_map.h> 6250c85a32SDmitry Chagin #include <vm/vm_param.h> 63242fae60SAndrew Gallatin 64cc1b0f7dSDmitry Chagin #include <x86/reg.h> 65cc1b0f7dSDmitry Chagin 66146aad74SMarcel Moolenaar #include <i386/linux/linux.h> 67ebea8660SMarcel Moolenaar #include <i386/linux/linux_proto.h> 68c0aa0e2cSEd Maste #include <compat/linux/linux_emul.h> 690a4b664aSDmitry Chagin #include <compat/linux/linux_fork.h> 70146aad74SMarcel Moolenaar #include <compat/linux/linux_ipc.h> 71adc7ece0SDmitry Chagin #include <compat/linux/linux_misc.h> 7297d06da6SDmitry Chagin #include <compat/linux/linux_mmap.h> 73146aad74SMarcel Moolenaar #include <compat/linux/linux_signal.h> 74146aad74SMarcel Moolenaar #include <compat/linux/linux_util.h> 759b44bfc5SAlexander Leidinger 769b44bfc5SAlexander Leidinger 775002a60fSMarcel Moolenaar struct l_descriptor { 785002a60fSMarcel Moolenaar l_uint entry_number; 795002a60fSMarcel Moolenaar l_ulong base_addr; 805002a60fSMarcel Moolenaar l_uint limit; 815002a60fSMarcel Moolenaar l_uint seg_32bit:1; 825002a60fSMarcel Moolenaar l_uint contents:2; 835002a60fSMarcel Moolenaar l_uint read_exec_only:1; 845002a60fSMarcel Moolenaar l_uint limit_in_pages:1; 855002a60fSMarcel Moolenaar l_uint seg_not_present:1; 865002a60fSMarcel Moolenaar l_uint useable:1; 87146aad74SMarcel Moolenaar }; 88146aad74SMarcel Moolenaar 895002a60fSMarcel Moolenaar struct l_old_select_argv { 905002a60fSMarcel Moolenaar l_int nfds; 915002a60fSMarcel Moolenaar l_fd_set *readfds; 925002a60fSMarcel Moolenaar l_fd_set *writefds; 935002a60fSMarcel Moolenaar l_fd_set *exceptfds; 945002a60fSMarcel Moolenaar struct l_timeval *timeout; 95146aad74SMarcel Moolenaar }; 96146aad74SMarcel Moolenaar 975002a60fSMarcel Moolenaar struct l_ipc_kludge { 985002a60fSMarcel Moolenaar struct l_msgbuf *msgp; 995002a60fSMarcel Moolenaar l_long msgtyp; 1005002a60fSMarcel Moolenaar }; 1015002a60fSMarcel Moolenaar 102146aad74SMarcel Moolenaar int 103b40ce416SJulian Elischer linux_ipc(struct thread *td, struct linux_ipc_args *args) 104146aad74SMarcel Moolenaar { 1055002a60fSMarcel Moolenaar 1065002a60fSMarcel Moolenaar switch (args->what & 0xFFFF) { 1075002a60fSMarcel Moolenaar case LINUX_SEMOP: { 1085002a60fSMarcel Moolenaar 109f48a6887SDmitry Chagin return (kern_semop(td, args->arg1, PTRIN(args->ptr), 110f48a6887SDmitry Chagin args->arg2, NULL)); 1115002a60fSMarcel Moolenaar } 1125002a60fSMarcel Moolenaar case LINUX_SEMGET: { 1135002a60fSMarcel Moolenaar struct linux_semget_args a; 1145002a60fSMarcel Moolenaar 1155002a60fSMarcel Moolenaar a.key = args->arg1; 1165002a60fSMarcel Moolenaar a.nsems = args->arg2; 1175002a60fSMarcel Moolenaar a.semflg = args->arg3; 118b40ce416SJulian Elischer return (linux_semget(td, &a)); 1195002a60fSMarcel Moolenaar } 1205002a60fSMarcel Moolenaar case LINUX_SEMCTL: { 1215002a60fSMarcel Moolenaar struct linux_semctl_args a; 1225002a60fSMarcel Moolenaar int error; 1235002a60fSMarcel Moolenaar 1245002a60fSMarcel Moolenaar a.semid = args->arg1; 1255002a60fSMarcel Moolenaar a.semnum = args->arg2; 1265002a60fSMarcel Moolenaar a.cmd = args->arg3; 1277dabf89bSDmitry Chagin error = copyin(PTRIN(args->ptr), &a.arg, sizeof(a.arg)); 1285002a60fSMarcel Moolenaar if (error) 1295002a60fSMarcel Moolenaar return (error); 130b40ce416SJulian Elischer return (linux_semctl(td, &a)); 1315002a60fSMarcel Moolenaar } 1323245a2ecSDmitry Chagin case LINUX_SEMTIMEDOP: { 1333245a2ecSDmitry Chagin struct linux_semtimedop_args a; 1343245a2ecSDmitry Chagin 1353245a2ecSDmitry Chagin a.semid = args->arg1; 1363245a2ecSDmitry Chagin a.tsops = PTRIN(args->ptr); 1373245a2ecSDmitry Chagin a.nsops = args->arg2; 1383245a2ecSDmitry Chagin a.timeout = PTRIN(args->arg5); 1393245a2ecSDmitry Chagin return (linux_semtimedop(td, &a)); 1403245a2ecSDmitry Chagin } 1415002a60fSMarcel Moolenaar case LINUX_MSGSND: { 1425002a60fSMarcel Moolenaar struct linux_msgsnd_args a; 1435002a60fSMarcel Moolenaar 1445002a60fSMarcel Moolenaar a.msqid = args->arg1; 1457dabf89bSDmitry Chagin a.msgp = PTRIN(args->ptr); 1465002a60fSMarcel Moolenaar a.msgsz = args->arg2; 1475002a60fSMarcel Moolenaar a.msgflg = args->arg3; 148b40ce416SJulian Elischer return (linux_msgsnd(td, &a)); 1495002a60fSMarcel Moolenaar } 1505002a60fSMarcel Moolenaar case LINUX_MSGRCV: { 1515002a60fSMarcel Moolenaar struct linux_msgrcv_args a; 1525002a60fSMarcel Moolenaar 1535002a60fSMarcel Moolenaar a.msqid = args->arg1; 1545002a60fSMarcel Moolenaar a.msgsz = args->arg2; 1555002a60fSMarcel Moolenaar a.msgflg = args->arg3; 1565002a60fSMarcel Moolenaar if ((args->what >> 16) == 0) { 1575002a60fSMarcel Moolenaar struct l_ipc_kludge tmp; 1585002a60fSMarcel Moolenaar int error; 1595002a60fSMarcel Moolenaar 1607dabf89bSDmitry Chagin if (args->ptr == 0) 1615002a60fSMarcel Moolenaar return (EINVAL); 1627dabf89bSDmitry Chagin error = copyin(PTRIN(args->ptr), &tmp, sizeof(tmp)); 1635002a60fSMarcel Moolenaar if (error) 1645002a60fSMarcel Moolenaar return (error); 1657dabf89bSDmitry Chagin a.msgp = PTRIN(tmp.msgp); 1665002a60fSMarcel Moolenaar a.msgtyp = tmp.msgtyp; 1675002a60fSMarcel Moolenaar } else { 1687dabf89bSDmitry Chagin a.msgp = PTRIN(args->ptr); 1695002a60fSMarcel Moolenaar a.msgtyp = args->arg5; 1705002a60fSMarcel Moolenaar } 171b40ce416SJulian Elischer return (linux_msgrcv(td, &a)); 1725002a60fSMarcel Moolenaar } 1735002a60fSMarcel Moolenaar case LINUX_MSGGET: { 1745002a60fSMarcel Moolenaar struct linux_msgget_args a; 1755002a60fSMarcel Moolenaar 1765002a60fSMarcel Moolenaar a.key = args->arg1; 1775002a60fSMarcel Moolenaar a.msgflg = args->arg2; 178b40ce416SJulian Elischer return (linux_msgget(td, &a)); 1795002a60fSMarcel Moolenaar } 1805002a60fSMarcel Moolenaar case LINUX_MSGCTL: { 1815002a60fSMarcel Moolenaar struct linux_msgctl_args a; 1825002a60fSMarcel Moolenaar 1835002a60fSMarcel Moolenaar a.msqid = args->arg1; 1845002a60fSMarcel Moolenaar a.cmd = args->arg2; 1857dabf89bSDmitry Chagin a.buf = PTRIN(args->ptr); 186b40ce416SJulian Elischer return (linux_msgctl(td, &a)); 1875002a60fSMarcel Moolenaar } 1885002a60fSMarcel Moolenaar case LINUX_SHMAT: { 1895002a60fSMarcel Moolenaar struct linux_shmat_args a; 1907dabf89bSDmitry Chagin l_uintptr_t addr; 1917dabf89bSDmitry Chagin int error; 1925002a60fSMarcel Moolenaar 1935002a60fSMarcel Moolenaar a.shmid = args->arg1; 1947dabf89bSDmitry Chagin a.shmaddr = PTRIN(args->ptr); 1955002a60fSMarcel Moolenaar a.shmflg = args->arg2; 1967dabf89bSDmitry Chagin error = linux_shmat(td, &a); 1977dabf89bSDmitry Chagin if (error != 0) 1987dabf89bSDmitry Chagin return (error); 1997dabf89bSDmitry Chagin addr = td->td_retval[0]; 2007dabf89bSDmitry Chagin error = copyout(&addr, PTRIN(args->arg3), sizeof(addr)); 2017dabf89bSDmitry Chagin td->td_retval[0] = 0; 2027dabf89bSDmitry Chagin return (error); 2035002a60fSMarcel Moolenaar } 2045002a60fSMarcel Moolenaar case LINUX_SHMDT: { 2055002a60fSMarcel Moolenaar struct linux_shmdt_args a; 2065002a60fSMarcel Moolenaar 2077dabf89bSDmitry Chagin a.shmaddr = PTRIN(args->ptr); 208b40ce416SJulian Elischer return (linux_shmdt(td, &a)); 2095002a60fSMarcel Moolenaar } 2105002a60fSMarcel Moolenaar case LINUX_SHMGET: { 2115002a60fSMarcel Moolenaar struct linux_shmget_args a; 2125002a60fSMarcel Moolenaar 2135002a60fSMarcel Moolenaar a.key = args->arg1; 2145002a60fSMarcel Moolenaar a.size = args->arg2; 2155002a60fSMarcel Moolenaar a.shmflg = args->arg3; 216b40ce416SJulian Elischer return (linux_shmget(td, &a)); 2175002a60fSMarcel Moolenaar } 2185002a60fSMarcel Moolenaar case LINUX_SHMCTL: { 2195002a60fSMarcel Moolenaar struct linux_shmctl_args a; 2205002a60fSMarcel Moolenaar 2215002a60fSMarcel Moolenaar a.shmid = args->arg1; 2225002a60fSMarcel Moolenaar a.cmd = args->arg2; 2237dabf89bSDmitry Chagin a.buf = PTRIN(args->ptr); 224b40ce416SJulian Elischer return (linux_shmctl(td, &a)); 2255002a60fSMarcel Moolenaar } 2265002a60fSMarcel Moolenaar default: 2275002a60fSMarcel Moolenaar break; 228146aad74SMarcel Moolenaar } 229146aad74SMarcel Moolenaar 2305002a60fSMarcel Moolenaar return (EINVAL); 231146aad74SMarcel Moolenaar } 232146aad74SMarcel Moolenaar 233146aad74SMarcel Moolenaar int 234b40ce416SJulian Elischer linux_old_select(struct thread *td, struct linux_old_select_args *args) 235146aad74SMarcel Moolenaar { 2365002a60fSMarcel Moolenaar struct l_old_select_argv linux_args; 2375002a60fSMarcel Moolenaar struct linux_select_args newsel; 238146aad74SMarcel Moolenaar int error; 239146aad74SMarcel Moolenaar 2404b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &linux_args, sizeof(linux_args)); 241146aad74SMarcel Moolenaar if (error) 242146aad74SMarcel Moolenaar return (error); 243146aad74SMarcel Moolenaar 244146aad74SMarcel Moolenaar newsel.nfds = linux_args.nfds; 245146aad74SMarcel Moolenaar newsel.readfds = linux_args.readfds; 246146aad74SMarcel Moolenaar newsel.writefds = linux_args.writefds; 247146aad74SMarcel Moolenaar newsel.exceptfds = linux_args.exceptfds; 248146aad74SMarcel Moolenaar newsel.timeout = linux_args.timeout; 249b40ce416SJulian Elischer return (linux_select(td, &newsel)); 250146aad74SMarcel Moolenaar } 251146aad74SMarcel Moolenaar 252146aad74SMarcel Moolenaar int 2532c7660baSDmitry Chagin linux_set_cloned_tls(struct thread *td, void *desc) 2542c7660baSDmitry Chagin { 2552c7660baSDmitry Chagin struct segment_descriptor sd; 2562c7660baSDmitry Chagin struct l_user_desc info; 2572c7660baSDmitry Chagin int idx, error; 2582c7660baSDmitry Chagin int a[2]; 2592c7660baSDmitry Chagin 2602c7660baSDmitry Chagin error = copyin(desc, &info, sizeof(struct l_user_desc)); 2612c7660baSDmitry Chagin if (error) { 262c5156c77SDmitry Chagin linux_msg(td, "set_cloned_tls copyin failed!"); 2632c7660baSDmitry Chagin } else { 2642c7660baSDmitry Chagin idx = info.entry_number; 2652c7660baSDmitry Chagin 2662c7660baSDmitry Chagin /* 2672c7660baSDmitry Chagin * looks like we're getting the idx we returned 2682c7660baSDmitry Chagin * in the set_thread_area() syscall 2692c7660baSDmitry Chagin */ 2702c7660baSDmitry Chagin if (idx != 6 && idx != 3) { 271c5156c77SDmitry Chagin linux_msg(td, "set_cloned_tls resetting idx!"); 2722c7660baSDmitry Chagin idx = 3; 2732c7660baSDmitry Chagin } 2742c7660baSDmitry Chagin 2752c7660baSDmitry Chagin /* this doesnt happen in practice */ 2762c7660baSDmitry Chagin if (idx == 6) { 2772c7660baSDmitry Chagin /* we might copy out the entry_number as 3 */ 2782c7660baSDmitry Chagin info.entry_number = 3; 2792c7660baSDmitry Chagin error = copyout(&info, desc, sizeof(struct l_user_desc)); 2802c7660baSDmitry Chagin if (error) 281c5156c77SDmitry Chagin linux_msg(td, "set_cloned_tls copyout failed!"); 2822c7660baSDmitry Chagin } 2832c7660baSDmitry Chagin 2842c7660baSDmitry Chagin a[0] = LINUX_LDT_entry_a(&info); 2852c7660baSDmitry Chagin a[1] = LINUX_LDT_entry_b(&info); 2862c7660baSDmitry Chagin 2872c7660baSDmitry Chagin memcpy(&sd, &a, sizeof(a)); 2882c7660baSDmitry Chagin /* set %gs */ 2892c7660baSDmitry Chagin td->td_pcb->pcb_gsd = sd; 2902c7660baSDmitry Chagin td->td_pcb->pcb_gs = GSEL(GUGS_SEL, SEL_UPL); 2912c7660baSDmitry Chagin } 2922c7660baSDmitry Chagin 2932c7660baSDmitry Chagin return (error); 2942c7660baSDmitry Chagin } 2952c7660baSDmitry Chagin 296146aad74SMarcel Moolenaar int 2973b57ddb0SJohn Baldwin linux_set_upcall(struct thread *td, register_t stack) 298c8d6845eSDmitry Chagin { 299c8d6845eSDmitry Chagin 30081338031SDmitry Chagin if (stack) 301c8d6845eSDmitry Chagin td->td_frame->tf_esp = stack; 302c8d6845eSDmitry Chagin 30381338031SDmitry Chagin /* 30481338031SDmitry Chagin * The newly created Linux thread returns 30581338031SDmitry Chagin * to the user space by the same path that a parent do. 30681338031SDmitry Chagin */ 30781338031SDmitry Chagin td->td_frame->tf_eax = 0; 308c8d6845eSDmitry Chagin return (0); 309c8d6845eSDmitry Chagin } 310c8d6845eSDmitry Chagin 3113ad9c842SMaxim Sobolev int 312b40ce416SJulian Elischer linux_mmap(struct thread *td, struct linux_mmap_args *args) 313146aad74SMarcel Moolenaar { 3143ad9c842SMaxim Sobolev int error; 3153ad9c842SMaxim Sobolev struct l_mmap_argv linux_args; 3163ad9c842SMaxim Sobolev 3174b7ef73dSDag-Erling Smørgrav error = copyin(args->ptr, &linux_args, sizeof(linux_args)); 3183ad9c842SMaxim Sobolev if (error) 3193ad9c842SMaxim Sobolev return (error); 3203ad9c842SMaxim Sobolev 321f12c0348SJohn Baldwin return (linux_mmap_common(td, linux_args.addr, linux_args.len, 322f12c0348SJohn Baldwin linux_args.prot, linux_args.flags, linux_args.fd, 323f12c0348SJohn Baldwin (uint32_t)linux_args.pgoff)); 3243ad9c842SMaxim Sobolev } 3253ad9c842SMaxim Sobolev 326146aad74SMarcel Moolenaar int 327b40ce416SJulian Elischer linux_ioperm(struct thread *td, struct linux_ioperm_args *args) 328146aad74SMarcel Moolenaar { 32984569dffSMaxim Sobolev int error; 33084569dffSMaxim Sobolev struct i386_ioperm_args iia; 331146aad74SMarcel Moolenaar 33284569dffSMaxim Sobolev iia.start = args->start; 33384569dffSMaxim Sobolev iia.length = args->length; 33484569dffSMaxim Sobolev iia.enable = args->enable; 33584569dffSMaxim Sobolev error = i386_set_ioperm(td, &iia); 33684569dffSMaxim Sobolev return (error); 337146aad74SMarcel Moolenaar } 338146aad74SMarcel Moolenaar 339146aad74SMarcel Moolenaar int 340b40ce416SJulian Elischer linux_iopl(struct thread *td, struct linux_iopl_args *args) 341146aad74SMarcel Moolenaar { 342146aad74SMarcel Moolenaar int error; 343146aad74SMarcel Moolenaar 344146aad74SMarcel Moolenaar if (args->level < 0 || args->level > 3) 345146aad74SMarcel Moolenaar return (EINVAL); 346acd3428bSRobert Watson if ((error = priv_check(td, PRIV_IO)) != 0) 347146aad74SMarcel Moolenaar return (error); 348a854ed98SJohn Baldwin if ((error = securelevel_gt(td->td_ucred, 0)) != 0) 34941c42188SRobert Watson return (error); 350b40ce416SJulian Elischer td->td_frame->tf_eflags = (td->td_frame->tf_eflags & ~PSL_IOPL) | 351146aad74SMarcel Moolenaar (args->level * (PSL_IOPL / 3)); 352146aad74SMarcel Moolenaar return (0); 353146aad74SMarcel Moolenaar } 354146aad74SMarcel Moolenaar 355146aad74SMarcel Moolenaar int 356b07cd97eSMark Murray linux_modify_ldt(struct thread *td, struct linux_modify_ldt_args *uap) 357146aad74SMarcel Moolenaar { 358146aad74SMarcel Moolenaar int error; 35984569dffSMaxim Sobolev struct i386_ldt_args ldt; 3605002a60fSMarcel Moolenaar struct l_descriptor ld; 36184569dffSMaxim Sobolev union descriptor desc; 3626259969dSKonstantin Belousov int size, written; 363146aad74SMarcel Moolenaar 364146aad74SMarcel Moolenaar switch (uap->func) { 365146aad74SMarcel Moolenaar case 0x00: /* read_ldt */ 36684569dffSMaxim Sobolev ldt.start = 0; 36784569dffSMaxim Sobolev ldt.descs = uap->ptr; 36884569dffSMaxim Sobolev ldt.num = uap->bytecount / sizeof(union descriptor); 36984569dffSMaxim Sobolev error = i386_get_ldt(td, &ldt); 370b40ce416SJulian Elischer td->td_retval[0] *= sizeof(union descriptor); 371146aad74SMarcel Moolenaar break; 3726259969dSKonstantin Belousov case 0x02: /* read_default_ldt = 0 */ 3736259969dSKonstantin Belousov size = 5*sizeof(struct l_desc_struct); 3746259969dSKonstantin Belousov if (size > uap->bytecount) 3756259969dSKonstantin Belousov size = uap->bytecount; 3766259969dSKonstantin Belousov for (written = error = 0; written < size && error == 0; written++) 3776259969dSKonstantin Belousov error = subyte((char *)uap->ptr + written, 0); 3786259969dSKonstantin Belousov td->td_retval[0] = written; 3796259969dSKonstantin Belousov break; 380146aad74SMarcel Moolenaar case 0x01: /* write_ldt */ 381146aad74SMarcel Moolenaar case 0x11: /* write_ldt */ 382146aad74SMarcel Moolenaar if (uap->bytecount != sizeof(ld)) 383146aad74SMarcel Moolenaar return (EINVAL); 384146aad74SMarcel Moolenaar 385146aad74SMarcel Moolenaar error = copyin(uap->ptr, &ld, sizeof(ld)); 386146aad74SMarcel Moolenaar if (error) 387146aad74SMarcel Moolenaar return (error); 388146aad74SMarcel Moolenaar 38984569dffSMaxim Sobolev ldt.start = ld.entry_number; 39084569dffSMaxim Sobolev ldt.descs = &desc; 39184569dffSMaxim Sobolev ldt.num = 1; 39284569dffSMaxim Sobolev desc.sd.sd_lolimit = (ld.limit & 0x0000ffff); 39384569dffSMaxim Sobolev desc.sd.sd_hilimit = (ld.limit & 0x000f0000) >> 16; 39484569dffSMaxim Sobolev desc.sd.sd_lobase = (ld.base_addr & 0x00ffffff); 39584569dffSMaxim Sobolev desc.sd.sd_hibase = (ld.base_addr & 0xff000000) >> 24; 39684569dffSMaxim Sobolev desc.sd.sd_type = SDT_MEMRO | ((ld.read_exec_only ^ 1) << 1) | 397146aad74SMarcel Moolenaar (ld.contents << 2); 39884569dffSMaxim Sobolev desc.sd.sd_dpl = 3; 39984569dffSMaxim Sobolev desc.sd.sd_p = (ld.seg_not_present ^ 1); 40084569dffSMaxim Sobolev desc.sd.sd_xx = 0; 40184569dffSMaxim Sobolev desc.sd.sd_def32 = ld.seg_32bit; 40284569dffSMaxim Sobolev desc.sd.sd_gran = ld.limit_in_pages; 40384569dffSMaxim Sobolev error = i386_set_ldt(td, &ldt, &desc); 404146aad74SMarcel Moolenaar break; 405146aad74SMarcel Moolenaar default: 4067c020cbbSJohn Baldwin error = ENOSYS; 407146aad74SMarcel Moolenaar break; 408146aad74SMarcel Moolenaar } 409146aad74SMarcel Moolenaar 410146aad74SMarcel Moolenaar if (error == EOPNOTSUPP) { 411c5156c77SDmitry Chagin linux_msg(td, "modify_ldt needs kernel option USER_LDT"); 412146aad74SMarcel Moolenaar error = ENOSYS; 413146aad74SMarcel Moolenaar } 414146aad74SMarcel Moolenaar 415146aad74SMarcel Moolenaar return (error); 416146aad74SMarcel Moolenaar } 417146aad74SMarcel Moolenaar 418146aad74SMarcel Moolenaar int 419b40ce416SJulian Elischer linux_sigaction(struct thread *td, struct linux_sigaction_args *args) 420146aad74SMarcel Moolenaar { 4215002a60fSMarcel Moolenaar l_osigaction_t osa; 4225002a60fSMarcel Moolenaar l_sigaction_t act, oact; 423146aad74SMarcel Moolenaar int error; 424146aad74SMarcel Moolenaar 425146aad74SMarcel Moolenaar if (args->nsa != NULL) { 4264b7ef73dSDag-Erling Smørgrav error = copyin(args->nsa, &osa, sizeof(l_osigaction_t)); 427146aad74SMarcel Moolenaar if (error) 428146aad74SMarcel Moolenaar return (error); 429146aad74SMarcel Moolenaar act.lsa_handler = osa.lsa_handler; 430146aad74SMarcel Moolenaar act.lsa_flags = osa.lsa_flags; 431146aad74SMarcel Moolenaar act.lsa_restorer = osa.lsa_restorer; 432146aad74SMarcel Moolenaar LINUX_SIGEMPTYSET(act.lsa_mask); 4334ab7403bSDmitry Chagin act.lsa_mask.__mask = osa.lsa_mask; 434146aad74SMarcel Moolenaar } 435146aad74SMarcel Moolenaar 436b40ce416SJulian Elischer error = linux_do_sigaction(td, args->sig, args->nsa ? &act : NULL, 437146aad74SMarcel Moolenaar args->osa ? &oact : NULL); 438146aad74SMarcel Moolenaar 439146aad74SMarcel Moolenaar if (args->osa != NULL && !error) { 440146aad74SMarcel Moolenaar osa.lsa_handler = oact.lsa_handler; 441146aad74SMarcel Moolenaar osa.lsa_flags = oact.lsa_flags; 442146aad74SMarcel Moolenaar osa.lsa_restorer = oact.lsa_restorer; 4434ab7403bSDmitry Chagin osa.lsa_mask = oact.lsa_mask.__mask; 4444b7ef73dSDag-Erling Smørgrav error = copyout(&osa, args->osa, sizeof(l_osigaction_t)); 445146aad74SMarcel Moolenaar } 446146aad74SMarcel Moolenaar 447146aad74SMarcel Moolenaar return (error); 448146aad74SMarcel Moolenaar } 449146aad74SMarcel Moolenaar 450146aad74SMarcel Moolenaar /* 451146aad74SMarcel Moolenaar * Linux has two extra args, restart and oldmask. We dont use these, 452146aad74SMarcel Moolenaar * but it seems that "restart" is actually a context pointer that 453146aad74SMarcel Moolenaar * enables the signal to happen with a different register set. 454146aad74SMarcel Moolenaar */ 455146aad74SMarcel Moolenaar int 456b40ce416SJulian Elischer linux_sigsuspend(struct thread *td, struct linux_sigsuspend_args *args) 457146aad74SMarcel Moolenaar { 458206a5d3aSIan Dowse sigset_t sigmask; 4595002a60fSMarcel Moolenaar l_sigset_t mask; 460146aad74SMarcel Moolenaar 461146aad74SMarcel Moolenaar LINUX_SIGEMPTYSET(mask); 4624ab7403bSDmitry Chagin mask.__mask = args->mask; 463206a5d3aSIan Dowse linux_to_bsd_sigset(&mask, &sigmask); 464206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 465146aad74SMarcel Moolenaar } 466146aad74SMarcel Moolenaar 467146aad74SMarcel Moolenaar int 468b40ce416SJulian Elischer linux_pause(struct thread *td, struct linux_pause_args *args) 469146aad74SMarcel Moolenaar { 470b40ce416SJulian Elischer struct proc *p = td->td_proc; 471206a5d3aSIan Dowse sigset_t sigmask; 472146aad74SMarcel Moolenaar 473fdfdfb78SJohn Baldwin PROC_LOCK(p); 4744093529dSJeff Roberson sigmask = td->td_sigmask; 475fdfdfb78SJohn Baldwin PROC_UNLOCK(p); 476206a5d3aSIan Dowse return (kern_sigsuspend(td, sigmask)); 477146aad74SMarcel Moolenaar } 478146aad74SMarcel Moolenaar 479146aad74SMarcel Moolenaar int 4801bc85c0dSDoug Rabson linux_set_thread_area(struct thread *td, struct linux_set_thread_area_args *args) 4811bc85c0dSDoug Rabson { 4829b44bfc5SAlexander Leidinger struct l_user_desc info; 4839b44bfc5SAlexander Leidinger int error; 4849b44bfc5SAlexander Leidinger int idx; 4859b44bfc5SAlexander Leidinger int a[2]; 4869b44bfc5SAlexander Leidinger struct segment_descriptor sd; 4879b44bfc5SAlexander Leidinger 4889b44bfc5SAlexander Leidinger error = copyin(args->desc, &info, sizeof(struct l_user_desc)); 4899b44bfc5SAlexander Leidinger if (error) 4909b44bfc5SAlexander Leidinger return (error); 4919b44bfc5SAlexander Leidinger 4929b44bfc5SAlexander Leidinger idx = info.entry_number; 4930eef2f8aSAlexander Leidinger /* 494eae594f7SEd Maste * Semantics of Linux version: every thread in the system has array of 495802e08a3SAlexander Leidinger * 3 tls descriptors. 1st is GLIBC TLS, 2nd is WINE, 3rd unknown. This 496*29eab3e4SGordon Bergling * syscall loads one of the selected tls descriptors with a value and 497802e08a3SAlexander Leidinger * also loads GDT descriptors 6, 7 and 8 with the content of the 498802e08a3SAlexander Leidinger * per-thread descriptors. 4999b44bfc5SAlexander Leidinger * 500eae594f7SEd Maste * Semantics of FreeBSD version: I think we can ignore that Linux has 3 501802e08a3SAlexander Leidinger * per-thread descriptors and use just the 1st one. The tls_array[] 502802e08a3SAlexander Leidinger * is used only in set/get-thread_area() syscalls and for loading the 503eae594f7SEd Maste * GDT descriptors. In FreeBSD we use just one GDT descriptor for TLS 504eae594f7SEd Maste * so we will load just one. 505802e08a3SAlexander Leidinger * 506802e08a3SAlexander Leidinger * XXX: this doesn't work when a user space process tries to use more 507eae594f7SEd Maste * than 1 TLS segment. Comment in the Linux sources says wine might do 508802e08a3SAlexander Leidinger * this. 5091bc85c0dSDoug Rabson */ 5109b44bfc5SAlexander Leidinger 5110eef2f8aSAlexander Leidinger /* 5120eef2f8aSAlexander Leidinger * we support just GLIBC TLS now 5139b44bfc5SAlexander Leidinger * we should let 3 proceed as well because we use this segment so 5149b44bfc5SAlexander Leidinger * if code does two subsequent calls it should succeed 5159b44bfc5SAlexander Leidinger */ 5169b44bfc5SAlexander Leidinger if (idx != 6 && idx != -1 && idx != 3) 5179b44bfc5SAlexander Leidinger return (EINVAL); 5189b44bfc5SAlexander Leidinger 5190eef2f8aSAlexander Leidinger /* 5200eef2f8aSAlexander Leidinger * we have to copy out the GDT entry we use 5219b44bfc5SAlexander Leidinger * FreeBSD uses GDT entry #3 for storing %gs so load that 522802e08a3SAlexander Leidinger * 523802e08a3SAlexander Leidinger * XXX: what if a user space program doesn't check this value and tries 5249b44bfc5SAlexander Leidinger * to use 6, 7 or 8? 5259b44bfc5SAlexander Leidinger */ 5269b44bfc5SAlexander Leidinger idx = info.entry_number = 3; 5279b44bfc5SAlexander Leidinger error = copyout(&info, args->desc, sizeof(struct l_user_desc)); 5289b44bfc5SAlexander Leidinger if (error) 5299b44bfc5SAlexander Leidinger return (error); 5309b44bfc5SAlexander Leidinger 531a4e3bad7SJung-uk Kim if (LINUX_LDT_empty(&info)) { 5329b44bfc5SAlexander Leidinger a[0] = 0; 5339b44bfc5SAlexander Leidinger a[1] = 0; 5349b44bfc5SAlexander Leidinger } else { 535a4e3bad7SJung-uk Kim a[0] = LINUX_LDT_entry_a(&info); 536a4e3bad7SJung-uk Kim a[1] = LINUX_LDT_entry_b(&info); 5371bc85c0dSDoug Rabson } 5381bc85c0dSDoug Rabson 5399b44bfc5SAlexander Leidinger memcpy(&sd, &a, sizeof(a)); 5409b44bfc5SAlexander Leidinger /* this is taken from i386 version of cpu_set_user_tls() */ 5419b44bfc5SAlexander Leidinger critical_enter(); 5429b44bfc5SAlexander Leidinger /* set %gs */ 5439b44bfc5SAlexander Leidinger td->td_pcb->pcb_gsd = sd; 5449b44bfc5SAlexander Leidinger PCPU_GET(fsgs_gdt)[1] = sd; 5459b44bfc5SAlexander Leidinger load_gs(GSEL(GUGS_SEL, SEL_UPL)); 5469b44bfc5SAlexander Leidinger critical_exit(); 5479b44bfc5SAlexander Leidinger 5481bc85c0dSDoug Rabson return (0); 5491bc85c0dSDoug Rabson } 5501bc85c0dSDoug Rabson 5511bc85c0dSDoug Rabson int 5529b44bfc5SAlexander Leidinger linux_get_thread_area(struct thread *td, struct linux_get_thread_area_args *args) 5531bc85c0dSDoug Rabson { 5541bc85c0dSDoug Rabson 5559b44bfc5SAlexander Leidinger struct l_user_desc info; 5569b44bfc5SAlexander Leidinger int error; 5579b44bfc5SAlexander Leidinger int idx; 5589b44bfc5SAlexander Leidinger struct l_desc_struct desc; 5599b44bfc5SAlexander Leidinger struct segment_descriptor sd; 5609b44bfc5SAlexander Leidinger 5619b44bfc5SAlexander Leidinger error = copyin(args->desc, &info, sizeof(struct l_user_desc)); 5629b44bfc5SAlexander Leidinger if (error) 5639b44bfc5SAlexander Leidinger return (error); 5649b44bfc5SAlexander Leidinger 5659b44bfc5SAlexander Leidinger idx = info.entry_number; 5669b44bfc5SAlexander Leidinger /* XXX: I am not sure if we want 3 to be allowed too. */ 5679b44bfc5SAlexander Leidinger if (idx != 6 && idx != 3) 5689b44bfc5SAlexander Leidinger return (EINVAL); 5699b44bfc5SAlexander Leidinger 5709b44bfc5SAlexander Leidinger idx = 3; 5719b44bfc5SAlexander Leidinger 5729b44bfc5SAlexander Leidinger memset(&info, 0, sizeof(info)); 5739b44bfc5SAlexander Leidinger 5749b44bfc5SAlexander Leidinger sd = PCPU_GET(fsgs_gdt)[1]; 5759b44bfc5SAlexander Leidinger 5769b44bfc5SAlexander Leidinger memcpy(&desc, &sd, sizeof(desc)); 5779b44bfc5SAlexander Leidinger 5789b44bfc5SAlexander Leidinger info.entry_number = idx; 579a4e3bad7SJung-uk Kim info.base_addr = LINUX_GET_BASE(&desc); 580a4e3bad7SJung-uk Kim info.limit = LINUX_GET_LIMIT(&desc); 581a4e3bad7SJung-uk Kim info.seg_32bit = LINUX_GET_32BIT(&desc); 582a4e3bad7SJung-uk Kim info.contents = LINUX_GET_CONTENTS(&desc); 583a4e3bad7SJung-uk Kim info.read_exec_only = !LINUX_GET_WRITABLE(&desc); 584a4e3bad7SJung-uk Kim info.limit_in_pages = LINUX_GET_LIMIT_PAGES(&desc); 585a4e3bad7SJung-uk Kim info.seg_not_present = !LINUX_GET_PRESENT(&desc); 586a4e3bad7SJung-uk Kim info.useable = LINUX_GET_USEABLE(&desc); 5879b44bfc5SAlexander Leidinger 5889b44bfc5SAlexander Leidinger error = copyout(&info, args->desc, sizeof(struct l_user_desc)); 5899b44bfc5SAlexander Leidinger if (error) 5909b44bfc5SAlexander Leidinger return (EFAULT); 5919b44bfc5SAlexander Leidinger 5929b44bfc5SAlexander Leidinger return (0); 5939b44bfc5SAlexander Leidinger } 5949b44bfc5SAlexander Leidinger 595cc1b0f7dSDmitry Chagin void 596cc1b0f7dSDmitry Chagin bsd_to_linux_regset(const struct reg *b_reg, 597cc1b0f7dSDmitry Chagin struct linux_pt_regset *l_regset) 598cc1b0f7dSDmitry Chagin { 599cc1b0f7dSDmitry Chagin 600cc1b0f7dSDmitry Chagin l_regset->ebx = b_reg->r_ebx; 601cc1b0f7dSDmitry Chagin l_regset->ecx = b_reg->r_ecx; 602cc1b0f7dSDmitry Chagin l_regset->edx = b_reg->r_edx; 603cc1b0f7dSDmitry Chagin l_regset->esi = b_reg->r_esi; 604cc1b0f7dSDmitry Chagin l_regset->edi = b_reg->r_edi; 605cc1b0f7dSDmitry Chagin l_regset->ebp = b_reg->r_ebp; 606cc1b0f7dSDmitry Chagin l_regset->eax = b_reg->r_eax; 607cc1b0f7dSDmitry Chagin l_regset->ds = b_reg->r_ds; 608cc1b0f7dSDmitry Chagin l_regset->es = b_reg->r_es; 609cc1b0f7dSDmitry Chagin l_regset->fs = b_reg->r_fs; 610cc1b0f7dSDmitry Chagin l_regset->gs = b_reg->r_gs; 611cc1b0f7dSDmitry Chagin l_regset->orig_eax = b_reg->r_eax; 612cc1b0f7dSDmitry Chagin l_regset->eip = b_reg->r_eip; 613cc1b0f7dSDmitry Chagin l_regset->cs = b_reg->r_cs; 614cc1b0f7dSDmitry Chagin l_regset->eflags = b_reg->r_eflags; 615cc1b0f7dSDmitry Chagin l_regset->esp = b_reg->r_esp; 616cc1b0f7dSDmitry Chagin l_regset->ss = b_reg->r_ss; 617cc1b0f7dSDmitry Chagin } 61850c85a32SDmitry Chagin 61950c85a32SDmitry Chagin int 62050c85a32SDmitry Chagin linux_uselib(struct thread *td, struct linux_uselib_args *args) 62150c85a32SDmitry Chagin { 62250c85a32SDmitry Chagin struct nameidata ni; 62350c85a32SDmitry Chagin struct vnode *vp; 62450c85a32SDmitry Chagin struct exec *a_out; 62550c85a32SDmitry Chagin vm_map_t map; 62650c85a32SDmitry Chagin vm_map_entry_t entry; 62750c85a32SDmitry Chagin struct vattr attr; 62850c85a32SDmitry Chagin vm_offset_t vmaddr; 62950c85a32SDmitry Chagin unsigned long file_offset; 63050c85a32SDmitry Chagin unsigned long bss_size; 63150c85a32SDmitry Chagin ssize_t aresid; 63250c85a32SDmitry Chagin int error; 63350c85a32SDmitry Chagin bool locked, opened, textset; 63450c85a32SDmitry Chagin 63550c85a32SDmitry Chagin a_out = NULL; 63650c85a32SDmitry Chagin vp = NULL; 63750c85a32SDmitry Chagin locked = false; 63850c85a32SDmitry Chagin textset = false; 63950c85a32SDmitry Chagin opened = false; 64050c85a32SDmitry Chagin 64150c85a32SDmitry Chagin NDINIT(&ni, LOOKUP, ISOPEN | FOLLOW | LOCKLEAF | AUDITVNODE1, 64250c85a32SDmitry Chagin UIO_USERSPACE, args->library); 64350c85a32SDmitry Chagin error = namei(&ni); 64450c85a32SDmitry Chagin if (error) 64550c85a32SDmitry Chagin goto cleanup; 64650c85a32SDmitry Chagin 64750c85a32SDmitry Chagin vp = ni.ni_vp; 64850c85a32SDmitry Chagin NDFREE_PNBUF(&ni); 64950c85a32SDmitry Chagin 65050c85a32SDmitry Chagin /* 65150c85a32SDmitry Chagin * From here on down, we have a locked vnode that must be unlocked. 65250c85a32SDmitry Chagin * XXX: The code below largely duplicates exec_check_permissions(). 65350c85a32SDmitry Chagin */ 65450c85a32SDmitry Chagin locked = true; 65550c85a32SDmitry Chagin 65650c85a32SDmitry Chagin /* Executable? */ 65750c85a32SDmitry Chagin error = VOP_GETATTR(vp, &attr, td->td_ucred); 65850c85a32SDmitry Chagin if (error) 65950c85a32SDmitry Chagin goto cleanup; 66050c85a32SDmitry Chagin 66150c85a32SDmitry Chagin if ((vp->v_mount->mnt_flag & MNT_NOEXEC) || 66250c85a32SDmitry Chagin ((attr.va_mode & 0111) == 0) || (attr.va_type != VREG)) { 66350c85a32SDmitry Chagin /* EACCESS is what exec(2) returns. */ 66450c85a32SDmitry Chagin error = ENOEXEC; 66550c85a32SDmitry Chagin goto cleanup; 66650c85a32SDmitry Chagin } 66750c85a32SDmitry Chagin 66850c85a32SDmitry Chagin /* Sensible size? */ 66950c85a32SDmitry Chagin if (attr.va_size == 0) { 67050c85a32SDmitry Chagin error = ENOEXEC; 67150c85a32SDmitry Chagin goto cleanup; 67250c85a32SDmitry Chagin } 67350c85a32SDmitry Chagin 67450c85a32SDmitry Chagin /* Can we access it? */ 67550c85a32SDmitry Chagin error = VOP_ACCESS(vp, VEXEC, td->td_ucred, td); 67650c85a32SDmitry Chagin if (error) 67750c85a32SDmitry Chagin goto cleanup; 67850c85a32SDmitry Chagin 67950c85a32SDmitry Chagin /* 68050c85a32SDmitry Chagin * XXX: This should use vn_open() so that it is properly authorized, 68150c85a32SDmitry Chagin * and to reduce code redundancy all over the place here. 68250c85a32SDmitry Chagin * XXX: Not really, it duplicates far more of exec_check_permissions() 68350c85a32SDmitry Chagin * than vn_open(). 68450c85a32SDmitry Chagin */ 68550c85a32SDmitry Chagin #ifdef MAC 68650c85a32SDmitry Chagin error = mac_vnode_check_open(td->td_ucred, vp, VREAD); 68750c85a32SDmitry Chagin if (error) 68850c85a32SDmitry Chagin goto cleanup; 68950c85a32SDmitry Chagin #endif 69050c85a32SDmitry Chagin error = VOP_OPEN(vp, FREAD, td->td_ucred, td, NULL); 69150c85a32SDmitry Chagin if (error) 69250c85a32SDmitry Chagin goto cleanup; 69350c85a32SDmitry Chagin opened = true; 69450c85a32SDmitry Chagin 69550c85a32SDmitry Chagin /* Pull in executable header into exec_map */ 69650c85a32SDmitry Chagin error = vm_mmap(exec_map, (vm_offset_t *)&a_out, PAGE_SIZE, 69750c85a32SDmitry Chagin VM_PROT_READ, VM_PROT_READ, 0, OBJT_VNODE, vp, 0); 69850c85a32SDmitry Chagin if (error) 69950c85a32SDmitry Chagin goto cleanup; 70050c85a32SDmitry Chagin 70150c85a32SDmitry Chagin /* Is it a Linux binary ? */ 70250c85a32SDmitry Chagin if (((a_out->a_magic >> 16) & 0xff) != 0x64) { 70350c85a32SDmitry Chagin error = ENOEXEC; 70450c85a32SDmitry Chagin goto cleanup; 70550c85a32SDmitry Chagin } 70650c85a32SDmitry Chagin 70750c85a32SDmitry Chagin /* 70850c85a32SDmitry Chagin * While we are here, we should REALLY do some more checks 70950c85a32SDmitry Chagin */ 71050c85a32SDmitry Chagin 71150c85a32SDmitry Chagin /* Set file/virtual offset based on a.out variant. */ 71250c85a32SDmitry Chagin switch ((int)(a_out->a_magic & 0xffff)) { 71350c85a32SDmitry Chagin case 0413: /* ZMAGIC */ 71450c85a32SDmitry Chagin file_offset = 1024; 71550c85a32SDmitry Chagin break; 71650c85a32SDmitry Chagin case 0314: /* QMAGIC */ 71750c85a32SDmitry Chagin file_offset = 0; 71850c85a32SDmitry Chagin break; 71950c85a32SDmitry Chagin default: 72050c85a32SDmitry Chagin error = ENOEXEC; 72150c85a32SDmitry Chagin goto cleanup; 72250c85a32SDmitry Chagin } 72350c85a32SDmitry Chagin 72450c85a32SDmitry Chagin bss_size = round_page(a_out->a_bss); 72550c85a32SDmitry Chagin 72650c85a32SDmitry Chagin /* Check various fields in header for validity/bounds. */ 72750c85a32SDmitry Chagin if (a_out->a_text & PAGE_MASK || a_out->a_data & PAGE_MASK) { 72850c85a32SDmitry Chagin error = ENOEXEC; 72950c85a32SDmitry Chagin goto cleanup; 73050c85a32SDmitry Chagin } 73150c85a32SDmitry Chagin 73250c85a32SDmitry Chagin /* text + data can't exceed file size */ 73350c85a32SDmitry Chagin if (a_out->a_data + a_out->a_text > attr.va_size) { 73450c85a32SDmitry Chagin error = EFAULT; 73550c85a32SDmitry Chagin goto cleanup; 73650c85a32SDmitry Chagin } 73750c85a32SDmitry Chagin 73850c85a32SDmitry Chagin /* 73950c85a32SDmitry Chagin * text/data/bss must not exceed limits 74050c85a32SDmitry Chagin * XXX - this is not complete. it should check current usage PLUS 74150c85a32SDmitry Chagin * the resources needed by this library. 74250c85a32SDmitry Chagin */ 74350c85a32SDmitry Chagin PROC_LOCK(td->td_proc); 74450c85a32SDmitry Chagin if (a_out->a_text > maxtsiz || 74550c85a32SDmitry Chagin a_out->a_data + bss_size > lim_cur_proc(td->td_proc, RLIMIT_DATA) || 74650c85a32SDmitry Chagin racct_set(td->td_proc, RACCT_DATA, a_out->a_data + 74750c85a32SDmitry Chagin bss_size) != 0) { 74850c85a32SDmitry Chagin PROC_UNLOCK(td->td_proc); 74950c85a32SDmitry Chagin error = ENOMEM; 75050c85a32SDmitry Chagin goto cleanup; 75150c85a32SDmitry Chagin } 75250c85a32SDmitry Chagin PROC_UNLOCK(td->td_proc); 75350c85a32SDmitry Chagin 75450c85a32SDmitry Chagin /* 75550c85a32SDmitry Chagin * Prevent more writers. 75650c85a32SDmitry Chagin */ 75750c85a32SDmitry Chagin error = VOP_SET_TEXT(vp); 75850c85a32SDmitry Chagin if (error != 0) 75950c85a32SDmitry Chagin goto cleanup; 76050c85a32SDmitry Chagin textset = true; 76150c85a32SDmitry Chagin 76250c85a32SDmitry Chagin /* 76350c85a32SDmitry Chagin * Lock no longer needed 76450c85a32SDmitry Chagin */ 76550c85a32SDmitry Chagin locked = false; 76650c85a32SDmitry Chagin VOP_UNLOCK(vp); 76750c85a32SDmitry Chagin 76850c85a32SDmitry Chagin /* 76950c85a32SDmitry Chagin * Check if file_offset page aligned. Currently we cannot handle 77050c85a32SDmitry Chagin * misalinged file offsets, and so we read in the entire image 77150c85a32SDmitry Chagin * (what a waste). 77250c85a32SDmitry Chagin */ 77350c85a32SDmitry Chagin if (file_offset & PAGE_MASK) { 77450c85a32SDmitry Chagin /* Map text+data read/write/execute */ 77550c85a32SDmitry Chagin 77650c85a32SDmitry Chagin /* a_entry is the load address and is page aligned */ 77750c85a32SDmitry Chagin vmaddr = trunc_page(a_out->a_entry); 77850c85a32SDmitry Chagin 77950c85a32SDmitry Chagin /* get anon user mapping, read+write+execute */ 78050c85a32SDmitry Chagin error = vm_map_find(&td->td_proc->p_vmspace->vm_map, NULL, 0, 78150c85a32SDmitry Chagin &vmaddr, a_out->a_text + a_out->a_data, 0, VMFS_NO_SPACE, 78250c85a32SDmitry Chagin VM_PROT_ALL, VM_PROT_ALL, 0); 78350c85a32SDmitry Chagin if (error) 78450c85a32SDmitry Chagin goto cleanup; 78550c85a32SDmitry Chagin 78650c85a32SDmitry Chagin error = vn_rdwr(UIO_READ, vp, (void *)vmaddr, file_offset, 78750c85a32SDmitry Chagin a_out->a_text + a_out->a_data, UIO_USERSPACE, 0, 78850c85a32SDmitry Chagin td->td_ucred, NOCRED, &aresid, td); 78950c85a32SDmitry Chagin if (error != 0) 79050c85a32SDmitry Chagin goto cleanup; 79150c85a32SDmitry Chagin if (aresid != 0) { 79250c85a32SDmitry Chagin error = ENOEXEC; 79350c85a32SDmitry Chagin goto cleanup; 79450c85a32SDmitry Chagin } 79550c85a32SDmitry Chagin } else { 79650c85a32SDmitry Chagin /* 79750c85a32SDmitry Chagin * for QMAGIC, a_entry is 20 bytes beyond the load address 79850c85a32SDmitry Chagin * to skip the executable header 79950c85a32SDmitry Chagin */ 80050c85a32SDmitry Chagin vmaddr = trunc_page(a_out->a_entry); 80150c85a32SDmitry Chagin 80250c85a32SDmitry Chagin /* 80350c85a32SDmitry Chagin * Map it all into the process's space as a single 80450c85a32SDmitry Chagin * copy-on-write "data" segment. 80550c85a32SDmitry Chagin */ 80650c85a32SDmitry Chagin map = &td->td_proc->p_vmspace->vm_map; 80750c85a32SDmitry Chagin error = vm_mmap(map, &vmaddr, 80850c85a32SDmitry Chagin a_out->a_text + a_out->a_data, VM_PROT_ALL, VM_PROT_ALL, 80950c85a32SDmitry Chagin MAP_PRIVATE | MAP_FIXED, OBJT_VNODE, vp, file_offset); 81050c85a32SDmitry Chagin if (error) 81150c85a32SDmitry Chagin goto cleanup; 81250c85a32SDmitry Chagin vm_map_lock(map); 81350c85a32SDmitry Chagin if (!vm_map_lookup_entry(map, vmaddr, &entry)) { 81450c85a32SDmitry Chagin vm_map_unlock(map); 81550c85a32SDmitry Chagin error = EDOOFUS; 81650c85a32SDmitry Chagin goto cleanup; 81750c85a32SDmitry Chagin } 81850c85a32SDmitry Chagin entry->eflags |= MAP_ENTRY_VN_EXEC; 81950c85a32SDmitry Chagin vm_map_unlock(map); 82050c85a32SDmitry Chagin textset = false; 82150c85a32SDmitry Chagin } 82250c85a32SDmitry Chagin 82350c85a32SDmitry Chagin if (bss_size != 0) { 82450c85a32SDmitry Chagin /* Calculate BSS start address */ 82550c85a32SDmitry Chagin vmaddr = trunc_page(a_out->a_entry) + a_out->a_text + 82650c85a32SDmitry Chagin a_out->a_data; 82750c85a32SDmitry Chagin 82850c85a32SDmitry Chagin /* allocate some 'anon' space */ 82950c85a32SDmitry Chagin error = vm_map_find(&td->td_proc->p_vmspace->vm_map, NULL, 0, 83050c85a32SDmitry Chagin &vmaddr, bss_size, 0, VMFS_NO_SPACE, VM_PROT_ALL, 83150c85a32SDmitry Chagin VM_PROT_ALL, 0); 83250c85a32SDmitry Chagin if (error) 83350c85a32SDmitry Chagin goto cleanup; 83450c85a32SDmitry Chagin } 83550c85a32SDmitry Chagin 83650c85a32SDmitry Chagin cleanup: 83750c85a32SDmitry Chagin if (opened) { 83850c85a32SDmitry Chagin if (locked) 83950c85a32SDmitry Chagin VOP_UNLOCK(vp); 84050c85a32SDmitry Chagin locked = false; 84150c85a32SDmitry Chagin VOP_CLOSE(vp, FREAD, td->td_ucred, td); 84250c85a32SDmitry Chagin } 84350c85a32SDmitry Chagin if (textset) { 84450c85a32SDmitry Chagin if (!locked) { 84550c85a32SDmitry Chagin locked = true; 84650c85a32SDmitry Chagin VOP_LOCK(vp, LK_SHARED | LK_RETRY); 84750c85a32SDmitry Chagin } 84850c85a32SDmitry Chagin VOP_UNSET_TEXT_CHECKED(vp); 84950c85a32SDmitry Chagin } 85050c85a32SDmitry Chagin if (locked) 85150c85a32SDmitry Chagin VOP_UNLOCK(vp); 85250c85a32SDmitry Chagin 85350c85a32SDmitry Chagin /* Release the temporary mapping. */ 85450c85a32SDmitry Chagin if (a_out) 85550c85a32SDmitry Chagin kmap_free_wakeup(exec_map, (vm_offset_t)a_out, PAGE_SIZE); 85650c85a32SDmitry Chagin 85750c85a32SDmitry Chagin return (error); 85850c85a32SDmitry Chagin } 859