17c478bd9Sstevel@tonic-gate /* 2ae115bc7Smrj * CDDL HEADER START 3ae115bc7Smrj * 4ae115bc7Smrj * The contents of this file are subject to the terms of the 5ae115bc7Smrj * Common Development and Distribution License (the "License"). 6ae115bc7Smrj * You may not use this file except in compliance with the License. 7ae115bc7Smrj * 8ae115bc7Smrj * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9ae115bc7Smrj * or http://www.opensolaris.org/os/licensing. 10ae115bc7Smrj * See the License for the specific language governing permissions 11ae115bc7Smrj * and limitations under the License. 12ae115bc7Smrj * 13ae115bc7Smrj * When distributing Covered Code, include this CDDL HEADER in each 14ae115bc7Smrj * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15ae115bc7Smrj * If applicable, add the following below this CDDL HEADER, with the 16ae115bc7Smrj * fields enclosed by brackets "[]" replaced with your own identifying 17ae115bc7Smrj * information: Portions Copyright [yyyy] [name of copyright owner] 18ae115bc7Smrj * 19ae115bc7Smrj * CDDL HEADER END 20ae115bc7Smrj */ 21ae115bc7Smrj 22ae115bc7Smrj /* 23eb5a5c78SSurya Prakki * Copyright (c) 2004, 2010, Oracle and/or its affiliates. All rights reserved. 247c478bd9Sstevel@tonic-gate */ 257c478bd9Sstevel@tonic-gate 267c478bd9Sstevel@tonic-gate /* 27*f16a0f4cSRobert Mustacchi * Copyright 2011 Joyent, Inc. All rights reserved. 28*f16a0f4cSRobert Mustacchi */ 29*f16a0f4cSRobert Mustacchi 30*f16a0f4cSRobert Mustacchi /* 317c478bd9Sstevel@tonic-gate * Copyright (c) 1992 Terrence R. Lambert. 327c478bd9Sstevel@tonic-gate * Copyright (c) 1990 The Regents of the University of California. 337c478bd9Sstevel@tonic-gate * All rights reserved. 347c478bd9Sstevel@tonic-gate * 357c478bd9Sstevel@tonic-gate * This code is derived from software contributed to Berkeley by 367c478bd9Sstevel@tonic-gate * William Jolitz. 377c478bd9Sstevel@tonic-gate * 387c478bd9Sstevel@tonic-gate * Redistribution and use in source and binary forms, with or without 397c478bd9Sstevel@tonic-gate * modification, are permitted provided that the following conditions 407c478bd9Sstevel@tonic-gate * are met: 417c478bd9Sstevel@tonic-gate * 1. Redistributions of source code must retain the above copyright 427c478bd9Sstevel@tonic-gate * notice, this list of conditions and the following disclaimer. 437c478bd9Sstevel@tonic-gate * 2. Redistributions in binary form must reproduce the above copyright 447c478bd9Sstevel@tonic-gate * notice, this list of conditions and the following disclaimer in the 457c478bd9Sstevel@tonic-gate * documentation and/or other materials provided with the distribution. 467c478bd9Sstevel@tonic-gate * 3. All advertising materials mentioning features or use of this software 477c478bd9Sstevel@tonic-gate * must display the following acknowledgement: 487c478bd9Sstevel@tonic-gate * This product includes software developed by the University of 497c478bd9Sstevel@tonic-gate * California, Berkeley and its contributors. 507c478bd9Sstevel@tonic-gate * 4. Neither the name of the University nor the names of its contributors 517c478bd9Sstevel@tonic-gate * may be used to endorse or promote products derived from this software 527c478bd9Sstevel@tonic-gate * without specific prior written permission. 537c478bd9Sstevel@tonic-gate * 547c478bd9Sstevel@tonic-gate * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 557c478bd9Sstevel@tonic-gate * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 567c478bd9Sstevel@tonic-gate * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 577c478bd9Sstevel@tonic-gate * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 587c478bd9Sstevel@tonic-gate * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 597c478bd9Sstevel@tonic-gate * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 607c478bd9Sstevel@tonic-gate * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 617c478bd9Sstevel@tonic-gate * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 627c478bd9Sstevel@tonic-gate * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 637c478bd9Sstevel@tonic-gate * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 647c478bd9Sstevel@tonic-gate * SUCH DAMAGE. 657c478bd9Sstevel@tonic-gate * 667c478bd9Sstevel@tonic-gate * from: @(#)machdep.c 7.4 (Berkeley) 6/3/91 677c478bd9Sstevel@tonic-gate */ 687c478bd9Sstevel@tonic-gate 697c478bd9Sstevel@tonic-gate #include <sys/types.h> 70ae115bc7Smrj #include <sys/sysmacros.h> 717c478bd9Sstevel@tonic-gate #include <sys/tss.h> 727c478bd9Sstevel@tonic-gate #include <sys/segments.h> 737c478bd9Sstevel@tonic-gate #include <sys/trap.h> 747c478bd9Sstevel@tonic-gate #include <sys/cpuvar.h> 75ae115bc7Smrj #include <sys/bootconf.h> 767c478bd9Sstevel@tonic-gate #include <sys/x86_archext.h> 77ae115bc7Smrj #include <sys/controlregs.h> 787c478bd9Sstevel@tonic-gate #include <sys/archsystm.h> 797c478bd9Sstevel@tonic-gate #include <sys/machsystm.h> 807c478bd9Sstevel@tonic-gate #include <sys/kobj.h> 817c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h> 827c478bd9Sstevel@tonic-gate #include <sys/reboot.h> 837c478bd9Sstevel@tonic-gate #include <sys/kdi.h> 84ae115bc7Smrj #include <sys/mach_mmu.h> 850baeff3dSrab #include <sys/systm.h> 86843e1988Sjohnlev 87843e1988Sjohnlev #ifdef __xpv 88843e1988Sjohnlev #include <sys/hypervisor.h> 89843e1988Sjohnlev #include <vm/as.h> 90843e1988Sjohnlev #endif 91843e1988Sjohnlev 92ae115bc7Smrj #include <sys/promif.h> 93ae115bc7Smrj #include <sys/bootinfo.h> 94ae115bc7Smrj #include <vm/kboot_mmu.h> 95843e1988Sjohnlev #include <vm/hat_pte.h> 967c478bd9Sstevel@tonic-gate 977c478bd9Sstevel@tonic-gate /* 987c478bd9Sstevel@tonic-gate * cpu0 and default tables and structures. 997c478bd9Sstevel@tonic-gate */ 100ae115bc7Smrj user_desc_t *gdt0; 101843e1988Sjohnlev #if !defined(__xpv) 1027c478bd9Sstevel@tonic-gate desctbr_t gdt0_default_r; 103843e1988Sjohnlev #endif 1047c478bd9Sstevel@tonic-gate 1050cfdb603Sjosephb gate_desc_t *idt0; /* interrupt descriptor table */ 106ae115bc7Smrj #if defined(__i386) 1077c478bd9Sstevel@tonic-gate desctbr_t idt0_default_r; /* describes idt0 in IDTR format */ 108ae115bc7Smrj #endif 1097c478bd9Sstevel@tonic-gate 110*f16a0f4cSRobert Mustacchi tss_t *ktss0; /* kernel task state structure */ 1117c478bd9Sstevel@tonic-gate 1127c478bd9Sstevel@tonic-gate #if defined(__i386) 113*f16a0f4cSRobert Mustacchi tss_t *dftss0; /* #DF double-fault exception */ 1147c478bd9Sstevel@tonic-gate #endif /* __i386 */ 1157c478bd9Sstevel@tonic-gate 1167c478bd9Sstevel@tonic-gate user_desc_t zero_udesc; /* base zero user desc native procs */ 117843e1988Sjohnlev user_desc_t null_udesc; /* null user descriptor */ 118843e1988Sjohnlev system_desc_t null_sdesc; /* null system descriptor */ 1197c478bd9Sstevel@tonic-gate 1207c478bd9Sstevel@tonic-gate #if defined(__amd64) 1217c478bd9Sstevel@tonic-gate user_desc_t zero_u32desc; /* 32-bit compatibility procs */ 1227c478bd9Sstevel@tonic-gate #endif /* __amd64 */ 1237c478bd9Sstevel@tonic-gate 124843e1988Sjohnlev #if defined(__amd64) 125843e1988Sjohnlev user_desc_t ucs_on; 126843e1988Sjohnlev user_desc_t ucs_off; 127843e1988Sjohnlev user_desc_t ucs32_on; 128843e1988Sjohnlev user_desc_t ucs32_off; 129843e1988Sjohnlev #endif /* __amd64 */ 130843e1988Sjohnlev 1317c478bd9Sstevel@tonic-gate #pragma align 16(dblfault_stack0) 1327c478bd9Sstevel@tonic-gate char dblfault_stack0[DEFAULTSTKSZ]; 1337c478bd9Sstevel@tonic-gate 1347c478bd9Sstevel@tonic-gate extern void fast_null(void); 1357c478bd9Sstevel@tonic-gate extern hrtime_t get_hrtime(void); 1367c478bd9Sstevel@tonic-gate extern hrtime_t gethrvtime(void); 1377c478bd9Sstevel@tonic-gate extern hrtime_t get_hrestime(void); 1387c478bd9Sstevel@tonic-gate extern uint64_t getlgrp(void); 1397c478bd9Sstevel@tonic-gate 1407c478bd9Sstevel@tonic-gate void (*(fasttable[]))(void) = { 1417c478bd9Sstevel@tonic-gate fast_null, /* T_FNULL routine */ 1427c478bd9Sstevel@tonic-gate fast_null, /* T_FGETFP routine (initially null) */ 1437c478bd9Sstevel@tonic-gate fast_null, /* T_FSETFP routine (initially null) */ 1447c478bd9Sstevel@tonic-gate (void (*)())get_hrtime, /* T_GETHRTIME */ 1457c478bd9Sstevel@tonic-gate (void (*)())gethrvtime, /* T_GETHRVTIME */ 1467c478bd9Sstevel@tonic-gate (void (*)())get_hrestime, /* T_GETHRESTIME */ 1477c478bd9Sstevel@tonic-gate (void (*)())getlgrp /* T_GETLGRP */ 1487c478bd9Sstevel@tonic-gate }; 1497c478bd9Sstevel@tonic-gate 1507c478bd9Sstevel@tonic-gate /* 1519acbbeafSnn35248 * Structure containing pre-computed descriptors to allow us to temporarily 1529acbbeafSnn35248 * interpose on a standard handler. 1539acbbeafSnn35248 */ 1549acbbeafSnn35248 struct interposing_handler { 1559acbbeafSnn35248 int ih_inum; 1569acbbeafSnn35248 gate_desc_t ih_interp_desc; 1579acbbeafSnn35248 gate_desc_t ih_default_desc; 1589acbbeafSnn35248 }; 1599acbbeafSnn35248 1609acbbeafSnn35248 /* 1619acbbeafSnn35248 * The brand infrastructure interposes on two handlers, and we use one as a 1629acbbeafSnn35248 * NULL signpost. 1639acbbeafSnn35248 */ 164eb5a5c78SSurya Prakki static struct interposing_handler brand_tbl[2]; 1659acbbeafSnn35248 1669acbbeafSnn35248 /* 1677c478bd9Sstevel@tonic-gate * software prototypes for default local descriptor table 1687c478bd9Sstevel@tonic-gate */ 1697c478bd9Sstevel@tonic-gate 1707c478bd9Sstevel@tonic-gate /* 1717c478bd9Sstevel@tonic-gate * Routines for loading segment descriptors in format the hardware 1727c478bd9Sstevel@tonic-gate * can understand. 1737c478bd9Sstevel@tonic-gate */ 1747c478bd9Sstevel@tonic-gate 1757c478bd9Sstevel@tonic-gate #if defined(__amd64) 1767c478bd9Sstevel@tonic-gate 1777c478bd9Sstevel@tonic-gate /* 1787c478bd9Sstevel@tonic-gate * In long mode we have the new L or long mode attribute bit 1797c478bd9Sstevel@tonic-gate * for code segments. Only the conforming bit in type is used along 1807c478bd9Sstevel@tonic-gate * with descriptor priority and present bits. Default operand size must 1817c478bd9Sstevel@tonic-gate * be zero when in long mode. In 32-bit compatibility mode all fields 1827c478bd9Sstevel@tonic-gate * are treated as in legacy mode. For data segments while in long mode 1837c478bd9Sstevel@tonic-gate * only the present bit is loaded. 1847c478bd9Sstevel@tonic-gate */ 1857c478bd9Sstevel@tonic-gate void 1867c478bd9Sstevel@tonic-gate set_usegd(user_desc_t *dp, uint_t lmode, void *base, size_t size, 1877c478bd9Sstevel@tonic-gate uint_t type, uint_t dpl, uint_t gran, uint_t defopsz) 1887c478bd9Sstevel@tonic-gate { 1897c478bd9Sstevel@tonic-gate ASSERT(lmode == SDP_SHORT || lmode == SDP_LONG); 1907c478bd9Sstevel@tonic-gate 1917c478bd9Sstevel@tonic-gate /* 1927c478bd9Sstevel@tonic-gate * 64-bit long mode. 1937c478bd9Sstevel@tonic-gate */ 1947c478bd9Sstevel@tonic-gate if (lmode == SDP_LONG) 1957c478bd9Sstevel@tonic-gate dp->usd_def32 = 0; /* 32-bit operands only */ 1967c478bd9Sstevel@tonic-gate else 1977c478bd9Sstevel@tonic-gate /* 1987c478bd9Sstevel@tonic-gate * 32-bit compatibility mode. 1997c478bd9Sstevel@tonic-gate */ 2007c478bd9Sstevel@tonic-gate dp->usd_def32 = defopsz; /* 0 = 16, 1 = 32-bit ops */ 2017c478bd9Sstevel@tonic-gate 2027c478bd9Sstevel@tonic-gate dp->usd_long = lmode; /* 64-bit mode */ 2037c478bd9Sstevel@tonic-gate dp->usd_type = type; 2047c478bd9Sstevel@tonic-gate dp->usd_dpl = dpl; 2057c478bd9Sstevel@tonic-gate dp->usd_p = 1; 2067c478bd9Sstevel@tonic-gate dp->usd_gran = gran; /* 0 = bytes, 1 = pages */ 2077c478bd9Sstevel@tonic-gate 2087c478bd9Sstevel@tonic-gate dp->usd_lobase = (uintptr_t)base; 2097c478bd9Sstevel@tonic-gate dp->usd_midbase = (uintptr_t)base >> 16; 2107c478bd9Sstevel@tonic-gate dp->usd_hibase = (uintptr_t)base >> (16 + 8); 2117c478bd9Sstevel@tonic-gate dp->usd_lolimit = size; 2127c478bd9Sstevel@tonic-gate dp->usd_hilimit = (uintptr_t)size >> 16; 2137c478bd9Sstevel@tonic-gate } 2147c478bd9Sstevel@tonic-gate 2157c478bd9Sstevel@tonic-gate #elif defined(__i386) 2167c478bd9Sstevel@tonic-gate 2177c478bd9Sstevel@tonic-gate /* 2187c478bd9Sstevel@tonic-gate * Install user segment descriptor for code and data. 2197c478bd9Sstevel@tonic-gate */ 2207c478bd9Sstevel@tonic-gate void 2217c478bd9Sstevel@tonic-gate set_usegd(user_desc_t *dp, void *base, size_t size, uint_t type, 2227c478bd9Sstevel@tonic-gate uint_t dpl, uint_t gran, uint_t defopsz) 2237c478bd9Sstevel@tonic-gate { 2247c478bd9Sstevel@tonic-gate dp->usd_lolimit = size; 2257c478bd9Sstevel@tonic-gate dp->usd_hilimit = (uintptr_t)size >> 16; 2267c478bd9Sstevel@tonic-gate 2277c478bd9Sstevel@tonic-gate dp->usd_lobase = (uintptr_t)base; 2287c478bd9Sstevel@tonic-gate dp->usd_midbase = (uintptr_t)base >> 16; 2297c478bd9Sstevel@tonic-gate dp->usd_hibase = (uintptr_t)base >> (16 + 8); 2307c478bd9Sstevel@tonic-gate 2317c478bd9Sstevel@tonic-gate dp->usd_type = type; 2327c478bd9Sstevel@tonic-gate dp->usd_dpl = dpl; 2337c478bd9Sstevel@tonic-gate dp->usd_p = 1; 2347c478bd9Sstevel@tonic-gate dp->usd_def32 = defopsz; /* 0 = 16, 1 = 32 bit operands */ 2357c478bd9Sstevel@tonic-gate dp->usd_gran = gran; /* 0 = bytes, 1 = pages */ 2367c478bd9Sstevel@tonic-gate } 2377c478bd9Sstevel@tonic-gate 2387c478bd9Sstevel@tonic-gate #endif /* __i386 */ 2397c478bd9Sstevel@tonic-gate 2407c478bd9Sstevel@tonic-gate /* 2417c478bd9Sstevel@tonic-gate * Install system segment descriptor for LDT and TSS segments. 2427c478bd9Sstevel@tonic-gate */ 2437c478bd9Sstevel@tonic-gate 2447c478bd9Sstevel@tonic-gate #if defined(__amd64) 2457c478bd9Sstevel@tonic-gate 2467c478bd9Sstevel@tonic-gate void 2477c478bd9Sstevel@tonic-gate set_syssegd(system_desc_t *dp, void *base, size_t size, uint_t type, 2487c478bd9Sstevel@tonic-gate uint_t dpl) 2497c478bd9Sstevel@tonic-gate { 2507c478bd9Sstevel@tonic-gate dp->ssd_lolimit = size; 2517c478bd9Sstevel@tonic-gate dp->ssd_hilimit = (uintptr_t)size >> 16; 2527c478bd9Sstevel@tonic-gate 2537c478bd9Sstevel@tonic-gate dp->ssd_lobase = (uintptr_t)base; 2547c478bd9Sstevel@tonic-gate dp->ssd_midbase = (uintptr_t)base >> 16; 2557c478bd9Sstevel@tonic-gate dp->ssd_hibase = (uintptr_t)base >> (16 + 8); 2567c478bd9Sstevel@tonic-gate dp->ssd_hi64base = (uintptr_t)base >> (16 + 8 + 8); 2577c478bd9Sstevel@tonic-gate 2587c478bd9Sstevel@tonic-gate dp->ssd_type = type; 2597c478bd9Sstevel@tonic-gate dp->ssd_zero1 = 0; /* must be zero */ 2607c478bd9Sstevel@tonic-gate dp->ssd_zero2 = 0; 2617c478bd9Sstevel@tonic-gate dp->ssd_dpl = dpl; 2627c478bd9Sstevel@tonic-gate dp->ssd_p = 1; 2637c478bd9Sstevel@tonic-gate dp->ssd_gran = 0; /* force byte units */ 2647c478bd9Sstevel@tonic-gate } 2657c478bd9Sstevel@tonic-gate 266843e1988Sjohnlev void * 267843e1988Sjohnlev get_ssd_base(system_desc_t *dp) 268843e1988Sjohnlev { 269843e1988Sjohnlev uintptr_t base; 270843e1988Sjohnlev 271843e1988Sjohnlev base = (uintptr_t)dp->ssd_lobase | 272843e1988Sjohnlev (uintptr_t)dp->ssd_midbase << 16 | 273843e1988Sjohnlev (uintptr_t)dp->ssd_hibase << (16 + 8) | 274843e1988Sjohnlev (uintptr_t)dp->ssd_hi64base << (16 + 8 + 8); 275843e1988Sjohnlev return ((void *)base); 276843e1988Sjohnlev } 277843e1988Sjohnlev 2787c478bd9Sstevel@tonic-gate #elif defined(__i386) 2797c478bd9Sstevel@tonic-gate 2807c478bd9Sstevel@tonic-gate void 2817c478bd9Sstevel@tonic-gate set_syssegd(system_desc_t *dp, void *base, size_t size, uint_t type, 2827c478bd9Sstevel@tonic-gate uint_t dpl) 2837c478bd9Sstevel@tonic-gate { 2847c478bd9Sstevel@tonic-gate dp->ssd_lolimit = size; 2857c478bd9Sstevel@tonic-gate dp->ssd_hilimit = (uintptr_t)size >> 16; 2867c478bd9Sstevel@tonic-gate 2877c478bd9Sstevel@tonic-gate dp->ssd_lobase = (uintptr_t)base; 2887c478bd9Sstevel@tonic-gate dp->ssd_midbase = (uintptr_t)base >> 16; 2897c478bd9Sstevel@tonic-gate dp->ssd_hibase = (uintptr_t)base >> (16 + 8); 2907c478bd9Sstevel@tonic-gate 2917c478bd9Sstevel@tonic-gate dp->ssd_type = type; 2927c478bd9Sstevel@tonic-gate dp->ssd_zero = 0; /* must be zero */ 2937c478bd9Sstevel@tonic-gate dp->ssd_dpl = dpl; 2947c478bd9Sstevel@tonic-gate dp->ssd_p = 1; 2957c478bd9Sstevel@tonic-gate dp->ssd_gran = 0; /* force byte units */ 2967c478bd9Sstevel@tonic-gate } 2977c478bd9Sstevel@tonic-gate 298843e1988Sjohnlev void * 299843e1988Sjohnlev get_ssd_base(system_desc_t *dp) 300843e1988Sjohnlev { 301843e1988Sjohnlev uintptr_t base; 302843e1988Sjohnlev 303843e1988Sjohnlev base = (uintptr_t)dp->ssd_lobase | 304843e1988Sjohnlev (uintptr_t)dp->ssd_midbase << 16 | 305843e1988Sjohnlev (uintptr_t)dp->ssd_hibase << (16 + 8); 306843e1988Sjohnlev return ((void *)base); 307843e1988Sjohnlev } 308843e1988Sjohnlev 3097c478bd9Sstevel@tonic-gate #endif /* __i386 */ 3107c478bd9Sstevel@tonic-gate 3117c478bd9Sstevel@tonic-gate /* 3127c478bd9Sstevel@tonic-gate * Install gate segment descriptor for interrupt, trap, call and task gates. 3137c478bd9Sstevel@tonic-gate */ 3147c478bd9Sstevel@tonic-gate 3157c478bd9Sstevel@tonic-gate #if defined(__amd64) 3167c478bd9Sstevel@tonic-gate 3179844da31SSeth Goldberg /*ARGSUSED*/ 3187c478bd9Sstevel@tonic-gate void 319ae115bc7Smrj set_gatesegd(gate_desc_t *dp, void (*func)(void), selector_t sel, 3209844da31SSeth Goldberg uint_t type, uint_t dpl, uint_t vector) 3217c478bd9Sstevel@tonic-gate { 3227c478bd9Sstevel@tonic-gate dp->sgd_looffset = (uintptr_t)func; 3237c478bd9Sstevel@tonic-gate dp->sgd_hioffset = (uintptr_t)func >> 16; 3247c478bd9Sstevel@tonic-gate dp->sgd_hi64offset = (uintptr_t)func >> (16 + 16); 3257c478bd9Sstevel@tonic-gate 3267c478bd9Sstevel@tonic-gate dp->sgd_selector = (uint16_t)sel; 327ae115bc7Smrj 328ae115bc7Smrj /* 329ae115bc7Smrj * For 64 bit native we use the IST stack mechanism 330ae115bc7Smrj * for double faults. All other traps use the CPL = 0 331ae115bc7Smrj * (tss_rsp0) stack. 332ae115bc7Smrj */ 333843e1988Sjohnlev #if !defined(__xpv) 3349844da31SSeth Goldberg if (vector == T_DBLFLT) 335ae115bc7Smrj dp->sgd_ist = 1; 336ae115bc7Smrj else 337843e1988Sjohnlev #endif 338ae115bc7Smrj dp->sgd_ist = 0; 339ae115bc7Smrj 3407c478bd9Sstevel@tonic-gate dp->sgd_type = type; 3417c478bd9Sstevel@tonic-gate dp->sgd_dpl = dpl; 3427c478bd9Sstevel@tonic-gate dp->sgd_p = 1; 3437c478bd9Sstevel@tonic-gate } 3447c478bd9Sstevel@tonic-gate 3457c478bd9Sstevel@tonic-gate #elif defined(__i386) 3467c478bd9Sstevel@tonic-gate 3479844da31SSeth Goldberg /*ARGSUSED*/ 3487c478bd9Sstevel@tonic-gate void 3497c478bd9Sstevel@tonic-gate set_gatesegd(gate_desc_t *dp, void (*func)(void), selector_t sel, 3509844da31SSeth Goldberg uint_t type, uint_t dpl, uint_t unused) 3517c478bd9Sstevel@tonic-gate { 3527c478bd9Sstevel@tonic-gate dp->sgd_looffset = (uintptr_t)func; 3537c478bd9Sstevel@tonic-gate dp->sgd_hioffset = (uintptr_t)func >> 16; 3547c478bd9Sstevel@tonic-gate 3557c478bd9Sstevel@tonic-gate dp->sgd_selector = (uint16_t)sel; 356ae115bc7Smrj dp->sgd_stkcpy = 0; /* always zero bytes */ 3577c478bd9Sstevel@tonic-gate dp->sgd_type = type; 3587c478bd9Sstevel@tonic-gate dp->sgd_dpl = dpl; 3597c478bd9Sstevel@tonic-gate dp->sgd_p = 1; 3607c478bd9Sstevel@tonic-gate } 3617c478bd9Sstevel@tonic-gate 3627c478bd9Sstevel@tonic-gate #endif /* __i386 */ 3637c478bd9Sstevel@tonic-gate 364843e1988Sjohnlev /* 365843e1988Sjohnlev * Updates a single user descriptor in the the GDT of the current cpu. 366843e1988Sjohnlev * Caller is responsible for preventing cpu migration. 367843e1988Sjohnlev */ 368843e1988Sjohnlev 369843e1988Sjohnlev void 370843e1988Sjohnlev gdt_update_usegd(uint_t sidx, user_desc_t *udp) 371843e1988Sjohnlev { 372843e1988Sjohnlev #if defined(__xpv) 373843e1988Sjohnlev 374843e1988Sjohnlev uint64_t dpa = CPU->cpu_m.mcpu_gdtpa + sizeof (*udp) * sidx; 375843e1988Sjohnlev 376843e1988Sjohnlev if (HYPERVISOR_update_descriptor(pa_to_ma(dpa), *(uint64_t *)udp)) 377843e1988Sjohnlev panic("gdt_update_usegd: HYPERVISOR_update_descriptor"); 378843e1988Sjohnlev 379843e1988Sjohnlev #else /* __xpv */ 380843e1988Sjohnlev 381843e1988Sjohnlev CPU->cpu_gdt[sidx] = *udp; 382843e1988Sjohnlev 383843e1988Sjohnlev #endif /* __xpv */ 384843e1988Sjohnlev } 385843e1988Sjohnlev 386843e1988Sjohnlev /* 387843e1988Sjohnlev * Writes single descriptor pointed to by udp into a processes 388843e1988Sjohnlev * LDT entry pointed to by ldp. 389843e1988Sjohnlev */ 390843e1988Sjohnlev int 391843e1988Sjohnlev ldt_update_segd(user_desc_t *ldp, user_desc_t *udp) 392843e1988Sjohnlev { 393843e1988Sjohnlev #if defined(__xpv) 394843e1988Sjohnlev 395843e1988Sjohnlev uint64_t dpa; 396843e1988Sjohnlev 397843e1988Sjohnlev dpa = mmu_ptob(hat_getpfnum(kas.a_hat, (caddr_t)ldp)) | 398843e1988Sjohnlev ((uintptr_t)ldp & PAGEOFFSET); 399843e1988Sjohnlev 400843e1988Sjohnlev /* 401843e1988Sjohnlev * The hypervisor is a little more restrictive about what it 402843e1988Sjohnlev * supports in the LDT. 403843e1988Sjohnlev */ 404843e1988Sjohnlev if (HYPERVISOR_update_descriptor(pa_to_ma(dpa), *(uint64_t *)udp) != 0) 405843e1988Sjohnlev return (EINVAL); 406843e1988Sjohnlev 407843e1988Sjohnlev #else /* __xpv */ 408843e1988Sjohnlev 409843e1988Sjohnlev *ldp = *udp; 410843e1988Sjohnlev 411843e1988Sjohnlev #endif /* __xpv */ 412843e1988Sjohnlev return (0); 413843e1988Sjohnlev } 414843e1988Sjohnlev 415843e1988Sjohnlev #if defined(__xpv) 416843e1988Sjohnlev 417843e1988Sjohnlev /* 418843e1988Sjohnlev * Converts hw format gate descriptor into pseudo-IDT format for the hypervisor. 419843e1988Sjohnlev * Returns true if a valid entry was written. 420843e1988Sjohnlev */ 421843e1988Sjohnlev int 422843e1988Sjohnlev xen_idt_to_trap_info(uint_t vec, gate_desc_t *sgd, void *ti_arg) 423843e1988Sjohnlev { 424843e1988Sjohnlev trap_info_t *ti = ti_arg; /* XXPV Aargh - segments.h comment */ 425843e1988Sjohnlev 426843e1988Sjohnlev /* 427843e1988Sjohnlev * skip holes in the IDT 428843e1988Sjohnlev */ 429843e1988Sjohnlev if (GATESEG_GETOFFSET(sgd) == 0) 430843e1988Sjohnlev return (0); 431843e1988Sjohnlev 432843e1988Sjohnlev ASSERT(sgd->sgd_type == SDT_SYSIGT); 433843e1988Sjohnlev ti->vector = vec; 434843e1988Sjohnlev TI_SET_DPL(ti, sgd->sgd_dpl); 435843e1988Sjohnlev 436843e1988Sjohnlev /* 437843e1988Sjohnlev * Is this an interrupt gate? 438843e1988Sjohnlev */ 439843e1988Sjohnlev if (sgd->sgd_type == SDT_SYSIGT) { 440843e1988Sjohnlev /* LINTED */ 441843e1988Sjohnlev TI_SET_IF(ti, 1); 442843e1988Sjohnlev } 443843e1988Sjohnlev ti->cs = sgd->sgd_selector; 444843e1988Sjohnlev #if defined(__amd64) 445843e1988Sjohnlev ti->cs |= SEL_KPL; /* force into ring 3. see KCS_SEL */ 446843e1988Sjohnlev #endif 447843e1988Sjohnlev ti->address = GATESEG_GETOFFSET(sgd); 448843e1988Sjohnlev return (1); 449843e1988Sjohnlev } 450843e1988Sjohnlev 451843e1988Sjohnlev /* 452843e1988Sjohnlev * Convert a single hw format gate descriptor and write it into our virtual IDT. 453843e1988Sjohnlev */ 454843e1988Sjohnlev void 455843e1988Sjohnlev xen_idt_write(gate_desc_t *sgd, uint_t vec) 456843e1988Sjohnlev { 457843e1988Sjohnlev trap_info_t trapinfo[2]; 458843e1988Sjohnlev 459843e1988Sjohnlev bzero(trapinfo, sizeof (trapinfo)); 460843e1988Sjohnlev if (xen_idt_to_trap_info(vec, sgd, &trapinfo[0]) == 0) 461843e1988Sjohnlev return; 462843e1988Sjohnlev if (xen_set_trap_table(trapinfo) != 0) 463843e1988Sjohnlev panic("xen_idt_write: xen_set_trap_table() failed"); 464843e1988Sjohnlev } 465843e1988Sjohnlev 466843e1988Sjohnlev #endif /* __xpv */ 467843e1988Sjohnlev 468ae115bc7Smrj #if defined(__amd64) 469ae115bc7Smrj 4707c478bd9Sstevel@tonic-gate /* 4717c478bd9Sstevel@tonic-gate * Build kernel GDT. 4727c478bd9Sstevel@tonic-gate */ 4737c478bd9Sstevel@tonic-gate 4747c478bd9Sstevel@tonic-gate static void 475ae115bc7Smrj init_gdt_common(user_desc_t *gdt) 4767c478bd9Sstevel@tonic-gate { 4779acbbeafSnn35248 int i; 4787c478bd9Sstevel@tonic-gate 4797c478bd9Sstevel@tonic-gate /* 4807c478bd9Sstevel@tonic-gate * 64-bit kernel code segment. 4817c478bd9Sstevel@tonic-gate */ 482ae115bc7Smrj set_usegd(&gdt[GDT_KCODE], SDP_LONG, NULL, 0, SDT_MEMERA, SEL_KPL, 4837c478bd9Sstevel@tonic-gate SDP_PAGES, SDP_OP32); 4847c478bd9Sstevel@tonic-gate 4857c478bd9Sstevel@tonic-gate /* 4867c478bd9Sstevel@tonic-gate * 64-bit kernel data segment. The limit attribute is ignored in 64-bit 4877c478bd9Sstevel@tonic-gate * mode, but we set it here to 0xFFFF so that we can use the SYSRET 4887c478bd9Sstevel@tonic-gate * instruction to return from system calls back to 32-bit applications. 4897c478bd9Sstevel@tonic-gate * SYSRET doesn't update the base, limit, or attributes of %ss or %ds 4907c478bd9Sstevel@tonic-gate * descriptors. We therefore must ensure that the kernel uses something, 4917c478bd9Sstevel@tonic-gate * though it will be ignored by hardware, that is compatible with 32-bit 4927c478bd9Sstevel@tonic-gate * apps. For the same reason we must set the default op size of this 4937c478bd9Sstevel@tonic-gate * descriptor to 32-bit operands. 4947c478bd9Sstevel@tonic-gate */ 495ae115bc7Smrj set_usegd(&gdt[GDT_KDATA], SDP_LONG, NULL, -1, SDT_MEMRWA, 4967c478bd9Sstevel@tonic-gate SEL_KPL, SDP_PAGES, SDP_OP32); 497ae115bc7Smrj gdt[GDT_KDATA].usd_def32 = 1; 4987c478bd9Sstevel@tonic-gate 4997c478bd9Sstevel@tonic-gate /* 5007c478bd9Sstevel@tonic-gate * 64-bit user code segment. 5017c478bd9Sstevel@tonic-gate */ 502ae115bc7Smrj set_usegd(&gdt[GDT_UCODE], SDP_LONG, NULL, 0, SDT_MEMERA, SEL_UPL, 5037c478bd9Sstevel@tonic-gate SDP_PAGES, SDP_OP32); 5047c478bd9Sstevel@tonic-gate 5057c478bd9Sstevel@tonic-gate /* 5067c478bd9Sstevel@tonic-gate * 32-bit user code segment. 5077c478bd9Sstevel@tonic-gate */ 508ae115bc7Smrj set_usegd(&gdt[GDT_U32CODE], SDP_SHORT, NULL, -1, SDT_MEMERA, 5097c478bd9Sstevel@tonic-gate SEL_UPL, SDP_PAGES, SDP_OP32); 5107c478bd9Sstevel@tonic-gate 5117c478bd9Sstevel@tonic-gate /* 512843e1988Sjohnlev * See gdt_ucode32() and gdt_ucode_native(). 513843e1988Sjohnlev */ 514843e1988Sjohnlev ucs_on = ucs_off = gdt[GDT_UCODE]; 515843e1988Sjohnlev ucs_off.usd_p = 0; /* forces #np fault */ 516843e1988Sjohnlev 517843e1988Sjohnlev ucs32_on = ucs32_off = gdt[GDT_U32CODE]; 518843e1988Sjohnlev ucs32_off.usd_p = 0; /* forces #np fault */ 519843e1988Sjohnlev 520843e1988Sjohnlev /* 5217c478bd9Sstevel@tonic-gate * 32 and 64 bit data segments can actually share the same descriptor. 5227c478bd9Sstevel@tonic-gate * In long mode only the present bit is checked but all other fields 5237c478bd9Sstevel@tonic-gate * are loaded. But in compatibility mode all fields are interpreted 5247c478bd9Sstevel@tonic-gate * as in legacy mode so they must be set correctly for a 32-bit data 5257c478bd9Sstevel@tonic-gate * segment. 5267c478bd9Sstevel@tonic-gate */ 527ae115bc7Smrj set_usegd(&gdt[GDT_UDATA], SDP_SHORT, NULL, -1, SDT_MEMRWA, SEL_UPL, 5287c478bd9Sstevel@tonic-gate SDP_PAGES, SDP_OP32); 5297c478bd9Sstevel@tonic-gate 530843e1988Sjohnlev #if !defined(__xpv) 531843e1988Sjohnlev 5327c478bd9Sstevel@tonic-gate /* 5330baeff3dSrab * The 64-bit kernel has no default LDT. By default, the LDT descriptor 5340baeff3dSrab * in the GDT is 0. 5357c478bd9Sstevel@tonic-gate */ 5367c478bd9Sstevel@tonic-gate 5377c478bd9Sstevel@tonic-gate /* 5387c478bd9Sstevel@tonic-gate * Kernel TSS 5397c478bd9Sstevel@tonic-gate */ 5400cfdb603Sjosephb set_syssegd((system_desc_t *)&gdt[GDT_KTSS], ktss0, 5410cfdb603Sjosephb sizeof (*ktss0) - 1, SDT_SYSTSS, SEL_KPL); 5427c478bd9Sstevel@tonic-gate 543843e1988Sjohnlev #endif /* !__xpv */ 544843e1988Sjohnlev 5457c478bd9Sstevel@tonic-gate /* 5467c478bd9Sstevel@tonic-gate * Initialize fs and gs descriptors for 32 bit processes. 5477c478bd9Sstevel@tonic-gate * Only attributes and limits are initialized, the effective 5487c478bd9Sstevel@tonic-gate * base address is programmed via fsbase/gsbase. 5497c478bd9Sstevel@tonic-gate */ 550ae115bc7Smrj set_usegd(&gdt[GDT_LWPFS], SDP_SHORT, NULL, -1, SDT_MEMRWA, 5517c478bd9Sstevel@tonic-gate SEL_UPL, SDP_PAGES, SDP_OP32); 552ae115bc7Smrj set_usegd(&gdt[GDT_LWPGS], SDP_SHORT, NULL, -1, SDT_MEMRWA, 5537c478bd9Sstevel@tonic-gate SEL_UPL, SDP_PAGES, SDP_OP32); 5547c478bd9Sstevel@tonic-gate 5557c478bd9Sstevel@tonic-gate /* 5569acbbeafSnn35248 * Initialize the descriptors set aside for brand usage. 5579acbbeafSnn35248 * Only attributes and limits are initialized. 5589acbbeafSnn35248 */ 5599acbbeafSnn35248 for (i = GDT_BRANDMIN; i <= GDT_BRANDMAX; i++) 560ae115bc7Smrj set_usegd(&gdt0[i], SDP_SHORT, NULL, -1, SDT_MEMRWA, 5619acbbeafSnn35248 SEL_UPL, SDP_PAGES, SDP_OP32); 5629acbbeafSnn35248 5639acbbeafSnn35248 /* 5647c478bd9Sstevel@tonic-gate * Initialize convenient zero base user descriptors for clearing 5657c478bd9Sstevel@tonic-gate * lwp private %fs and %gs descriptors in GDT. See setregs() for 5667c478bd9Sstevel@tonic-gate * an example. 5677c478bd9Sstevel@tonic-gate */ 5687c478bd9Sstevel@tonic-gate set_usegd(&zero_udesc, SDP_LONG, 0, 0, SDT_MEMRWA, SEL_UPL, 5697c478bd9Sstevel@tonic-gate SDP_BYTES, SDP_OP32); 5707c478bd9Sstevel@tonic-gate set_usegd(&zero_u32desc, SDP_SHORT, 0, -1, SDT_MEMRWA, SEL_UPL, 5717c478bd9Sstevel@tonic-gate SDP_PAGES, SDP_OP32); 5727c478bd9Sstevel@tonic-gate } 5737c478bd9Sstevel@tonic-gate 574843e1988Sjohnlev #if defined(__xpv) 575843e1988Sjohnlev 576843e1988Sjohnlev static user_desc_t * 577843e1988Sjohnlev init_gdt(void) 578843e1988Sjohnlev { 579843e1988Sjohnlev uint64_t gdtpa; 580843e1988Sjohnlev ulong_t ma[1]; /* XXPV should be a memory_t */ 581843e1988Sjohnlev ulong_t addr; 582843e1988Sjohnlev 583843e1988Sjohnlev #if !defined(__lint) 584843e1988Sjohnlev /* 585843e1988Sjohnlev * Our gdt is never larger than a single page. 586843e1988Sjohnlev */ 587843e1988Sjohnlev ASSERT((sizeof (*gdt0) * NGDT) <= PAGESIZE); 588843e1988Sjohnlev #endif 589843e1988Sjohnlev gdt0 = (user_desc_t *)BOP_ALLOC(bootops, (caddr_t)GDT_VA, 590843e1988Sjohnlev PAGESIZE, PAGESIZE); 591843e1988Sjohnlev bzero(gdt0, PAGESIZE); 592843e1988Sjohnlev 593843e1988Sjohnlev init_gdt_common(gdt0); 594843e1988Sjohnlev 595843e1988Sjohnlev /* 596843e1988Sjohnlev * XXX Since we never invoke kmdb until after the kernel takes 597843e1988Sjohnlev * over the descriptor tables why not have it use the kernel's 598843e1988Sjohnlev * selectors? 599843e1988Sjohnlev */ 600843e1988Sjohnlev if (boothowto & RB_DEBUG) { 601843e1988Sjohnlev set_usegd(&gdt0[GDT_B32DATA], SDP_LONG, NULL, -1, SDT_MEMRWA, 602843e1988Sjohnlev SEL_KPL, SDP_PAGES, SDP_OP32); 603843e1988Sjohnlev set_usegd(&gdt0[GDT_B64CODE], SDP_LONG, NULL, -1, SDT_MEMERA, 604843e1988Sjohnlev SEL_KPL, SDP_PAGES, SDP_OP32); 605843e1988Sjohnlev } 606843e1988Sjohnlev 607843e1988Sjohnlev /* 608843e1988Sjohnlev * Clear write permission for page containing the gdt and install it. 609843e1988Sjohnlev */ 610843e1988Sjohnlev gdtpa = pfn_to_pa(va_to_pfn(gdt0)); 611843e1988Sjohnlev ma[0] = (ulong_t)(pa_to_ma(gdtpa) >> PAGESHIFT); 612843e1988Sjohnlev kbm_read_only((uintptr_t)gdt0, gdtpa); 613843e1988Sjohnlev xen_set_gdt(ma, NGDT); 614843e1988Sjohnlev 615843e1988Sjohnlev /* 616843e1988Sjohnlev * Reload the segment registers to use the new GDT. 617843e1988Sjohnlev * On 64-bit, fixup KCS_SEL to be in ring 3. 618843e1988Sjohnlev * See KCS_SEL in segments.h. 619843e1988Sjohnlev */ 620843e1988Sjohnlev load_segment_registers((KCS_SEL | SEL_KPL), KFS_SEL, KGS_SEL, KDS_SEL); 621843e1988Sjohnlev 622843e1988Sjohnlev /* 623843e1988Sjohnlev * setup %gs for kernel 624843e1988Sjohnlev */ 625843e1988Sjohnlev xen_set_segment_base(SEGBASE_GS_KERNEL, (ulong_t)&cpus[0]); 626843e1988Sjohnlev 627843e1988Sjohnlev /* 628843e1988Sjohnlev * XX64 We should never dereference off "other gsbase" or 629843e1988Sjohnlev * "fsbase". So, we should arrange to point FSBASE and 630843e1988Sjohnlev * KGSBASE somewhere truly awful e.g. point it at the last 631843e1988Sjohnlev * valid address below the hole so that any attempts to index 632843e1988Sjohnlev * off them cause an exception. 633843e1988Sjohnlev * 634843e1988Sjohnlev * For now, point it at 8G -- at least it should be unmapped 635843e1988Sjohnlev * until some 64-bit processes run. 636843e1988Sjohnlev */ 637843e1988Sjohnlev addr = 0x200000000ul; 638843e1988Sjohnlev xen_set_segment_base(SEGBASE_FS, addr); 639843e1988Sjohnlev xen_set_segment_base(SEGBASE_GS_USER, addr); 640843e1988Sjohnlev xen_set_segment_base(SEGBASE_GS_USER_SEL, 0); 641843e1988Sjohnlev 642843e1988Sjohnlev return (gdt0); 643843e1988Sjohnlev } 644843e1988Sjohnlev 645843e1988Sjohnlev #else /* __xpv */ 646843e1988Sjohnlev 647ae115bc7Smrj static user_desc_t * 6487c478bd9Sstevel@tonic-gate init_gdt(void) 6497c478bd9Sstevel@tonic-gate { 6507c478bd9Sstevel@tonic-gate desctbr_t r_bgdt, r_gdt; 6517c478bd9Sstevel@tonic-gate user_desc_t *bgdt; 652ae115bc7Smrj 653ae115bc7Smrj #if !defined(__lint) 654ae115bc7Smrj /* 655ae115bc7Smrj * Our gdt is never larger than a single page. 656ae115bc7Smrj */ 657ae115bc7Smrj ASSERT((sizeof (*gdt0) * NGDT) <= PAGESIZE); 658ae115bc7Smrj #endif 659ae115bc7Smrj gdt0 = (user_desc_t *)BOP_ALLOC(bootops, (caddr_t)GDT_VA, 660ae115bc7Smrj PAGESIZE, PAGESIZE); 661ae115bc7Smrj bzero(gdt0, PAGESIZE); 662ae115bc7Smrj 663ae115bc7Smrj init_gdt_common(gdt0); 6647c478bd9Sstevel@tonic-gate 6657c478bd9Sstevel@tonic-gate /* 666ae115bc7Smrj * Copy in from boot's gdt to our gdt. 667ae115bc7Smrj * Entry 0 is the null descriptor by definition. 6687c478bd9Sstevel@tonic-gate */ 6697c478bd9Sstevel@tonic-gate rd_gdtr(&r_bgdt); 6707c478bd9Sstevel@tonic-gate bgdt = (user_desc_t *)r_bgdt.dtr_base; 6717c478bd9Sstevel@tonic-gate if (bgdt == NULL) 6727c478bd9Sstevel@tonic-gate panic("null boot gdt"); 6737c478bd9Sstevel@tonic-gate 674ae115bc7Smrj gdt0[GDT_B32DATA] = bgdt[GDT_B32DATA]; 675ae115bc7Smrj gdt0[GDT_B32CODE] = bgdt[GDT_B32CODE]; 676ae115bc7Smrj gdt0[GDT_B16CODE] = bgdt[GDT_B16CODE]; 677ae115bc7Smrj gdt0[GDT_B16DATA] = bgdt[GDT_B16DATA]; 678ae115bc7Smrj gdt0[GDT_B64CODE] = bgdt[GDT_B64CODE]; 679ae115bc7Smrj 680ae115bc7Smrj /* 681ae115bc7Smrj * Install our new GDT 682ae115bc7Smrj */ 683ae115bc7Smrj r_gdt.dtr_limit = (sizeof (*gdt0) * NGDT) - 1; 684ae115bc7Smrj r_gdt.dtr_base = (uintptr_t)gdt0; 685ae115bc7Smrj wr_gdtr(&r_gdt); 686ae115bc7Smrj 687ae115bc7Smrj /* 688ae115bc7Smrj * Reload the segment registers to use the new GDT 689ae115bc7Smrj */ 690ae115bc7Smrj load_segment_registers(KCS_SEL, KFS_SEL, KGS_SEL, KDS_SEL); 691ae115bc7Smrj 692ae115bc7Smrj /* 693ae115bc7Smrj * setup %gs for kernel 694ae115bc7Smrj */ 695ae115bc7Smrj wrmsr(MSR_AMD_GSBASE, (uint64_t)&cpus[0]); 696ae115bc7Smrj 697ae115bc7Smrj /* 698ae115bc7Smrj * XX64 We should never dereference off "other gsbase" or 699ae115bc7Smrj * "fsbase". So, we should arrange to point FSBASE and 700ae115bc7Smrj * KGSBASE somewhere truly awful e.g. point it at the last 701ae115bc7Smrj * valid address below the hole so that any attempts to index 702ae115bc7Smrj * off them cause an exception. 703ae115bc7Smrj * 704ae115bc7Smrj * For now, point it at 8G -- at least it should be unmapped 705ae115bc7Smrj * until some 64-bit processes run. 706ae115bc7Smrj */ 707ae115bc7Smrj wrmsr(MSR_AMD_FSBASE, 0x200000000ul); 708ae115bc7Smrj wrmsr(MSR_AMD_KGSBASE, 0x200000000ul); 709ae115bc7Smrj return (gdt0); 710ae115bc7Smrj } 711ae115bc7Smrj 712843e1988Sjohnlev #endif /* __xpv */ 713843e1988Sjohnlev 714ae115bc7Smrj #elif defined(__i386) 715ae115bc7Smrj 716ae115bc7Smrj static void 717ae115bc7Smrj init_gdt_common(user_desc_t *gdt) 718ae115bc7Smrj { 719ae115bc7Smrj int i; 7207c478bd9Sstevel@tonic-gate 7217c478bd9Sstevel@tonic-gate /* 7227c478bd9Sstevel@tonic-gate * Text and data for both kernel and user span entire 32 bit 7237c478bd9Sstevel@tonic-gate * address space. 7247c478bd9Sstevel@tonic-gate */ 7257c478bd9Sstevel@tonic-gate 7267c478bd9Sstevel@tonic-gate /* 7277c478bd9Sstevel@tonic-gate * kernel code segment. 7287c478bd9Sstevel@tonic-gate */ 729ae115bc7Smrj set_usegd(&gdt[GDT_KCODE], NULL, -1, SDT_MEMERA, SEL_KPL, SDP_PAGES, 7307c478bd9Sstevel@tonic-gate SDP_OP32); 7317c478bd9Sstevel@tonic-gate 7327c478bd9Sstevel@tonic-gate /* 7337c478bd9Sstevel@tonic-gate * kernel data segment. 7347c478bd9Sstevel@tonic-gate */ 735ae115bc7Smrj set_usegd(&gdt[GDT_KDATA], NULL, -1, SDT_MEMRWA, SEL_KPL, SDP_PAGES, 7367c478bd9Sstevel@tonic-gate SDP_OP32); 7377c478bd9Sstevel@tonic-gate 7387c478bd9Sstevel@tonic-gate /* 7397c478bd9Sstevel@tonic-gate * user code segment. 7407c478bd9Sstevel@tonic-gate */ 741ae115bc7Smrj set_usegd(&gdt[GDT_UCODE], NULL, -1, SDT_MEMERA, SEL_UPL, SDP_PAGES, 7427c478bd9Sstevel@tonic-gate SDP_OP32); 7437c478bd9Sstevel@tonic-gate 7447c478bd9Sstevel@tonic-gate /* 7457c478bd9Sstevel@tonic-gate * user data segment. 7467c478bd9Sstevel@tonic-gate */ 747ae115bc7Smrj set_usegd(&gdt[GDT_UDATA], NULL, -1, SDT_MEMRWA, SEL_UPL, SDP_PAGES, 7487c478bd9Sstevel@tonic-gate SDP_OP32); 7497c478bd9Sstevel@tonic-gate 750843e1988Sjohnlev #if !defined(__xpv) 751843e1988Sjohnlev 7527c478bd9Sstevel@tonic-gate /* 7537c478bd9Sstevel@tonic-gate * TSS for T_DBLFLT (double fault) handler 7547c478bd9Sstevel@tonic-gate */ 7550cfdb603Sjosephb set_syssegd((system_desc_t *)&gdt[GDT_DBFLT], dftss0, 7560cfdb603Sjosephb sizeof (*dftss0) - 1, SDT_SYSTSS, SEL_KPL); 7577c478bd9Sstevel@tonic-gate 7587c478bd9Sstevel@tonic-gate /* 7597c478bd9Sstevel@tonic-gate * TSS for kernel 7607c478bd9Sstevel@tonic-gate */ 7610cfdb603Sjosephb set_syssegd((system_desc_t *)&gdt[GDT_KTSS], ktss0, 7620cfdb603Sjosephb sizeof (*ktss0) - 1, SDT_SYSTSS, SEL_KPL); 7637c478bd9Sstevel@tonic-gate 764843e1988Sjohnlev #endif /* !__xpv */ 765843e1988Sjohnlev 7667c478bd9Sstevel@tonic-gate /* 7677c478bd9Sstevel@tonic-gate * %gs selector for kernel 7687c478bd9Sstevel@tonic-gate */ 769ae115bc7Smrj set_usegd(&gdt[GDT_GS], &cpus[0], sizeof (struct cpu) -1, SDT_MEMRWA, 7707c478bd9Sstevel@tonic-gate SEL_KPL, SDP_BYTES, SDP_OP32); 7717c478bd9Sstevel@tonic-gate 7727c478bd9Sstevel@tonic-gate /* 7737c478bd9Sstevel@tonic-gate * Initialize lwp private descriptors. 7747c478bd9Sstevel@tonic-gate * Only attributes and limits are initialized, the effective 7757c478bd9Sstevel@tonic-gate * base address is programmed via fsbase/gsbase. 7767c478bd9Sstevel@tonic-gate */ 777ae115bc7Smrj set_usegd(&gdt[GDT_LWPFS], NULL, (size_t)-1, SDT_MEMRWA, SEL_UPL, 7787c478bd9Sstevel@tonic-gate SDP_PAGES, SDP_OP32); 779ae115bc7Smrj set_usegd(&gdt[GDT_LWPGS], NULL, (size_t)-1, SDT_MEMRWA, SEL_UPL, 7807c478bd9Sstevel@tonic-gate SDP_PAGES, SDP_OP32); 7817c478bd9Sstevel@tonic-gate 7827c478bd9Sstevel@tonic-gate /* 7839acbbeafSnn35248 * Initialize the descriptors set aside for brand usage. 7849acbbeafSnn35248 * Only attributes and limits are initialized. 7859acbbeafSnn35248 */ 7869acbbeafSnn35248 for (i = GDT_BRANDMIN; i <= GDT_BRANDMAX; i++) 7879acbbeafSnn35248 set_usegd(&gdt0[i], NULL, (size_t)-1, SDT_MEMRWA, SEL_UPL, 7889acbbeafSnn35248 SDP_PAGES, SDP_OP32); 789ae115bc7Smrj /* 790ae115bc7Smrj * Initialize convenient zero base user descriptor for clearing 791ae115bc7Smrj * lwp private %fs and %gs descriptors in GDT. See setregs() for 792ae115bc7Smrj * an example. 793ae115bc7Smrj */ 794ae115bc7Smrj set_usegd(&zero_udesc, NULL, -1, SDT_MEMRWA, SEL_UPL, 795ae115bc7Smrj SDP_BYTES, SDP_OP32); 796ae115bc7Smrj } 797ae115bc7Smrj 798843e1988Sjohnlev #if defined(__xpv) 799843e1988Sjohnlev 800843e1988Sjohnlev static user_desc_t * 801843e1988Sjohnlev init_gdt(void) 802843e1988Sjohnlev { 803843e1988Sjohnlev uint64_t gdtpa; 804843e1988Sjohnlev ulong_t ma[1]; /* XXPV should be a memory_t */ 805843e1988Sjohnlev 806843e1988Sjohnlev #if !defined(__lint) 807843e1988Sjohnlev /* 808843e1988Sjohnlev * Our gdt is never larger than a single page. 809843e1988Sjohnlev */ 810843e1988Sjohnlev ASSERT((sizeof (*gdt0) * NGDT) <= PAGESIZE); 811843e1988Sjohnlev #endif 812843e1988Sjohnlev gdt0 = (user_desc_t *)BOP_ALLOC(bootops, (caddr_t)GDT_VA, 813843e1988Sjohnlev PAGESIZE, PAGESIZE); 814843e1988Sjohnlev bzero(gdt0, PAGESIZE); 815843e1988Sjohnlev 816843e1988Sjohnlev init_gdt_common(gdt0); 817843e1988Sjohnlev gdtpa = pfn_to_pa(va_to_pfn(gdt0)); 818843e1988Sjohnlev 819843e1988Sjohnlev /* 820843e1988Sjohnlev * XXX Since we never invoke kmdb until after the kernel takes 821843e1988Sjohnlev * over the descriptor tables why not have it use the kernel's 822843e1988Sjohnlev * selectors? 823843e1988Sjohnlev */ 824843e1988Sjohnlev if (boothowto & RB_DEBUG) { 825843e1988Sjohnlev set_usegd(&gdt0[GDT_B32DATA], NULL, -1, SDT_MEMRWA, SEL_KPL, 826843e1988Sjohnlev SDP_PAGES, SDP_OP32); 827843e1988Sjohnlev set_usegd(&gdt0[GDT_B32CODE], NULL, -1, SDT_MEMERA, SEL_KPL, 828843e1988Sjohnlev SDP_PAGES, SDP_OP32); 829843e1988Sjohnlev } 830843e1988Sjohnlev 831843e1988Sjohnlev /* 832843e1988Sjohnlev * Clear write permission for page containing the gdt and install it. 833843e1988Sjohnlev */ 834843e1988Sjohnlev ma[0] = (ulong_t)(pa_to_ma(gdtpa) >> PAGESHIFT); 835843e1988Sjohnlev kbm_read_only((uintptr_t)gdt0, gdtpa); 836843e1988Sjohnlev xen_set_gdt(ma, NGDT); 837843e1988Sjohnlev 838843e1988Sjohnlev /* 839843e1988Sjohnlev * Reload the segment registers to use the new GDT 840843e1988Sjohnlev */ 841843e1988Sjohnlev load_segment_registers( 842843e1988Sjohnlev KCS_SEL, KDS_SEL, KDS_SEL, KFS_SEL, KGS_SEL, KDS_SEL); 843843e1988Sjohnlev 844843e1988Sjohnlev return (gdt0); 845843e1988Sjohnlev } 846843e1988Sjohnlev 847843e1988Sjohnlev #else /* __xpv */ 848843e1988Sjohnlev 849ae115bc7Smrj static user_desc_t * 850ae115bc7Smrj init_gdt(void) 851ae115bc7Smrj { 852ae115bc7Smrj desctbr_t r_bgdt, r_gdt; 853ae115bc7Smrj user_desc_t *bgdt; 854ae115bc7Smrj 855ae115bc7Smrj #if !defined(__lint) 856ae115bc7Smrj /* 857ae115bc7Smrj * Our gdt is never larger than a single page. 858ae115bc7Smrj */ 859ae115bc7Smrj ASSERT((sizeof (*gdt0) * NGDT) <= PAGESIZE); 860ae115bc7Smrj #endif 861ae115bc7Smrj /* 862ae115bc7Smrj * XXX this allocation belongs in our caller, not here. 863ae115bc7Smrj */ 864ae115bc7Smrj gdt0 = (user_desc_t *)BOP_ALLOC(bootops, (caddr_t)GDT_VA, 865ae115bc7Smrj PAGESIZE, PAGESIZE); 866ae115bc7Smrj bzero(gdt0, PAGESIZE); 867ae115bc7Smrj 868ae115bc7Smrj init_gdt_common(gdt0); 869ae115bc7Smrj 870ae115bc7Smrj /* 871ae115bc7Smrj * Copy in from boot's gdt to our gdt entries. 872ae115bc7Smrj * Entry 0 is null descriptor by definition. 873ae115bc7Smrj */ 874ae115bc7Smrj rd_gdtr(&r_bgdt); 875ae115bc7Smrj bgdt = (user_desc_t *)r_bgdt.dtr_base; 876ae115bc7Smrj if (bgdt == NULL) 877ae115bc7Smrj panic("null boot gdt"); 878ae115bc7Smrj 879ae115bc7Smrj gdt0[GDT_B32DATA] = bgdt[GDT_B32DATA]; 880ae115bc7Smrj gdt0[GDT_B32CODE] = bgdt[GDT_B32CODE]; 881ae115bc7Smrj gdt0[GDT_B16CODE] = bgdt[GDT_B16CODE]; 882ae115bc7Smrj gdt0[GDT_B16DATA] = bgdt[GDT_B16DATA]; 8839acbbeafSnn35248 8849acbbeafSnn35248 /* 8857c478bd9Sstevel@tonic-gate * Install our new GDT 8867c478bd9Sstevel@tonic-gate */ 887ae115bc7Smrj r_gdt.dtr_limit = (sizeof (*gdt0) * NGDT) - 1; 8887c478bd9Sstevel@tonic-gate r_gdt.dtr_base = (uintptr_t)gdt0; 8897c478bd9Sstevel@tonic-gate wr_gdtr(&r_gdt); 8907c478bd9Sstevel@tonic-gate 8917c478bd9Sstevel@tonic-gate /* 892ae115bc7Smrj * Reload the segment registers to use the new GDT 8937c478bd9Sstevel@tonic-gate */ 894ae115bc7Smrj load_segment_registers( 895ae115bc7Smrj KCS_SEL, KDS_SEL, KDS_SEL, KFS_SEL, KGS_SEL, KDS_SEL); 896ae115bc7Smrj 897ae115bc7Smrj return (gdt0); 8987c478bd9Sstevel@tonic-gate } 8997c478bd9Sstevel@tonic-gate 900843e1988Sjohnlev #endif /* __xpv */ 9017c478bd9Sstevel@tonic-gate #endif /* __i386 */ 9027c478bd9Sstevel@tonic-gate 9037c478bd9Sstevel@tonic-gate /* 9047c478bd9Sstevel@tonic-gate * Build kernel IDT. 9057c478bd9Sstevel@tonic-gate * 906ae115bc7Smrj * Note that for amd64 we pretty much require every gate to be an interrupt 907ae115bc7Smrj * gate which blocks interrupts atomically on entry; that's because of our 908ae115bc7Smrj * dependency on using 'swapgs' every time we come into the kernel to find 909ae115bc7Smrj * the cpu structure. If we get interrupted just before doing that, %cs could 910ae115bc7Smrj * be in kernel mode (so that the trap prolog doesn't do a swapgs), but 911ae115bc7Smrj * %gsbase is really still pointing at something in userland. Bad things will 912ae115bc7Smrj * ensue. We also use interrupt gates for i386 as well even though this is not 913ae115bc7Smrj * required for some traps. 9147c478bd9Sstevel@tonic-gate * 9157c478bd9Sstevel@tonic-gate * Perhaps they should have invented a trap gate that does an atomic swapgs? 9167c478bd9Sstevel@tonic-gate */ 9177c478bd9Sstevel@tonic-gate static void 918ae115bc7Smrj init_idt_common(gate_desc_t *idt) 9197c478bd9Sstevel@tonic-gate { 9209844da31SSeth Goldberg set_gatesegd(&idt[T_ZERODIV], &div0trap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9219844da31SSeth Goldberg 0); 9229844da31SSeth Goldberg set_gatesegd(&idt[T_SGLSTP], &dbgtrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9239844da31SSeth Goldberg 0); 9249844da31SSeth Goldberg set_gatesegd(&idt[T_NMIFLT], &nmiint, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9259844da31SSeth Goldberg 0); 9269844da31SSeth Goldberg set_gatesegd(&idt[T_BPTFLT], &brktrap, KCS_SEL, SDT_SYSIGT, TRP_UPL, 9279844da31SSeth Goldberg 0); 9289844da31SSeth Goldberg set_gatesegd(&idt[T_OVFLW], &ovflotrap, KCS_SEL, SDT_SYSIGT, TRP_UPL, 9299844da31SSeth Goldberg 0); 930ae115bc7Smrj set_gatesegd(&idt[T_BOUNDFLT], &boundstrap, KCS_SEL, SDT_SYSIGT, 9319844da31SSeth Goldberg TRP_KPL, 0); 9329844da31SSeth Goldberg set_gatesegd(&idt[T_ILLINST], &invoptrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9339844da31SSeth Goldberg 0); 9349844da31SSeth Goldberg set_gatesegd(&idt[T_NOEXTFLT], &ndptrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9359844da31SSeth Goldberg 0); 9367c478bd9Sstevel@tonic-gate 9377c478bd9Sstevel@tonic-gate /* 9387c478bd9Sstevel@tonic-gate * double fault handler. 939843e1988Sjohnlev * 940843e1988Sjohnlev * Note that on the hypervisor a guest does not receive #df faults. 941843e1988Sjohnlev * Instead a failsafe event is injected into the guest if its selectors 942843e1988Sjohnlev * and/or stack is in a broken state. See xen_failsafe_callback. 9437c478bd9Sstevel@tonic-gate */ 944843e1988Sjohnlev #if !defined(__xpv) 945ae115bc7Smrj #if defined(__amd64) 946843e1988Sjohnlev 9479844da31SSeth Goldberg set_gatesegd(&idt[T_DBLFLT], &syserrtrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9489844da31SSeth Goldberg T_DBLFLT); 949843e1988Sjohnlev 950ae115bc7Smrj #elif defined(__i386) 951843e1988Sjohnlev 952ae115bc7Smrj /* 953ae115bc7Smrj * task gate required. 954ae115bc7Smrj */ 9559844da31SSeth Goldberg set_gatesegd(&idt[T_DBLFLT], NULL, DFTSS_SEL, SDT_SYSTASKGT, TRP_KPL, 9569844da31SSeth Goldberg 0); 957ae115bc7Smrj 958ae115bc7Smrj #endif /* __i386 */ 959843e1988Sjohnlev #endif /* !__xpv */ 9607c478bd9Sstevel@tonic-gate 9617c478bd9Sstevel@tonic-gate /* 9627c478bd9Sstevel@tonic-gate * T_EXTOVRFLT coprocessor-segment-overrun not supported. 9637c478bd9Sstevel@tonic-gate */ 9647c478bd9Sstevel@tonic-gate 9659844da31SSeth Goldberg set_gatesegd(&idt[T_TSSFLT], &invtsstrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9669844da31SSeth Goldberg 0); 9679844da31SSeth Goldberg set_gatesegd(&idt[T_SEGFLT], &segnptrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9689844da31SSeth Goldberg 0); 9699844da31SSeth Goldberg set_gatesegd(&idt[T_STKFLT], &stktrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 0); 9709844da31SSeth Goldberg set_gatesegd(&idt[T_GPFLT], &gptrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 0); 9719844da31SSeth Goldberg set_gatesegd(&idt[T_PGFLT], &pftrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 0); 9729844da31SSeth Goldberg set_gatesegd(&idt[T_EXTERRFLT], &ndperr, KCS_SEL, SDT_SYSIGT, TRP_KPL, 9739844da31SSeth Goldberg 0); 974ae115bc7Smrj set_gatesegd(&idt[T_ALIGNMENT], &achktrap, KCS_SEL, SDT_SYSIGT, 9759844da31SSeth Goldberg TRP_KPL, 0); 9769844da31SSeth Goldberg set_gatesegd(&idt[T_MCE], &mcetrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 0); 9779844da31SSeth Goldberg set_gatesegd(&idt[T_SIMDFPE], &xmtrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 0); 9787c478bd9Sstevel@tonic-gate 9797c478bd9Sstevel@tonic-gate /* 9807c478bd9Sstevel@tonic-gate * install fast trap handler at 210. 9817c478bd9Sstevel@tonic-gate */ 9829844da31SSeth Goldberg set_gatesegd(&idt[T_FASTTRAP], &fasttrap, KCS_SEL, SDT_SYSIGT, TRP_UPL, 9839844da31SSeth Goldberg 0); 9847c478bd9Sstevel@tonic-gate 9857c478bd9Sstevel@tonic-gate /* 9867c478bd9Sstevel@tonic-gate * System call handler. 9877c478bd9Sstevel@tonic-gate */ 988ae115bc7Smrj #if defined(__amd64) 989ae115bc7Smrj set_gatesegd(&idt[T_SYSCALLINT], &sys_syscall_int, KCS_SEL, SDT_SYSIGT, 9909844da31SSeth Goldberg TRP_UPL, 0); 991ae115bc7Smrj 992ae115bc7Smrj #elif defined(__i386) 993ae115bc7Smrj set_gatesegd(&idt[T_SYSCALLINT], &sys_call, KCS_SEL, SDT_SYSIGT, 9949844da31SSeth Goldberg TRP_UPL, 0); 995ae115bc7Smrj #endif /* __i386 */ 9967c478bd9Sstevel@tonic-gate 9977c478bd9Sstevel@tonic-gate /* 998f498645aSahl * Install the DTrace interrupt handler for the pid provider. 9997c478bd9Sstevel@tonic-gate */ 1000ae115bc7Smrj set_gatesegd(&idt[T_DTRACE_RET], &dtrace_ret, KCS_SEL, 10019844da31SSeth Goldberg SDT_SYSIGT, TRP_UPL, 0); 10027c478bd9Sstevel@tonic-gate 10039acbbeafSnn35248 /* 1004eb5a5c78SSurya Prakki * Prepare interposing descriptor for the syscall handler 1005eb5a5c78SSurya Prakki * and cache copy of the default descriptor. 10069acbbeafSnn35248 */ 1007eb5a5c78SSurya Prakki brand_tbl[0].ih_inum = T_SYSCALLINT; 1008eb5a5c78SSurya Prakki brand_tbl[0].ih_default_desc = idt0[T_SYSCALLINT]; 1009ae115bc7Smrj 1010ae115bc7Smrj #if defined(__amd64) 1011eb5a5c78SSurya Prakki set_gatesegd(&(brand_tbl[0].ih_interp_desc), &brand_sys_syscall_int, 10129844da31SSeth Goldberg KCS_SEL, SDT_SYSIGT, TRP_UPL, 0); 1013ae115bc7Smrj #elif defined(__i386) 1014eb5a5c78SSurya Prakki set_gatesegd(&(brand_tbl[0].ih_interp_desc), &brand_sys_call, 10159844da31SSeth Goldberg KCS_SEL, SDT_SYSIGT, TRP_UPL, 0); 1016ae115bc7Smrj #endif /* __i386 */ 10179acbbeafSnn35248 1018eb5a5c78SSurya Prakki brand_tbl[1].ih_inum = 0; 10197c478bd9Sstevel@tonic-gate } 10207c478bd9Sstevel@tonic-gate 1021843e1988Sjohnlev #if defined(__xpv) 1022843e1988Sjohnlev 1023843e1988Sjohnlev static void 1024843e1988Sjohnlev init_idt(gate_desc_t *idt) 1025843e1988Sjohnlev { 1026843e1988Sjohnlev init_idt_common(idt); 1027843e1988Sjohnlev } 1028843e1988Sjohnlev 1029843e1988Sjohnlev #else /* __xpv */ 1030843e1988Sjohnlev 10317c478bd9Sstevel@tonic-gate static void 1032ae115bc7Smrj init_idt(gate_desc_t *idt) 10337c478bd9Sstevel@tonic-gate { 10347c478bd9Sstevel@tonic-gate char ivctname[80]; 10357c478bd9Sstevel@tonic-gate void (*ivctptr)(void); 10367c478bd9Sstevel@tonic-gate int i; 10377c478bd9Sstevel@tonic-gate 10387c478bd9Sstevel@tonic-gate /* 10397c478bd9Sstevel@tonic-gate * Initialize entire table with 'reserved' trap and then overwrite 10407c478bd9Sstevel@tonic-gate * specific entries. T_EXTOVRFLT (9) is unsupported and reserved 10417c478bd9Sstevel@tonic-gate * since it can only be generated on a 386 processor. 15 is also 10427c478bd9Sstevel@tonic-gate * unsupported and reserved. 10437c478bd9Sstevel@tonic-gate */ 10447c478bd9Sstevel@tonic-gate for (i = 0; i < NIDT; i++) 10459844da31SSeth Goldberg set_gatesegd(&idt[i], &resvtrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 10469844da31SSeth Goldberg 0); 10477c478bd9Sstevel@tonic-gate 10487c478bd9Sstevel@tonic-gate /* 10497c478bd9Sstevel@tonic-gate * 20-31 reserved 10507c478bd9Sstevel@tonic-gate */ 10517c478bd9Sstevel@tonic-gate for (i = 20; i < 32; i++) 10529844da31SSeth Goldberg set_gatesegd(&idt[i], &invaltrap, KCS_SEL, SDT_SYSIGT, TRP_KPL, 10539844da31SSeth Goldberg 0); 10547c478bd9Sstevel@tonic-gate 10557c478bd9Sstevel@tonic-gate /* 10567c478bd9Sstevel@tonic-gate * interrupts 32 - 255 10577c478bd9Sstevel@tonic-gate */ 10587c478bd9Sstevel@tonic-gate for (i = 32; i < 256; i++) { 10597c478bd9Sstevel@tonic-gate (void) snprintf(ivctname, sizeof (ivctname), "ivct%d", i); 10607c478bd9Sstevel@tonic-gate ivctptr = (void (*)(void))kobj_getsymvalue(ivctname, 0); 10617c478bd9Sstevel@tonic-gate if (ivctptr == NULL) 10627c478bd9Sstevel@tonic-gate panic("kobj_getsymvalue(%s) failed", ivctname); 10637c478bd9Sstevel@tonic-gate 10649844da31SSeth Goldberg set_gatesegd(&idt[i], ivctptr, KCS_SEL, SDT_SYSIGT, TRP_KPL, 0); 10657c478bd9Sstevel@tonic-gate } 10667c478bd9Sstevel@tonic-gate 10677c478bd9Sstevel@tonic-gate /* 1068ae115bc7Smrj * Now install the common ones. Note that it will overlay some 1069ae115bc7Smrj * entries installed above like T_SYSCALLINT, T_FASTTRAP etc. 10709acbbeafSnn35248 */ 1071ae115bc7Smrj init_idt_common(idt); 10727c478bd9Sstevel@tonic-gate } 10737c478bd9Sstevel@tonic-gate 1074843e1988Sjohnlev #endif /* __xpv */ 1075843e1988Sjohnlev 10767c478bd9Sstevel@tonic-gate /* 10770baeff3dSrab * The kernel does not deal with LDTs unless a user explicitly creates 10780baeff3dSrab * one. Under normal circumstances, the LDTR contains 0. Any process attempting 10790baeff3dSrab * to reference the LDT will therefore cause a #gp. System calls made via the 10800baeff3dSrab * obsolete lcall mechanism are emulated by the #gp fault handler. 10817c478bd9Sstevel@tonic-gate */ 10827c478bd9Sstevel@tonic-gate static void 10837c478bd9Sstevel@tonic-gate init_ldt(void) 10847c478bd9Sstevel@tonic-gate { 1085843e1988Sjohnlev #if defined(__xpv) 1086843e1988Sjohnlev xen_set_ldt(NULL, 0); 1087843e1988Sjohnlev #else 10880baeff3dSrab wr_ldtr(0); 1089843e1988Sjohnlev #endif 10907c478bd9Sstevel@tonic-gate } 10917c478bd9Sstevel@tonic-gate 1092843e1988Sjohnlev #if !defined(__xpv) 10937c478bd9Sstevel@tonic-gate #if defined(__amd64) 10947c478bd9Sstevel@tonic-gate 10957c478bd9Sstevel@tonic-gate static void 10967c478bd9Sstevel@tonic-gate init_tss(void) 10977c478bd9Sstevel@tonic-gate { 10987c478bd9Sstevel@tonic-gate /* 10997c478bd9Sstevel@tonic-gate * tss_rsp0 is dynamically filled in by resume() on each context switch. 11007c478bd9Sstevel@tonic-gate * All exceptions but #DF will run on the thread stack. 11017c478bd9Sstevel@tonic-gate * Set up the double fault stack here. 11027c478bd9Sstevel@tonic-gate */ 11030cfdb603Sjosephb ktss0->tss_ist1 = 11047c478bd9Sstevel@tonic-gate (uint64_t)&dblfault_stack0[sizeof (dblfault_stack0)]; 11057c478bd9Sstevel@tonic-gate 11067c478bd9Sstevel@tonic-gate /* 11077c478bd9Sstevel@tonic-gate * Set I/O bit map offset equal to size of TSS segment limit 11087c478bd9Sstevel@tonic-gate * for no I/O permission map. This will force all user I/O 11097c478bd9Sstevel@tonic-gate * instructions to generate #gp fault. 11107c478bd9Sstevel@tonic-gate */ 11110cfdb603Sjosephb ktss0->tss_bitmapbase = sizeof (*ktss0); 11127c478bd9Sstevel@tonic-gate 11137c478bd9Sstevel@tonic-gate /* 11147c478bd9Sstevel@tonic-gate * Point %tr to descriptor for ktss0 in gdt. 11157c478bd9Sstevel@tonic-gate */ 11167c478bd9Sstevel@tonic-gate wr_tsr(KTSS_SEL); 11177c478bd9Sstevel@tonic-gate } 11187c478bd9Sstevel@tonic-gate 11197c478bd9Sstevel@tonic-gate #elif defined(__i386) 11207c478bd9Sstevel@tonic-gate 11217c478bd9Sstevel@tonic-gate static void 11227c478bd9Sstevel@tonic-gate init_tss(void) 11237c478bd9Sstevel@tonic-gate { 11247c478bd9Sstevel@tonic-gate /* 11250cfdb603Sjosephb * ktss0->tss_esp dynamically filled in by resume() on each 11267c478bd9Sstevel@tonic-gate * context switch. 11277c478bd9Sstevel@tonic-gate */ 11280cfdb603Sjosephb ktss0->tss_ss0 = KDS_SEL; 11290cfdb603Sjosephb ktss0->tss_eip = (uint32_t)_start; 11300cfdb603Sjosephb ktss0->tss_ds = ktss0->tss_es = ktss0->tss_ss = KDS_SEL; 11310cfdb603Sjosephb ktss0->tss_cs = KCS_SEL; 11320cfdb603Sjosephb ktss0->tss_fs = KFS_SEL; 11330cfdb603Sjosephb ktss0->tss_gs = KGS_SEL; 11340cfdb603Sjosephb ktss0->tss_ldt = ULDT_SEL; 11357c478bd9Sstevel@tonic-gate 11367c478bd9Sstevel@tonic-gate /* 11377c478bd9Sstevel@tonic-gate * Initialize double fault tss. 11387c478bd9Sstevel@tonic-gate */ 11390cfdb603Sjosephb dftss0->tss_esp0 = (uint32_t)&dblfault_stack0[sizeof (dblfault_stack0)]; 11400cfdb603Sjosephb dftss0->tss_ss0 = KDS_SEL; 11417c478bd9Sstevel@tonic-gate 11427c478bd9Sstevel@tonic-gate /* 11437c478bd9Sstevel@tonic-gate * tss_cr3 will get initialized in hat_kern_setup() once our page 11447c478bd9Sstevel@tonic-gate * tables have been setup. 11457c478bd9Sstevel@tonic-gate */ 11460cfdb603Sjosephb dftss0->tss_eip = (uint32_t)syserrtrap; 11470cfdb603Sjosephb dftss0->tss_esp = (uint32_t)&dblfault_stack0[sizeof (dblfault_stack0)]; 11480cfdb603Sjosephb dftss0->tss_cs = KCS_SEL; 11490cfdb603Sjosephb dftss0->tss_ds = KDS_SEL; 11500cfdb603Sjosephb dftss0->tss_es = KDS_SEL; 11510cfdb603Sjosephb dftss0->tss_ss = KDS_SEL; 11520cfdb603Sjosephb dftss0->tss_fs = KFS_SEL; 11530cfdb603Sjosephb dftss0->tss_gs = KGS_SEL; 11547c478bd9Sstevel@tonic-gate 11557c478bd9Sstevel@tonic-gate /* 11567c478bd9Sstevel@tonic-gate * Set I/O bit map offset equal to size of TSS segment limit 11577c478bd9Sstevel@tonic-gate * for no I/O permission map. This will force all user I/O 11587c478bd9Sstevel@tonic-gate * instructions to generate #gp fault. 11597c478bd9Sstevel@tonic-gate */ 11600cfdb603Sjosephb ktss0->tss_bitmapbase = sizeof (*ktss0); 11617c478bd9Sstevel@tonic-gate 11627c478bd9Sstevel@tonic-gate /* 11637c478bd9Sstevel@tonic-gate * Point %tr to descriptor for ktss0 in gdt. 11647c478bd9Sstevel@tonic-gate */ 11657c478bd9Sstevel@tonic-gate wr_tsr(KTSS_SEL); 11667c478bd9Sstevel@tonic-gate } 11677c478bd9Sstevel@tonic-gate 11687c478bd9Sstevel@tonic-gate #endif /* __i386 */ 1169843e1988Sjohnlev #endif /* !__xpv */ 1170843e1988Sjohnlev 1171843e1988Sjohnlev #if defined(__xpv) 1172843e1988Sjohnlev 1173843e1988Sjohnlev void 1174843e1988Sjohnlev init_desctbls(void) 1175843e1988Sjohnlev { 1176843e1988Sjohnlev uint_t vec; 1177843e1988Sjohnlev user_desc_t *gdt; 1178843e1988Sjohnlev 1179843e1988Sjohnlev /* 1180843e1988Sjohnlev * Setup and install our GDT. 1181843e1988Sjohnlev */ 1182843e1988Sjohnlev gdt = init_gdt(); 1183843e1988Sjohnlev 1184843e1988Sjohnlev /* 1185843e1988Sjohnlev * Store static pa of gdt to speed up pa_to_ma() translations 1186843e1988Sjohnlev * on lwp context switches. 1187843e1988Sjohnlev */ 1188843e1988Sjohnlev ASSERT(IS_P2ALIGNED((uintptr_t)gdt, PAGESIZE)); 11890cfdb603Sjosephb CPU->cpu_gdt = gdt; 1190843e1988Sjohnlev CPU->cpu_m.mcpu_gdtpa = pfn_to_pa(va_to_pfn(gdt)); 1191843e1988Sjohnlev 1192843e1988Sjohnlev /* 1193843e1988Sjohnlev * Setup and install our IDT. 1194843e1988Sjohnlev */ 11950cfdb603Sjosephb #if !defined(__lint) 11960cfdb603Sjosephb ASSERT(NIDT * sizeof (*idt0) <= PAGESIZE); 11970cfdb603Sjosephb #endif 11980cfdb603Sjosephb idt0 = (gate_desc_t *)BOP_ALLOC(bootops, (caddr_t)IDT_VA, 11990cfdb603Sjosephb PAGESIZE, PAGESIZE); 12009844da31SSeth Goldberg bzero(idt0, PAGESIZE); 12010cfdb603Sjosephb init_idt(idt0); 1202843e1988Sjohnlev for (vec = 0; vec < NIDT; vec++) 1203843e1988Sjohnlev xen_idt_write(&idt0[vec], vec); 1204843e1988Sjohnlev 12050cfdb603Sjosephb CPU->cpu_idt = idt0; 1206843e1988Sjohnlev 1207843e1988Sjohnlev /* 1208843e1988Sjohnlev * set default kernel stack 1209843e1988Sjohnlev */ 1210843e1988Sjohnlev xen_stack_switch(KDS_SEL, 1211843e1988Sjohnlev (ulong_t)&dblfault_stack0[sizeof (dblfault_stack0)]); 1212843e1988Sjohnlev 1213843e1988Sjohnlev xen_init_callbacks(); 1214843e1988Sjohnlev 1215843e1988Sjohnlev init_ldt(); 1216843e1988Sjohnlev } 1217843e1988Sjohnlev 1218843e1988Sjohnlev #else /* __xpv */ 12197c478bd9Sstevel@tonic-gate 12207c478bd9Sstevel@tonic-gate void 1221ae115bc7Smrj init_desctbls(void) 12227c478bd9Sstevel@tonic-gate { 1223ae115bc7Smrj user_desc_t *gdt; 1224ae115bc7Smrj desctbr_t idtr; 1225ae115bc7Smrj 1226ae115bc7Smrj /* 12270cfdb603Sjosephb * Allocate IDT and TSS structures on unique pages for better 12280cfdb603Sjosephb * performance in virtual machines. 12290cfdb603Sjosephb */ 12300cfdb603Sjosephb #if !defined(__lint) 12310cfdb603Sjosephb ASSERT(NIDT * sizeof (*idt0) <= PAGESIZE); 12320cfdb603Sjosephb #endif 12330cfdb603Sjosephb idt0 = (gate_desc_t *)BOP_ALLOC(bootops, (caddr_t)IDT_VA, 12340cfdb603Sjosephb PAGESIZE, PAGESIZE); 12359844da31SSeth Goldberg bzero(idt0, PAGESIZE); 12360cfdb603Sjosephb #if !defined(__lint) 12370cfdb603Sjosephb ASSERT(sizeof (*ktss0) <= PAGESIZE); 12380cfdb603Sjosephb #endif 1239*f16a0f4cSRobert Mustacchi ktss0 = (tss_t *)BOP_ALLOC(bootops, (caddr_t)KTSS_VA, 12400cfdb603Sjosephb PAGESIZE, PAGESIZE); 12419844da31SSeth Goldberg bzero(ktss0, PAGESIZE); 12420cfdb603Sjosephb 12430cfdb603Sjosephb #if defined(__i386) 12440cfdb603Sjosephb #if !defined(__lint) 12450cfdb603Sjosephb ASSERT(sizeof (*dftss0) <= PAGESIZE); 12460cfdb603Sjosephb #endif 1247*f16a0f4cSRobert Mustacchi dftss0 = (tss_t *)BOP_ALLOC(bootops, (caddr_t)DFTSS_VA, 12480cfdb603Sjosephb PAGESIZE, PAGESIZE); 12499844da31SSeth Goldberg bzero(dftss0, PAGESIZE); 12500cfdb603Sjosephb #endif 12510cfdb603Sjosephb 12520cfdb603Sjosephb /* 1253ae115bc7Smrj * Setup and install our GDT. 1254ae115bc7Smrj */ 1255ae115bc7Smrj gdt = init_gdt(); 1256ae115bc7Smrj ASSERT(IS_P2ALIGNED((uintptr_t)gdt, PAGESIZE)); 12570cfdb603Sjosephb CPU->cpu_gdt = gdt; 1258ae115bc7Smrj 1259ae115bc7Smrj /* 1260ae115bc7Smrj * Setup and install our IDT. 1261ae115bc7Smrj */ 12620cfdb603Sjosephb init_idt(idt0); 1263ae115bc7Smrj 1264ae115bc7Smrj idtr.dtr_base = (uintptr_t)idt0; 12650cfdb603Sjosephb idtr.dtr_limit = (NIDT * sizeof (*idt0)) - 1; 1266ae115bc7Smrj wr_idtr(&idtr); 12670cfdb603Sjosephb CPU->cpu_idt = idt0; 1268ae115bc7Smrj 1269ae115bc7Smrj #if defined(__i386) 1270ae115bc7Smrj /* 1271ae115bc7Smrj * We maintain a description of idt0 in convenient IDTR format 1272ae115bc7Smrj * for #pf's on some older pentium processors. See pentium_pftrap(). 1273ae115bc7Smrj */ 1274ae115bc7Smrj idt0_default_r = idtr; 1275ae115bc7Smrj #endif /* __i386 */ 1276ae115bc7Smrj 12777c478bd9Sstevel@tonic-gate init_tss(); 12780cfdb603Sjosephb CPU->cpu_tss = ktss0; 12797c478bd9Sstevel@tonic-gate init_ldt(); 12807c478bd9Sstevel@tonic-gate } 12819acbbeafSnn35248 1282843e1988Sjohnlev #endif /* __xpv */ 1283843e1988Sjohnlev 12849acbbeafSnn35248 /* 1285ae115bc7Smrj * In the early kernel, we need to set up a simple GDT to run on. 1286843e1988Sjohnlev * 1287843e1988Sjohnlev * XXPV Can dboot use this too? See dboot_gdt.s 1288ae115bc7Smrj */ 1289ae115bc7Smrj void 1290ae115bc7Smrj init_boot_gdt(user_desc_t *bgdt) 1291ae115bc7Smrj { 1292ae115bc7Smrj #if defined(__amd64) 1293ae115bc7Smrj set_usegd(&bgdt[GDT_B32DATA], SDP_LONG, NULL, -1, SDT_MEMRWA, SEL_KPL, 1294ae115bc7Smrj SDP_PAGES, SDP_OP32); 1295ae115bc7Smrj set_usegd(&bgdt[GDT_B64CODE], SDP_LONG, NULL, -1, SDT_MEMERA, SEL_KPL, 1296ae115bc7Smrj SDP_PAGES, SDP_OP32); 1297ae115bc7Smrj #elif defined(__i386) 1298ae115bc7Smrj set_usegd(&bgdt[GDT_B32DATA], NULL, -1, SDT_MEMRWA, SEL_KPL, 1299ae115bc7Smrj SDP_PAGES, SDP_OP32); 1300ae115bc7Smrj set_usegd(&bgdt[GDT_B32CODE], NULL, -1, SDT_MEMERA, SEL_KPL, 1301ae115bc7Smrj SDP_PAGES, SDP_OP32); 1302ae115bc7Smrj #endif /* __i386 */ 1303ae115bc7Smrj } 1304ae115bc7Smrj 1305ae115bc7Smrj /* 13069acbbeafSnn35248 * Enable interpositioning on the system call path by rewriting the 13079acbbeafSnn35248 * sys{call|enter} MSRs and the syscall-related entries in the IDT to use 13089acbbeafSnn35248 * the branded entry points. 13099acbbeafSnn35248 */ 13109acbbeafSnn35248 void 13119acbbeafSnn35248 brand_interpositioning_enable(void) 13129acbbeafSnn35248 { 1313843e1988Sjohnlev gate_desc_t *idt = CPU->cpu_idt; 13149acbbeafSnn35248 int i; 13159acbbeafSnn35248 1316843e1988Sjohnlev ASSERT(curthread->t_preempt != 0 || getpil() >= DISP_LEVEL); 1317843e1988Sjohnlev 1318843e1988Sjohnlev for (i = 0; brand_tbl[i].ih_inum; i++) { 1319843e1988Sjohnlev idt[brand_tbl[i].ih_inum] = brand_tbl[i].ih_interp_desc; 1320843e1988Sjohnlev #if defined(__xpv) 1321843e1988Sjohnlev xen_idt_write(&idt[brand_tbl[i].ih_inum], 1322843e1988Sjohnlev brand_tbl[i].ih_inum); 1323843e1988Sjohnlev #endif 1324843e1988Sjohnlev } 13259acbbeafSnn35248 13269acbbeafSnn35248 #if defined(__amd64) 1327843e1988Sjohnlev #if defined(__xpv) 1328843e1988Sjohnlev 1329843e1988Sjohnlev /* 1330843e1988Sjohnlev * Currently the hypervisor only supports 64-bit syscalls via 1331843e1988Sjohnlev * syscall instruction. The 32-bit syscalls are handled by 1332843e1988Sjohnlev * interrupt gate above. 1333843e1988Sjohnlev */ 1334843e1988Sjohnlev xen_set_callback(brand_sys_syscall, CALLBACKTYPE_syscall, 1335843e1988Sjohnlev CALLBACKF_mask_events); 1336843e1988Sjohnlev 1337843e1988Sjohnlev #else 1338843e1988Sjohnlev 13397417cfdeSKuriakose Kuruvilla if (is_x86_feature(x86_featureset, X86FSET_ASYSC)) { 13409acbbeafSnn35248 wrmsr(MSR_AMD_LSTAR, (uintptr_t)brand_sys_syscall); 13419acbbeafSnn35248 wrmsr(MSR_AMD_CSTAR, (uintptr_t)brand_sys_syscall32); 1342843e1988Sjohnlev } 1343843e1988Sjohnlev 13449acbbeafSnn35248 #endif 1345843e1988Sjohnlev #endif /* __amd64 */ 13469acbbeafSnn35248 13477417cfdeSKuriakose Kuruvilla if (is_x86_feature(x86_featureset, X86FSET_SEP)) 13489acbbeafSnn35248 wrmsr(MSR_INTC_SEP_EIP, (uintptr_t)brand_sys_sysenter); 13499acbbeafSnn35248 } 13509acbbeafSnn35248 13519acbbeafSnn35248 /* 13529acbbeafSnn35248 * Disable interpositioning on the system call path by rewriting the 13539acbbeafSnn35248 * sys{call|enter} MSRs and the syscall-related entries in the IDT to use 13549acbbeafSnn35248 * the standard entry points, which bypass the interpositioning hooks. 13559acbbeafSnn35248 */ 13569acbbeafSnn35248 void 13579acbbeafSnn35248 brand_interpositioning_disable(void) 13589acbbeafSnn35248 { 1359843e1988Sjohnlev gate_desc_t *idt = CPU->cpu_idt; 13609acbbeafSnn35248 int i; 13619acbbeafSnn35248 1362843e1988Sjohnlev ASSERT(curthread->t_preempt != 0 || getpil() >= DISP_LEVEL); 1363843e1988Sjohnlev 1364843e1988Sjohnlev for (i = 0; brand_tbl[i].ih_inum; i++) { 1365843e1988Sjohnlev idt[brand_tbl[i].ih_inum] = brand_tbl[i].ih_default_desc; 1366843e1988Sjohnlev #if defined(__xpv) 1367843e1988Sjohnlev xen_idt_write(&idt[brand_tbl[i].ih_inum], 1368843e1988Sjohnlev brand_tbl[i].ih_inum); 1369843e1988Sjohnlev #endif 1370843e1988Sjohnlev } 13719acbbeafSnn35248 13729acbbeafSnn35248 #if defined(__amd64) 1373843e1988Sjohnlev #if defined(__xpv) 1374843e1988Sjohnlev 1375843e1988Sjohnlev /* 1376843e1988Sjohnlev * See comment above in brand_interpositioning_enable. 1377843e1988Sjohnlev */ 1378843e1988Sjohnlev xen_set_callback(sys_syscall, CALLBACKTYPE_syscall, 1379843e1988Sjohnlev CALLBACKF_mask_events); 1380843e1988Sjohnlev 1381843e1988Sjohnlev #else 1382843e1988Sjohnlev 13837417cfdeSKuriakose Kuruvilla if (is_x86_feature(x86_featureset, X86FSET_ASYSC)) { 13849acbbeafSnn35248 wrmsr(MSR_AMD_LSTAR, (uintptr_t)sys_syscall); 13859acbbeafSnn35248 wrmsr(MSR_AMD_CSTAR, (uintptr_t)sys_syscall32); 1386843e1988Sjohnlev } 1387843e1988Sjohnlev 13889acbbeafSnn35248 #endif 1389843e1988Sjohnlev #endif /* __amd64 */ 13909acbbeafSnn35248 13917417cfdeSKuriakose Kuruvilla if (is_x86_feature(x86_featureset, X86FSET_SEP)) 13929acbbeafSnn35248 wrmsr(MSR_INTC_SEP_EIP, (uintptr_t)sys_sysenter); 13939acbbeafSnn35248 } 1394