11a9cdd37SRoger Pau Monné /* 21a9cdd37SRoger Pau Monné * Copyright (c) 2004 Christian Limpach. 31a9cdd37SRoger Pau Monné * Copyright (c) 2004-2006,2008 Kip Macy 41a9cdd37SRoger Pau Monné * Copyright (c) 2013 Roger Pau Monné <roger.pau@citrix.com> 51a9cdd37SRoger Pau Monné * All rights reserved. 61a9cdd37SRoger Pau Monné * 71a9cdd37SRoger Pau Monné * Redistribution and use in source and binary forms, with or without 81a9cdd37SRoger Pau Monné * modification, are permitted provided that the following conditions 91a9cdd37SRoger Pau Monné * are met: 101a9cdd37SRoger Pau Monné * 1. Redistributions of source code must retain the above copyright 111a9cdd37SRoger Pau Monné * notice, this list of conditions and the following disclaimer. 121a9cdd37SRoger Pau Monné * 2. Redistributions in binary form must reproduce the above copyright 131a9cdd37SRoger Pau Monné * notice, this list of conditions and the following disclaimer in the 141a9cdd37SRoger Pau Monné * documentation and/or other materials provided with the distribution. 151a9cdd37SRoger Pau Monné * 161a9cdd37SRoger Pau Monné * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS AS IS'' AND 171a9cdd37SRoger Pau Monné * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 181a9cdd37SRoger Pau Monné * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 191a9cdd37SRoger Pau Monné * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 201a9cdd37SRoger Pau Monné * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 211a9cdd37SRoger Pau Monné * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 221a9cdd37SRoger Pau Monné * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 231a9cdd37SRoger Pau Monné * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 241a9cdd37SRoger Pau Monné * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 251a9cdd37SRoger Pau Monné * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 261a9cdd37SRoger Pau Monné * SUCH DAMAGE. 271a9cdd37SRoger Pau Monné */ 281a9cdd37SRoger Pau Monné 291a9cdd37SRoger Pau Monné #include <sys/cdefs.h> 301a9cdd37SRoger Pau Monné __FBSDID("$FreeBSD$"); 311a9cdd37SRoger Pau Monné 321a9cdd37SRoger Pau Monné #include <sys/param.h> 331a9cdd37SRoger Pau Monné #include <sys/bus.h> 341a9cdd37SRoger Pau Monné #include <sys/kernel.h> 351a9cdd37SRoger Pau Monné #include <sys/reboot.h> 361a9cdd37SRoger Pau Monné #include <sys/systm.h> 37079f7ef8SRoger Pau Monné #include <sys/malloc.h> 381a9cdd37SRoger Pau Monné #include <sys/lock.h> 391a9cdd37SRoger Pau Monné #include <sys/rwlock.h> 40aa389b4fSRoger Pau Monné #include <sys/boot.h> 4197baeefdSRoger Pau Monné #include <sys/ctype.h> 42079f7ef8SRoger Pau Monné #include <sys/mutex.h> 43079f7ef8SRoger Pau Monné #include <sys/smp.h> 441a9cdd37SRoger Pau Monné 451a9cdd37SRoger Pau Monné #include <vm/vm.h> 461a9cdd37SRoger Pau Monné #include <vm/vm_extern.h> 471a9cdd37SRoger Pau Monné #include <vm/vm_kern.h> 481a9cdd37SRoger Pau Monné #include <vm/vm_page.h> 491a9cdd37SRoger Pau Monné #include <vm/vm_map.h> 501a9cdd37SRoger Pau Monné #include <vm/vm_object.h> 511a9cdd37SRoger Pau Monné #include <vm/vm_pager.h> 521a9cdd37SRoger Pau Monné #include <vm/vm_param.h> 531a9cdd37SRoger Pau Monné 5497baeefdSRoger Pau Monné #include <x86/init.h> 551e69553eSRoger Pau Monné #include <machine/pc/bios.h> 56079f7ef8SRoger Pau Monné #include <machine/smp.h> 5797baeefdSRoger Pau Monné 581a9cdd37SRoger Pau Monné #include <xen/xen-os.h> 591a9cdd37SRoger Pau Monné #include <xen/hypervisor.h> 60*b7df74eeSWarner Losh #include <xen/xenstore/xenstorevar.h> 611a9cdd37SRoger Pau Monné 62079f7ef8SRoger Pau Monné #include <xen/interface/vcpu.h> 63079f7ef8SRoger Pau Monné 645f05c794SRoger Pau Monné #include <dev/xen/timer/timer.h> 655f05c794SRoger Pau Monné 661a9cdd37SRoger Pau Monné /* Native initial function */ 671a9cdd37SRoger Pau Monné extern u_int64_t hammer_time(u_int64_t, u_int64_t); 681a9cdd37SRoger Pau Monné /* Xen initial function */ 691a9cdd37SRoger Pau Monné uint64_t hammer_time_xen(start_info_t *, uint64_t); 701a9cdd37SRoger Pau Monné 711e69553eSRoger Pau Monné #define MAX_E820_ENTRIES 128 721e69553eSRoger Pau Monné 7397baeefdSRoger Pau Monné /*--------------------------- Forward Declarations ---------------------------*/ 7497baeefdSRoger Pau Monné static caddr_t xen_pv_parse_preload_data(u_int64_t); 751e69553eSRoger Pau Monné static void xen_pv_parse_memmap(caddr_t, vm_paddr_t *, int *); 7697baeefdSRoger Pau Monné 77079f7ef8SRoger Pau Monné #ifdef SMP 78079f7ef8SRoger Pau Monné static int xen_pv_start_all_aps(void); 79079f7ef8SRoger Pau Monné #endif 80079f7ef8SRoger Pau Monné 81079f7ef8SRoger Pau Monné /*---------------------------- Extern Declarations ---------------------------*/ 82079f7ef8SRoger Pau Monné #ifdef SMP 83079f7ef8SRoger Pau Monné /* Variables used by amd64 mp_machdep to start APs */ 84079f7ef8SRoger Pau Monné extern struct mtx ap_boot_mtx; 85079f7ef8SRoger Pau Monné extern void *bootstacks[]; 86079f7ef8SRoger Pau Monné extern char *doublefault_stack; 87079f7ef8SRoger Pau Monné extern char *nmi_stack; 88079f7ef8SRoger Pau Monné extern void *dpcpu; 89079f7ef8SRoger Pau Monné extern int bootAP; 90079f7ef8SRoger Pau Monné extern char *bootSTK; 91079f7ef8SRoger Pau Monné #endif 92079f7ef8SRoger Pau Monné 9397baeefdSRoger Pau Monné /*-------------------------------- Global Data -------------------------------*/ 9497baeefdSRoger Pau Monné /* Xen init_ops implementation. */ 9597baeefdSRoger Pau Monné struct init_ops xen_init_ops = { 9697baeefdSRoger Pau Monné .parse_preload_data = xen_pv_parse_preload_data, 975f05c794SRoger Pau Monné .early_clock_source_init = xen_clock_init, 985f05c794SRoger Pau Monné .early_delay = xen_delay, 991e69553eSRoger Pau Monné .parse_memmap = xen_pv_parse_memmap, 100079f7ef8SRoger Pau Monné #ifdef SMP 101079f7ef8SRoger Pau Monné .start_all_aps = xen_pv_start_all_aps, 102079f7ef8SRoger Pau Monné #endif 10397baeefdSRoger Pau Monné }; 10497baeefdSRoger Pau Monné 1051e69553eSRoger Pau Monné static struct bios_smap xen_smap[MAX_E820_ENTRIES]; 1061e69553eSRoger Pau Monné 10797baeefdSRoger Pau Monné /*-------------------------------- Xen PV init -------------------------------*/ 1081a9cdd37SRoger Pau Monné /* 1091a9cdd37SRoger Pau Monné * First function called by the Xen PVH boot sequence. 1101a9cdd37SRoger Pau Monné * 1111a9cdd37SRoger Pau Monné * Set some Xen global variables and prepare the environment so it is 1121a9cdd37SRoger Pau Monné * as similar as possible to what native FreeBSD init function expects. 1131a9cdd37SRoger Pau Monné */ 1141a9cdd37SRoger Pau Monné uint64_t 1151a9cdd37SRoger Pau Monné hammer_time_xen(start_info_t *si, uint64_t xenstack) 1161a9cdd37SRoger Pau Monné { 1171a9cdd37SRoger Pau Monné uint64_t physfree; 1181a9cdd37SRoger Pau Monné uint64_t *PT4 = (u_int64_t *)xenstack; 1191a9cdd37SRoger Pau Monné uint64_t *PT3 = (u_int64_t *)(xenstack + PAGE_SIZE); 1201a9cdd37SRoger Pau Monné uint64_t *PT2 = (u_int64_t *)(xenstack + 2 * PAGE_SIZE); 1211a9cdd37SRoger Pau Monné int i; 1221a9cdd37SRoger Pau Monné 1231a9cdd37SRoger Pau Monné xen_domain_type = XEN_PV_DOMAIN; 1241a9cdd37SRoger Pau Monné vm_guest = VM_GUEST_XEN; 1251a9cdd37SRoger Pau Monné 1261a9cdd37SRoger Pau Monné if ((si == NULL) || (xenstack == 0)) { 127c203fa69SRoger Pau Monné xc_printf("ERROR: invalid start_info or xen stack, halting\n"); 1281a9cdd37SRoger Pau Monné HYPERVISOR_shutdown(SHUTDOWN_crash); 1291a9cdd37SRoger Pau Monné } 1301a9cdd37SRoger Pau Monné 131c203fa69SRoger Pau Monné xc_printf("FreeBSD PVH running on %s\n", si->magic); 132c203fa69SRoger Pau Monné 1331a9cdd37SRoger Pau Monné /* We use 3 pages of xen stack for the boot pagetables */ 1341a9cdd37SRoger Pau Monné physfree = xenstack + 3 * PAGE_SIZE - KERNBASE; 1351a9cdd37SRoger Pau Monné 1361a9cdd37SRoger Pau Monné /* Setup Xen global variables */ 1371a9cdd37SRoger Pau Monné HYPERVISOR_start_info = si; 1381a9cdd37SRoger Pau Monné HYPERVISOR_shared_info = 1391a9cdd37SRoger Pau Monné (shared_info_t *)(si->shared_info + KERNBASE); 1401a9cdd37SRoger Pau Monné 1411a9cdd37SRoger Pau Monné /* 1421a9cdd37SRoger Pau Monné * Setup some misc global variables for Xen devices 1431a9cdd37SRoger Pau Monné * 1441a9cdd37SRoger Pau Monné * XXX: Devices that need these specific variables should 1451a9cdd37SRoger Pau Monné * be rewritten to fetch this info by themselves from the 1461a9cdd37SRoger Pau Monné * start_info page. 1471a9cdd37SRoger Pau Monné */ 1481a9cdd37SRoger Pau Monné xen_store = (struct xenstore_domain_interface *) 1491a9cdd37SRoger Pau Monné (ptoa(si->store_mfn) + KERNBASE); 150c203fa69SRoger Pau Monné console_page = (char *)(ptoa(si->console.domU.mfn) + KERNBASE); 1511a9cdd37SRoger Pau Monné 1521a9cdd37SRoger Pau Monné /* 1531a9cdd37SRoger Pau Monné * Use the stack Xen gives us to build the page tables 1541a9cdd37SRoger Pau Monné * as native FreeBSD expects to find them (created 1551a9cdd37SRoger Pau Monné * by the boot trampoline). 1561a9cdd37SRoger Pau Monné */ 1571a9cdd37SRoger Pau Monné for (i = 0; i < (PAGE_SIZE / sizeof(uint64_t)); i++) { 1581a9cdd37SRoger Pau Monné /* Each slot of the level 4 pages points to the same level 3 page */ 1591a9cdd37SRoger Pau Monné PT4[i] = ((uint64_t)&PT3[0]) - KERNBASE; 1601a9cdd37SRoger Pau Monné PT4[i] |= PG_V | PG_RW | PG_U; 1611a9cdd37SRoger Pau Monné 1621a9cdd37SRoger Pau Monné /* Each slot of the level 3 pages points to the same level 2 page */ 1631a9cdd37SRoger Pau Monné PT3[i] = ((uint64_t)&PT2[0]) - KERNBASE; 1641a9cdd37SRoger Pau Monné PT3[i] |= PG_V | PG_RW | PG_U; 1651a9cdd37SRoger Pau Monné 1661a9cdd37SRoger Pau Monné /* The level 2 page slots are mapped with 2MB pages for 1GB. */ 1671a9cdd37SRoger Pau Monné PT2[i] = i * (2 * 1024 * 1024); 1681a9cdd37SRoger Pau Monné PT2[i] |= PG_V | PG_RW | PG_PS | PG_U; 1691a9cdd37SRoger Pau Monné } 1701a9cdd37SRoger Pau Monné load_cr3(((uint64_t)&PT4[0]) - KERNBASE); 1711a9cdd37SRoger Pau Monné 17297baeefdSRoger Pau Monné /* Set the hooks for early functions that diverge from bare metal */ 17397baeefdSRoger Pau Monné init_ops = xen_init_ops; 17497baeefdSRoger Pau Monné 1751a9cdd37SRoger Pau Monné /* Now we can jump into the native init function */ 1761a9cdd37SRoger Pau Monné return (hammer_time(0, physfree)); 1771a9cdd37SRoger Pau Monné } 17897baeefdSRoger Pau Monné 17997baeefdSRoger Pau Monné /*-------------------------------- PV specific -------------------------------*/ 180079f7ef8SRoger Pau Monné #ifdef SMP 181079f7ef8SRoger Pau Monné static bool 182079f7ef8SRoger Pau Monné start_xen_ap(int cpu) 183079f7ef8SRoger Pau Monné { 184079f7ef8SRoger Pau Monné struct vcpu_guest_context *ctxt; 185079f7ef8SRoger Pau Monné int ms, cpus = mp_naps; 186079f7ef8SRoger Pau Monné const size_t stacksize = KSTACK_PAGES * PAGE_SIZE; 187079f7ef8SRoger Pau Monné 188079f7ef8SRoger Pau Monné /* allocate and set up an idle stack data page */ 189079f7ef8SRoger Pau Monné bootstacks[cpu] = 190079f7ef8SRoger Pau Monné (void *)kmem_malloc(kernel_arena, stacksize, M_WAITOK | M_ZERO); 191079f7ef8SRoger Pau Monné doublefault_stack = 192079f7ef8SRoger Pau Monné (char *)kmem_malloc(kernel_arena, PAGE_SIZE, M_WAITOK | M_ZERO); 193079f7ef8SRoger Pau Monné nmi_stack = 194079f7ef8SRoger Pau Monné (char *)kmem_malloc(kernel_arena, PAGE_SIZE, M_WAITOK | M_ZERO); 195079f7ef8SRoger Pau Monné dpcpu = 196079f7ef8SRoger Pau Monné (void *)kmem_malloc(kernel_arena, DPCPU_SIZE, M_WAITOK | M_ZERO); 197079f7ef8SRoger Pau Monné 198079f7ef8SRoger Pau Monné bootSTK = (char *)bootstacks[cpu] + KSTACK_PAGES * PAGE_SIZE - 8; 199079f7ef8SRoger Pau Monné bootAP = cpu; 200079f7ef8SRoger Pau Monné 201079f7ef8SRoger Pau Monné ctxt = malloc(sizeof(*ctxt), M_TEMP, M_WAITOK | M_ZERO); 202079f7ef8SRoger Pau Monné if (ctxt == NULL) 203079f7ef8SRoger Pau Monné panic("unable to allocate memory"); 204079f7ef8SRoger Pau Monné 205079f7ef8SRoger Pau Monné ctxt->flags = VGCF_IN_KERNEL; 206079f7ef8SRoger Pau Monné ctxt->user_regs.rip = (unsigned long) init_secondary; 207079f7ef8SRoger Pau Monné ctxt->user_regs.rsp = (unsigned long) bootSTK; 208079f7ef8SRoger Pau Monné 209079f7ef8SRoger Pau Monné /* Set the AP to use the same page tables */ 210079f7ef8SRoger Pau Monné ctxt->ctrlreg[3] = KPML4phys; 211079f7ef8SRoger Pau Monné 212079f7ef8SRoger Pau Monné if (HYPERVISOR_vcpu_op(VCPUOP_initialise, cpu, ctxt)) 213079f7ef8SRoger Pau Monné panic("unable to initialize AP#%d", cpu); 214079f7ef8SRoger Pau Monné 215079f7ef8SRoger Pau Monné free(ctxt, M_TEMP); 216079f7ef8SRoger Pau Monné 217079f7ef8SRoger Pau Monné /* Launch the vCPU */ 218079f7ef8SRoger Pau Monné if (HYPERVISOR_vcpu_op(VCPUOP_up, cpu, NULL)) 219079f7ef8SRoger Pau Monné panic("unable to start AP#%d", cpu); 220079f7ef8SRoger Pau Monné 221079f7ef8SRoger Pau Monné /* Wait up to 5 seconds for it to start. */ 222079f7ef8SRoger Pau Monné for (ms = 0; ms < 5000; ms++) { 223079f7ef8SRoger Pau Monné if (mp_naps > cpus) 224079f7ef8SRoger Pau Monné return (true); 225079f7ef8SRoger Pau Monné DELAY(1000); 226079f7ef8SRoger Pau Monné } 227079f7ef8SRoger Pau Monné 228079f7ef8SRoger Pau Monné return (false); 229079f7ef8SRoger Pau Monné } 230079f7ef8SRoger Pau Monné 231079f7ef8SRoger Pau Monné static int 232079f7ef8SRoger Pau Monné xen_pv_start_all_aps(void) 233079f7ef8SRoger Pau Monné { 234079f7ef8SRoger Pau Monné int cpu; 235079f7ef8SRoger Pau Monné 236079f7ef8SRoger Pau Monné mtx_init(&ap_boot_mtx, "ap boot", NULL, MTX_SPIN); 237079f7ef8SRoger Pau Monné 238079f7ef8SRoger Pau Monné for (cpu = 1; cpu < mp_ncpus; cpu++) { 239079f7ef8SRoger Pau Monné 240079f7ef8SRoger Pau Monné /* attempt to start the Application Processor */ 241079f7ef8SRoger Pau Monné if (!start_xen_ap(cpu)) 242079f7ef8SRoger Pau Monné panic("AP #%d failed to start!", cpu); 243079f7ef8SRoger Pau Monné 244079f7ef8SRoger Pau Monné CPU_SET(cpu, &all_cpus); /* record AP in CPU map */ 245079f7ef8SRoger Pau Monné } 246079f7ef8SRoger Pau Monné 247079f7ef8SRoger Pau Monné return (mp_naps); 248079f7ef8SRoger Pau Monné } 249079f7ef8SRoger Pau Monné #endif /* SMP */ 250079f7ef8SRoger Pau Monné 25197baeefdSRoger Pau Monné /* 25297baeefdSRoger Pau Monné * Functions to convert the "extra" parameters passed by Xen 25397baeefdSRoger Pau Monné * into FreeBSD boot options. 25497baeefdSRoger Pau Monné */ 25597baeefdSRoger Pau Monné static void 25697baeefdSRoger Pau Monné xen_pv_set_env(void) 25797baeefdSRoger Pau Monné { 25897baeefdSRoger Pau Monné char *cmd_line_next, *cmd_line; 25997baeefdSRoger Pau Monné size_t env_size; 26097baeefdSRoger Pau Monné 26197baeefdSRoger Pau Monné cmd_line = HYPERVISOR_start_info->cmd_line; 26297baeefdSRoger Pau Monné env_size = sizeof(HYPERVISOR_start_info->cmd_line); 26397baeefdSRoger Pau Monné 26497baeefdSRoger Pau Monné /* Skip leading spaces */ 26597baeefdSRoger Pau Monné for (; isspace(*cmd_line) && (env_size != 0); cmd_line++) 26697baeefdSRoger Pau Monné env_size--; 26797baeefdSRoger Pau Monné 26897baeefdSRoger Pau Monné /* Replace ',' with '\0' */ 26997baeefdSRoger Pau Monné for (cmd_line_next = cmd_line; strsep(&cmd_line_next, ",") != NULL;) 27097baeefdSRoger Pau Monné ; 27197baeefdSRoger Pau Monné 27297baeefdSRoger Pau Monné init_static_kenv(cmd_line, env_size); 27397baeefdSRoger Pau Monné } 27497baeefdSRoger Pau Monné 27597baeefdSRoger Pau Monné static void 27697baeefdSRoger Pau Monné xen_pv_set_boothowto(void) 27797baeefdSRoger Pau Monné { 27897baeefdSRoger Pau Monné int i; 27997baeefdSRoger Pau Monné 28097baeefdSRoger Pau Monné /* get equivalents from the environment */ 28197baeefdSRoger Pau Monné for (i = 0; howto_names[i].ev != NULL; i++) { 28297baeefdSRoger Pau Monné if (getenv(howto_names[i].ev) != NULL) 28397baeefdSRoger Pau Monné boothowto |= howto_names[i].mask; 28497baeefdSRoger Pau Monné } 28597baeefdSRoger Pau Monné } 28697baeefdSRoger Pau Monné 28797baeefdSRoger Pau Monné static caddr_t 28897baeefdSRoger Pau Monné xen_pv_parse_preload_data(u_int64_t modulep) 28997baeefdSRoger Pau Monné { 29097baeefdSRoger Pau Monné /* Parse the extra boot information given by Xen */ 29197baeefdSRoger Pau Monné xen_pv_set_env(); 29297baeefdSRoger Pau Monné xen_pv_set_boothowto(); 29397baeefdSRoger Pau Monné 29497baeefdSRoger Pau Monné return (NULL); 29597baeefdSRoger Pau Monné } 2961e69553eSRoger Pau Monné 2971e69553eSRoger Pau Monné static void 2981e69553eSRoger Pau Monné xen_pv_parse_memmap(caddr_t kmdp, vm_paddr_t *physmap, int *physmap_idx) 2991e69553eSRoger Pau Monné { 3001e69553eSRoger Pau Monné struct xen_memory_map memmap; 3011e69553eSRoger Pau Monné u_int32_t size; 3021e69553eSRoger Pau Monné int rc; 3031e69553eSRoger Pau Monné 3041e69553eSRoger Pau Monné /* Fetch the E820 map from Xen */ 3051e69553eSRoger Pau Monné memmap.nr_entries = MAX_E820_ENTRIES; 3061e69553eSRoger Pau Monné set_xen_guest_handle(memmap.buffer, xen_smap); 3071e69553eSRoger Pau Monné rc = HYPERVISOR_memory_op(XENMEM_memory_map, &memmap); 3081e69553eSRoger Pau Monné if (rc) 3091e69553eSRoger Pau Monné panic("unable to fetch Xen E820 memory map"); 3101e69553eSRoger Pau Monné size = memmap.nr_entries * sizeof(xen_smap[0]); 3111e69553eSRoger Pau Monné 3121e69553eSRoger Pau Monné bios_add_smap_entries(xen_smap, size, physmap, physmap_idx); 3131e69553eSRoger Pau Monné } 314