17c478bd9Sstevel@tonic-gate /* 27c478bd9Sstevel@tonic-gate * CDDL HEADER START 37c478bd9Sstevel@tonic-gate * 47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the 545916cd2Sjpk * Common Development and Distribution License (the "License"). 645916cd2Sjpk * You may not use this file except in compliance with the License. 77c478bd9Sstevel@tonic-gate * 87c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 97c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 107c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions 117c478bd9Sstevel@tonic-gate * and limitations under the License. 127c478bd9Sstevel@tonic-gate * 137c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 147c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 157c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 167c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 177c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 187c478bd9Sstevel@tonic-gate * 197c478bd9Sstevel@tonic-gate * CDDL HEADER END 207c478bd9Sstevel@tonic-gate */ 216eb30ec3SRoger A. Faulkner 227c478bd9Sstevel@tonic-gate /* 23c3f63b71SAlexandre Chartre * Copyright (c) 1988, 2010, Oracle and/or its affiliates. All rights reserved. 247c478bd9Sstevel@tonic-gate */ 257c478bd9Sstevel@tonic-gate 267c478bd9Sstevel@tonic-gate /* Copyright (c) 1988 AT&T */ 277c478bd9Sstevel@tonic-gate /* All Rights Reserved */ 287c478bd9Sstevel@tonic-gate 29a288e5a9SJoshua M. Clulow /* 30a288e5a9SJoshua M. Clulow * Copyright (c) 2013, Joyent, Inc. All rights reserved. 31a288e5a9SJoshua M. Clulow */ 32a288e5a9SJoshua M. Clulow 337c478bd9Sstevel@tonic-gate #include <sys/types.h> 347c478bd9Sstevel@tonic-gate #include <sys/param.h> 357c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 367c478bd9Sstevel@tonic-gate #include <sys/pcb.h> 377c478bd9Sstevel@tonic-gate #include <sys/systm.h> 387c478bd9Sstevel@tonic-gate #include <sys/signal.h> 397c478bd9Sstevel@tonic-gate #include <sys/cred.h> 407c478bd9Sstevel@tonic-gate #include <sys/user.h> 417c478bd9Sstevel@tonic-gate #include <sys/vfs.h> 427c478bd9Sstevel@tonic-gate #include <sys/vnode.h> 437c478bd9Sstevel@tonic-gate #include <sys/proc.h> 447c478bd9Sstevel@tonic-gate #include <sys/time.h> 457c478bd9Sstevel@tonic-gate #include <sys/file.h> 467c478bd9Sstevel@tonic-gate #include <sys/priocntl.h> 477c478bd9Sstevel@tonic-gate #include <sys/procset.h> 487c478bd9Sstevel@tonic-gate #include <sys/disp.h> 497c478bd9Sstevel@tonic-gate #include <sys/callo.h> 507c478bd9Sstevel@tonic-gate #include <sys/callb.h> 517c478bd9Sstevel@tonic-gate #include <sys/debug.h> 527c478bd9Sstevel@tonic-gate #include <sys/conf.h> 537c478bd9Sstevel@tonic-gate #include <sys/bootconf.h> 547c478bd9Sstevel@tonic-gate #include <sys/utsname.h> 557c478bd9Sstevel@tonic-gate #include <sys/cmn_err.h> 567c478bd9Sstevel@tonic-gate #include <sys/vmparam.h> 577c478bd9Sstevel@tonic-gate #include <sys/modctl.h> 587c478bd9Sstevel@tonic-gate #include <sys/vm.h> 597c478bd9Sstevel@tonic-gate #include <sys/callb.h> 60a288e5a9SJoshua M. Clulow #include <sys/ddi_periodic.h> 617c478bd9Sstevel@tonic-gate #include <sys/kmem.h> 627c478bd9Sstevel@tonic-gate #include <sys/vmem.h> 637c478bd9Sstevel@tonic-gate #include <sys/cpuvar.h> 647c478bd9Sstevel@tonic-gate #include <sys/cladm.h> 657c478bd9Sstevel@tonic-gate #include <sys/corectl.h> 667c478bd9Sstevel@tonic-gate #include <sys/exec.h> 677c478bd9Sstevel@tonic-gate #include <sys/syscall.h> 687c478bd9Sstevel@tonic-gate #include <sys/reboot.h> 697c478bd9Sstevel@tonic-gate #include <sys/task.h> 707c478bd9Sstevel@tonic-gate #include <sys/exacct.h> 717c478bd9Sstevel@tonic-gate #include <sys/autoconf.h> 727c478bd9Sstevel@tonic-gate #include <sys/errorq.h> 737c478bd9Sstevel@tonic-gate #include <sys/class.h> 747c478bd9Sstevel@tonic-gate #include <sys/stack.h> 759acbbeafSnn35248 #include <sys/brand.h> 760616c1c3SMichael Corcoran #include <sys/mmapobj.h> 777c478bd9Sstevel@tonic-gate 787c478bd9Sstevel@tonic-gate #include <vm/as.h> 797c478bd9Sstevel@tonic-gate #include <vm/seg_kmem.h> 807c478bd9Sstevel@tonic-gate #include <sys/dc_ki.h> 817c478bd9Sstevel@tonic-gate 827c478bd9Sstevel@tonic-gate #include <c2/audit.h> 836cefaae1SJack Meng #include <sys/bootprops.h> 847c478bd9Sstevel@tonic-gate 857c478bd9Sstevel@tonic-gate /* well known processes */ 867c478bd9Sstevel@tonic-gate proc_t *proc_sched; /* memory scheduler */ 877c478bd9Sstevel@tonic-gate proc_t *proc_init; /* init */ 887c478bd9Sstevel@tonic-gate proc_t *proc_pageout; /* pageout daemon */ 897c478bd9Sstevel@tonic-gate proc_t *proc_fsflush; /* fsflush daemon */ 907c478bd9Sstevel@tonic-gate 917c478bd9Sstevel@tonic-gate pgcnt_t maxmem; /* Maximum available memory in pages. */ 927c478bd9Sstevel@tonic-gate pgcnt_t freemem; /* Current available memory in pages. */ 937c478bd9Sstevel@tonic-gate int interrupts_unleashed; /* set when we do the first spl0() */ 947c478bd9Sstevel@tonic-gate 957c478bd9Sstevel@tonic-gate kmem_cache_t *process_cache; /* kmem cache for proc structures */ 967c478bd9Sstevel@tonic-gate 977c478bd9Sstevel@tonic-gate /* 98005d3febSMarek Pospisil * Indicates whether the auditing module (c2audit) is loaded. Possible 99005d3febSMarek Pospisil * values are: 100005d3febSMarek Pospisil * 0 - c2audit module is excluded in /etc/system and cannot be loaded 101005d3febSMarek Pospisil * 1 - c2audit module is not loaded but can be anytime 102005d3febSMarek Pospisil * 2 - c2audit module is loaded 103005d3febSMarek Pospisil */ 104005d3febSMarek Pospisil int audit_active = C2AUDIT_DISABLED; 105005d3febSMarek Pospisil 106005d3febSMarek Pospisil /* 1077c478bd9Sstevel@tonic-gate * Process 0's lwp directory and lwpid hash table. 1087c478bd9Sstevel@tonic-gate */ 1097c478bd9Sstevel@tonic-gate lwpdir_t p0_lwpdir[2]; 1106eb30ec3SRoger A. Faulkner tidhash_t p0_tidhash[2]; 1117c478bd9Sstevel@tonic-gate lwpent_t p0_lep; 1127c478bd9Sstevel@tonic-gate 1137c478bd9Sstevel@tonic-gate /* 1147c478bd9Sstevel@tonic-gate * Machine-independent initialization code 1157c478bd9Sstevel@tonic-gate * Called from cold start routine as 1167c478bd9Sstevel@tonic-gate * soon as a stack and segmentation 1177c478bd9Sstevel@tonic-gate * have been established. 1187c478bd9Sstevel@tonic-gate * Functions: 1197c478bd9Sstevel@tonic-gate * clear and free user core 1207c478bd9Sstevel@tonic-gate * turn on clock 1217c478bd9Sstevel@tonic-gate * hand craft 0th process 1227c478bd9Sstevel@tonic-gate * call all initialization routines 1237c478bd9Sstevel@tonic-gate * fork - process 0 to schedule 1247c478bd9Sstevel@tonic-gate * - process 1 execute bootstrap 1257c478bd9Sstevel@tonic-gate * - process 2 to page out 1267c478bd9Sstevel@tonic-gate * create system threads 1277c478bd9Sstevel@tonic-gate */ 1287c478bd9Sstevel@tonic-gate 1297c478bd9Sstevel@tonic-gate int cluster_bootflags = 0; 1307c478bd9Sstevel@tonic-gate 1317c478bd9Sstevel@tonic-gate void 1327c478bd9Sstevel@tonic-gate cluster_wrapper(void) 1337c478bd9Sstevel@tonic-gate { 1347c478bd9Sstevel@tonic-gate cluster(); 1357c478bd9Sstevel@tonic-gate panic("cluster() returned"); 1367c478bd9Sstevel@tonic-gate } 1377c478bd9Sstevel@tonic-gate 1383f2f09c1Sdp char initname[INITNAME_SZ] = "/sbin/init"; /* also referenced by zone0 */ 1393f2f09c1Sdp char initargs[BOOTARGS_MAX] = ""; /* also referenced by zone0 */ 1407c478bd9Sstevel@tonic-gate 1417c478bd9Sstevel@tonic-gate /* 1423f2f09c1Sdp * Construct a stack for init containing the arguments to it, then 1433f2f09c1Sdp * pass control to exec_common. 1447c478bd9Sstevel@tonic-gate */ 1457c478bd9Sstevel@tonic-gate int 1463f2f09c1Sdp exec_init(const char *initpath, const char *args) 1477c478bd9Sstevel@tonic-gate { 1483f2f09c1Sdp caddr32_t ucp; 1497c478bd9Sstevel@tonic-gate caddr32_t *uap; 1503f2f09c1Sdp caddr32_t *argv; 1513f2f09c1Sdp caddr32_t exec_fnamep; 1523f2f09c1Sdp char *scratchargs; 1533f2f09c1Sdp int i, sarg; 1543f2f09c1Sdp size_t argvlen, alen; 1553f2f09c1Sdp boolean_t in_arg; 1567c478bd9Sstevel@tonic-gate int argc = 0; 1573f2f09c1Sdp int error = 0, count = 0; 1587c478bd9Sstevel@tonic-gate proc_t *p = ttoproc(curthread); 1597c478bd9Sstevel@tonic-gate klwp_t *lwp = ttolwp(curthread); 1609acbbeafSnn35248 int brand_action; 1617c478bd9Sstevel@tonic-gate 1623f2f09c1Sdp if (args == NULL) 1633f2f09c1Sdp args = ""; 1647c478bd9Sstevel@tonic-gate 1653f2f09c1Sdp alen = strlen(initpath) + 1 + strlen(args) + 1; 1663f2f09c1Sdp scratchargs = kmem_alloc(alen, KM_SLEEP); 1673f2f09c1Sdp (void) snprintf(scratchargs, alen, "%s %s", initpath, args); 1687c478bd9Sstevel@tonic-gate 1697c478bd9Sstevel@tonic-gate /* 1703f2f09c1Sdp * We do a quick two state parse of the string to sort out how big 1713f2f09c1Sdp * argc should be. 1727c478bd9Sstevel@tonic-gate */ 1733f2f09c1Sdp in_arg = B_FALSE; 1743f2f09c1Sdp for (i = 0; i < strlen(scratchargs); i++) { 1753f2f09c1Sdp if (scratchargs[i] == ' ' || scratchargs[i] == '\0') { 1763f2f09c1Sdp if (in_arg) { 1773f2f09c1Sdp in_arg = B_FALSE; 1783f2f09c1Sdp argc++; 1793f2f09c1Sdp } 1803f2f09c1Sdp } else { 1813f2f09c1Sdp in_arg = B_TRUE; 1823f2f09c1Sdp } 1833f2f09c1Sdp } 1843f2f09c1Sdp argvlen = sizeof (caddr32_t) * (argc + 1); 1853f2f09c1Sdp argv = kmem_zalloc(argvlen, KM_SLEEP); 1863f2f09c1Sdp 1873f2f09c1Sdp /* 1883f2f09c1Sdp * We pull off a bit of a hack here. We work our way through the 1893f2f09c1Sdp * args string, putting nulls at the ends of space delimited tokens 1903f2f09c1Sdp * (boot args don't support quoting at this time). Then we just 1913f2f09c1Sdp * copy the whole mess to userland in one go. In other words, we 1923f2f09c1Sdp * transform this: "init -s -r\0" into this on the stack: 1933f2f09c1Sdp * 1943f2f09c1Sdp * -0x00 \0 1953f2f09c1Sdp * -0x01 r 1963f2f09c1Sdp * -0x02 - <--------. 1973f2f09c1Sdp * -0x03 \0 | 1983f2f09c1Sdp * -0x04 s | 1993f2f09c1Sdp * -0x05 - <------. | 2003f2f09c1Sdp * -0x06 \0 | | 2013f2f09c1Sdp * -0x07 t | | 2023f2f09c1Sdp * -0x08 i | | 2033f2f09c1Sdp * -0x09 n | | 2043f2f09c1Sdp * -0x0a i <---. | | 2053f2f09c1Sdp * -0x10 NULL | | | (argv[3]) 2063f2f09c1Sdp * -0x14 -----|--|-' (argv[2]) 2073f2f09c1Sdp * -0x18 ------|--' (argv[1]) 2083f2f09c1Sdp * -0x1c -------' (argv[0]) 2093f2f09c1Sdp * 2103f2f09c1Sdp * Since we know the value of ucp at the beginning of this process, 2113f2f09c1Sdp * we can trivially compute the argv[] array which we also need to 2123f2f09c1Sdp * place in userland: argv[i] = ucp - sarg(i), where ucp is the 2133f2f09c1Sdp * stack ptr, and sarg is the string index of the start of the 2143f2f09c1Sdp * argument. 2153f2f09c1Sdp */ 2163f2f09c1Sdp ucp = (caddr32_t)(uintptr_t)p->p_usrstack; 2173f2f09c1Sdp 2183f2f09c1Sdp argc = 0; 2193f2f09c1Sdp in_arg = B_FALSE; 2203f2f09c1Sdp sarg = 0; 2213f2f09c1Sdp 2223f2f09c1Sdp for (i = 0; i < alen; i++) { 2233f2f09c1Sdp if (scratchargs[i] == ' ' || scratchargs[i] == '\0') { 2243f2f09c1Sdp if (in_arg == B_TRUE) { 2253f2f09c1Sdp in_arg = B_FALSE; 2263f2f09c1Sdp scratchargs[i] = '\0'; 2273f2f09c1Sdp argv[argc++] = ucp - (alen - sarg); 2283f2f09c1Sdp } 2293f2f09c1Sdp } else if (in_arg == B_FALSE) { 2303f2f09c1Sdp in_arg = B_TRUE; 2313f2f09c1Sdp sarg = i; 2323f2f09c1Sdp } 2333f2f09c1Sdp } 2343f2f09c1Sdp ucp -= alen; 2353f2f09c1Sdp error |= copyout(scratchargs, (caddr_t)(uintptr_t)ucp, alen); 2363f2f09c1Sdp 2377c478bd9Sstevel@tonic-gate uap = (caddr32_t *)P2ALIGN((uintptr_t)ucp, sizeof (caddr32_t)); 2383f2f09c1Sdp uap--; /* advance to be below the word we're in */ 2393f2f09c1Sdp uap -= (argc + 1); /* advance argc words down, plus one for NULL */ 2403f2f09c1Sdp error |= copyout(argv, uap, argvlen); 2417c478bd9Sstevel@tonic-gate 2427c478bd9Sstevel@tonic-gate if (error != 0) { 2437c478bd9Sstevel@tonic-gate zcmn_err(p->p_zone->zone_id, CE_WARN, 2447c478bd9Sstevel@tonic-gate "Could not construct stack for init.\n"); 2453f2f09c1Sdp kmem_free(argv, argvlen); 2463f2f09c1Sdp kmem_free(scratchargs, alen); 2477c478bd9Sstevel@tonic-gate return (EFAULT); 2487c478bd9Sstevel@tonic-gate } 2497c478bd9Sstevel@tonic-gate 2503f2f09c1Sdp exec_fnamep = argv[0]; 2513f2f09c1Sdp kmem_free(argv, argvlen); 2523f2f09c1Sdp kmem_free(scratchargs, alen); 2533f2f09c1Sdp 2547c478bd9Sstevel@tonic-gate /* 2557c478bd9Sstevel@tonic-gate * Point at the arguments. 2567c478bd9Sstevel@tonic-gate */ 2577c478bd9Sstevel@tonic-gate lwp->lwp_ap = lwp->lwp_arg; 2583f2f09c1Sdp lwp->lwp_arg[0] = (uintptr_t)exec_fnamep; 2597c478bd9Sstevel@tonic-gate lwp->lwp_arg[1] = (uintptr_t)uap; 2607c478bd9Sstevel@tonic-gate lwp->lwp_arg[2] = NULL; 2617c478bd9Sstevel@tonic-gate curthread->t_post_sys = 1; 2627c478bd9Sstevel@tonic-gate curthread->t_sysnum = SYS_execve; 2637c478bd9Sstevel@tonic-gate 2649acbbeafSnn35248 /* 2659acbbeafSnn35248 * If we are executing init from zsched, we may have inherited its 2669acbbeafSnn35248 * parent process's signal mask. Clear it now so that we behave in 2679acbbeafSnn35248 * the same way as when started from the global zone. 2689acbbeafSnn35248 */ 269bdf0047cSRoger A. Faulkner sigemptyset(&curthread->t_hold); 2709acbbeafSnn35248 2719acbbeafSnn35248 brand_action = ZONE_IS_BRANDED(p->p_zone) ? EBA_BRAND : EBA_NONE; 2727c478bd9Sstevel@tonic-gate again: 2733f2f09c1Sdp error = exec_common((const char *)(uintptr_t)exec_fnamep, 2749acbbeafSnn35248 (const char **)(uintptr_t)uap, NULL, brand_action); 2757c478bd9Sstevel@tonic-gate 2767c478bd9Sstevel@tonic-gate /* 2777c478bd9Sstevel@tonic-gate * Normally we would just set lwp_argsaved and t_post_sys and 2787c478bd9Sstevel@tonic-gate * let post_syscall reset lwp_ap for us. Unfortunately, 2797c478bd9Sstevel@tonic-gate * exec_init isn't always called from a system call. Instead 2807c478bd9Sstevel@tonic-gate * of making a mess of trap_cleanup, we just reset the args 2817c478bd9Sstevel@tonic-gate * pointer here. 2827c478bd9Sstevel@tonic-gate */ 2837c478bd9Sstevel@tonic-gate reset_syscall_args(); 2847c478bd9Sstevel@tonic-gate 2857c478bd9Sstevel@tonic-gate switch (error) { 2867c478bd9Sstevel@tonic-gate case 0: 2877c478bd9Sstevel@tonic-gate return (0); 2887c478bd9Sstevel@tonic-gate 2897c478bd9Sstevel@tonic-gate case ENOENT: 2907c478bd9Sstevel@tonic-gate zcmn_err(p->p_zone->zone_id, CE_WARN, 2917c478bd9Sstevel@tonic-gate "exec(%s) failed (file not found).\n", initpath); 2927c478bd9Sstevel@tonic-gate return (ENOENT); 2937c478bd9Sstevel@tonic-gate 2947c478bd9Sstevel@tonic-gate case EAGAIN: 2957c478bd9Sstevel@tonic-gate case EINTR: 2967c478bd9Sstevel@tonic-gate ++count; 2977c478bd9Sstevel@tonic-gate if (count < 5) { 2987c478bd9Sstevel@tonic-gate zcmn_err(p->p_zone->zone_id, CE_WARN, 2997c478bd9Sstevel@tonic-gate "exec(%s) failed with errno %d. Retrying...\n", 3007c478bd9Sstevel@tonic-gate initpath, error); 3017c478bd9Sstevel@tonic-gate goto again; 3027c478bd9Sstevel@tonic-gate } 3037c478bd9Sstevel@tonic-gate } 3047c478bd9Sstevel@tonic-gate 3057c478bd9Sstevel@tonic-gate zcmn_err(p->p_zone->zone_id, CE_WARN, 3067c478bd9Sstevel@tonic-gate "exec(%s) failed with errno %d.", initpath, error); 3077c478bd9Sstevel@tonic-gate return (error); 3087c478bd9Sstevel@tonic-gate } 3097c478bd9Sstevel@tonic-gate 3103f2f09c1Sdp /* 3113f2f09c1Sdp * This routine does all of the common setup for invoking init; global 3123f2f09c1Sdp * and non-global zones employ this routine for the functionality which is 3133f2f09c1Sdp * in common. 3143f2f09c1Sdp * 3153f2f09c1Sdp * This program (init, presumably) must be a 32-bit process. 3163f2f09c1Sdp */ 3173f2f09c1Sdp int 3183f2f09c1Sdp start_init_common() 3193f2f09c1Sdp { 3203f2f09c1Sdp proc_t *p = curproc; 3213f2f09c1Sdp ASSERT_STACK_ALIGNED(); 3223f2f09c1Sdp p->p_zone->zone_proc_initpid = p->p_pid; 3233f2f09c1Sdp 3243f2f09c1Sdp p->p_cstime = p->p_stime = p->p_cutime = p->p_utime = 0; 3253f2f09c1Sdp p->p_usrstack = (caddr_t)USRSTACK32; 3263f2f09c1Sdp p->p_model = DATAMODEL_ILP32; 3273f2f09c1Sdp p->p_stkprot = PROT_ZFOD & ~PROT_EXEC; 3283f2f09c1Sdp p->p_datprot = PROT_ZFOD & ~PROT_EXEC; 3293f2f09c1Sdp p->p_stk_ctl = INT32_MAX; 3303f2f09c1Sdp 3313f2f09c1Sdp p->p_as = as_alloc(); 332c6939658Ssl108498 p->p_as->a_proc = p; 3333f2f09c1Sdp p->p_as->a_userlimit = (caddr_t)USERLIMIT32; 3343f2f09c1Sdp (void) hat_setup(p->p_as->a_hat, HAT_INIT); 3353f2f09c1Sdp 3363f2f09c1Sdp init_core(); 3373f2f09c1Sdp 3383f2f09c1Sdp init_mstate(curthread, LMS_SYSTEM); 3393f2f09c1Sdp return (exec_init(p->p_zone->zone_initname, p->p_zone->zone_bootargs)); 3403f2f09c1Sdp } 3413f2f09c1Sdp 3423f2f09c1Sdp /* 3433f2f09c1Sdp * Start the initial user process for the global zone; once running, if 3443f2f09c1Sdp * init should subsequently fail, it will be automatically be caught in the 3453f2f09c1Sdp * exit(2) path, and restarted by restart_init(). 3463f2f09c1Sdp */ 3473f2f09c1Sdp static void 3483f2f09c1Sdp start_init(void) 3493f2f09c1Sdp { 3503f2f09c1Sdp proc_init = curproc; 3513f2f09c1Sdp 3523f2f09c1Sdp ASSERT(curproc->p_zone->zone_initname != NULL); 3533f2f09c1Sdp 3543f2f09c1Sdp if (start_init_common() != 0) 3553f2f09c1Sdp halt("unix: Could not start init"); 3563f2f09c1Sdp lwp_rtt(); 3573f2f09c1Sdp } 3583f2f09c1Sdp 3597c478bd9Sstevel@tonic-gate void 3607c478bd9Sstevel@tonic-gate main(void) 3617c478bd9Sstevel@tonic-gate { 3627c478bd9Sstevel@tonic-gate proc_t *p = ttoproc(curthread); /* &p0 */ 3637c478bd9Sstevel@tonic-gate int (**initptr)(); 3647c478bd9Sstevel@tonic-gate extern void sched(); 3657c478bd9Sstevel@tonic-gate extern void fsflush(); 3667c478bd9Sstevel@tonic-gate extern int (*init_tbl[])(); 3677c478bd9Sstevel@tonic-gate extern int (*mp_init_tbl[])(); 3687c478bd9Sstevel@tonic-gate extern id_t syscid, defaultcid; 3697c478bd9Sstevel@tonic-gate extern int swaploaded; 3707c478bd9Sstevel@tonic-gate extern int netboot; 3716cefaae1SJack Meng extern ib_boot_prop_t *iscsiboot_prop; 3727c478bd9Sstevel@tonic-gate extern void vm_init(void); 373b9499e44Smrj extern void cbe_init_pre(void); 3747c478bd9Sstevel@tonic-gate extern void cbe_init(void); 3752850d85bSmv143129 extern void clock_tick_init_pre(void); 3762850d85bSmv143129 extern void clock_tick_init_post(void); 3777c478bd9Sstevel@tonic-gate extern void clock_init(void); 3787c478bd9Sstevel@tonic-gate extern void physio_bufs_init(void); 3797c478bd9Sstevel@tonic-gate extern void pm_cfb_setup_intr(void); 3807c478bd9Sstevel@tonic-gate extern int pm_adjust_timestamps(dev_info_t *, void *); 3817c478bd9Sstevel@tonic-gate extern void start_other_cpus(int); 3827c478bd9Sstevel@tonic-gate extern void sysevent_evc_thrinit(); 383c3f63b71SAlexandre Chartre extern kmutex_t ualock; 3845cff7825Smh27603 #if defined(__x86) 385753a6d45SSherry Moore extern void fastboot_post_startup(void); 386486aec20SEnrico Perla - Sun Microsystems extern void progressbar_start(void); 3875cff7825Smh27603 #endif 3887c478bd9Sstevel@tonic-gate /* 3897c478bd9Sstevel@tonic-gate * In the horrible world of x86 in-lines, you can't get symbolic 3907c478bd9Sstevel@tonic-gate * structure offsets a la genassym. This assertion is here so 3917c478bd9Sstevel@tonic-gate * that the next poor slob who innocently changes the offset of 3927c478bd9Sstevel@tonic-gate * cpu_thread doesn't waste as much time as I just did finding 3937c478bd9Sstevel@tonic-gate * out that it's hard-coded in i86/ml/i86.il. Similarly for 3947c478bd9Sstevel@tonic-gate * curcpup. You're welcome. 3957c478bd9Sstevel@tonic-gate */ 3967c478bd9Sstevel@tonic-gate ASSERT(CPU == CPU->cpu_self); 3977c478bd9Sstevel@tonic-gate ASSERT(curthread == CPU->cpu_thread); 3987c478bd9Sstevel@tonic-gate ASSERT_STACK_ALIGNED(); 3997c478bd9Sstevel@tonic-gate 4007c478bd9Sstevel@tonic-gate /* 401c3f63b71SAlexandre Chartre * We take the ualock until we have completed the startup 402c3f63b71SAlexandre Chartre * to prevent kadmin() from disrupting this work. In particular, 403c3f63b71SAlexandre Chartre * we don't want kadmin() to bring the system down while we are 404c3f63b71SAlexandre Chartre * trying to start it up. 405c3f63b71SAlexandre Chartre */ 406c3f63b71SAlexandre Chartre mutex_enter(&ualock); 407c3f63b71SAlexandre Chartre 408c3f63b71SAlexandre Chartre /* 409d5d7cf4eSJonathan Chew * Setup root lgroup and leaf lgroup for CPU 0 4107c478bd9Sstevel@tonic-gate */ 411d5d7cf4eSJonathan Chew lgrp_init(LGRP_INIT_STAGE2); 4127c478bd9Sstevel@tonic-gate 4135ce42f36Spraks /* 4145ce42f36Spraks * Once 'startup()' completes, the thread_reaper() daemon would be 4155ce42f36Spraks * created(in thread_init()). After that, it is safe to create threads 4165ce42f36Spraks * that could exit. These exited threads will get reaped. 4175ce42f36Spraks */ 4187c478bd9Sstevel@tonic-gate startup(); 4197c478bd9Sstevel@tonic-gate segkmem_gc(); 4207c478bd9Sstevel@tonic-gate callb_init(); 421b9499e44Smrj cbe_init_pre(); /* x86 must initialize gethrtimef before timer_init */ 422a288e5a9SJoshua M. Clulow ddi_periodic_init(); 4237c478bd9Sstevel@tonic-gate cbe_init(); 42487a18d3fSMadhavan Venkataraman callout_init(); /* callout table MUST be init'd after cyclics */ 4252850d85bSmv143129 clock_tick_init_pre(); 4267c478bd9Sstevel@tonic-gate clock_init(); 4277c478bd9Sstevel@tonic-gate 428486aec20SEnrico Perla - Sun Microsystems #if defined(__x86) 429486aec20SEnrico Perla - Sun Microsystems /* 430486aec20SEnrico Perla - Sun Microsystems * The progressbar thread uses cv_reltimedwait() and hence needs to be 431486aec20SEnrico Perla - Sun Microsystems * started after the callout mechanism has been initialized. 432486aec20SEnrico Perla - Sun Microsystems */ 433486aec20SEnrico Perla - Sun Microsystems progressbar_start(); 434486aec20SEnrico Perla - Sun Microsystems #endif 4357c478bd9Sstevel@tonic-gate /* 436ae115bc7Smrj * On some platforms, clkinitf() changes the timing source that 437ae115bc7Smrj * gethrtime_unscaled() uses to generate timestamps. cbe_init() calls 438ae115bc7Smrj * clkinitf(), so re-initialize the microstate counters after the 439ae115bc7Smrj * timesource has been chosen. 440ae115bc7Smrj */ 441ae115bc7Smrj init_mstate(&t0, LMS_SYSTEM); 442ae115bc7Smrj init_cpu_mstate(CPU, CMS_SYSTEM); 443ae115bc7Smrj 444ae115bc7Smrj /* 4457c478bd9Sstevel@tonic-gate * May need to probe to determine latencies from CPU 0 after 4467c478bd9Sstevel@tonic-gate * gethrtime() comes alive in cbe_init() and before enabling interrupts 447d5d7cf4eSJonathan Chew * and copy and release any temporary memory allocated with BOP_ALLOC() 448d5d7cf4eSJonathan Chew * before release_bootstrap() frees boot memory 4497c478bd9Sstevel@tonic-gate */ 450d5d7cf4eSJonathan Chew lgrp_init(LGRP_INIT_STAGE3); 4517c478bd9Sstevel@tonic-gate 4527c478bd9Sstevel@tonic-gate /* 4537c478bd9Sstevel@tonic-gate * Call all system initialization functions. 4547c478bd9Sstevel@tonic-gate */ 4557c478bd9Sstevel@tonic-gate for (initptr = &init_tbl[0]; *initptr; initptr++) 4567c478bd9Sstevel@tonic-gate (**initptr)(); 4576cefaae1SJack Meng /* 4586cefaae1SJack Meng * Load iSCSI boot properties 4596cefaae1SJack Meng */ 4606cefaae1SJack Meng ld_ib_prop(); 4617c478bd9Sstevel@tonic-gate /* 4627c478bd9Sstevel@tonic-gate * initialize vm related stuff. 4637c478bd9Sstevel@tonic-gate */ 4647c478bd9Sstevel@tonic-gate vm_init(); 4657c478bd9Sstevel@tonic-gate 4667c478bd9Sstevel@tonic-gate /* 4677c478bd9Sstevel@tonic-gate * initialize buffer pool for raw I/O requests 4687c478bd9Sstevel@tonic-gate */ 4697c478bd9Sstevel@tonic-gate physio_bufs_init(); 4707c478bd9Sstevel@tonic-gate 4717c478bd9Sstevel@tonic-gate ttolwp(curthread)->lwp_error = 0; /* XXX kludge for SCSI driver */ 4727c478bd9Sstevel@tonic-gate 4737c478bd9Sstevel@tonic-gate /* 4747c478bd9Sstevel@tonic-gate * Drop the interrupt level and allow interrupts. At this point 4757c478bd9Sstevel@tonic-gate * the DDI guarantees that interrupts are enabled. 4767c478bd9Sstevel@tonic-gate */ 4777c478bd9Sstevel@tonic-gate (void) spl0(); 4787c478bd9Sstevel@tonic-gate interrupts_unleashed = 1; 4797c478bd9Sstevel@tonic-gate 48035a5a358SJonathan Adams /* 48135a5a358SJonathan Adams * Create kmem cache for proc structures 48235a5a358SJonathan Adams */ 48335a5a358SJonathan Adams process_cache = kmem_cache_create("process_cache", sizeof (proc_t), 48435a5a358SJonathan Adams 0, NULL, NULL, NULL, NULL, NULL, 0); 48535a5a358SJonathan Adams 4867c478bd9Sstevel@tonic-gate vfs_mountroot(); /* Mount the root file system */ 4877c478bd9Sstevel@tonic-gate errorq_init(); /* after vfs_mountroot() so DDI root is ready */ 4887c478bd9Sstevel@tonic-gate cpu_kstat_init(CPU); /* after vfs_mountroot() so TOD is valid */ 4897c478bd9Sstevel@tonic-gate ddi_walk_devs(ddi_root_node(), pm_adjust_timestamps, NULL); 4907c478bd9Sstevel@tonic-gate /* after vfs_mountroot() so hrestime is valid */ 4917c478bd9Sstevel@tonic-gate 4927c478bd9Sstevel@tonic-gate post_startup(); 4937c478bd9Sstevel@tonic-gate swaploaded = 1; 4947c478bd9Sstevel@tonic-gate 4957c478bd9Sstevel@tonic-gate /* 496d3e55dcdSgww * Initialize Solaris Audit Subsystem 4977c478bd9Sstevel@tonic-gate */ 498d3e55dcdSgww audit_init(); 4997c478bd9Sstevel@tonic-gate 5007c478bd9Sstevel@tonic-gate /* 501*bbd630eeSMarcel Telka * Start the periodic hash rescale for all vmem arenas before we load 502*bbd630eeSMarcel Telka * protocol modules and drivers via strplumb() below. Some drivers 503*bbd630eeSMarcel Telka * might rely on heavy vmem operations that could hurt performance 504*bbd630eeSMarcel Telka * without the rescale. 505*bbd630eeSMarcel Telka */ 506*bbd630eeSMarcel Telka vmem_update(NULL); 507*bbd630eeSMarcel Telka 508*bbd630eeSMarcel Telka /* 5097c478bd9Sstevel@tonic-gate * Plumb the protocol modules and drivers only if we are not 5107c478bd9Sstevel@tonic-gate * networked booted, in this case we already did it in rootconf(). 5117c478bd9Sstevel@tonic-gate */ 5126cefaae1SJack Meng if (netboot == 0 && iscsiboot_prop == NULL) 5137c478bd9Sstevel@tonic-gate (void) strplumb(); 5147c478bd9Sstevel@tonic-gate 515ae115bc7Smrj gethrestime(&PTOU(curproc)->u_start); 516ae115bc7Smrj curthread->t_start = PTOU(curproc)->u_start.tv_sec; 5177c478bd9Sstevel@tonic-gate p->p_mstart = gethrtime(); 5187c478bd9Sstevel@tonic-gate 5197c478bd9Sstevel@tonic-gate /* 5207c478bd9Sstevel@tonic-gate * Perform setup functions that can only be done after root 5217c478bd9Sstevel@tonic-gate * and swap have been set up. 5227c478bd9Sstevel@tonic-gate */ 5237c478bd9Sstevel@tonic-gate consconfig(); 524fe85ab99SBijan Mottahedeh #ifndef __sparc 525fe85ab99SBijan Mottahedeh release_bootstrap(); 526fe85ab99SBijan Mottahedeh #endif 5271b83305cSjm22469 5287c478bd9Sstevel@tonic-gate /* 5297c478bd9Sstevel@tonic-gate * attach drivers with ddi-forceattach prop 5307c478bd9Sstevel@tonic-gate * It must be done early enough to load hotplug drivers (e.g. 5317c478bd9Sstevel@tonic-gate * pcmcia nexus) so that devices enumerated via hotplug is 5327c478bd9Sstevel@tonic-gate * available before I/O subsystem is fully initialized. 5337c478bd9Sstevel@tonic-gate */ 5347c478bd9Sstevel@tonic-gate i_ddi_forceattach_drivers(); 5357c478bd9Sstevel@tonic-gate 5367c478bd9Sstevel@tonic-gate /* 5377c478bd9Sstevel@tonic-gate * Set the scan rate and other parameters of the paging subsystem. 5387c478bd9Sstevel@tonic-gate */ 5397c478bd9Sstevel@tonic-gate setupclock(0); 5407c478bd9Sstevel@tonic-gate 5417c478bd9Sstevel@tonic-gate /* 5427c478bd9Sstevel@tonic-gate * Initialize process 0's lwp directory and lwpid hash table. 5437c478bd9Sstevel@tonic-gate */ 5447c478bd9Sstevel@tonic-gate p->p_lwpdir = p->p_lwpfree = p0_lwpdir; 5457c478bd9Sstevel@tonic-gate p->p_lwpdir->ld_next = p->p_lwpdir + 1; 5467c478bd9Sstevel@tonic-gate p->p_lwpdir_sz = 2; 5477c478bd9Sstevel@tonic-gate p->p_tidhash = p0_tidhash; 5487c478bd9Sstevel@tonic-gate p->p_tidhash_sz = 2; 5497c478bd9Sstevel@tonic-gate p0_lep.le_thread = curthread; 5507c478bd9Sstevel@tonic-gate p0_lep.le_lwpid = curthread->t_tid; 5517c478bd9Sstevel@tonic-gate p0_lep.le_start = curthread->t_start; 5526eb30ec3SRoger A. Faulkner lwp_hash_in(p, &p0_lep, p0_tidhash, 2, 0); 5537c478bd9Sstevel@tonic-gate 5547c478bd9Sstevel@tonic-gate /* 5557c478bd9Sstevel@tonic-gate * Initialize extended accounting. 5567c478bd9Sstevel@tonic-gate */ 5577c478bd9Sstevel@tonic-gate exacct_init(); 5587c478bd9Sstevel@tonic-gate 5597c478bd9Sstevel@tonic-gate /* 5607c478bd9Sstevel@tonic-gate * Initialize threads of sysevent event channels 5617c478bd9Sstevel@tonic-gate */ 5627c478bd9Sstevel@tonic-gate sysevent_evc_thrinit(); 5637c478bd9Sstevel@tonic-gate 5647c478bd9Sstevel@tonic-gate /* 565d5d7cf4eSJonathan Chew * This must be done after post_startup() but before 5667c478bd9Sstevel@tonic-gate * start_other_cpus() 5677c478bd9Sstevel@tonic-gate */ 568d5d7cf4eSJonathan Chew lgrp_init(LGRP_INIT_STAGE4); 5697c478bd9Sstevel@tonic-gate 5707c478bd9Sstevel@tonic-gate /* 5717c478bd9Sstevel@tonic-gate * Perform MP initialization, if any. 5727c478bd9Sstevel@tonic-gate */ 5737c478bd9Sstevel@tonic-gate start_other_cpus(0); 5747c478bd9Sstevel@tonic-gate 575fe85ab99SBijan Mottahedeh #ifdef __sparc 5767c478bd9Sstevel@tonic-gate /* 5779853d9e8SJason Beloro * Release bootstrap here since PROM interfaces are 5789853d9e8SJason Beloro * used to start other CPUs above. 5799853d9e8SJason Beloro */ 5809853d9e8SJason Beloro release_bootstrap(); 581fe85ab99SBijan Mottahedeh #endif 5829853d9e8SJason Beloro 5839853d9e8SJason Beloro /* 5847c478bd9Sstevel@tonic-gate * Finish lgrp initialization after all CPUS are brought online. 5857c478bd9Sstevel@tonic-gate */ 586d5d7cf4eSJonathan Chew lgrp_init(LGRP_INIT_STAGE5); 5877c478bd9Sstevel@tonic-gate 5887c478bd9Sstevel@tonic-gate /* 5897c478bd9Sstevel@tonic-gate * After mp_init(), number of cpus are known (this is 5907c478bd9Sstevel@tonic-gate * true for the time being, when there are actually 5917c478bd9Sstevel@tonic-gate * hot pluggable cpus then this scheme would not do). 5927c478bd9Sstevel@tonic-gate * Any per cpu initialization is done here. 5937c478bd9Sstevel@tonic-gate */ 5947c478bd9Sstevel@tonic-gate kmem_mp_init(); 5957c478bd9Sstevel@tonic-gate 5962850d85bSmv143129 clock_tick_init_post(); 5972850d85bSmv143129 5987c478bd9Sstevel@tonic-gate for (initptr = &mp_init_tbl[0]; *initptr; initptr++) 5997c478bd9Sstevel@tonic-gate (**initptr)(); 6007c478bd9Sstevel@tonic-gate 6017c478bd9Sstevel@tonic-gate /* 6025cff7825Smh27603 * These must be called after start_other_cpus 6037c478bd9Sstevel@tonic-gate */ 6047c478bd9Sstevel@tonic-gate pm_cfb_setup_intr(); 6055cff7825Smh27603 #if defined(__x86) 606753a6d45SSherry Moore fastboot_post_startup(); 6075cff7825Smh27603 #endif 6087c478bd9Sstevel@tonic-gate 6097c478bd9Sstevel@tonic-gate /* 6107c478bd9Sstevel@tonic-gate * Make init process; enter scheduling loop with system process. 61135a5a358SJonathan Adams * 61235a5a358SJonathan Adams * Note that we manually assign the pids for these processes, for 61335a5a358SJonathan Adams * historical reasons. If more pre-assigned pids are needed, 61435a5a358SJonathan Adams * FAMOUS_PIDS will have to be updated. 6157c478bd9Sstevel@tonic-gate */ 6167c478bd9Sstevel@tonic-gate 6177c478bd9Sstevel@tonic-gate /* create init process */ 61835a5a358SJonathan Adams if (newproc(start_init, NULL, defaultcid, 59, NULL, 61935a5a358SJonathan Adams FAMOUS_PID_INIT)) 6207c478bd9Sstevel@tonic-gate panic("main: unable to fork init."); 6217c478bd9Sstevel@tonic-gate 6227c478bd9Sstevel@tonic-gate /* create pageout daemon */ 62335a5a358SJonathan Adams if (newproc(pageout, NULL, syscid, maxclsyspri - 1, NULL, 62435a5a358SJonathan Adams FAMOUS_PID_PAGEOUT)) 6257c478bd9Sstevel@tonic-gate panic("main: unable to fork pageout()"); 6267c478bd9Sstevel@tonic-gate 6277c478bd9Sstevel@tonic-gate /* create fsflush daemon */ 62835a5a358SJonathan Adams if (newproc(fsflush, NULL, syscid, minclsyspri, NULL, 62935a5a358SJonathan Adams FAMOUS_PID_FSFLUSH)) 6307c478bd9Sstevel@tonic-gate panic("main: unable to fork fsflush()"); 6317c478bd9Sstevel@tonic-gate 6327c478bd9Sstevel@tonic-gate /* create cluster process if we're a member of one */ 6337c478bd9Sstevel@tonic-gate if (cluster_bootflags & CLUSTER_BOOTED) { 63435a5a358SJonathan Adams if (newproc(cluster_wrapper, NULL, syscid, minclsyspri, 63535a5a358SJonathan Adams NULL, 0)) { 6367c478bd9Sstevel@tonic-gate panic("main: unable to fork cluster()"); 6377c478bd9Sstevel@tonic-gate } 63835a5a358SJonathan Adams } 6397c478bd9Sstevel@tonic-gate 6407c478bd9Sstevel@tonic-gate /* 6417c478bd9Sstevel@tonic-gate * Create system threads (threads are associated with p0) 6427c478bd9Sstevel@tonic-gate */ 6437c478bd9Sstevel@tonic-gate 6447c478bd9Sstevel@tonic-gate /* create module uninstall daemon */ 6457c478bd9Sstevel@tonic-gate /* BugID 1132273. If swapping over NFS need a bigger stack */ 6467c478bd9Sstevel@tonic-gate (void) thread_create(NULL, 0, (void (*)())mod_uninstall_daemon, 6477c478bd9Sstevel@tonic-gate NULL, 0, &p0, TS_RUN, minclsyspri); 6487c478bd9Sstevel@tonic-gate 6497c478bd9Sstevel@tonic-gate (void) thread_create(NULL, 0, seg_pasync_thread, 6507c478bd9Sstevel@tonic-gate NULL, 0, &p0, TS_RUN, minclsyspri); 6517c478bd9Sstevel@tonic-gate 6527c478bd9Sstevel@tonic-gate pid_setmin(); 6537c478bd9Sstevel@tonic-gate 654c3f63b71SAlexandre Chartre /* system is now ready */ 655c3f63b71SAlexandre Chartre mutex_exit(&ualock); 656c3f63b71SAlexandre Chartre 657ae115bc7Smrj bcopy("sched", PTOU(curproc)->u_psargs, 6); 658ae115bc7Smrj bcopy("sched", PTOU(curproc)->u_comm, 5); 6597c478bd9Sstevel@tonic-gate sched(); 6607c478bd9Sstevel@tonic-gate /* NOTREACHED */ 6617c478bd9Sstevel@tonic-gate } 662