1df8bae1dSRodney W. Grimes /* 22b14f991SJulian Elischer * Copyright (c) 1995 Terrence R. Lambert 32b14f991SJulian Elischer * All rights reserved. 42b14f991SJulian Elischer * 5df8bae1dSRodney W. Grimes * Copyright (c) 1982, 1986, 1989, 1991, 1992, 1993 6df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 7df8bae1dSRodney W. Grimes * (c) UNIX System Laboratories, Inc. 8df8bae1dSRodney W. Grimes * All or some portions of this file are derived from material licensed 9df8bae1dSRodney W. Grimes * to the University of California by American Telephone and Telegraph 10df8bae1dSRodney W. Grimes * Co. or Unix System Laboratories, Inc. and are reproduced herein with 11df8bae1dSRodney W. Grimes * the permission of UNIX System Laboratories, Inc. 12df8bae1dSRodney W. Grimes * 13df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 14df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 15df8bae1dSRodney W. Grimes * are met: 16df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 17df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 18df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 19df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 20df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 21df8bae1dSRodney W. Grimes * 3. All advertising materials mentioning features or use of this software 22df8bae1dSRodney W. Grimes * must display the following acknowledgement: 23df8bae1dSRodney W. Grimes * This product includes software developed by the University of 24df8bae1dSRodney W. Grimes * California, Berkeley and its contributors. 25df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 26df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 27df8bae1dSRodney W. Grimes * without specific prior written permission. 28df8bae1dSRodney W. Grimes * 29df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 30df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 31df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 32df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 33df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 34df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 35df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 36df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 37df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 38df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 39df8bae1dSRodney W. Grimes * SUCH DAMAGE. 40df8bae1dSRodney W. Grimes * 41df8bae1dSRodney W. Grimes * @(#)init_main.c 8.9 (Berkeley) 1/21/94 42df8bae1dSRodney W. Grimes */ 43df8bae1dSRodney W. Grimes 44677b542eSDavid E. O'Brien #include <sys/cdefs.h> 45677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 46677b542eSDavid E. O'Brien 4767481196SJohn Birrell #include "opt_init_path.h" 4840244964SRobert Watson #include "opt_mac.h" 494bd49128SPeter Wemm 50df8bae1dSRodney W. Grimes #include <sys/param.h> 519e209b12SAlfred Perlstein #include <sys/kernel.h> 52f36ba452SJake Burkholder #include <sys/exec.h> 53b3c5c18dSBruce Evans #include <sys/file.h> 54df8bae1dSRodney W. Grimes #include <sys/filedesc.h> 550384fff8SJason Evans #include <sys/ktr.h> 561005a129SJohn Baldwin #include <sys/lock.h> 5740244964SRobert Watson #include <sys/mac.h> 58ac0ad63fSBruce Evans #include <sys/mount.h> 5935e0e5b3SJohn Baldwin #include <sys/mutex.h> 608f19eb88SIan Dowse #include <sys/syscallsubr.h> 61946bb7a2SPoul-Henning Kamp #include <sys/sysctl.h> 62df8bae1dSRodney W. Grimes #include <sys/proc.h> 63df8bae1dSRodney W. Grimes #include <sys/resourcevar.h> 64df8bae1dSRodney W. Grimes #include <sys/systm.h> 6536240ea5SDoug Rabson #include <sys/signalvar.h> 66df8bae1dSRodney W. Grimes #include <sys/vnode.h> 67f3f0ca60SSøren Schmidt #include <sys/sysent.h> 68df8bae1dSRodney W. Grimes #include <sys/reboot.h> 69de028f5aSJeff Roberson #include <sys/sched.h> 701005a129SJohn Baldwin #include <sys/sx.h> 71ad7507e2SSteven Wallace #include <sys/sysproto.h> 72efeaf95aSDavid Greenman #include <sys/vmmeter.h> 7374b2192aSJohn Dyson #include <sys/unistd.h> 7494e9d7c1SPeter Wemm #include <sys/malloc.h> 75db901281SPoul-Henning Kamp #include <sys/conf.h> 76df8bae1dSRodney W. Grimes 77df8bae1dSRodney W. Grimes #include <machine/cpu.h> 78df8bae1dSRodney W. Grimes 79df8bae1dSRodney W. Grimes #include <vm/vm.h> 80efeaf95aSDavid Greenman #include <vm/vm_param.h> 81efeaf95aSDavid Greenman #include <vm/pmap.h> 82efeaf95aSDavid Greenman #include <vm/vm_map.h> 83efeaf95aSDavid Greenman #include <sys/user.h> 846faaa756SWolfram Schneider #include <sys/copyright.h> 85df8bae1dSRodney W. Grimes 8637b087a6SPeter Wemm void mi_startup(void); /* Should be elsewhere */ 87df8bae1dSRodney W. Grimes 88df8bae1dSRodney W. Grimes /* Components of the first process -- never freed. */ 89154c04e5SPoul-Henning Kamp static struct session session0; 90154c04e5SPoul-Henning Kamp static struct pgrp pgrp0; 91df8bae1dSRodney W. Grimes struct proc proc0; 92079b7badSJulian Elischer struct thread thread0; 934f0db5e0SJulian Elischer struct ksegrp ksegrp0; 9423734995SJake Burkholder struct vmspace vmspace0; 952b14f991SJulian Elischer struct proc *initproc; 96df8bae1dSRodney W. Grimes 97c463cf1cSBruce Evans int boothowto = 0; /* initialized so that it can be patched */ 988d0bf3d6SJordan K. Hubbard SYSCTL_INT(_debug, OID_AUTO, boothowto, CTLFLAG_RD, &boothowto, 0, ""); 997a08bae6SJohn Baldwin int bootverbose; 1007a08bae6SJohn Baldwin SYSCTL_INT(_debug, OID_AUTO, bootverbose, CTLFLAG_RW, &bootverbose, 0, ""); 101946bb7a2SPoul-Henning Kamp 1022b14f991SJulian Elischer /* 1032b14f991SJulian Elischer * This ensures that there is at least one entry so that the sysinit_set 1042b14f991SJulian Elischer * symbol is not undefined. A sybsystem ID of SI_SUB_DUMMY is never 1052b14f991SJulian Elischer * executed. 10626f9a767SRodney W. Grimes */ 1072b14f991SJulian Elischer SYSINIT(placeholder, SI_SUB_DUMMY, SI_ORDER_ANY, NULL, NULL) 1088a129caeSDavid Greenman 10994e9d7c1SPeter Wemm /* 11094e9d7c1SPeter Wemm * The sysinit table itself. Items are checked off as the are run. 11194e9d7c1SPeter Wemm * If we want to register new sysinit types, add them to newsysinit. 11294e9d7c1SPeter Wemm */ 113f41325dbSPeter Wemm SET_DECLARE(sysinit_set, struct sysinit); 114f41325dbSPeter Wemm struct sysinit **sysinit, **sysinit_end; 115f41325dbSPeter Wemm struct sysinit **newsysinit, **newsysinit_end; 11694e9d7c1SPeter Wemm 11794e9d7c1SPeter Wemm /* 11894e9d7c1SPeter Wemm * Merge a new sysinit set into the current set, reallocating it if 11994e9d7c1SPeter Wemm * necessary. This can only be called after malloc is running. 12094e9d7c1SPeter Wemm */ 12194e9d7c1SPeter Wemm void 122f41325dbSPeter Wemm sysinit_add(struct sysinit **set, struct sysinit **set_end) 12394e9d7c1SPeter Wemm { 12494e9d7c1SPeter Wemm struct sysinit **newset; 12594e9d7c1SPeter Wemm struct sysinit **sipp; 12694e9d7c1SPeter Wemm struct sysinit **xipp; 127f41325dbSPeter Wemm int count; 12894e9d7c1SPeter Wemm 129f41325dbSPeter Wemm count = set_end - set; 130ddd62546SPeter Wemm if (newsysinit) 131f41325dbSPeter Wemm count += newsysinit_end - newsysinit; 132ddd62546SPeter Wemm else 133f41325dbSPeter Wemm count += sysinit_end - sysinit; 13494e9d7c1SPeter Wemm newset = malloc(count * sizeof(*sipp), M_TEMP, M_NOWAIT); 13594e9d7c1SPeter Wemm if (newset == NULL) 13694e9d7c1SPeter Wemm panic("cannot malloc for sysinit"); 13794e9d7c1SPeter Wemm xipp = newset; 138ddd62546SPeter Wemm if (newsysinit) 139f41325dbSPeter Wemm for (sipp = newsysinit; sipp < newsysinit_end; sipp++) 140ddd62546SPeter Wemm *xipp++ = *sipp; 141ddd62546SPeter Wemm else 142f41325dbSPeter Wemm for (sipp = sysinit; sipp < sysinit_end; sipp++) 14394e9d7c1SPeter Wemm *xipp++ = *sipp; 144f41325dbSPeter Wemm for (sipp = set; sipp < set_end; sipp++) 14594e9d7c1SPeter Wemm *xipp++ = *sipp; 146ddd62546SPeter Wemm if (newsysinit) 147ddd62546SPeter Wemm free(newsysinit, M_TEMP); 14894e9d7c1SPeter Wemm newsysinit = newset; 149f41325dbSPeter Wemm newsysinit_end = newset + count; 15094e9d7c1SPeter Wemm } 15126f9a767SRodney W. Grimes 152df8bae1dSRodney W. Grimes /* 153df8bae1dSRodney W. Grimes * System startup; initialize the world, create process 0, mount root 154df8bae1dSRodney W. Grimes * filesystem, and fork to create init and pagedaemon. Most of the 155df8bae1dSRodney W. Grimes * hard work is done in the lower-level initialization routines including 156df8bae1dSRodney W. Grimes * startup(), which does memory initialization and autoconfiguration. 1572b14f991SJulian Elischer * 1582b14f991SJulian Elischer * This allows simple addition of new kernel subsystems that require 1592b14f991SJulian Elischer * boot time initialization. It also allows substitution of subsystem 1602b14f991SJulian Elischer * (for instance, a scheduler, kernel profiler, or VM system) by object 161c5b193bfSPoul-Henning Kamp * module. Finally, it allows for optional "kernel threads". 162df8bae1dSRodney W. Grimes */ 16326f9a767SRodney W. Grimes void 16437b087a6SPeter Wemm mi_startup(void) 165df8bae1dSRodney W. Grimes { 1662b14f991SJulian Elischer 1672b14f991SJulian Elischer register struct sysinit **sipp; /* system initialization*/ 1682b14f991SJulian Elischer register struct sysinit **xipp; /* interior loop of sort*/ 1692b14f991SJulian Elischer register struct sysinit *save; /* bubble*/ 1702b14f991SJulian Elischer 171f41325dbSPeter Wemm if (sysinit == NULL) { 172f41325dbSPeter Wemm sysinit = SET_BEGIN(sysinit_set); 173f41325dbSPeter Wemm sysinit_end = SET_LIMIT(sysinit_set); 174f41325dbSPeter Wemm } 175f41325dbSPeter Wemm 17694e9d7c1SPeter Wemm restart: 1772b14f991SJulian Elischer /* 1782b14f991SJulian Elischer * Perform a bubble sort of the system initialization objects by 1792b14f991SJulian Elischer * their subsystem (primary key) and order (secondary key). 1802b14f991SJulian Elischer */ 181f41325dbSPeter Wemm for (sipp = sysinit; sipp < sysinit_end; sipp++) { 182f41325dbSPeter Wemm for (xipp = sipp + 1; xipp < sysinit_end; xipp++) { 1832b14f991SJulian Elischer if ((*sipp)->subsystem < (*xipp)->subsystem || 1842b14f991SJulian Elischer ((*sipp)->subsystem == (*xipp)->subsystem && 185af4b2d2dSPeter Wemm (*sipp)->order <= (*xipp)->order)) 1862b14f991SJulian Elischer continue; /* skip*/ 1872b14f991SJulian Elischer save = *sipp; 1882b14f991SJulian Elischer *sipp = *xipp; 1892b14f991SJulian Elischer *xipp = save; 1902b14f991SJulian Elischer } 1912b14f991SJulian Elischer } 1922b14f991SJulian Elischer 1932b14f991SJulian Elischer /* 1942b14f991SJulian Elischer * Traverse the (now) ordered list of system initialization tasks. 1952b14f991SJulian Elischer * Perform each task, and continue on to the next task. 1962b14f991SJulian Elischer * 1972b14f991SJulian Elischer * The last item on the list is expected to be the scheduler, 1982b14f991SJulian Elischer * which will not return. 1992b14f991SJulian Elischer */ 200f41325dbSPeter Wemm for (sipp = sysinit; sipp < sysinit_end; sipp++) { 20174b2192aSJohn Dyson 2022b14f991SJulian Elischer if ((*sipp)->subsystem == SI_SUB_DUMMY) 2032b14f991SJulian Elischer continue; /* skip dummy task(s)*/ 2042b14f991SJulian Elischer 20594e9d7c1SPeter Wemm if ((*sipp)->subsystem == SI_SUB_DONE) 20694e9d7c1SPeter Wemm continue; 20794e9d7c1SPeter Wemm 2089c8b8baaSPeter Wemm /* Call function */ 2092b14f991SJulian Elischer (*((*sipp)->func))((*sipp)->udata); 21094e9d7c1SPeter Wemm 21194e9d7c1SPeter Wemm /* Check off the one we're just done */ 21294e9d7c1SPeter Wemm (*sipp)->subsystem = SI_SUB_DONE; 21394e9d7c1SPeter Wemm 21494e9d7c1SPeter Wemm /* Check if we've installed more sysinit items via KLD */ 21594e9d7c1SPeter Wemm if (newsysinit != NULL) { 216f41325dbSPeter Wemm if (sysinit != SET_BEGIN(sysinit_set)) 21794e9d7c1SPeter Wemm free(sysinit, M_TEMP); 21894e9d7c1SPeter Wemm sysinit = newsysinit; 219f41325dbSPeter Wemm sysinit_end = newsysinit_end; 22094e9d7c1SPeter Wemm newsysinit = NULL; 221f41325dbSPeter Wemm newsysinit_end = NULL; 22294e9d7c1SPeter Wemm goto restart; 22394e9d7c1SPeter Wemm } 2242b14f991SJulian Elischer } 2252b14f991SJulian Elischer 226477a642cSPeter Wemm panic("Shouldn't get here!"); 2272b14f991SJulian Elischer /* NOTREACHED*/ 2282b14f991SJulian Elischer } 2292b14f991SJulian Elischer 2302b14f991SJulian Elischer 2312b14f991SJulian Elischer /* 2322b14f991SJulian Elischer *************************************************************************** 2332b14f991SJulian Elischer **** 2342b14f991SJulian Elischer **** The following SYSINIT's belong elsewhere, but have not yet 2352b14f991SJulian Elischer **** been moved. 2362b14f991SJulian Elischer **** 2372b14f991SJulian Elischer *************************************************************************** 2382b14f991SJulian Elischer */ 2399ef6c28aSBruce Evans static void 24037b087a6SPeter Wemm print_caddr_t(void *data __unused) 2419ef6c28aSBruce Evans { 2429ef6c28aSBruce Evans printf("%s", (char *)data); 2439ef6c28aSBruce Evans } 244d841aaa7SBruce Evans SYSINIT(announce, SI_SUB_COPYRIGHT, SI_ORDER_FIRST, print_caddr_t, copyright) 2457a08bae6SJohn Baldwin SYSINIT(version, SI_SUB_COPYRIGHT, SI_ORDER_SECOND, print_caddr_t, version) 2467a08bae6SJohn Baldwin 2472cf6bdacSPoul-Henning Kamp #ifdef WITNESS 2482cf6bdacSPoul-Henning Kamp static char wit_warn[] = 2492cf6bdacSPoul-Henning Kamp "WARNING: WITNESS option enabled, expect reduced performance.\n"; 2502cf6bdacSPoul-Henning Kamp SYSINIT(witwarn, SI_SUB_COPYRIGHT, SI_ORDER_SECOND + 1, 2512cf6bdacSPoul-Henning Kamp print_caddr_t, wit_warn) 2522cf6bdacSPoul-Henning Kamp #endif 2532cf6bdacSPoul-Henning Kamp 2542cf6bdacSPoul-Henning Kamp #ifdef DIAGNOSTIC 2552cf6bdacSPoul-Henning Kamp static char diag_warn[] = 2562cf6bdacSPoul-Henning Kamp "WARNING: DIAGNOSTIC option enabled, expect reduced performance.\n"; 2572cf6bdacSPoul-Henning Kamp SYSINIT(diagwarn, SI_SUB_COPYRIGHT, SI_ORDER_SECOND + 2, 2582cf6bdacSPoul-Henning Kamp print_caddr_t, diag_warn) 2592cf6bdacSPoul-Henning Kamp #endif 2602cf6bdacSPoul-Henning Kamp 2617a08bae6SJohn Baldwin static void 2627a08bae6SJohn Baldwin set_boot_verbose(void *data __unused) 2637a08bae6SJohn Baldwin { 2647a08bae6SJohn Baldwin 2657a08bae6SJohn Baldwin if (boothowto & RB_VERBOSE) 2667a08bae6SJohn Baldwin bootverbose++; 2677a08bae6SJohn Baldwin } 2687a08bae6SJohn Baldwin SYSINIT(boot_verbose, SI_SUB_TUNABLES, SI_ORDER_ANY, set_boot_verbose, NULL) 2692b14f991SJulian Elischer 270f36ba452SJake Burkholder struct sysentvec null_sysvec = { 271f36ba452SJake Burkholder 0, 272f36ba452SJake Burkholder NULL, 273f36ba452SJake Burkholder 0, 274f36ba452SJake Burkholder 0, 275f36ba452SJake Burkholder NULL, 276f36ba452SJake Burkholder 0, 277f36ba452SJake Burkholder NULL, 278f36ba452SJake Burkholder NULL, 279f36ba452SJake Burkholder NULL, 280f36ba452SJake Burkholder NULL, 281f36ba452SJake Burkholder NULL, 282f36ba452SJake Burkholder NULL, 283f36ba452SJake Burkholder NULL, 284f36ba452SJake Burkholder "null", 285f36ba452SJake Burkholder NULL, 286f36ba452SJake Burkholder NULL, 287f36ba452SJake Burkholder 0, 288f36ba452SJake Burkholder PAGE_SIZE, 289f36ba452SJake Burkholder VM_MIN_ADDRESS, 290f36ba452SJake Burkholder VM_MAXUSER_ADDRESS, 291f36ba452SJake Burkholder USRSTACK, 292f36ba452SJake Burkholder PS_STRINGS, 293f36ba452SJake Burkholder VM_PROT_ALL, 294f36ba452SJake Burkholder NULL, 295c460ac3aSPeter Wemm NULL, 296f36ba452SJake Burkholder NULL 297f36ba452SJake Burkholder }; 2983ebc1248SPeter Wemm 2992b14f991SJulian Elischer /* 3002b14f991SJulian Elischer *************************************************************************** 3012b14f991SJulian Elischer **** 3020c920c0dSGiorgos Keramidas **** The two following SYSINIT's are proc0 specific glue code. I am not 3032b14f991SJulian Elischer **** convinced that they can not be safely combined, but their order of 3042b14f991SJulian Elischer **** operation has been maintained as the same as the original init_main.c 3052b14f991SJulian Elischer **** for right now. 3062b14f991SJulian Elischer **** 3072b14f991SJulian Elischer **** These probably belong in init_proc.c or kern_proc.c, since they 3082b14f991SJulian Elischer **** deal with proc0 (the fork template process). 3092b14f991SJulian Elischer **** 3102b14f991SJulian Elischer *************************************************************************** 3112b14f991SJulian Elischer */ 3122b14f991SJulian Elischer /* ARGSUSED*/ 313154c04e5SPoul-Henning Kamp static void 31437b087a6SPeter Wemm proc0_init(void *dummy __unused) 3152b14f991SJulian Elischer { 3168ec21e3aSPoul-Henning Kamp struct proc *p; 3178ec21e3aSPoul-Henning Kamp unsigned i; 318b40ce416SJulian Elischer struct thread *td; 319079b7badSJulian Elischer struct ksegrp *kg; 320df8bae1dSRodney W. Grimes 3210cddd8f0SMatthew Dillon GIANT_REQUIRED; 322df8bae1dSRodney W. Grimes p = &proc0; 323079b7badSJulian Elischer td = &thread0; 3244f0db5e0SJulian Elischer kg = &ksegrp0; 325df8bae1dSRodney W. Grimes 326df8bae1dSRodney W. Grimes /* 3270384fff8SJason Evans * Initialize magic number. 3280384fff8SJason Evans */ 3290384fff8SJason Evans p->p_magic = P_MAGIC; 3300384fff8SJason Evans 3310384fff8SJason Evans /* 332ed062c8dSJulian Elischer * Initialize thread, process and ksegrp structures. 333a3bfb996SJeffrey Hsu */ 334ed062c8dSJulian Elischer procinit(); /* set up proc zone */ 335ed062c8dSJulian Elischer threadinit(); /* set up thead, upcall and KSEGRP zones */ 336a3bfb996SJeffrey Hsu 337a3bfb996SJeffrey Hsu /* 338ed062c8dSJulian Elischer * Initialise scheduler resources. 339ed062c8dSJulian Elischer * Add scheduler specific parts to proc, ksegrp, thread as needed. 340ed062c8dSJulian Elischer */ 341ed062c8dSJulian Elischer schedinit(); /* scheduler gets its house in order */ 342ed062c8dSJulian Elischer /* 343b1508c72SDavid Greenman * Initialize sleep queue hash table 344b1508c72SDavid Greenman */ 345b1508c72SDavid Greenman sleepinit(); 346b1508c72SDavid Greenman 347b1508c72SDavid Greenman /* 3483075778bSJohn Dyson * additional VM structures 3493075778bSJohn Dyson */ 3503075778bSJohn Dyson vm_init2(); 3513075778bSJohn Dyson 3523075778bSJohn Dyson /* 353df8bae1dSRodney W. Grimes * Create process 0 (the swapper). 354df8bae1dSRodney W. Grimes */ 355a3bfb996SJeffrey Hsu LIST_INSERT_HEAD(&allproc, p, p_list); 3567b531e60SJohn Baldwin LIST_INSERT_HEAD(PIDHASH(0), p, p_hash); 3576008862bSJohn Baldwin mtx_init(&pgrp0.pg_mtx, "process group", NULL, MTX_DEF | MTX_DUPOK); 358df8bae1dSRodney W. Grimes p->p_pgrp = &pgrp0; 359a3bfb996SJeffrey Hsu LIST_INSERT_HEAD(PGRPHASH(0), &pgrp0, pg_hash); 360a3bfb996SJeffrey Hsu LIST_INIT(&pgrp0.pg_members); 361a3bfb996SJeffrey Hsu LIST_INSERT_HEAD(&pgrp0.pg_members, p, p_pglist); 362a3bfb996SJeffrey Hsu 363df8bae1dSRodney W. Grimes pgrp0.pg_session = &session0; 3646008862bSJohn Baldwin mtx_init(&session0.s_mtx, "session", NULL, MTX_DEF); 365df8bae1dSRodney W. Grimes session0.s_count = 1; 366df8bae1dSRodney W. Grimes session0.s_leader = p; 367df8bae1dSRodney W. Grimes 3683ebc1248SPeter Wemm p->p_sysent = &null_sysvec; 369f202965eSJohn Baldwin p->p_flag = P_SYSTEM; 370f202965eSJohn Baldwin p->p_sflag = PS_INMEM; 371e602ba25SJulian Elischer p->p_state = PRS_NORMAL; 372ad3b9257SJohn-Mark Gurney knlist_init(&p->p_klist, &p->p_mtx); 373fa885116SJulian Elischer p->p_nice = NZERO; 374e602ba25SJulian Elischer td->td_state = TDS_RUNNING; 3752c100766SJulian Elischer kg->kg_pri_class = PRI_TIMESHARE; 3762c100766SJulian Elischer kg->kg_user_pri = PUSER; 3772c100766SJulian Elischer td->td_priority = PVM; 3782c100766SJulian Elischer td->td_base_pri = PUSER; 379060563ecSJulian Elischer td->td_oncpu = 0; 3802c1011f7SJohn Dyson p->p_peers = 0; 3812c1011f7SJohn Dyson p->p_leader = p; 382e602ba25SJulian Elischer 3832c1011f7SJohn Dyson 384df8bae1dSRodney W. Grimes bcopy("swapper", p->p_comm, sizeof ("swapper")); 385df8bae1dSRodney W. Grimes 386c06eb4e2SSam Leffler callout_init(&p->p_itcallout, CALLOUT_MPSAFE); 387c06eb4e2SSam Leffler callout_init(&td->td_slpcallout, CALLOUT_MPSAFE); 3884f559836SJake Burkholder 389df8bae1dSRodney W. Grimes /* Create credentials. */ 390df8bae1dSRodney W. Grimes p->p_ucred = crget(); 391df8bae1dSRodney W. Grimes p->p_ucred->cr_ngroups = 1; /* group 0 */ 392f535380cSDon Lewis p->p_ucred->cr_uidinfo = uifind(0); 393b1fc0ec1SRobert Watson p->p_ucred->cr_ruidinfo = uifind(0); 39491421ba2SRobert Watson p->p_ucred->cr_prison = NULL; /* Don't jail it. */ 39540244964SRobert Watson #ifdef MAC 39640244964SRobert Watson mac_create_proc0(p->p_ucred); 39740244964SRobert Watson #endif 3988e2e767bSJohn Baldwin td->td_ucred = crhold(p->p_ucred); 39975c13541SPoul-Henning Kamp 40090af4afaSJohn Baldwin /* Create sigacts. */ 40190af4afaSJohn Baldwin p->p_sigacts = sigacts_alloc(); 4026626c604SJulian Elischer 40337b087a6SPeter Wemm /* Initialize signal state for process 0. */ 40437b087a6SPeter Wemm siginit(&proc0); 40537b087a6SPeter Wemm 406df8bae1dSRodney W. Grimes /* Create the file descriptor table. */ 4078ec21e3aSPoul-Henning Kamp p->p_fd = fdinit(NULL); 408ad05d580STor Egge p->p_fdtol = NULL; 409df8bae1dSRodney W. Grimes 410df8bae1dSRodney W. Grimes /* Create the limits structures. */ 41191d5354aSJohn Baldwin p->p_limit = lim_alloc(); 41291d5354aSJohn Baldwin for (i = 0; i < RLIM_NLIMITS; i++) 41391d5354aSJohn Baldwin p->p_limit->pl_rlimit[i].rlim_cur = 41491d5354aSJohn Baldwin p->p_limit->pl_rlimit[i].rlim_max = RLIM_INFINITY; 41591d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_NOFILE].rlim_cur = 41691d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_NOFILE].rlim_max = maxfiles; 41791d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_NPROC].rlim_cur = 41891d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_NPROC].rlim_max = maxproc; 419df8bae1dSRodney W. Grimes i = ptoa(cnt.v_free_count); 42091d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_RSS].rlim_max = i; 42191d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_MEMLOCK].rlim_max = i; 42291d5354aSJohn Baldwin p->p_limit->pl_rlimit[RLIMIT_MEMLOCK].rlim_cur = i / 3; 4235715307fSJohn Baldwin p->p_cpulimit = RLIM_INFINITY; 424df8bae1dSRodney W. Grimes 425df8bae1dSRodney W. Grimes /* Allocate a prototype map so we have something to fork. */ 426b1028ad1SLuoqi Chen pmap_pinit0(vmspace_pmap(&vmspace0)); 427df8bae1dSRodney W. Grimes p->p_vmspace = &vmspace0; 428df8bae1dSRodney W. Grimes vmspace0.vm_refcnt = 1; 42905ba50f5SJake Burkholder vm_map_init(&vmspace0.vm_map, p->p_sysent->sv_minuser, 43005ba50f5SJake Burkholder p->p_sysent->sv_maxuser); 431b1028ad1SLuoqi Chen vmspace0.vm_map.pmap = vmspace_pmap(&vmspace0); 432df8bae1dSRodney W. Grimes 43339fb8e6bSJulian Elischer /* 43490af4afaSJohn Baldwin * We continue to place resource usage info 43590af4afaSJohn Baldwin * in the user struct so that it's pageable. 436df8bae1dSRodney W. Grimes */ 437b40ce416SJulian Elischer p->p_stats = &p->p_uarea->u_stats; 438df8bae1dSRodney W. Grimes 439df8bae1dSRodney W. Grimes /* 440a3bfb996SJeffrey Hsu * Charge root for one process. 441df8bae1dSRodney W. Grimes */ 442b1fc0ec1SRobert Watson (void)chgproccnt(p->p_ucred->cr_ruidinfo, 1, 0); 44326f9a767SRodney W. Grimes } 4442b14f991SJulian Elischer SYSINIT(p0init, SI_SUB_INTRINSIC, SI_ORDER_FIRST, proc0_init, NULL) 4452b14f991SJulian Elischer 4462b14f991SJulian Elischer /* ARGSUSED*/ 447154c04e5SPoul-Henning Kamp static void 44837b087a6SPeter Wemm proc0_post(void *dummy __unused) 4492b14f991SJulian Elischer { 45000af9731SPoul-Henning Kamp struct timespec ts; 45137b087a6SPeter Wemm struct proc *p; 452a6fc8288SPeter Wemm 4532b14f991SJulian Elischer /* 4541b0b259eSBruce Evans * Now we can look at the time, having had a chance to verify the 4551b0b259eSBruce Evans * time from the filesystem. Pretend that proc0 started now. 4562b14f991SJulian Elischer */ 4571005a129SJohn Baldwin sx_slock(&allproc_lock); 45837b087a6SPeter Wemm LIST_FOREACH(p, &allproc, p_list) { 45987ccef7bSDag-Erling Smørgrav microuptime(&p->p_stats->p_start); 46078c85e8dSJohn Baldwin p->p_rux.rux_runtime.sec = 0; 46178c85e8dSJohn Baldwin p->p_rux.rux_runtime.frac = 0; 46237b087a6SPeter Wemm } 4631005a129SJohn Baldwin sx_sunlock(&allproc_lock); 464e2256f43SPeter Wemm binuptime(PCPU_PTR(switchtime)); 4650384fff8SJason Evans PCPU_SET(switchticks, ticks); 4662b14f991SJulian Elischer 467a6fc8288SPeter Wemm /* 468a6fc8288SPeter Wemm * Give the ``random'' number generator a thump. 469a6fc8288SPeter Wemm */ 47000af9731SPoul-Henning Kamp nanotime(&ts); 47100af9731SPoul-Henning Kamp srandom(ts.tv_sec ^ ts.tv_nsec); 4722b14f991SJulian Elischer } 4732b14f991SJulian Elischer SYSINIT(p0post, SI_SUB_INTRINSIC_POST, SI_ORDER_FIRST, proc0_post, NULL) 4742b14f991SJulian Elischer 475df8bae1dSRodney W. Grimes /* 4762b14f991SJulian Elischer *************************************************************************** 4772b14f991SJulian Elischer **** 4782b14f991SJulian Elischer **** The following SYSINIT's and glue code should be moved to the 4792b14f991SJulian Elischer **** respective files on a per subsystem basis. 4802b14f991SJulian Elischer **** 4812b14f991SJulian Elischer *************************************************************************** 482df8bae1dSRodney W. Grimes */ 483df8bae1dSRodney W. Grimes 484df8bae1dSRodney W. Grimes 485df8bae1dSRodney W. Grimes /* 4862b14f991SJulian Elischer *************************************************************************** 4872b14f991SJulian Elischer **** 4882b14f991SJulian Elischer **** The following code probably belongs in another file, like 48937b087a6SPeter Wemm **** kern/init_init.c. 4902b14f991SJulian Elischer **** 4912b14f991SJulian Elischer *************************************************************************** 492df8bae1dSRodney W. Grimes */ 493df8bae1dSRodney W. Grimes 494df8bae1dSRodney W. Grimes /* 495df8bae1dSRodney W. Grimes * List of paths to try when searching for "init". 496df8bae1dSRodney W. Grimes */ 4975f967b24SDag-Erling Smørgrav static char init_path[MAXPATHLEN] = 49867481196SJohn Birrell #ifdef INIT_PATH 49967481196SJohn Birrell __XSTRING(INIT_PATH); 50067481196SJohn Birrell #else 501e4082284SJohn Birrell "/sbin/init:/sbin/oinit:/sbin/init.bak:/stand/sysinstall"; 50267481196SJohn Birrell #endif 503af1408e3SLuigi Rizzo SYSCTL_STRING(_kern, OID_AUTO, init_path, CTLFLAG_RD, init_path, 0, 504af1408e3SLuigi Rizzo "Path used to search the init process"); 505df8bae1dSRodney W. Grimes 506df8bae1dSRodney W. Grimes /* 5075f967b24SDag-Erling Smørgrav * Start the initial user process; try exec'ing each pathname in init_path. 508df8bae1dSRodney W. Grimes * The program is invoked with one argument containing the boot flags. 509df8bae1dSRodney W. Grimes */ 510df8bae1dSRodney W. Grimes static void 51137b087a6SPeter Wemm start_init(void *dummy) 512df8bae1dSRodney W. Grimes { 513df8bae1dSRodney W. Grimes vm_offset_t addr; 514df8bae1dSRodney W. Grimes struct execve_args args; 5155f967b24SDag-Erling Smørgrav int options, error; 5165f967b24SDag-Erling Smørgrav char *var, *path, *next, *s; 5175f967b24SDag-Erling Smørgrav char *ucp, **uap, *arg0, *arg1; 518b40ce416SJulian Elischer struct thread *td; 5199c8b8baaSPeter Wemm struct proc *p; 520b7116168SPeter Wemm int init_does_devfs = 0; 521df8bae1dSRodney W. Grimes 5229ed346baSBosko Milekic mtx_lock(&Giant); 5230384fff8SJason Evans 5240cddd8f0SMatthew Dillon GIANT_REQUIRED; 5250cddd8f0SMatthew Dillon 526b40ce416SJulian Elischer td = curthread; 527b40ce416SJulian Elischer p = td->td_proc; 528df8bae1dSRodney W. Grimes 529563af2ecSMaxime Henrion vfs_mountroot(); 530fb92273bSPoul-Henning Kamp 53137b087a6SPeter Wemm /* Get the vnode for '/'. Set p->p_fd->fd_cdir to reference it. */ 532f257b7a5SAlfred Perlstein if (VFS_ROOT(TAILQ_FIRST(&mountlist), &rootvnode, td)) 53337b087a6SPeter Wemm panic("cannot find root vnode"); 534426da3bcSAlfred Perlstein FILEDESC_LOCK(p->p_fd); 53537b087a6SPeter Wemm p->p_fd->fd_cdir = rootvnode; 53637b087a6SPeter Wemm VREF(p->p_fd->fd_cdir); 53737b087a6SPeter Wemm p->p_fd->fd_rdir = rootvnode; 538a90ef2aeSIan Dowse VREF(p->p_fd->fd_rdir); 539426da3bcSAlfred Perlstein FILEDESC_UNLOCK(p->p_fd); 540b40ce416SJulian Elischer VOP_UNLOCK(rootvnode, 0, td); 541a87cdf83SRobert Watson #ifdef MAC 542a87cdf83SRobert Watson mac_create_root_mount(td->td_ucred, TAILQ_FIRST(&mountlist)); 543a87cdf83SRobert Watson #endif 54437b087a6SPeter Wemm 545b7116168SPeter Wemm /* 546b7116168SPeter Wemm * For disk based systems, we probably cannot do this yet 547b7116168SPeter Wemm * since the fs will be read-only. But a NFS root 548b7116168SPeter Wemm * might be ok. It is worth a shot. 549b7116168SPeter Wemm */ 5508f19eb88SIan Dowse error = kern_mkdir(td, "/dev", UIO_SYSSPACE, 0700); 551b7116168SPeter Wemm if (error == EEXIST) 552b7116168SPeter Wemm error = 0; 553b7116168SPeter Wemm if (error == 0) 5546dbde1feSMaxime Henrion error = kernel_vmount(0, "fstype", "devfs", 5556dbde1feSMaxime Henrion "fspath", "/dev", NULL); 556b7116168SPeter Wemm if (error != 0) 557b7116168SPeter Wemm init_does_devfs = 1; 558b7116168SPeter Wemm 559df8bae1dSRodney W. Grimes /* 560df8bae1dSRodney W. Grimes * Need just enough stack to hold the faked-up "execve()" arguments. 561df8bae1dSRodney W. Grimes */ 56205ba50f5SJake Burkholder addr = p->p_sysent->sv_usrstack - PAGE_SIZE; 5635f967b24SDag-Erling Smørgrav if (vm_map_find(&p->p_vmspace->vm_map, NULL, 0, &addr, PAGE_SIZE, 5645f967b24SDag-Erling Smørgrav FALSE, VM_PROT_ALL, VM_PROT_ALL, 0) != 0) 565df8bae1dSRodney W. Grimes panic("init: couldn't allocate argument space"); 566df8bae1dSRodney W. Grimes p->p_vmspace->vm_maxsaddr = (caddr_t)addr; 56726f9a767SRodney W. Grimes p->p_vmspace->vm_ssize = 1; 568df8bae1dSRodney W. Grimes 5695f967b24SDag-Erling Smørgrav if ((var = getenv("init_path")) != NULL) { 570e80fb434SRobert Drehmel strlcpy(init_path, var, sizeof(init_path)); 571d786139cSMaxime Henrion freeenv(var); 5725f967b24SDag-Erling Smørgrav } 5735f967b24SDag-Erling Smørgrav 57467481196SJohn Birrell for (path = init_path; *path != '\0'; path = next) { 575e4082284SJohn Birrell while (*path == ':') 5765f967b24SDag-Erling Smørgrav path++; 57767481196SJohn Birrell if (*path == '\0') 5785f967b24SDag-Erling Smørgrav break; 579e4082284SJohn Birrell for (next = path; *next != '\0' && *next != ':'; next++) 5805f967b24SDag-Erling Smørgrav /* nothing */ ; 5815f967b24SDag-Erling Smørgrav if (bootverbose) 582ba41a07dSDmitrij Tejblum printf("start_init: trying %.*s\n", (int)(next - path), 583ba41a07dSDmitrij Tejblum path); 5845f967b24SDag-Erling Smørgrav 585df8bae1dSRodney W. Grimes /* 586df8bae1dSRodney W. Grimes * Move out the boot flag argument. 587df8bae1dSRodney W. Grimes */ 588df8bae1dSRodney W. Grimes options = 0; 58905ba50f5SJake Burkholder ucp = (char *)p->p_sysent->sv_usrstack; 590df8bae1dSRodney W. Grimes (void)subyte(--ucp, 0); /* trailing zero */ 591df8bae1dSRodney W. Grimes if (boothowto & RB_SINGLE) { 592df8bae1dSRodney W. Grimes (void)subyte(--ucp, 's'); 593df8bae1dSRodney W. Grimes options = 1; 594df8bae1dSRodney W. Grimes } 595df8bae1dSRodney W. Grimes #ifdef notyet 596df8bae1dSRodney W. Grimes if (boothowto & RB_FASTBOOT) { 597df8bae1dSRodney W. Grimes (void)subyte(--ucp, 'f'); 598df8bae1dSRodney W. Grimes options = 1; 599df8bae1dSRodney W. Grimes } 600df8bae1dSRodney W. Grimes #endif 60117755ac8SPoul-Henning Kamp 60217755ac8SPoul-Henning Kamp #ifdef BOOTCDROM 60317755ac8SPoul-Henning Kamp (void)subyte(--ucp, 'C'); 60417755ac8SPoul-Henning Kamp options = 1; 60517755ac8SPoul-Henning Kamp #endif 606b7116168SPeter Wemm if (init_does_devfs) { 6073f54a085SPoul-Henning Kamp (void)subyte(--ucp, 'd'); 6083f54a085SPoul-Henning Kamp options = 1; 609db901281SPoul-Henning Kamp } 610db901281SPoul-Henning Kamp 611df8bae1dSRodney W. Grimes if (options == 0) 612df8bae1dSRodney W. Grimes (void)subyte(--ucp, '-'); 613df8bae1dSRodney W. Grimes (void)subyte(--ucp, '-'); /* leading hyphen */ 614df8bae1dSRodney W. Grimes arg1 = ucp; 615df8bae1dSRodney W. Grimes 616df8bae1dSRodney W. Grimes /* 617df8bae1dSRodney W. Grimes * Move out the file name (also arg 0). 618df8bae1dSRodney W. Grimes */ 6195f967b24SDag-Erling Smørgrav (void)subyte(--ucp, 0); 6205f967b24SDag-Erling Smørgrav for (s = next - 1; s >= path; s--) 6215f967b24SDag-Erling Smørgrav (void)subyte(--ucp, *s); 622df8bae1dSRodney W. Grimes arg0 = ucp; 623df8bae1dSRodney W. Grimes 624df8bae1dSRodney W. Grimes /* 625df8bae1dSRodney W. Grimes * Move out the arg pointers. 626df8bae1dSRodney W. Grimes */ 627a20d7755SDoug Rabson uap = (char **)((intptr_t)ucp & ~(sizeof(intptr_t)-1)); 628c2da0fd9SBruce Evans (void)suword((caddr_t)--uap, (long)0); /* terminator */ 629c2da0fd9SBruce Evans (void)suword((caddr_t)--uap, (long)(intptr_t)arg1); 630c2da0fd9SBruce Evans (void)suword((caddr_t)--uap, (long)(intptr_t)arg0); 631df8bae1dSRodney W. Grimes 632df8bae1dSRodney W. Grimes /* 633df8bae1dSRodney W. Grimes * Point at the arguments. 634df8bae1dSRodney W. Grimes */ 635df8bae1dSRodney W. Grimes args.fname = arg0; 63626f9a767SRodney W. Grimes args.argv = uap; 63726f9a767SRodney W. Grimes args.envv = NULL; 638df8bae1dSRodney W. Grimes 639df8bae1dSRodney W. Grimes /* 640df8bae1dSRodney W. Grimes * Now try to exec the program. If can't for any reason 641df8bae1dSRodney W. Grimes * other than it doesn't exist, complain. 6422b14f991SJulian Elischer * 64337b087a6SPeter Wemm * Otherwise, return via fork_trampoline() all the way 6449c8b8baaSPeter Wemm * to user mode as init! 645df8bae1dSRodney W. Grimes */ 646b40ce416SJulian Elischer if ((error = execve(td, &args)) == 0) { 6479ed346baSBosko Milekic mtx_unlock(&Giant); 648df8bae1dSRodney W. Grimes return; 649db72809dSJohn Baldwin } 650df8bae1dSRodney W. Grimes if (error != ENOENT) 651ba41a07dSDmitrij Tejblum printf("exec %.*s: error %d\n", (int)(next - path), 652ba41a07dSDmitrij Tejblum path, error); 653df8bae1dSRodney W. Grimes } 654580e7e5aSGreg Lehey printf("init: not found in path %s\n", init_path); 655df8bae1dSRodney W. Grimes panic("no init"); 656df8bae1dSRodney W. Grimes } 65737b087a6SPeter Wemm 65837b087a6SPeter Wemm /* 65937b087a6SPeter Wemm * Like kthread_create(), but runs in it's own address space. 66037b087a6SPeter Wemm * We do this early to reserve pid 1. 66137b087a6SPeter Wemm * 66237b087a6SPeter Wemm * Note special case - do not make it runnable yet. Other work 66337b087a6SPeter Wemm * in progress will change this more. 66437b087a6SPeter Wemm */ 66537b087a6SPeter Wemm static void 66637b087a6SPeter Wemm create_init(const void *udata __unused) 66737b087a6SPeter Wemm { 6685a06cb0cSRobert Watson struct ucred *newcred, *oldcred; 66937b087a6SPeter Wemm int error; 67037b087a6SPeter Wemm 671316ec49aSScott Long error = fork1(&thread0, RFFDG | RFPROC | RFSTOPPED, 0, &initproc); 67237b087a6SPeter Wemm if (error) 67337b087a6SPeter Wemm panic("cannot fork init: %d\n", error); 674bafc8f25SRobert Watson KASSERT(initproc->p_pid == 1, ("create_init: initproc->p_pid != 1")); 6755a06cb0cSRobert Watson /* divorce init's credentials from the kernel's */ 6765a06cb0cSRobert Watson newcred = crget(); 677f202965eSJohn Baldwin PROC_LOCK(initproc); 678f202965eSJohn Baldwin initproc->p_flag |= P_SYSTEM; 6795a06cb0cSRobert Watson oldcred = initproc->p_ucred; 6805a06cb0cSRobert Watson crcopy(newcred, oldcred); 68140244964SRobert Watson #ifdef MAC 68240244964SRobert Watson mac_create_proc1(newcred); 68340244964SRobert Watson #endif 6845a06cb0cSRobert Watson initproc->p_ucred = newcred; 685f202965eSJohn Baldwin PROC_UNLOCK(initproc); 6865a06cb0cSRobert Watson crfree(oldcred); 6874d1a4bb7SRobert Watson cred_update_thread(FIRST_THREAD_IN_PROC(initproc)); 6889ed346baSBosko Milekic mtx_lock_spin(&sched_lock); 689f202965eSJohn Baldwin initproc->p_sflag |= PS_INMEM; 6909ed346baSBosko Milekic mtx_unlock_spin(&sched_lock); 691079b7badSJulian Elischer cpu_set_fork_handler(FIRST_THREAD_IN_PROC(initproc), start_init, NULL); 69237b087a6SPeter Wemm } 69337b087a6SPeter Wemm SYSINIT(init, SI_SUB_CREATE_INIT, SI_ORDER_FIRST, create_init, NULL) 69437b087a6SPeter Wemm 69537b087a6SPeter Wemm /* 69637b087a6SPeter Wemm * Make it runnable now. 69737b087a6SPeter Wemm */ 69837b087a6SPeter Wemm static void 69937b087a6SPeter Wemm kick_init(const void *udata __unused) 70037b087a6SPeter Wemm { 701079b7badSJulian Elischer struct thread *td; 702f202965eSJohn Baldwin 703079b7badSJulian Elischer td = FIRST_THREAD_IN_PROC(initproc); 7049ed346baSBosko Milekic mtx_lock_spin(&sched_lock); 70571fad9fdSJulian Elischer TD_SET_CAN_RUN(td); 7062630e4c9SJulian Elischer setrunqueue(td, SRQ_BORING); /* XXXKSE */ 7079ed346baSBosko Milekic mtx_unlock_spin(&sched_lock); 70837b087a6SPeter Wemm } 70937b087a6SPeter Wemm SYSINIT(kickinit, SI_SUB_KTHREAD_INIT, SI_ORDER_FIRST, kick_init, NULL) 710