xref: /freebsd/sys/kern/kern_shutdown.c (revision 5dc5dab6eb40126ad56224fb2edbac445ed38f52)
1ad4240feSJulian Elischer /*-
2ad4240feSJulian Elischer  * Copyright (c) 1986, 1988, 1991, 1993
3ad4240feSJulian Elischer  *	The Regents of the University of California.  All rights reserved.
4ad4240feSJulian Elischer  * (c) UNIX System Laboratories, Inc.
5ad4240feSJulian Elischer  * All or some portions of this file are derived from material licensed
6ad4240feSJulian Elischer  * to the University of California by American Telephone and Telegraph
7ad4240feSJulian Elischer  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
8ad4240feSJulian Elischer  * the permission of UNIX System Laboratories, Inc.
9ad4240feSJulian Elischer  *
10ad4240feSJulian Elischer  * Redistribution and use in source and binary forms, with or without
11ad4240feSJulian Elischer  * modification, are permitted provided that the following conditions
12ad4240feSJulian Elischer  * are met:
13ad4240feSJulian Elischer  * 1. Redistributions of source code must retain the above copyright
14ad4240feSJulian Elischer  *    notice, this list of conditions and the following disclaimer.
15ad4240feSJulian Elischer  * 2. Redistributions in binary form must reproduce the above copyright
16ad4240feSJulian Elischer  *    notice, this list of conditions and the following disclaimer in the
17ad4240feSJulian Elischer  *    documentation and/or other materials provided with the distribution.
18ad4240feSJulian Elischer  * 4. Neither the name of the University nor the names of its contributors
19ad4240feSJulian Elischer  *    may be used to endorse or promote products derived from this software
20ad4240feSJulian Elischer  *    without specific prior written permission.
21ad4240feSJulian Elischer  *
22ad4240feSJulian Elischer  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23ad4240feSJulian Elischer  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24ad4240feSJulian Elischer  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25ad4240feSJulian Elischer  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26ad4240feSJulian Elischer  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27ad4240feSJulian Elischer  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28ad4240feSJulian Elischer  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29ad4240feSJulian Elischer  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30ad4240feSJulian Elischer  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31ad4240feSJulian Elischer  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32ad4240feSJulian Elischer  * SUCH DAMAGE.
33ad4240feSJulian Elischer  *
34ad4240feSJulian Elischer  *	@(#)kern_shutdown.c	8.3 (Berkeley) 1/21/94
35ad4240feSJulian Elischer  */
36ad4240feSJulian Elischer 
37677b542eSDavid E. O'Brien #include <sys/cdefs.h>
38677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
39677b542eSDavid E. O'Brien 
40618c7db3SRobert Watson #include "opt_ddb.h"
412d50560aSMarcel Moolenaar #include "opt_kdb.h"
426d58e6cbSBruce Evans #include "opt_panic.h"
439923b511SScott Long #include "opt_sched.h"
442be767e0SAttilio Rao #include "opt_watchdog.h"
45ad4240feSJulian Elischer 
46ad4240feSJulian Elischer #include <sys/param.h>
47ad4240feSJulian Elischer #include <sys/systm.h>
489626b608SPoul-Henning Kamp #include <sys/bio.h>
49fc8f7066SBruce Evans #include <sys/buf.h>
501d79f1bbSJohn Baldwin #include <sys/conf.h>
511d79f1bbSJohn Baldwin #include <sys/cons.h>
521d79f1bbSJohn Baldwin #include <sys/eventhandler.h>
530d3d0cc3SEdward Tomasz Napierala #include <sys/filedesc.h>
5476ca6f88SJamie Gritton #include <sys/jail.h>
552d50560aSMarcel Moolenaar #include <sys/kdb.h>
56ad4240feSJulian Elischer #include <sys/kernel.h>
57e6592ee5SPeter Wemm #include <sys/kerneldump.h>
585e950839SLuoqi Chen #include <sys/kthread.h>
593945a964SAlfred Perlstein #include <sys/ktr.h>
60dcd7d9b7SMaxim Sobolev #include <sys/malloc.h>
61ac0ad63fSBruce Evans #include <sys/mount.h>
62acd3428bSRobert Watson #include <sys/priv.h>
631d79f1bbSJohn Baldwin #include <sys/proc.h>
641d79f1bbSJohn Baldwin #include <sys/reboot.h>
651d79f1bbSJohn Baldwin #include <sys/resourcevar.h>
6689f6b863SAttilio Rao #include <sys/rwlock.h>
6720e25d7dSPeter Wemm #include <sys/sched.h>
68248bb937SAttilio Rao #include <sys/smp.h>
69ad4240feSJulian Elischer #include <sys/sysctl.h>
70ad4240feSJulian Elischer #include <sys/sysproto.h>
71fa2b39a1SAttilio Rao #include <sys/vnode.h>
722be767e0SAttilio Rao #include <sys/watchdog.h>
73ad4240feSJulian Elischer 
74618c7db3SRobert Watson #include <ddb/ddb.h>
75618c7db3SRobert Watson 
7626502503SMarcel Moolenaar #include <machine/cpu.h>
77bdb9ab0dSMark Johnston #include <machine/dump.h>
78d39e457bSPoul-Henning Kamp #include <machine/pcb.h>
79752dff3dSJake Burkholder #include <machine/smp.h>
80ad4240feSJulian Elischer 
81aed55708SRobert Watson #include <security/mac/mac_framework.h>
82aed55708SRobert Watson 
830909f38aSPawel Jakub Dawidek #include <vm/vm.h>
840909f38aSPawel Jakub Dawidek #include <vm/vm_object.h>
850909f38aSPawel Jakub Dawidek #include <vm/vm_page.h>
860909f38aSPawel Jakub Dawidek #include <vm/vm_pager.h>
870909f38aSPawel Jakub Dawidek #include <vm/swap_pager.h>
880909f38aSPawel Jakub Dawidek 
89ad4240feSJulian Elischer #include <sys/signalvar.h>
90ad4240feSJulian Elischer 
91*5dc5dab6SConrad Meyer static MALLOC_DEFINE(M_DUMPER, "dumper", "dumper block buffer");
92*5dc5dab6SConrad Meyer 
93ad4240feSJulian Elischer #ifndef PANIC_REBOOT_WAIT_TIME
94ad4240feSJulian Elischer #define PANIC_REBOOT_WAIT_TIME 15 /* default to 15 seconds */
95ad4240feSJulian Elischer #endif
963b251028SColin Percival static int panic_reboot_wait_time = PANIC_REBOOT_WAIT_TIME;
97af3b2549SHans Petter Selasky SYSCTL_INT(_kern, OID_AUTO, panic_reboot_wait_time, CTLFLAG_RWTUN,
981cdbb9edSColin Percival     &panic_reboot_wait_time, 0,
991cdbb9edSColin Percival     "Seconds to wait before rebooting after a panic");
100ad4240feSJulian Elischer 
101ad4240feSJulian Elischer /*
102ad4240feSJulian Elischer  * Note that stdarg.h and the ANSI style va_start macro is used for both
103ad4240feSJulian Elischer  * ANSI and traditional C compilers.
104ad4240feSJulian Elischer  */
105ad4240feSJulian Elischer #include <machine/stdarg.h>
106ad4240feSJulian Elischer 
1072d50560aSMarcel Moolenaar #ifdef KDB
1082d50560aSMarcel Moolenaar #ifdef KDB_UNATTENDED
1099959b1a8SMike Smith int debugger_on_panic = 0;
110ad4240feSJulian Elischer #else
1119959b1a8SMike Smith int debugger_on_panic = 1;
112ad4240feSJulian Elischer #endif
1133d7618d8SDavid E. O'Brien SYSCTL_INT(_debug, OID_AUTO, debugger_on_panic,
114af3b2549SHans Petter Selasky     CTLFLAG_RWTUN | CTLFLAG_SECURE,
1151c5151f3SDavid E. O'Brien     &debugger_on_panic, 0, "Run debugger on kernel panic");
116e485b64bSJohn Baldwin 
1172d50560aSMarcel Moolenaar #ifdef KDB_TRACE
11808a9c205SAndriy Gapon static int trace_on_panic = 1;
119e485b64bSJohn Baldwin #else
12008a9c205SAndriy Gapon static int trace_on_panic = 0;
121e485b64bSJohn Baldwin #endif
1223d7618d8SDavid E. O'Brien SYSCTL_INT(_debug, OID_AUTO, trace_on_panic,
123af3b2549SHans Petter Selasky     CTLFLAG_RWTUN | CTLFLAG_SECURE,
1241c5151f3SDavid E. O'Brien     &trace_on_panic, 0, "Print stack trace on kernel panic");
1252d50560aSMarcel Moolenaar #endif /* KDB */
126ad4240feSJulian Elischer 
12708a9c205SAndriy Gapon static int sync_on_panic = 0;
128af3b2549SHans Petter Selasky SYSCTL_INT(_kern, OID_AUTO, sync_on_panic, CTLFLAG_RWTUN,
129259ed917SPeter Wemm 	&sync_on_panic, 0, "Do a sync before rebooting from a panic");
130259ed917SPeter Wemm 
1316472ac3dSEd Schouten static SYSCTL_NODE(_kern, OID_AUTO, shutdown, CTLFLAG_RW, 0,
1326472ac3dSEd Schouten     "Shutdown environment");
133db82a982SMike Smith 
134fa2b39a1SAttilio Rao #ifndef DIAGNOSTIC
135fa2b39a1SAttilio Rao static int show_busybufs;
136fa2b39a1SAttilio Rao #else
137fa2b39a1SAttilio Rao static int show_busybufs = 1;
138fa2b39a1SAttilio Rao #endif
139fa2b39a1SAttilio Rao SYSCTL_INT(_kern_shutdown, OID_AUTO, show_busybufs, CTLFLAG_RW,
140fa2b39a1SAttilio Rao 	&show_busybufs, 0, "");
141fa2b39a1SAttilio Rao 
1422eb0015aSColin Percival int suspend_blocked = 0;
1432eb0015aSColin Percival SYSCTL_INT(_kern, OID_AUTO, suspend_blocked, CTLFLAG_RW,
1442eb0015aSColin Percival 	&suspend_blocked, 0, "Block suspend due to a pending shutdown");
1452eb0015aSColin Percival 
1465230cfd2SJulian Elischer /*
147ad4240feSJulian Elischer  * Variable panicstr contains argument to first call to panic; used as flag
148ad4240feSJulian Elischer  * to indicate that the kernel has already called panic.
149ad4240feSJulian Elischer  */
150ad4240feSJulian Elischer const char *panicstr;
151ad4240feSJulian Elischer 
15216a011f9SPaul Saab int dumping;				/* system is dumping */
15336a52c3cSJeff Roberson int rebooting;				/* system is rebooting */
15481661c94SPoul-Henning Kamp static struct dumperinfo dumper;	/* our selected dumper */
1552d50560aSMarcel Moolenaar 
1562d50560aSMarcel Moolenaar /* Context information for dump-debuggers. */
1572d50560aSMarcel Moolenaar static struct pcb dumppcb;		/* Registers. */
158ac6e25ecSHartmut Brandt lwpid_t dumptid;			/* Thread ID. */
15916a011f9SPaul Saab 
1600d3d0cc3SEdward Tomasz Napierala static struct cdevsw reroot_cdevsw = {
1610d3d0cc3SEdward Tomasz Napierala      .d_version = D_VERSION,
1620d3d0cc3SEdward Tomasz Napierala      .d_name    = "reroot",
1630d3d0cc3SEdward Tomasz Napierala };
1640d3d0cc3SEdward Tomasz Napierala 
16582acbcf5SPeter Wemm static void poweroff_wait(void *, int);
16682acbcf5SPeter Wemm static void shutdown_halt(void *junk, int howto);
16782acbcf5SPeter Wemm static void shutdown_panic(void *junk, int howto);
16882acbcf5SPeter Wemm static void shutdown_reset(void *junk, int howto);
1690d3d0cc3SEdward Tomasz Napierala static int kern_reroot(void);
170f06a54f0SPoul-Henning Kamp 
171fcb893a8SMike Smith /* register various local shutdown events */
172fcb893a8SMike Smith static void
173fcb893a8SMike Smith shutdown_conf(void *unused)
174fcb893a8SMike Smith {
175e95499bdSAlfred Perlstein 
176e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, poweroff_wait, NULL,
177fd104c15SRebecca Cran 	    SHUTDOWN_PRI_FIRST);
178e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_halt, NULL,
179e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 100);
180e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_panic, NULL,
181e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 100);
182e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_reset, NULL,
183e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 200);
184fcb893a8SMike Smith }
185ad4240feSJulian Elischer 
186237fdd78SRobert Watson SYSINIT(shutdown_conf, SI_SUB_INTRINSIC, SI_ORDER_ANY, shutdown_conf, NULL);
187fcb893a8SMike Smith 
188ad4240feSJulian Elischer /*
1890d3d0cc3SEdward Tomasz Napierala  * The only reason this exists is to create the /dev/reroot/ directory,
1900d3d0cc3SEdward Tomasz Napierala  * used by reroot code in init(8) as a mountpoint for tmpfs.
1910d3d0cc3SEdward Tomasz Napierala  */
1920d3d0cc3SEdward Tomasz Napierala static void
1930d3d0cc3SEdward Tomasz Napierala reroot_conf(void *unused)
1940d3d0cc3SEdward Tomasz Napierala {
1950d3d0cc3SEdward Tomasz Napierala 	int error;
1960d3d0cc3SEdward Tomasz Napierala 	struct cdev *cdev;
1970d3d0cc3SEdward Tomasz Napierala 
1980d3d0cc3SEdward Tomasz Napierala 	error = make_dev_p(MAKEDEV_CHECKNAME | MAKEDEV_WAITOK, &cdev,
1990d3d0cc3SEdward Tomasz Napierala 	    &reroot_cdevsw, NULL, UID_ROOT, GID_WHEEL, 0600, "reroot/reroot");
2000d3d0cc3SEdward Tomasz Napierala 	if (error != 0) {
2010d3d0cc3SEdward Tomasz Napierala 		printf("%s: failed to create device node, error %d",
2020d3d0cc3SEdward Tomasz Napierala 		    __func__, error);
2030d3d0cc3SEdward Tomasz Napierala 	}
2040d3d0cc3SEdward Tomasz Napierala }
2050d3d0cc3SEdward Tomasz Napierala 
2060d3d0cc3SEdward Tomasz Napierala SYSINIT(reroot_conf, SI_SUB_DEVFS, SI_ORDER_ANY, reroot_conf, NULL);
2070d3d0cc3SEdward Tomasz Napierala 
2080d3d0cc3SEdward Tomasz Napierala /*
2090c14ff0eSRobert Watson  * The system call that results in a reboot.
210ad4240feSJulian Elischer  */
211835a82eeSMatthew Dillon /* ARGSUSED */
212ad4240feSJulian Elischer int
2138451d0ddSKip Macy sys_reboot(struct thread *td, struct reboot_args *uap)
214ad4240feSJulian Elischer {
215ad4240feSJulian Elischer 	int error;
216ad4240feSJulian Elischer 
217a2ecb9b7SRobert Watson 	error = 0;
218a2ecb9b7SRobert Watson #ifdef MAC
21930d239bcSRobert Watson 	error = mac_system_check_reboot(td->td_ucred, uap->opt);
220a2ecb9b7SRobert Watson #endif
221a2ecb9b7SRobert Watson 	if (error == 0)
222acd3428bSRobert Watson 		error = priv_check(td, PRIV_REBOOT);
223a2ecb9b7SRobert Watson 	if (error == 0) {
2240d3d0cc3SEdward Tomasz Napierala 		if (uap->opt & RB_REROOT) {
2250d3d0cc3SEdward Tomasz Napierala 			error = kern_reroot();
2260d3d0cc3SEdward Tomasz Napierala 		} else {
227835a82eeSMatthew Dillon 			mtx_lock(&Giant);
22876e18b25SMarcel Moolenaar 			kern_reboot(uap->opt);
229835a82eeSMatthew Dillon 			mtx_unlock(&Giant);
230a2ecb9b7SRobert Watson 		}
2310d3d0cc3SEdward Tomasz Napierala 	}
232835a82eeSMatthew Dillon 	return (error);
233ad4240feSJulian Elischer }
234ad4240feSJulian Elischer 
235ad4240feSJulian Elischer /*
236ad4240feSJulian Elischer  * Called by events that want to shut down.. e.g  <CTL><ALT><DEL> on a PC
237ad4240feSJulian Elischer  */
238ad4240feSJulian Elischer void
2393e755f76SMike Smith shutdown_nice(int howto)
240ad4240feSJulian Elischer {
241e95499bdSAlfred Perlstein 
242ad4240feSJulian Elischer 	if (initproc != NULL) {
243912d5937SEd Schouten 		/* Send a signal to init(8) and have it shutdown the world. */
24487729a2bSJohn Baldwin 		PROC_LOCK(initproc);
245912d5937SEd Schouten 		if (howto & RB_POWEROFF)
246912d5937SEd Schouten 			kern_psignal(initproc, SIGUSR2);
247912d5937SEd Schouten 		else if (howto & RB_HALT)
248912d5937SEd Schouten 			kern_psignal(initproc, SIGUSR1);
249912d5937SEd Schouten 		else
2508451d0ddSKip Macy 			kern_psignal(initproc, SIGINT);
25187729a2bSJohn Baldwin 		PROC_UNLOCK(initproc);
252ad4240feSJulian Elischer 	} else {
253912d5937SEd Schouten 		/* No init(8) running, so simply reboot. */
2548f5b107bSEd Schouten 		kern_reboot(howto | RB_NOSYNC);
255ad4240feSJulian Elischer 	}
256ad4240feSJulian Elischer }
257ad4240feSJulian Elischer 
25872dfe7a3SPoul-Henning Kamp static void
25982acbcf5SPeter Wemm print_uptime(void)
26072dfe7a3SPoul-Henning Kamp {
26172dfe7a3SPoul-Henning Kamp 	int f;
26272dfe7a3SPoul-Henning Kamp 	struct timespec ts;
26372dfe7a3SPoul-Henning Kamp 
26472dfe7a3SPoul-Henning Kamp 	getnanouptime(&ts);
26572dfe7a3SPoul-Henning Kamp 	printf("Uptime: ");
26672dfe7a3SPoul-Henning Kamp 	f = 0;
26772dfe7a3SPoul-Henning Kamp 	if (ts.tv_sec >= 86400) {
2684a6404dfSJohn Baldwin 		printf("%ldd", (long)ts.tv_sec / 86400);
26972dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 86400;
27072dfe7a3SPoul-Henning Kamp 		f = 1;
27172dfe7a3SPoul-Henning Kamp 	}
27272dfe7a3SPoul-Henning Kamp 	if (f || ts.tv_sec >= 3600) {
2734a6404dfSJohn Baldwin 		printf("%ldh", (long)ts.tv_sec / 3600);
27472dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 3600;
27572dfe7a3SPoul-Henning Kamp 		f = 1;
27672dfe7a3SPoul-Henning Kamp 	}
27772dfe7a3SPoul-Henning Kamp 	if (f || ts.tv_sec >= 60) {
2784a6404dfSJohn Baldwin 		printf("%ldm", (long)ts.tv_sec / 60);
27972dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 60;
28072dfe7a3SPoul-Henning Kamp 		f = 1;
28172dfe7a3SPoul-Henning Kamp 	}
2824a6404dfSJohn Baldwin 	printf("%lds\n", (long)ts.tv_sec);
28372dfe7a3SPoul-Henning Kamp }
28472dfe7a3SPoul-Henning Kamp 
285299cceefSMarcel Moolenaar int
286299cceefSMarcel Moolenaar doadump(boolean_t textdump)
287d39e457bSPoul-Henning Kamp {
288299cceefSMarcel Moolenaar 	boolean_t coredump;
289f6b4f5caSGavin Atkinson 	int error;
290e95499bdSAlfred Perlstein 
291f6b4f5caSGavin Atkinson 	error = 0;
292299cceefSMarcel Moolenaar 	if (dumping)
293299cceefSMarcel Moolenaar 		return (EBUSY);
294299cceefSMarcel Moolenaar 	if (dumper.dumper == NULL)
295299cceefSMarcel Moolenaar 		return (ENXIO);
296f6449d9dSJulian Elischer 
297d39e457bSPoul-Henning Kamp 	savectx(&dumppcb);
2982d50560aSMarcel Moolenaar 	dumptid = curthread->td_tid;
299d39e457bSPoul-Henning Kamp 	dumping++;
300299cceefSMarcel Moolenaar 
301299cceefSMarcel Moolenaar 	coredump = TRUE;
302618c7db3SRobert Watson #ifdef DDB
303299cceefSMarcel Moolenaar 	if (textdump && textdump_pending) {
304299cceefSMarcel Moolenaar 		coredump = FALSE;
305618c7db3SRobert Watson 		textdump_dumpsys(&dumper);
306299cceefSMarcel Moolenaar 	}
307618c7db3SRobert Watson #endif
308299cceefSMarcel Moolenaar 	if (coredump)
309f6b4f5caSGavin Atkinson 		error = dumpsys(&dumper);
310299cceefSMarcel Moolenaar 
3119e473363SRuslan Ermilov 	dumping--;
312f6b4f5caSGavin Atkinson 	return (error);
313d39e457bSPoul-Henning Kamp }
314d39e457bSPoul-Henning Kamp 
315ad4240feSJulian Elischer /*
31670ce93f4SNate Lawson  * Shutdown the system cleanly to prepare for reboot, halt, or power off.
317ad4240feSJulian Elischer  */
31876e18b25SMarcel Moolenaar void
31976e18b25SMarcel Moolenaar kern_reboot(int howto)
320ad4240feSJulian Elischer {
32198082691SJeff Roberson 	static int once = 0;
322ad4240feSJulian Elischer 
323f7ebc7ceSMarcel Moolenaar #if defined(SMP)
32470ce93f4SNate Lawson 	/*
32570ce93f4SNate Lawson 	 * Bind us to CPU 0 so that all shutdown code runs there.  Some
32670ce93f4SNate Lawson 	 * systems don't shutdown properly (i.e., ACPI power off) if we
32770ce93f4SNate Lawson 	 * run on another processor.
32870ce93f4SNate Lawson 	 */
32935370593SAndriy Gapon 	if (!SCHEDULER_STOPPED()) {
330982d11f8SJeff Roberson 		thread_lock(curthread);
33120e25d7dSPeter Wemm 		sched_bind(curthread, 0);
332982d11f8SJeff Roberson 		thread_unlock(curthread);
33335370593SAndriy Gapon 		KASSERT(PCPU_GET(cpuid) == 0, ("boot: not running on cpu 0"));
33435370593SAndriy Gapon 	}
33520e25d7dSPeter Wemm #endif
33636a52c3cSJeff Roberson 	/* We're in the process of rebooting. */
33736a52c3cSJeff Roberson 	rebooting = 1;
33820e25d7dSPeter Wemm 
33961e96500SJohn Baldwin 	/* We are out of the debugger now. */
3402d50560aSMarcel Moolenaar 	kdb_active = 0;
34161e96500SJohn Baldwin 
3425230cfd2SJulian Elischer 	/*
3435230cfd2SJulian Elischer 	 * Do any callouts that should be done BEFORE syncing the filesystems.
3445230cfd2SJulian Elischer 	 */
345fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_pre_sync, howto);
3465230cfd2SJulian Elischer 
3475230cfd2SJulian Elischer 	/*
3485230cfd2SJulian Elischer 	 * Now sync filesystems
3495230cfd2SJulian Elischer 	 */
35098082691SJeff Roberson 	if (!cold && (howto & RB_NOSYNC) == 0 && once == 0) {
35198082691SJeff Roberson 		once = 1;
35298082691SJeff Roberson 		bufshutdown(show_busybufs);
353ad4240feSJulian Elischer 	}
3545230cfd2SJulian Elischer 
35572dfe7a3SPoul-Henning Kamp 	print_uptime();
35672dfe7a3SPoul-Henning Kamp 
357bf8696b4SAndriy Gapon 	cngrab();
358bf8696b4SAndriy Gapon 
3595230cfd2SJulian Elischer 	/*
3605230cfd2SJulian Elischer 	 * Ok, now do things that assume all filesystem activity has
3615230cfd2SJulian Elischer 	 * been completed.
3625230cfd2SJulian Elischer 	 */
363fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_post_sync, howto);
36470ce93f4SNate Lawson 
365f6449d9dSJulian Elischer 	if ((howto & (RB_HALT|RB_DUMP)) == RB_DUMP && !cold && !dumping)
366299cceefSMarcel Moolenaar 		doadump(TRUE);
3672cfa0a03SJustin T. Gibbs 
3682cfa0a03SJustin T. Gibbs 	/* Now that we're going to really halt the system... */
369fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_final, howto);
3702cfa0a03SJustin T. Gibbs 
371fcb893a8SMike Smith 	for(;;) ;	/* safety against shutdown_reset not working */
372fcb893a8SMike Smith 	/* NOTREACHED */
373fcb893a8SMike Smith }
374fcb893a8SMike Smith 
375fcb893a8SMike Smith /*
3760d3d0cc3SEdward Tomasz Napierala  * The system call that results in changing the rootfs.
3770d3d0cc3SEdward Tomasz Napierala  */
3780d3d0cc3SEdward Tomasz Napierala static int
3790d3d0cc3SEdward Tomasz Napierala kern_reroot(void)
3800d3d0cc3SEdward Tomasz Napierala {
3810d3d0cc3SEdward Tomasz Napierala 	struct vnode *oldrootvnode, *vp;
3820d3d0cc3SEdward Tomasz Napierala 	struct mount *mp, *devmp;
3830d3d0cc3SEdward Tomasz Napierala 	int error;
3840d3d0cc3SEdward Tomasz Napierala 
3850d3d0cc3SEdward Tomasz Napierala 	if (curproc != initproc)
3860d3d0cc3SEdward Tomasz Napierala 		return (EPERM);
3870d3d0cc3SEdward Tomasz Napierala 
3880d3d0cc3SEdward Tomasz Napierala 	/*
3890d3d0cc3SEdward Tomasz Napierala 	 * Mark the filesystem containing currently-running executable
3900d3d0cc3SEdward Tomasz Napierala 	 * (the temporary copy of init(8)) busy.
3910d3d0cc3SEdward Tomasz Napierala 	 */
3920d3d0cc3SEdward Tomasz Napierala 	vp = curproc->p_textvp;
3930d3d0cc3SEdward Tomasz Napierala 	error = vn_lock(vp, LK_SHARED);
3940d3d0cc3SEdward Tomasz Napierala 	if (error != 0)
3950d3d0cc3SEdward Tomasz Napierala 		return (error);
3960d3d0cc3SEdward Tomasz Napierala 	mp = vp->v_mount;
3970d3d0cc3SEdward Tomasz Napierala 	error = vfs_busy(mp, MBF_NOWAIT);
3980d3d0cc3SEdward Tomasz Napierala 	if (error != 0) {
3990d3d0cc3SEdward Tomasz Napierala 		vfs_ref(mp);
4000d3d0cc3SEdward Tomasz Napierala 		VOP_UNLOCK(vp, 0);
4010d3d0cc3SEdward Tomasz Napierala 		error = vfs_busy(mp, 0);
4020d3d0cc3SEdward Tomasz Napierala 		vn_lock(vp, LK_SHARED | LK_RETRY);
4030d3d0cc3SEdward Tomasz Napierala 		vfs_rel(mp);
4040d3d0cc3SEdward Tomasz Napierala 		if (error != 0) {
4050d3d0cc3SEdward Tomasz Napierala 			VOP_UNLOCK(vp, 0);
4060d3d0cc3SEdward Tomasz Napierala 			return (ENOENT);
4070d3d0cc3SEdward Tomasz Napierala 		}
4080d3d0cc3SEdward Tomasz Napierala 		if (vp->v_iflag & VI_DOOMED) {
4090d3d0cc3SEdward Tomasz Napierala 			VOP_UNLOCK(vp, 0);
4100d3d0cc3SEdward Tomasz Napierala 			vfs_unbusy(mp);
4110d3d0cc3SEdward Tomasz Napierala 			return (ENOENT);
4120d3d0cc3SEdward Tomasz Napierala 		}
4130d3d0cc3SEdward Tomasz Napierala 	}
4140d3d0cc3SEdward Tomasz Napierala 	VOP_UNLOCK(vp, 0);
4150d3d0cc3SEdward Tomasz Napierala 
4160d3d0cc3SEdward Tomasz Napierala 	/*
4170d3d0cc3SEdward Tomasz Napierala 	 * Remove the filesystem containing currently-running executable
4180d3d0cc3SEdward Tomasz Napierala 	 * from the mount list, to prevent it from being unmounted
4190d3d0cc3SEdward Tomasz Napierala 	 * by vfs_unmountall(), and to avoid confusing vfs_mountroot().
4200d3d0cc3SEdward Tomasz Napierala 	 *
4210d3d0cc3SEdward Tomasz Napierala 	 * Also preserve /dev - forcibly unmounting it could cause driver
4220d3d0cc3SEdward Tomasz Napierala 	 * reinitialization.
4230d3d0cc3SEdward Tomasz Napierala 	 */
4240d3d0cc3SEdward Tomasz Napierala 
4250d3d0cc3SEdward Tomasz Napierala 	vfs_ref(rootdevmp);
4260d3d0cc3SEdward Tomasz Napierala 	devmp = rootdevmp;
4270d3d0cc3SEdward Tomasz Napierala 	rootdevmp = NULL;
4280d3d0cc3SEdward Tomasz Napierala 
4290d3d0cc3SEdward Tomasz Napierala 	mtx_lock(&mountlist_mtx);
4300d3d0cc3SEdward Tomasz Napierala 	TAILQ_REMOVE(&mountlist, mp, mnt_list);
4310d3d0cc3SEdward Tomasz Napierala 	TAILQ_REMOVE(&mountlist, devmp, mnt_list);
4320d3d0cc3SEdward Tomasz Napierala 	mtx_unlock(&mountlist_mtx);
4330d3d0cc3SEdward Tomasz Napierala 
4340d3d0cc3SEdward Tomasz Napierala 	oldrootvnode = rootvnode;
4350d3d0cc3SEdward Tomasz Napierala 
4360d3d0cc3SEdward Tomasz Napierala 	/*
4370d3d0cc3SEdward Tomasz Napierala 	 * Unmount everything except for the two filesystems preserved above.
4380d3d0cc3SEdward Tomasz Napierala 	 */
4390d3d0cc3SEdward Tomasz Napierala 	vfs_unmountall();
4400d3d0cc3SEdward Tomasz Napierala 
4410d3d0cc3SEdward Tomasz Napierala 	/*
4420d3d0cc3SEdward Tomasz Napierala 	 * Add /dev back; vfs_mountroot() will move it into its new place.
4430d3d0cc3SEdward Tomasz Napierala 	 */
4440d3d0cc3SEdward Tomasz Napierala 	mtx_lock(&mountlist_mtx);
4450d3d0cc3SEdward Tomasz Napierala 	TAILQ_INSERT_HEAD(&mountlist, devmp, mnt_list);
4460d3d0cc3SEdward Tomasz Napierala 	mtx_unlock(&mountlist_mtx);
4470d3d0cc3SEdward Tomasz Napierala 	rootdevmp = devmp;
4480d3d0cc3SEdward Tomasz Napierala 	vfs_rel(rootdevmp);
4490d3d0cc3SEdward Tomasz Napierala 
4500d3d0cc3SEdward Tomasz Napierala 	/*
4510d3d0cc3SEdward Tomasz Napierala 	 * Mount the new rootfs.
4520d3d0cc3SEdward Tomasz Napierala 	 */
4530d3d0cc3SEdward Tomasz Napierala 	vfs_mountroot();
4540d3d0cc3SEdward Tomasz Napierala 
4550d3d0cc3SEdward Tomasz Napierala 	/*
4560d3d0cc3SEdward Tomasz Napierala 	 * Update all references to the old rootvnode.
4570d3d0cc3SEdward Tomasz Napierala 	 */
4580d3d0cc3SEdward Tomasz Napierala 	mountcheckdirs(oldrootvnode, rootvnode);
4590d3d0cc3SEdward Tomasz Napierala 
4600d3d0cc3SEdward Tomasz Napierala 	/*
4610d3d0cc3SEdward Tomasz Napierala 	 * Add the temporary filesystem back and unbusy it.
4620d3d0cc3SEdward Tomasz Napierala 	 */
4630d3d0cc3SEdward Tomasz Napierala 	mtx_lock(&mountlist_mtx);
4640d3d0cc3SEdward Tomasz Napierala 	TAILQ_INSERT_TAIL(&mountlist, mp, mnt_list);
4650d3d0cc3SEdward Tomasz Napierala 	mtx_unlock(&mountlist_mtx);
4660d3d0cc3SEdward Tomasz Napierala 	vfs_unbusy(mp);
4670d3d0cc3SEdward Tomasz Napierala 
4680d3d0cc3SEdward Tomasz Napierala 	return (0);
4690d3d0cc3SEdward Tomasz Napierala }
4700d3d0cc3SEdward Tomasz Napierala 
4710d3d0cc3SEdward Tomasz Napierala /*
472fcb893a8SMike Smith  * If the shutdown was a clean halt, behave accordingly.
473fcb893a8SMike Smith  */
474fcb893a8SMike Smith static void
475fcb893a8SMike Smith shutdown_halt(void *junk, int howto)
476fcb893a8SMike Smith {
477e95499bdSAlfred Perlstein 
478ad4240feSJulian Elischer 	if (howto & RB_HALT) {
479ad4240feSJulian Elischer 		printf("\n");
480ad4240feSJulian Elischer 		printf("The operating system has halted.\n");
481ad4240feSJulian Elischer 		printf("Please press any key to reboot.\n\n");
482d13d3630SJulian Elischer 		switch (cngetc()) {
483d13d3630SJulian Elischer 		case -1:		/* No console, just die */
484d13d3630SJulian Elischer 			cpu_halt();
485d13d3630SJulian Elischer 			/* NOTREACHED */
486d13d3630SJulian Elischer 		default:
4872cfa0a03SJustin T. Gibbs 			howto &= ~RB_HALT;
488d13d3630SJulian Elischer 			break;
489d13d3630SJulian Elischer 		}
490fcb893a8SMike Smith 	}
491fcb893a8SMike Smith }
492ad4240feSJulian Elischer 
493fcb893a8SMike Smith /*
494fcb893a8SMike Smith  * Check to see if the system paniced, pause and then reboot
495fcb893a8SMike Smith  * according to the specified delay.
496fcb893a8SMike Smith  */
497fcb893a8SMike Smith static void
498fcb893a8SMike Smith shutdown_panic(void *junk, int howto)
499fcb893a8SMike Smith {
500fcb893a8SMike Smith 	int loop;
501fcb893a8SMike Smith 
502fcb893a8SMike Smith 	if (howto & RB_DUMP) {
5031cdbb9edSColin Percival 		if (panic_reboot_wait_time != 0) {
5041cdbb9edSColin Percival 			if (panic_reboot_wait_time != -1) {
5052cfa0a03SJustin T. Gibbs 				printf("Automatic reboot in %d seconds - "
5062cfa0a03SJustin T. Gibbs 				       "press a key on the console to abort\n",
5071cdbb9edSColin Percival 					panic_reboot_wait_time);
5081cdbb9edSColin Percival 				for (loop = panic_reboot_wait_time * 10;
5092cfa0a03SJustin T. Gibbs 				     loop > 0; --loop) {
510ad4240feSJulian Elischer 					DELAY(1000 * 100); /* 1/10th second */
511a7f8f2abSBruce Evans 					/* Did user type a key? */
512a7f8f2abSBruce Evans 					if (cncheckc() != -1)
513ad4240feSJulian Elischer 						break;
514ad4240feSJulian Elischer 				}
515ad4240feSJulian Elischer 				if (!loop)
516fcb893a8SMike Smith 					return;
517ad4240feSJulian Elischer 			}
518ad4240feSJulian Elischer 		} else { /* zero time specified - reboot NOW */
519fcb893a8SMike Smith 			return;
520ad4240feSJulian Elischer 		}
521422702e9SNik Clayton 		printf("--> Press a key on the console to reboot,\n");
522422702e9SNik Clayton 		printf("--> or switch off the system now.\n");
523ad4240feSJulian Elischer 		cngetc();
524ad4240feSJulian Elischer 	}
525fcb893a8SMike Smith }
526fcb893a8SMike Smith 
527fcb893a8SMike Smith /*
528fcb893a8SMike Smith  * Everything done, now reset
529fcb893a8SMike Smith  */
530fcb893a8SMike Smith static void
531fcb893a8SMike Smith shutdown_reset(void *junk, int howto)
532fcb893a8SMike Smith {
533e95499bdSAlfred Perlstein 
534ad4240feSJulian Elischer 	printf("Rebooting...\n");
535ad4240feSJulian Elischer 	DELAY(1000000);	/* wait 1 sec for printf's to complete and be read */
536248bb937SAttilio Rao 
537248bb937SAttilio Rao 	/*
538248bb937SAttilio Rao 	 * Acquiring smp_ipi_mtx here has a double effect:
539248bb937SAttilio Rao 	 * - it disables interrupts avoiding CPU0 preemption
540248bb937SAttilio Rao 	 *   by fast handlers (thus deadlocking  against other CPUs)
541248bb937SAttilio Rao 	 * - it avoids deadlocks against smp_rendezvous() or, more
542248bb937SAttilio Rao 	 *   generally, threads busy-waiting, with this spinlock held,
543248bb937SAttilio Rao 	 *   and waiting for responses by threads on other CPUs
544248bb937SAttilio Rao 	 *   (ie. smp_tlb_shootdown()).
5450a2d5feaSAttilio Rao 	 *
5460a2d5feaSAttilio Rao 	 * For the !SMP case it just needs to handle the former problem.
547248bb937SAttilio Rao 	 */
5480a2d5feaSAttilio Rao #ifdef SMP
549248bb937SAttilio Rao 	mtx_lock_spin(&smp_ipi_mtx);
5500a2d5feaSAttilio Rao #else
5510a2d5feaSAttilio Rao 	spinlock_enter();
5520a2d5feaSAttilio Rao #endif
553248bb937SAttilio Rao 
554269fb9d7SJulian Elischer 	/* cpu_boot(howto); */ /* doesn't do anything at the moment */
555ad4240feSJulian Elischer 	cpu_reset();
556fcb893a8SMike Smith 	/* NOTREACHED */ /* assuming reset worked */
557ad4240feSJulian Elischer }
558ad4240feSJulian Elischer 
5596b6bd3b7SAlfred Perlstein #if defined(WITNESS) || defined(INVARIANTS)
5603945a964SAlfred Perlstein static int kassert_warn_only = 0;
561a94053baSAlfred Perlstein #ifdef KDB
562a94053baSAlfred Perlstein static int kassert_do_kdb = 0;
563a94053baSAlfred Perlstein #endif
5643945a964SAlfred Perlstein #ifdef KTR
5653945a964SAlfred Perlstein static int kassert_do_ktr = 0;
5663945a964SAlfred Perlstein #endif
5673945a964SAlfred Perlstein static int kassert_do_log = 1;
5683945a964SAlfred Perlstein static int kassert_log_pps_limit = 4;
5693945a964SAlfred Perlstein static int kassert_log_mute_at = 0;
5703945a964SAlfred Perlstein static int kassert_log_panic_at = 0;
5713945a964SAlfred Perlstein static int kassert_warnings = 0;
5723945a964SAlfred Perlstein 
5733945a964SAlfred Perlstein SYSCTL_NODE(_debug, OID_AUTO, kassert, CTLFLAG_RW, NULL, "kassert options");
5743945a964SAlfred Perlstein 
575af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, warn_only, CTLFLAG_RWTUN,
5763945a964SAlfred Perlstein     &kassert_warn_only, 0,
5773945a964SAlfred Perlstein     "KASSERT triggers a panic (1) or just a warning (0)");
5783945a964SAlfred Perlstein 
579a94053baSAlfred Perlstein #ifdef KDB
580af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, do_kdb, CTLFLAG_RWTUN,
581a94053baSAlfred Perlstein     &kassert_do_kdb, 0, "KASSERT will enter the debugger");
582a94053baSAlfred Perlstein #endif
583a94053baSAlfred Perlstein 
5843945a964SAlfred Perlstein #ifdef KTR
585af3b2549SHans Petter Selasky SYSCTL_UINT(_debug_kassert, OID_AUTO, do_ktr, CTLFLAG_RWTUN,
5863945a964SAlfred Perlstein     &kassert_do_ktr, 0,
5873945a964SAlfred Perlstein     "KASSERT does a KTR, set this to the KTRMASK you want");
5883945a964SAlfred Perlstein #endif
5893945a964SAlfred Perlstein 
590af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, do_log, CTLFLAG_RWTUN,
5913945a964SAlfred Perlstein     &kassert_do_log, 0, "KASSERT triggers a panic (1) or just a warning (0)");
5923945a964SAlfred Perlstein 
593af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, warnings, CTLFLAG_RWTUN,
5943945a964SAlfred Perlstein     &kassert_warnings, 0, "number of KASSERTs that have been triggered");
5953945a964SAlfred Perlstein 
596af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, log_panic_at, CTLFLAG_RWTUN,
5973945a964SAlfred Perlstein     &kassert_log_panic_at, 0, "max number of KASSERTS before we will panic");
5983945a964SAlfred Perlstein 
599af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, log_pps_limit, CTLFLAG_RWTUN,
6003945a964SAlfred Perlstein     &kassert_log_pps_limit, 0, "limit number of log messages per second");
6013945a964SAlfred Perlstein 
602af3b2549SHans Petter Selasky SYSCTL_INT(_debug_kassert, OID_AUTO, log_mute_at, CTLFLAG_RWTUN,
6033945a964SAlfred Perlstein     &kassert_log_mute_at, 0, "max number of KASSERTS to log");
6043945a964SAlfred Perlstein 
6053945a964SAlfred Perlstein static int kassert_sysctl_kassert(SYSCTL_HANDLER_ARGS);
6063945a964SAlfred Perlstein 
6073945a964SAlfred Perlstein SYSCTL_PROC(_debug_kassert, OID_AUTO, kassert,
6083945a964SAlfred Perlstein     CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_SECURE, NULL, 0,
6093945a964SAlfred Perlstein     kassert_sysctl_kassert, "I", "set to trigger a test kassert");
6103945a964SAlfred Perlstein 
6113945a964SAlfred Perlstein static int
6123945a964SAlfred Perlstein kassert_sysctl_kassert(SYSCTL_HANDLER_ARGS)
6133945a964SAlfred Perlstein {
6143945a964SAlfred Perlstein 	int error, i;
6153945a964SAlfred Perlstein 
6163945a964SAlfred Perlstein 	error = sysctl_wire_old_buffer(req, sizeof(int));
6173945a964SAlfred Perlstein 	if (error == 0) {
6183945a964SAlfred Perlstein 		i = 0;
6193945a964SAlfred Perlstein 		error = sysctl_handle_int(oidp, &i, 0, req);
6203945a964SAlfred Perlstein 	}
6213945a964SAlfred Perlstein 	if (error != 0 || req->newptr == NULL)
6223945a964SAlfred Perlstein 		return (error);
6233945a964SAlfred Perlstein 	KASSERT(0, ("kassert_sysctl_kassert triggered kassert %d", i));
6243945a964SAlfred Perlstein 	return (0);
6253945a964SAlfred Perlstein }
6263945a964SAlfred Perlstein 
6273945a964SAlfred Perlstein /*
6283945a964SAlfred Perlstein  * Called by KASSERT, this decides if we will panic
6293945a964SAlfred Perlstein  * or if we will log via printf and/or ktr.
6303945a964SAlfred Perlstein  */
6313945a964SAlfred Perlstein void
6323945a964SAlfred Perlstein kassert_panic(const char *fmt, ...)
6333945a964SAlfred Perlstein {
6343945a964SAlfred Perlstein 	static char buf[256];
6353945a964SAlfred Perlstein 	va_list ap;
6363945a964SAlfred Perlstein 
6373945a964SAlfred Perlstein 	va_start(ap, fmt);
6383945a964SAlfred Perlstein 	(void)vsnprintf(buf, sizeof(buf), fmt, ap);
6393945a964SAlfred Perlstein 	va_end(ap);
6403945a964SAlfred Perlstein 
6413945a964SAlfred Perlstein 	/*
6423945a964SAlfred Perlstein 	 * panic if we're not just warning, or if we've exceeded
6433945a964SAlfred Perlstein 	 * kassert_log_panic_at warnings.
6443945a964SAlfred Perlstein 	 */
6453945a964SAlfred Perlstein 	if (!kassert_warn_only ||
6463945a964SAlfred Perlstein 	    (kassert_log_panic_at > 0 &&
6473945a964SAlfred Perlstein 	     kassert_warnings >= kassert_log_panic_at)) {
6483945a964SAlfred Perlstein 		va_start(ap, fmt);
6493945a964SAlfred Perlstein 		vpanic(fmt, ap);
6503945a964SAlfred Perlstein 		/* NORETURN */
6513945a964SAlfred Perlstein 	}
6523945a964SAlfred Perlstein #ifdef KTR
6533945a964SAlfred Perlstein 	if (kassert_do_ktr)
6543945a964SAlfred Perlstein 		CTR0(ktr_mask, buf);
6553945a964SAlfred Perlstein #endif /* KTR */
6563945a964SAlfred Perlstein 	/*
6573945a964SAlfred Perlstein 	 * log if we've not yet met the mute limit.
6583945a964SAlfred Perlstein 	 */
6593945a964SAlfred Perlstein 	if (kassert_do_log &&
6603945a964SAlfred Perlstein 	    (kassert_log_mute_at == 0 ||
6613945a964SAlfred Perlstein 	     kassert_warnings < kassert_log_mute_at)) {
6623945a964SAlfred Perlstein 		static  struct timeval lasterr;
6633945a964SAlfred Perlstein 		static  int curerr;
6643945a964SAlfred Perlstein 
6653945a964SAlfred Perlstein 		if (ppsratecheck(&lasterr, &curerr, kassert_log_pps_limit)) {
6663945a964SAlfred Perlstein 			printf("KASSERT failed: %s\n", buf);
6673945a964SAlfred Perlstein 			kdb_backtrace();
6683945a964SAlfred Perlstein 		}
6693945a964SAlfred Perlstein 	}
670a94053baSAlfred Perlstein #ifdef KDB
671a94053baSAlfred Perlstein 	if (kassert_do_kdb) {
672a94053baSAlfred Perlstein 		kdb_enter(KDB_WHY_KASSERT, buf);
673a94053baSAlfred Perlstein 	}
674a94053baSAlfred Perlstein #endif
6753945a964SAlfred Perlstein 	atomic_add_int(&kassert_warnings, 1);
6763945a964SAlfred Perlstein }
6773945a964SAlfred Perlstein #endif
6783945a964SAlfred Perlstein 
679ad4240feSJulian Elischer /*
680ad4240feSJulian Elischer  * Panic is called on unresolvable fatal errors.  It prints "panic: mesg",
681ad4240feSJulian Elischer  * and then reboots.  If we are called twice, then we avoid trying to sync
682ad4240feSJulian Elischer  * the disks as this often leads to recursive panics.
683ad4240feSJulian Elischer  */
684ad4240feSJulian Elischer void
6859a6dc4b6SPoul-Henning Kamp panic(const char *fmt, ...)
686ad4240feSJulian Elischer {
6873945a964SAlfred Perlstein 	va_list ap;
6883945a964SAlfred Perlstein 
6893945a964SAlfred Perlstein 	va_start(ap, fmt);
6903945a964SAlfred Perlstein 	vpanic(fmt, ap);
6913945a964SAlfred Perlstein }
6923945a964SAlfred Perlstein 
693da10a603SMark Johnston void
6943945a964SAlfred Perlstein vpanic(const char *fmt, va_list ap)
6953945a964SAlfred Perlstein {
69664dd590eSAndriy Gapon #ifdef SMP
69735370593SAndriy Gapon 	cpuset_t other_cpus;
69864dd590eSAndriy Gapon #endif
699fe799533SAndrew Gallatin 	struct thread *td = curthread;
700e485b64bSJohn Baldwin 	int bootopt, newpanic;
70199237364SAndrey A. Chernov 	static char buf[256];
702ad4240feSJulian Elischer 
70335370593SAndriy Gapon 	spinlock_enter();
70435370593SAndriy Gapon 
7050384fff8SJason Evans #ifdef SMP
7061a5333c3SJohn Baldwin 	/*
7076898bee9SAndriy Gapon 	 * stop_cpus_hard(other_cpus) should prevent multiple CPUs from
7086898bee9SAndriy Gapon 	 * concurrently entering panic.  Only the winner will proceed
7096898bee9SAndriy Gapon 	 * further.
7101a5333c3SJohn Baldwin 	 */
71135370593SAndriy Gapon 	if (panicstr == NULL && !kdb_active) {
71235370593SAndriy Gapon 		other_cpus = all_cpus;
71335370593SAndriy Gapon 		CPU_CLR(PCPU_GET(cpuid), &other_cpus);
71435370593SAndriy Gapon 		stop_cpus_hard(other_cpus);
71535370593SAndriy Gapon 	}
71635370593SAndriy Gapon 
71735370593SAndriy Gapon 	/*
7189ad64f27SMark Johnston 	 * Ensure that the scheduler is stopped while panicking, even if panic
7199ad64f27SMark Johnston 	 * has been entered from kdb.
72035370593SAndriy Gapon 	 */
7215d7380f8SAttilio Rao 	td->td_stopsched = 1;
7220384fff8SJason Evans #endif
7230384fff8SJason Evans 
724e3adb685SAttilio Rao 	bootopt = RB_AUTOBOOT;
725e485b64bSJohn Baldwin 	newpanic = 0;
726ad4240feSJulian Elischer 	if (panicstr)
727ad4240feSJulian Elischer 		bootopt |= RB_NOSYNC;
728e485b64bSJohn Baldwin 	else {
729e3adb685SAttilio Rao 		bootopt |= RB_DUMP;
730ad4240feSJulian Elischer 		panicstr = fmt;
731e485b64bSJohn Baldwin 		newpanic = 1;
732e485b64bSJohn Baldwin 	}
733ad4240feSJulian Elischer 
7344f1b4577SIan Dowse 	if (newpanic) {
7352127f260SArchie Cobbs 		(void)vsnprintf(buf, sizeof(buf), fmt, ap);
73699237364SAndrey A. Chernov 		panicstr = buf;
737bf8696b4SAndriy Gapon 		cngrab();
7389a6dc4b6SPoul-Henning Kamp 		printf("panic: %s\n", buf);
7394f1b4577SIan Dowse 	} else {
7404f1b4577SIan Dowse 		printf("panic: ");
7414f1b4577SIan Dowse 		vprintf(fmt, ap);
7429a6dc4b6SPoul-Henning Kamp 		printf("\n");
7434f1b4577SIan Dowse 	}
74447d81897SSteve Passe #ifdef SMP
74555c45354SJohn Baldwin 	printf("cpuid = %d\n", PCPU_GET(cpuid));
7462bcc63c5SJohn Baldwin #endif
747ad4240feSJulian Elischer 
7482d50560aSMarcel Moolenaar #ifdef KDB
749e485b64bSJohn Baldwin 	if (newpanic && trace_on_panic)
7502d50560aSMarcel Moolenaar 		kdb_backtrace();
751ad4240feSJulian Elischer 	if (debugger_on_panic)
7523de213ccSRobert Watson 		kdb_enter(KDB_WHY_PANIC, "panic");
7531432aa0cSJohn Baldwin #endif
754982d11f8SJeff Roberson 	/*thread_lock(td); */
755fe799533SAndrew Gallatin 	td->td_flags |= TDF_INPANIC;
756982d11f8SJeff Roberson 	/* thread_unlock(td); */
757259ed917SPeter Wemm 	if (!sync_on_panic)
758259ed917SPeter Wemm 		bootopt |= RB_NOSYNC;
75976e18b25SMarcel Moolenaar 	kern_reboot(bootopt);
760ad4240feSJulian Elischer }
761ad4240feSJulian Elischer 
762e0d898b4SJulian Elischer /*
763db82a982SMike Smith  * Support for poweroff delay.
764b22692bdSNick Hibma  *
765b22692bdSNick Hibma  * Please note that setting this delay too short might power off your machine
766b22692bdSNick Hibma  * before the write cache on your hard disk has been flushed, leading to
767b22692bdSNick Hibma  * soft-updates inconsistencies.
768db82a982SMike Smith  */
7699eec6969SMike Smith #ifndef POWEROFF_DELAY
7709eec6969SMike Smith # define POWEROFF_DELAY 5000
7719eec6969SMike Smith #endif
7729eec6969SMike Smith static int poweroff_delay = POWEROFF_DELAY;
7739eec6969SMike Smith 
774db82a982SMike Smith SYSCTL_INT(_kern_shutdown, OID_AUTO, poweroff_delay, CTLFLAG_RW,
7753eb9ab52SEitan Adler     &poweroff_delay, 0, "Delay before poweroff to write disk caches (msec)");
776db82a982SMike Smith 
777fcb893a8SMike Smith static void
778fcb893a8SMike Smith poweroff_wait(void *junk, int howto)
779db82a982SMike Smith {
780e95499bdSAlfred Perlstein 
781db82a982SMike Smith 	if (!(howto & RB_POWEROFF) || poweroff_delay <= 0)
782db82a982SMike Smith 		return;
783db82a982SMike Smith 	DELAY(poweroff_delay * 1000);
784db82a982SMike Smith }
7855e950839SLuoqi Chen 
7865e950839SLuoqi Chen /*
7875e950839SLuoqi Chen  * Some system processes (e.g. syncer) need to be stopped at appropriate
7885e950839SLuoqi Chen  * points in their main loops prior to a system shutdown, so that they
7895e950839SLuoqi Chen  * won't interfere with the shutdown process (e.g. by holding a disk buf
7905e950839SLuoqi Chen  * to cause sync to fail).  For each of these system processes, register
7915e950839SLuoqi Chen  * shutdown_kproc() as a handler for one of shutdown events.
7925e950839SLuoqi Chen  */
7935e950839SLuoqi Chen static int kproc_shutdown_wait = 60;
7945e950839SLuoqi Chen SYSCTL_INT(_kern_shutdown, OID_AUTO, kproc_shutdown_wait, CTLFLAG_RW,
7953eb9ab52SEitan Adler     &kproc_shutdown_wait, 0, "Max wait time (sec) to stop for each process");
7965e950839SLuoqi Chen 
7975e950839SLuoqi Chen void
798ffc831daSJohn Baldwin kproc_shutdown(void *arg, int howto)
7995e950839SLuoqi Chen {
8005e950839SLuoqi Chen 	struct proc *p;
8015e950839SLuoqi Chen 	int error;
8025e950839SLuoqi Chen 
8035e950839SLuoqi Chen 	if (panicstr)
8045e950839SLuoqi Chen 		return;
8055e950839SLuoqi Chen 
8065e950839SLuoqi Chen 	p = (struct proc *)arg;
807b1c81391SNate Lawson 	printf("Waiting (max %d seconds) for system process `%s' to stop...",
8084f9d48e4SJohn Baldwin 	    kproc_shutdown_wait, p->p_comm);
8093745c395SJulian Elischer 	error = kproc_suspend(p, kproc_shutdown_wait * hz);
8105e950839SLuoqi Chen 
8115e950839SLuoqi Chen 	if (error == EWOULDBLOCK)
812b1c81391SNate Lawson 		printf("timed out\n");
8135e950839SLuoqi Chen 	else
814b1c81391SNate Lawson 		printf("done\n");
8155e950839SLuoqi Chen }
81681661c94SPoul-Henning Kamp 
8177ab24ea3SJulian Elischer void
8187ab24ea3SJulian Elischer kthread_shutdown(void *arg, int howto)
8197ab24ea3SJulian Elischer {
8207ab24ea3SJulian Elischer 	struct thread *td;
8217ab24ea3SJulian Elischer 	int error;
8227ab24ea3SJulian Elischer 
8237ab24ea3SJulian Elischer 	if (panicstr)
8247ab24ea3SJulian Elischer 		return;
8257ab24ea3SJulian Elischer 
8267ab24ea3SJulian Elischer 	td = (struct thread *)arg;
8277ab24ea3SJulian Elischer 	printf("Waiting (max %d seconds) for system thread `%s' to stop...",
8284f9d48e4SJohn Baldwin 	    kproc_shutdown_wait, td->td_name);
8297ab24ea3SJulian Elischer 	error = kthread_suspend(td, kproc_shutdown_wait * hz);
8307ab24ea3SJulian Elischer 
8317ab24ea3SJulian Elischer 	if (error == EWOULDBLOCK)
8327ab24ea3SJulian Elischer 		printf("timed out\n");
8337ab24ea3SJulian Elischer 	else
8347ab24ea3SJulian Elischer 		printf("done\n");
8357ab24ea3SJulian Elischer }
8367ab24ea3SJulian Elischer 
837bad7e7f3SAlfred Perlstein static char dumpdevname[sizeof(((struct cdev*)NULL)->si_name)];
838bad7e7f3SAlfred Perlstein SYSCTL_STRING(_kern_shutdown, OID_AUTO, dumpdevname, CTLFLAG_RD,
839bad7e7f3SAlfred Perlstein     dumpdevname, 0, "Device for kernel dumps");
840bad7e7f3SAlfred Perlstein 
84181661c94SPoul-Henning Kamp /* Registration of dumpers */
84281661c94SPoul-Henning Kamp int
8435ebb15b9SPawel Jakub Dawidek set_dumper(struct dumperinfo *di, const char *devname, struct thread *td)
84481661c94SPoul-Henning Kamp {
8455a3a8ec0SAlfred Perlstein 	size_t wantcopy;
8465ebb15b9SPawel Jakub Dawidek 	int error;
8475ebb15b9SPawel Jakub Dawidek 
8485ebb15b9SPawel Jakub Dawidek 	error = priv_check(td, PRIV_SETDUMPER);
8495ebb15b9SPawel Jakub Dawidek 	if (error != 0)
8505ebb15b9SPawel Jakub Dawidek 		return (error);
851e95499bdSAlfred Perlstein 
85281661c94SPoul-Henning Kamp 	if (di == NULL) {
853*5dc5dab6SConrad Meyer 		if (dumper.blockbuf != NULL)
854*5dc5dab6SConrad Meyer 			free(dumper.blockbuf, M_DUMPER);
855*5dc5dab6SConrad Meyer 		bzero(&dumper, sizeof(dumper));
856bad7e7f3SAlfred Perlstein 		dumpdevname[0] = '\0';
85781661c94SPoul-Henning Kamp 		return (0);
85881661c94SPoul-Henning Kamp 	}
85981661c94SPoul-Henning Kamp 	if (dumper.dumper != NULL)
86081661c94SPoul-Henning Kamp 		return (EBUSY);
86181661c94SPoul-Henning Kamp 	dumper = *di;
8625a3a8ec0SAlfred Perlstein 	wantcopy = strlcpy(dumpdevname, devname, sizeof(dumpdevname));
8635a3a8ec0SAlfred Perlstein 	if (wantcopy >= sizeof(dumpdevname)) {
864bad7e7f3SAlfred Perlstein 		printf("set_dumper: device name truncated from '%s' -> '%s'\n",
865bad7e7f3SAlfred Perlstein 			devname, dumpdevname);
866bad7e7f3SAlfred Perlstein 	}
867*5dc5dab6SConrad Meyer 	dumper.blockbuf = malloc(di->blocksize, M_DUMPER, M_WAITOK | M_ZERO);
86881661c94SPoul-Henning Kamp 	return (0);
86981661c94SPoul-Henning Kamp }
87081661c94SPoul-Henning Kamp 
871007b1b7bSRuslan Ermilov /* Call dumper with bounds checking. */
872007b1b7bSRuslan Ermilov int
873007b1b7bSRuslan Ermilov dump_write(struct dumperinfo *di, void *virtual, vm_offset_t physical,
874007b1b7bSRuslan Ermilov     off_t offset, size_t length)
875007b1b7bSRuslan Ermilov {
876007b1b7bSRuslan Ermilov 
877007b1b7bSRuslan Ermilov 	if (length != 0 && (offset < di->mediaoffset ||
878007b1b7bSRuslan Ermilov 	    offset - di->mediaoffset + length > di->mediasize)) {
87958379067SAttilio Rao 		printf("Attempt to write outside dump device boundaries.\n"
88058379067SAttilio Rao 	    "offset(%jd), mediaoffset(%jd), length(%ju), mediasize(%jd).\n",
88158379067SAttilio Rao 		    (intmax_t)offset, (intmax_t)di->mediaoffset,
88258379067SAttilio Rao 		    (uintmax_t)length, (intmax_t)di->mediasize);
88358379067SAttilio Rao 		return (ENOSPC);
884007b1b7bSRuslan Ermilov 	}
885007b1b7bSRuslan Ermilov 	return (di->dumper(di->priv, virtual, physical, offset, length));
886007b1b7bSRuslan Ermilov }
887007b1b7bSRuslan Ermilov 
888*5dc5dab6SConrad Meyer /* Call dumper with bounds checking. */
889*5dc5dab6SConrad Meyer int
890*5dc5dab6SConrad Meyer dump_write_pad(struct dumperinfo *di, void *virtual, vm_offset_t physical,
891*5dc5dab6SConrad Meyer     off_t offset, size_t length, size_t *size)
892*5dc5dab6SConrad Meyer {
893*5dc5dab6SConrad Meyer 	char *temp;
894*5dc5dab6SConrad Meyer 	int ret;
895*5dc5dab6SConrad Meyer 
896*5dc5dab6SConrad Meyer 	if (length > di->blocksize)
897*5dc5dab6SConrad Meyer 		return (ENOMEM);
898*5dc5dab6SConrad Meyer 
899*5dc5dab6SConrad Meyer 	*size = di->blocksize;
900*5dc5dab6SConrad Meyer 	if (length == di->blocksize)
901*5dc5dab6SConrad Meyer 		temp = virtual;
902*5dc5dab6SConrad Meyer 	else {
903*5dc5dab6SConrad Meyer 		temp = di->blockbuf;
904*5dc5dab6SConrad Meyer 		memset(temp + length, 0, di->blocksize - length);
905*5dc5dab6SConrad Meyer 		memcpy(temp, virtual, length);
906*5dc5dab6SConrad Meyer 	}
907*5dc5dab6SConrad Meyer 	ret = dump_write(di, temp, physical, offset, *size);
908*5dc5dab6SConrad Meyer 
909*5dc5dab6SConrad Meyer 	return (ret);
910*5dc5dab6SConrad Meyer }
911*5dc5dab6SConrad Meyer 
912*5dc5dab6SConrad Meyer 
913e6592ee5SPeter Wemm void
914e6592ee5SPeter Wemm mkdumpheader(struct kerneldumpheader *kdh, char *magic, uint32_t archver,
915e6592ee5SPeter Wemm     uint64_t dumplen, uint32_t blksz)
916e6592ee5SPeter Wemm {
917e6592ee5SPeter Wemm 
918e6592ee5SPeter Wemm 	bzero(kdh, sizeof(*kdh));
9197a9c38e6SAlan Somers 	strlcpy(kdh->magic, magic, sizeof(kdh->magic));
9207a9c38e6SAlan Somers 	strlcpy(kdh->architecture, MACHINE_ARCH, sizeof(kdh->architecture));
921e6592ee5SPeter Wemm 	kdh->version = htod32(KERNELDUMPVERSION);
922e6592ee5SPeter Wemm 	kdh->architectureversion = htod32(archver);
923e6592ee5SPeter Wemm 	kdh->dumplength = htod64(dumplen);
924e6592ee5SPeter Wemm 	kdh->dumptime = htod64(time_second);
925e6592ee5SPeter Wemm 	kdh->blocksize = htod32(blksz);
9267a9c38e6SAlan Somers 	strlcpy(kdh->hostname, prison0.pr_hostname, sizeof(kdh->hostname));
9277a9c38e6SAlan Somers 	strlcpy(kdh->versionstring, version, sizeof(kdh->versionstring));
928e6592ee5SPeter Wemm 	if (panicstr != NULL)
9297a9c38e6SAlan Somers 		strlcpy(kdh->panicstring, panicstr, sizeof(kdh->panicstring));
930e6592ee5SPeter Wemm 	kdh->parity = kerneldump_parity(kdh);
931e6592ee5SPeter Wemm }
932