xref: /freebsd/sys/kern/kern_shutdown.c (revision 08a9c2050064cb63274f8b08943257711217ea62)
1ad4240feSJulian Elischer /*-
2ad4240feSJulian Elischer  * Copyright (c) 1986, 1988, 1991, 1993
3ad4240feSJulian Elischer  *	The Regents of the University of California.  All rights reserved.
4ad4240feSJulian Elischer  * (c) UNIX System Laboratories, Inc.
5ad4240feSJulian Elischer  * All or some portions of this file are derived from material licensed
6ad4240feSJulian Elischer  * to the University of California by American Telephone and Telegraph
7ad4240feSJulian Elischer  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
8ad4240feSJulian Elischer  * the permission of UNIX System Laboratories, Inc.
9ad4240feSJulian Elischer  *
10ad4240feSJulian Elischer  * Redistribution and use in source and binary forms, with or without
11ad4240feSJulian Elischer  * modification, are permitted provided that the following conditions
12ad4240feSJulian Elischer  * are met:
13ad4240feSJulian Elischer  * 1. Redistributions of source code must retain the above copyright
14ad4240feSJulian Elischer  *    notice, this list of conditions and the following disclaimer.
15ad4240feSJulian Elischer  * 2. Redistributions in binary form must reproduce the above copyright
16ad4240feSJulian Elischer  *    notice, this list of conditions and the following disclaimer in the
17ad4240feSJulian Elischer  *    documentation and/or other materials provided with the distribution.
18ad4240feSJulian Elischer  * 4. Neither the name of the University nor the names of its contributors
19ad4240feSJulian Elischer  *    may be used to endorse or promote products derived from this software
20ad4240feSJulian Elischer  *    without specific prior written permission.
21ad4240feSJulian Elischer  *
22ad4240feSJulian Elischer  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23ad4240feSJulian Elischer  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24ad4240feSJulian Elischer  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25ad4240feSJulian Elischer  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26ad4240feSJulian Elischer  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27ad4240feSJulian Elischer  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28ad4240feSJulian Elischer  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29ad4240feSJulian Elischer  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30ad4240feSJulian Elischer  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31ad4240feSJulian Elischer  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32ad4240feSJulian Elischer  * SUCH DAMAGE.
33ad4240feSJulian Elischer  *
34ad4240feSJulian Elischer  *	@(#)kern_shutdown.c	8.3 (Berkeley) 1/21/94
35ad4240feSJulian Elischer  */
36ad4240feSJulian Elischer 
37677b542eSDavid E. O'Brien #include <sys/cdefs.h>
38677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
39677b542eSDavid E. O'Brien 
40618c7db3SRobert Watson #include "opt_ddb.h"
412d50560aSMarcel Moolenaar #include "opt_kdb.h"
426d58e6cbSBruce Evans #include "opt_panic.h"
436d58e6cbSBruce Evans #include "opt_show_busybufs.h"
449923b511SScott Long #include "opt_sched.h"
45ad4240feSJulian Elischer 
46ad4240feSJulian Elischer #include <sys/param.h>
47ad4240feSJulian Elischer #include <sys/systm.h>
489626b608SPoul-Henning Kamp #include <sys/bio.h>
49fc8f7066SBruce Evans #include <sys/buf.h>
501d79f1bbSJohn Baldwin #include <sys/conf.h>
511d79f1bbSJohn Baldwin #include <sys/cons.h>
521d79f1bbSJohn Baldwin #include <sys/eventhandler.h>
5376ca6f88SJamie Gritton #include <sys/jail.h>
542d50560aSMarcel Moolenaar #include <sys/kdb.h>
55ad4240feSJulian Elischer #include <sys/kernel.h>
56e6592ee5SPeter Wemm #include <sys/kerneldump.h>
575e950839SLuoqi Chen #include <sys/kthread.h>
58dcd7d9b7SMaxim Sobolev #include <sys/malloc.h>
59ac0ad63fSBruce Evans #include <sys/mount.h>
60acd3428bSRobert Watson #include <sys/priv.h>
611d79f1bbSJohn Baldwin #include <sys/proc.h>
621d79f1bbSJohn Baldwin #include <sys/reboot.h>
631d79f1bbSJohn Baldwin #include <sys/resourcevar.h>
6420e25d7dSPeter Wemm #include <sys/sched.h>
65248bb937SAttilio Rao #include <sys/smp.h>
66ad4240feSJulian Elischer #include <sys/sysctl.h>
67ad4240feSJulian Elischer #include <sys/sysproto.h>
68ad4240feSJulian Elischer 
69618c7db3SRobert Watson #include <ddb/ddb.h>
70618c7db3SRobert Watson 
7126502503SMarcel Moolenaar #include <machine/cpu.h>
72d39e457bSPoul-Henning Kamp #include <machine/pcb.h>
73752dff3dSJake Burkholder #include <machine/smp.h>
74ad4240feSJulian Elischer 
75aed55708SRobert Watson #include <security/mac/mac_framework.h>
76aed55708SRobert Watson 
770909f38aSPawel Jakub Dawidek #include <vm/vm.h>
780909f38aSPawel Jakub Dawidek #include <vm/vm_object.h>
790909f38aSPawel Jakub Dawidek #include <vm/vm_page.h>
800909f38aSPawel Jakub Dawidek #include <vm/vm_pager.h>
810909f38aSPawel Jakub Dawidek #include <vm/swap_pager.h>
820909f38aSPawel Jakub Dawidek 
83ad4240feSJulian Elischer #include <sys/signalvar.h>
84ad4240feSJulian Elischer 
85ad4240feSJulian Elischer #ifndef PANIC_REBOOT_WAIT_TIME
86ad4240feSJulian Elischer #define PANIC_REBOOT_WAIT_TIME 15 /* default to 15 seconds */
87ad4240feSJulian Elischer #endif
88ad4240feSJulian Elischer 
89ad4240feSJulian Elischer /*
90ad4240feSJulian Elischer  * Note that stdarg.h and the ANSI style va_start macro is used for both
91ad4240feSJulian Elischer  * ANSI and traditional C compilers.
92ad4240feSJulian Elischer  */
93ad4240feSJulian Elischer #include <machine/stdarg.h>
94ad4240feSJulian Elischer 
952d50560aSMarcel Moolenaar #ifdef KDB
962d50560aSMarcel Moolenaar #ifdef KDB_UNATTENDED
979959b1a8SMike Smith int debugger_on_panic = 0;
98ad4240feSJulian Elischer #else
999959b1a8SMike Smith int debugger_on_panic = 1;
100ad4240feSJulian Elischer #endif
101*08a9c205SAndriy Gapon SYSCTL_INT(_debug, OID_AUTO, debugger_on_panic, CTLFLAG_RW | CTLFLAG_TUN,
1023d177f46SBill Fumerola 	&debugger_on_panic, 0, "Run debugger on kernel panic");
103*08a9c205SAndriy Gapon TUNABLE_INT("debug.debugger_on_panic", &debugger_on_panic);
104e485b64bSJohn Baldwin 
1052d50560aSMarcel Moolenaar #ifdef KDB_TRACE
106*08a9c205SAndriy Gapon static int trace_on_panic = 1;
107e485b64bSJohn Baldwin #else
108*08a9c205SAndriy Gapon static int trace_on_panic = 0;
109e485b64bSJohn Baldwin #endif
110*08a9c205SAndriy Gapon SYSCTL_INT(_debug, OID_AUTO, trace_on_panic, CTLFLAG_RW | CTLFLAG_TUN,
111e485b64bSJohn Baldwin 	&trace_on_panic, 0, "Print stack trace on kernel panic");
112*08a9c205SAndriy Gapon TUNABLE_INT("debug.trace_on_panic", &trace_on_panic);
1132d50560aSMarcel Moolenaar #endif /* KDB */
114ad4240feSJulian Elischer 
115*08a9c205SAndriy Gapon static int sync_on_panic = 0;
116*08a9c205SAndriy Gapon SYSCTL_INT(_kern, OID_AUTO, sync_on_panic, CTLFLAG_RW | CTLFLAG_TUN,
117259ed917SPeter Wemm 	&sync_on_panic, 0, "Do a sync before rebooting from a panic");
118*08a9c205SAndriy Gapon TUNABLE_INT("kern.sync_on_panic", &sync_on_panic);
119259ed917SPeter Wemm 
120db82a982SMike Smith SYSCTL_NODE(_kern, OID_AUTO, shutdown, CTLFLAG_RW, 0, "Shutdown environment");
121db82a982SMike Smith 
1225230cfd2SJulian Elischer /*
123ad4240feSJulian Elischer  * Variable panicstr contains argument to first call to panic; used as flag
124ad4240feSJulian Elischer  * to indicate that the kernel has already called panic.
125ad4240feSJulian Elischer  */
126ad4240feSJulian Elischer const char *panicstr;
127ad4240feSJulian Elischer 
12816a011f9SPaul Saab int dumping;				/* system is dumping */
12936a52c3cSJeff Roberson int rebooting;				/* system is rebooting */
13081661c94SPoul-Henning Kamp static struct dumperinfo dumper;	/* our selected dumper */
1312d50560aSMarcel Moolenaar 
1322d50560aSMarcel Moolenaar /* Context information for dump-debuggers. */
1332d50560aSMarcel Moolenaar static struct pcb dumppcb;		/* Registers. */
1342d50560aSMarcel Moolenaar static lwpid_t dumptid;			/* Thread ID. */
13516a011f9SPaul Saab 
13682acbcf5SPeter Wemm static void boot(int) __dead2;
13782acbcf5SPeter Wemm static void poweroff_wait(void *, int);
13882acbcf5SPeter Wemm static void shutdown_halt(void *junk, int howto);
13982acbcf5SPeter Wemm static void shutdown_panic(void *junk, int howto);
14082acbcf5SPeter Wemm static void shutdown_reset(void *junk, int howto);
141f06a54f0SPoul-Henning Kamp 
142fcb893a8SMike Smith /* register various local shutdown events */
143fcb893a8SMike Smith static void
144fcb893a8SMike Smith shutdown_conf(void *unused)
145fcb893a8SMike Smith {
146e95499bdSAlfred Perlstein 
147e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, poweroff_wait, NULL,
1486f15a274SAlexander Motin 	    SHUTDOWN_PRI_FIRST + 100);
149e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_halt, NULL,
150e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 100);
151e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_panic, NULL,
152e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 100);
153e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_reset, NULL,
154e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 200);
155fcb893a8SMike Smith }
156ad4240feSJulian Elischer 
157237fdd78SRobert Watson SYSINIT(shutdown_conf, SI_SUB_INTRINSIC, SI_ORDER_ANY, shutdown_conf, NULL);
158fcb893a8SMike Smith 
159ad4240feSJulian Elischer /*
1600c14ff0eSRobert Watson  * The system call that results in a reboot.
161ad4240feSJulian Elischer  */
162835a82eeSMatthew Dillon /* ARGSUSED */
163ad4240feSJulian Elischer int
164b40ce416SJulian Elischer reboot(struct thread *td, struct reboot_args *uap)
165ad4240feSJulian Elischer {
166ad4240feSJulian Elischer 	int error;
167ad4240feSJulian Elischer 
168a2ecb9b7SRobert Watson 	error = 0;
169a2ecb9b7SRobert Watson #ifdef MAC
17030d239bcSRobert Watson 	error = mac_system_check_reboot(td->td_ucred, uap->opt);
171a2ecb9b7SRobert Watson #endif
172a2ecb9b7SRobert Watson 	if (error == 0)
173acd3428bSRobert Watson 		error = priv_check(td, PRIV_REBOOT);
174a2ecb9b7SRobert Watson 	if (error == 0) {
175835a82eeSMatthew Dillon 		mtx_lock(&Giant);
176ad4240feSJulian Elischer 		boot(uap->opt);
177835a82eeSMatthew Dillon 		mtx_unlock(&Giant);
178a2ecb9b7SRobert Watson 	}
179835a82eeSMatthew Dillon 	return (error);
180ad4240feSJulian Elischer }
181ad4240feSJulian Elischer 
182ad4240feSJulian Elischer /*
183ad4240feSJulian Elischer  * Called by events that want to shut down.. e.g  <CTL><ALT><DEL> on a PC
184ad4240feSJulian Elischer  */
1853e755f76SMike Smith static int shutdown_howto = 0;
1863e755f76SMike Smith 
187ad4240feSJulian Elischer void
1883e755f76SMike Smith shutdown_nice(int howto)
189ad4240feSJulian Elischer {
190e95499bdSAlfred Perlstein 
1913e755f76SMike Smith 	shutdown_howto = howto;
1923e755f76SMike Smith 
193ad4240feSJulian Elischer 	/* Send a signal to init(8) and have it shutdown the world */
194ad4240feSJulian Elischer 	if (initproc != NULL) {
19587729a2bSJohn Baldwin 		PROC_LOCK(initproc);
196ad4240feSJulian Elischer 		psignal(initproc, SIGINT);
19787729a2bSJohn Baldwin 		PROC_UNLOCK(initproc);
198ad4240feSJulian Elischer 	} else {
199ad4240feSJulian Elischer 		/* No init(8) running, so simply reboot */
200ad4240feSJulian Elischer 		boot(RB_NOSYNC);
201ad4240feSJulian Elischer 	}
202ad4240feSJulian Elischer 	return;
203ad4240feSJulian Elischer }
204ad4240feSJulian Elischer static int	waittime = -1;
205ad4240feSJulian Elischer 
20672dfe7a3SPoul-Henning Kamp static void
20782acbcf5SPeter Wemm print_uptime(void)
20872dfe7a3SPoul-Henning Kamp {
20972dfe7a3SPoul-Henning Kamp 	int f;
21072dfe7a3SPoul-Henning Kamp 	struct timespec ts;
21172dfe7a3SPoul-Henning Kamp 
21272dfe7a3SPoul-Henning Kamp 	getnanouptime(&ts);
21372dfe7a3SPoul-Henning Kamp 	printf("Uptime: ");
21472dfe7a3SPoul-Henning Kamp 	f = 0;
21572dfe7a3SPoul-Henning Kamp 	if (ts.tv_sec >= 86400) {
2164a6404dfSJohn Baldwin 		printf("%ldd", (long)ts.tv_sec / 86400);
21772dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 86400;
21872dfe7a3SPoul-Henning Kamp 		f = 1;
21972dfe7a3SPoul-Henning Kamp 	}
22072dfe7a3SPoul-Henning Kamp 	if (f || ts.tv_sec >= 3600) {
2214a6404dfSJohn Baldwin 		printf("%ldh", (long)ts.tv_sec / 3600);
22272dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 3600;
22372dfe7a3SPoul-Henning Kamp 		f = 1;
22472dfe7a3SPoul-Henning Kamp 	}
22572dfe7a3SPoul-Henning Kamp 	if (f || ts.tv_sec >= 60) {
2264a6404dfSJohn Baldwin 		printf("%ldm", (long)ts.tv_sec / 60);
22772dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 60;
22872dfe7a3SPoul-Henning Kamp 		f = 1;
22972dfe7a3SPoul-Henning Kamp 	}
2304a6404dfSJohn Baldwin 	printf("%lds\n", (long)ts.tv_sec);
23172dfe7a3SPoul-Henning Kamp }
23272dfe7a3SPoul-Henning Kamp 
233d39e457bSPoul-Henning Kamp static void
234d39e457bSPoul-Henning Kamp doadump(void)
235d39e457bSPoul-Henning Kamp {
236e95499bdSAlfred Perlstein 
237f6449d9dSJulian Elischer 	/*
238f6449d9dSJulian Elischer 	 * Sometimes people have to call this from the kernel debugger.
239f6449d9dSJulian Elischer 	 * (if 'panic' can not dump)
240f6449d9dSJulian Elischer 	 * Give them a clue as to why they can't dump.
241f6449d9dSJulian Elischer 	 */
242f6449d9dSJulian Elischer 	if (dumper.dumper == NULL) {
24327d68f90SDavid Malone 		printf("Cannot dump. Device not defined or unavailable.\n");
244f6449d9dSJulian Elischer 		return;
245f6449d9dSJulian Elischer 	}
246f6449d9dSJulian Elischer 
247d39e457bSPoul-Henning Kamp 	savectx(&dumppcb);
2482d50560aSMarcel Moolenaar 	dumptid = curthread->td_tid;
249d39e457bSPoul-Henning Kamp 	dumping++;
250618c7db3SRobert Watson #ifdef DDB
251618c7db3SRobert Watson 	if (textdump_pending)
252618c7db3SRobert Watson 		textdump_dumpsys(&dumper);
253618c7db3SRobert Watson 	else
254618c7db3SRobert Watson #endif
255d39e457bSPoul-Henning Kamp 		dumpsys(&dumper);
2569e473363SRuslan Ermilov 	dumping--;
257d39e457bSPoul-Henning Kamp }
258d39e457bSPoul-Henning Kamp 
259d07f87a2SDon Lewis static int
260d07f87a2SDon Lewis isbufbusy(struct buf *bp)
261d07f87a2SDon Lewis {
262d07f87a2SDon Lewis 	if (((bp->b_flags & (B_INVAL | B_PERSISTENT)) == 0 &&
263d638e093SAttilio Rao 	    BUF_ISLOCKED(bp)) ||
264d07f87a2SDon Lewis 	    ((bp->b_flags & (B_DELWRI | B_INVAL)) == B_DELWRI))
265d07f87a2SDon Lewis 		return (1);
266d07f87a2SDon Lewis 	return (0);
267d07f87a2SDon Lewis }
268d07f87a2SDon Lewis 
269ad4240feSJulian Elischer /*
27070ce93f4SNate Lawson  * Shutdown the system cleanly to prepare for reboot, halt, or power off.
271ad4240feSJulian Elischer  */
272fc8f7066SBruce Evans static void
27382acbcf5SPeter Wemm boot(int howto)
274ad4240feSJulian Elischer {
275b6915bdbSDon Lewis 	static int first_buf_printf = 1;
276ad4240feSJulian Elischer 
277f7ebc7ceSMarcel Moolenaar #if defined(SMP)
27870ce93f4SNate Lawson 	/*
27970ce93f4SNate Lawson 	 * Bind us to CPU 0 so that all shutdown code runs there.  Some
28070ce93f4SNate Lawson 	 * systems don't shutdown properly (i.e., ACPI power off) if we
28170ce93f4SNate Lawson 	 * run on another processor.
28270ce93f4SNate Lawson 	 */
283982d11f8SJeff Roberson 	thread_lock(curthread);
28420e25d7dSPeter Wemm 	sched_bind(curthread, 0);
285982d11f8SJeff Roberson 	thread_unlock(curthread);
2862fd32b93SNate Lawson 	KASSERT(PCPU_GET(cpuid) == 0, ("boot: not running on cpu 0"));
28720e25d7dSPeter Wemm #endif
28836a52c3cSJeff Roberson 	/* We're in the process of rebooting. */
28936a52c3cSJeff Roberson 	rebooting = 1;
29020e25d7dSPeter Wemm 
2913e755f76SMike Smith 	/* collect extra flags that shutdown_nice might have set */
2923e755f76SMike Smith 	howto |= shutdown_howto;
2933e755f76SMike Smith 
29461e96500SJohn Baldwin 	/* We are out of the debugger now. */
2952d50560aSMarcel Moolenaar 	kdb_active = 0;
29661e96500SJohn Baldwin 
2975230cfd2SJulian Elischer 	/*
2985230cfd2SJulian Elischer 	 * Do any callouts that should be done BEFORE syncing the filesystems.
2995230cfd2SJulian Elischer 	 */
300fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_pre_sync, howto);
3015230cfd2SJulian Elischer 
3025230cfd2SJulian Elischer 	/*
3035230cfd2SJulian Elischer 	 * Now sync filesystems
3045230cfd2SJulian Elischer 	 */
305ad4240feSJulian Elischer 	if (!cold && (howto & RB_NOSYNC) == 0 && waittime < 0) {
306ad4240feSJulian Elischer 		register struct buf *bp;
30762820f25SJason Evans 		int iter, nbusy, pbusy;
3080c0b25aeSJohn Baldwin #ifndef PREEMPTION
30962820f25SJason Evans 		int subiter;
3100c0b25aeSJohn Baldwin #endif
311ad4240feSJulian Elischer 
312ad4240feSJulian Elischer 		waittime = 0;
313ad4240feSJulian Elischer 
3143fafa27bSStephan Uphoff 		sync(curthread, NULL);
315ad4240feSJulian Elischer 
316b1897c19SJulian Elischer 		/*
317b1897c19SJulian Elischer 		 * With soft updates, some buffers that are
318b1897c19SJulian Elischer 		 * written will be remarked as dirty until other
319b1897c19SJulian Elischer 		 * buffers are written.
320b1897c19SJulian Elischer 		 */
32162820f25SJason Evans 		for (iter = pbusy = 0; iter < 20; iter++) {
322ad4240feSJulian Elischer 			nbusy = 0;
323d07f87a2SDon Lewis 			for (bp = &buf[nbuf]; --bp >= buf; )
324d07f87a2SDon Lewis 				if (isbufbusy(bp))
325ad4240feSJulian Elischer 					nbusy++;
326b6915bdbSDon Lewis 			if (nbusy == 0) {
327b6915bdbSDon Lewis 				if (first_buf_printf)
32837abb77fSPoul-Henning Kamp 					printf("All buffers synced.");
329ad4240feSJulian Elischer 				break;
330b6915bdbSDon Lewis 			}
331b6915bdbSDon Lewis 			if (first_buf_printf) {
332b6915bdbSDon Lewis 				printf("Syncing disks, buffers remaining... ");
333b6915bdbSDon Lewis 				first_buf_printf = 0;
334b6915bdbSDon Lewis 			}
335ad4240feSJulian Elischer 			printf("%d ", nbusy);
33662820f25SJason Evans 			if (nbusy < pbusy)
33762820f25SJason Evans 				iter = 0;
33862820f25SJason Evans 			pbusy = nbusy;
3393fafa27bSStephan Uphoff 			sync(curthread, NULL);
3400c0b25aeSJohn Baldwin 
3410c0b25aeSJohn Baldwin #ifdef PREEMPTION
3420c0b25aeSJohn Baldwin 			/*
3430c0b25aeSJohn Baldwin 			 * Drop Giant and spin for a while to allow
3440c0b25aeSJohn Baldwin 			 * interrupt threads to run.
3450c0b25aeSJohn Baldwin 			 */
3460c0b25aeSJohn Baldwin 			DROP_GIANT();
3470c0b25aeSJohn Baldwin 			DELAY(50000 * iter);
3480c0b25aeSJohn Baldwin 			PICKUP_GIANT();
3490c0b25aeSJohn Baldwin #else
3500c0b25aeSJohn Baldwin 			/*
3510c0b25aeSJohn Baldwin 			 * Drop Giant and context switch several times to
3520c0b25aeSJohn Baldwin 			 * allow interrupt threads to run.
3530c0b25aeSJohn Baldwin 			 */
354c86b6ff5SJohn Baldwin 			DROP_GIANT();
35562820f25SJason Evans 			for (subiter = 0; subiter < 50 * iter; subiter++) {
356982d11f8SJeff Roberson 				thread_lock(curthread);
357bf0acc27SJohn Baldwin 				mi_switch(SW_VOL, NULL);
358982d11f8SJeff Roberson 				thread_unlock(curthread);
35962820f25SJason Evans 				DELAY(1000);
36062820f25SJason Evans 			}
36120cdcc5bSJohn Baldwin 			PICKUP_GIANT();
3620c0b25aeSJohn Baldwin #endif
363ad4240feSJulian Elischer 		}
364c8c216d5SNate Lawson 		printf("\n");
365d02d6d04SMike Smith 		/*
366d02d6d04SMike Smith 		 * Count only busy local buffers to prevent forcing
367d02d6d04SMike Smith 		 * a fsck if we're just a client of a wedged NFS server
368d02d6d04SMike Smith 		 */
369d02d6d04SMike Smith 		nbusy = 0;
370d02d6d04SMike Smith 		for (bp = &buf[nbuf]; --bp >= buf; ) {
371d07f87a2SDon Lewis 			if (isbufbusy(bp)) {
372c5690651SPoul-Henning Kamp #if 0
373c5690651SPoul-Henning Kamp /* XXX: This is bogus.  We should probably have a BO_REMOTE flag instead */
374f3732fd1SPoul-Henning Kamp 				if (bp->b_dev == NULL) {
3750429e37aSPoul-Henning Kamp 					TAILQ_REMOVE(&mountlist,
37667812eacSKirk McKusick 					    bp->b_vp->v_mount, mnt_list);
3779c111b31SPoul-Henning Kamp 					continue;
378dfd5dee1SPeter Wemm 				}
379c5690651SPoul-Henning Kamp #endif
3809c111b31SPoul-Henning Kamp 				nbusy++;
3819c111b31SPoul-Henning Kamp #if defined(SHOW_BUSYBUFS) || defined(DIAGNOSTIC)
3829c111b31SPoul-Henning Kamp 				printf(
383c5690651SPoul-Henning Kamp 			    "%d: bufobj:%p, flags:%0x, blkno:%ld, lblkno:%ld\n",
384c5690651SPoul-Henning Kamp 				    nbusy, bp->b_bufobj,
3859c111b31SPoul-Henning Kamp 				    bp->b_flags, (long)bp->b_blkno,
3869c111b31SPoul-Henning Kamp 				    (long)bp->b_lblkno);
3879c111b31SPoul-Henning Kamp #endif
3889c111b31SPoul-Henning Kamp 			}
389d02d6d04SMike Smith 		}
390ad4240feSJulian Elischer 		if (nbusy) {
391ad4240feSJulian Elischer 			/*
392ad4240feSJulian Elischer 			 * Failed to sync all blocks. Indicate this and don't
393ad4240feSJulian Elischer 			 * unmount filesystems (thus forcing an fsck on reboot).
394ad4240feSJulian Elischer 			 */
395b6915bdbSDon Lewis 			printf("Giving up on %d buffers\n", nbusy);
396ad4240feSJulian Elischer 			DELAY(5000000);	/* 5 seconds */
397ad4240feSJulian Elischer 		} else {
398b6915bdbSDon Lewis 			if (!first_buf_printf)
399b6915bdbSDon Lewis 				printf("Final sync complete\n");
400ad4240feSJulian Elischer 			/*
401ad4240feSJulian Elischer 			 * Unmount filesystems
402ad4240feSJulian Elischer 			 */
403ad4240feSJulian Elischer 			if (panicstr == 0)
404ad4240feSJulian Elischer 				vfs_unmountall();
405ad4240feSJulian Elischer 		}
4060909f38aSPawel Jakub Dawidek 		swapoff_all();
407ad4240feSJulian Elischer 		DELAY(100000);		/* wait for console output to finish */
408ad4240feSJulian Elischer 	}
4095230cfd2SJulian Elischer 
41072dfe7a3SPoul-Henning Kamp 	print_uptime();
41172dfe7a3SPoul-Henning Kamp 
4125230cfd2SJulian Elischer 	/*
4135230cfd2SJulian Elischer 	 * Ok, now do things that assume all filesystem activity has
4145230cfd2SJulian Elischer 	 * been completed.
4155230cfd2SJulian Elischer 	 */
416fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_post_sync, howto);
41770ce93f4SNate Lawson 
418f6449d9dSJulian Elischer 	if ((howto & (RB_HALT|RB_DUMP)) == RB_DUMP && !cold && !dumping)
419d39e457bSPoul-Henning Kamp 		doadump();
4202cfa0a03SJustin T. Gibbs 
4212cfa0a03SJustin T. Gibbs 	/* Now that we're going to really halt the system... */
422fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_final, howto);
4232cfa0a03SJustin T. Gibbs 
424fcb893a8SMike Smith 	for(;;) ;	/* safety against shutdown_reset not working */
425fcb893a8SMike Smith 	/* NOTREACHED */
426fcb893a8SMike Smith }
427fcb893a8SMike Smith 
428fcb893a8SMike Smith /*
429fcb893a8SMike Smith  * If the shutdown was a clean halt, behave accordingly.
430fcb893a8SMike Smith  */
431fcb893a8SMike Smith static void
432fcb893a8SMike Smith shutdown_halt(void *junk, int howto)
433fcb893a8SMike Smith {
434e95499bdSAlfred Perlstein 
435ad4240feSJulian Elischer 	if (howto & RB_HALT) {
436ad4240feSJulian Elischer 		printf("\n");
437ad4240feSJulian Elischer 		printf("The operating system has halted.\n");
438ad4240feSJulian Elischer 		printf("Please press any key to reboot.\n\n");
439d13d3630SJulian Elischer 		switch (cngetc()) {
440d13d3630SJulian Elischer 		case -1:		/* No console, just die */
441d13d3630SJulian Elischer 			cpu_halt();
442d13d3630SJulian Elischer 			/* NOTREACHED */
443d13d3630SJulian Elischer 		default:
4442cfa0a03SJustin T. Gibbs 			howto &= ~RB_HALT;
445d13d3630SJulian Elischer 			break;
446d13d3630SJulian Elischer 		}
447fcb893a8SMike Smith 	}
448fcb893a8SMike Smith }
449ad4240feSJulian Elischer 
450fcb893a8SMike Smith /*
451fcb893a8SMike Smith  * Check to see if the system paniced, pause and then reboot
452fcb893a8SMike Smith  * according to the specified delay.
453fcb893a8SMike Smith  */
454fcb893a8SMike Smith static void
455fcb893a8SMike Smith shutdown_panic(void *junk, int howto)
456fcb893a8SMike Smith {
457fcb893a8SMike Smith 	int loop;
458fcb893a8SMike Smith 
459fcb893a8SMike Smith 	if (howto & RB_DUMP) {
460ad4240feSJulian Elischer 		if (PANIC_REBOOT_WAIT_TIME != 0) {
461ad4240feSJulian Elischer 			if (PANIC_REBOOT_WAIT_TIME != -1) {
4622cfa0a03SJustin T. Gibbs 				printf("Automatic reboot in %d seconds - "
4632cfa0a03SJustin T. Gibbs 				       "press a key on the console to abort\n",
464ad4240feSJulian Elischer 					PANIC_REBOOT_WAIT_TIME);
4652cfa0a03SJustin T. Gibbs 				for (loop = PANIC_REBOOT_WAIT_TIME * 10;
4662cfa0a03SJustin T. Gibbs 				     loop > 0; --loop) {
467ad4240feSJulian Elischer 					DELAY(1000 * 100); /* 1/10th second */
468a7f8f2abSBruce Evans 					/* Did user type a key? */
469a7f8f2abSBruce Evans 					if (cncheckc() != -1)
470ad4240feSJulian Elischer 						break;
471ad4240feSJulian Elischer 				}
472ad4240feSJulian Elischer 				if (!loop)
473fcb893a8SMike Smith 					return;
474ad4240feSJulian Elischer 			}
475ad4240feSJulian Elischer 		} else { /* zero time specified - reboot NOW */
476fcb893a8SMike Smith 			return;
477ad4240feSJulian Elischer 		}
478422702e9SNik Clayton 		printf("--> Press a key on the console to reboot,\n");
479422702e9SNik Clayton 		printf("--> or switch off the system now.\n");
480ad4240feSJulian Elischer 		cngetc();
481ad4240feSJulian Elischer 	}
482fcb893a8SMike Smith }
483fcb893a8SMike Smith 
484fcb893a8SMike Smith /*
485fcb893a8SMike Smith  * Everything done, now reset
486fcb893a8SMike Smith  */
487fcb893a8SMike Smith static void
488fcb893a8SMike Smith shutdown_reset(void *junk, int howto)
489fcb893a8SMike Smith {
490e95499bdSAlfred Perlstein 
491ad4240feSJulian Elischer 	printf("Rebooting...\n");
492ad4240feSJulian Elischer 	DELAY(1000000);	/* wait 1 sec for printf's to complete and be read */
493248bb937SAttilio Rao 
494248bb937SAttilio Rao 	/*
495248bb937SAttilio Rao 	 * Acquiring smp_ipi_mtx here has a double effect:
496248bb937SAttilio Rao 	 * - it disables interrupts avoiding CPU0 preemption
497248bb937SAttilio Rao 	 *   by fast handlers (thus deadlocking  against other CPUs)
498248bb937SAttilio Rao 	 * - it avoids deadlocks against smp_rendezvous() or, more
499248bb937SAttilio Rao 	 *   generally, threads busy-waiting, with this spinlock held,
500248bb937SAttilio Rao 	 *   and waiting for responses by threads on other CPUs
501248bb937SAttilio Rao 	 *   (ie. smp_tlb_shootdown()).
5020a2d5feaSAttilio Rao 	 *
5030a2d5feaSAttilio Rao 	 * For the !SMP case it just needs to handle the former problem.
504248bb937SAttilio Rao 	 */
5050a2d5feaSAttilio Rao #ifdef SMP
506248bb937SAttilio Rao 	mtx_lock_spin(&smp_ipi_mtx);
5070a2d5feaSAttilio Rao #else
5080a2d5feaSAttilio Rao 	spinlock_enter();
5090a2d5feaSAttilio Rao #endif
510248bb937SAttilio Rao 
511269fb9d7SJulian Elischer 	/* cpu_boot(howto); */ /* doesn't do anything at the moment */
512ad4240feSJulian Elischer 	cpu_reset();
513fcb893a8SMike Smith 	/* NOTREACHED */ /* assuming reset worked */
514ad4240feSJulian Elischer }
515ad4240feSJulian Elischer 
516abd9053eSJohn Baldwin #ifdef SMP
5170711ca46SJohn Baldwin static u_int panic_cpu = NOCPU;
518abd9053eSJohn Baldwin #endif
519abd9053eSJohn Baldwin 
520ad4240feSJulian Elischer /*
521ad4240feSJulian Elischer  * Panic is called on unresolvable fatal errors.  It prints "panic: mesg",
522ad4240feSJulian Elischer  * and then reboots.  If we are called twice, then we avoid trying to sync
523ad4240feSJulian Elischer  * the disks as this often leads to recursive panics.
524ad4240feSJulian Elischer  */
525ad4240feSJulian Elischer void
5269a6dc4b6SPoul-Henning Kamp panic(const char *fmt, ...)
527ad4240feSJulian Elischer {
528fe799533SAndrew Gallatin 	struct thread *td = curthread;
529e485b64bSJohn Baldwin 	int bootopt, newpanic;
530ad4240feSJulian Elischer 	va_list ap;
53199237364SAndrey A. Chernov 	static char buf[256];
532ad4240feSJulian Elischer 
53341a4e90eSKonstantin Belousov 	critical_enter();
5340384fff8SJason Evans #ifdef SMP
5351a5333c3SJohn Baldwin 	/*
5361a5333c3SJohn Baldwin 	 * We don't want multiple CPU's to panic at the same time, so we
5370711ca46SJohn Baldwin 	 * use panic_cpu as a simple spinlock.  We have to keep checking
5380711ca46SJohn Baldwin 	 * panic_cpu if we are spinning in case the panic on the first
5391a5333c3SJohn Baldwin 	 * CPU is canceled.
5401a5333c3SJohn Baldwin 	 */
5410711ca46SJohn Baldwin 	if (panic_cpu != PCPU_GET(cpuid))
5420711ca46SJohn Baldwin 		while (atomic_cmpset_int(&panic_cpu, NOCPU,
5430711ca46SJohn Baldwin 		    PCPU_GET(cpuid)) == 0)
5440711ca46SJohn Baldwin 			while (panic_cpu != NOCPU)
5450711ca46SJohn Baldwin 				; /* nothing */
5460384fff8SJason Evans #endif
5470384fff8SJason Evans 
548ad4240feSJulian Elischer 	bootopt = RB_AUTOBOOT | RB_DUMP;
549e485b64bSJohn Baldwin 	newpanic = 0;
550ad4240feSJulian Elischer 	if (panicstr)
551ad4240feSJulian Elischer 		bootopt |= RB_NOSYNC;
552e485b64bSJohn Baldwin 	else {
553ad4240feSJulian Elischer 		panicstr = fmt;
554e485b64bSJohn Baldwin 		newpanic = 1;
555e485b64bSJohn Baldwin 	}
556ad4240feSJulian Elischer 
557ad4240feSJulian Elischer 	va_start(ap, fmt);
5584f1b4577SIan Dowse 	if (newpanic) {
5592127f260SArchie Cobbs 		(void)vsnprintf(buf, sizeof(buf), fmt, ap);
56099237364SAndrey A. Chernov 		panicstr = buf;
5619a6dc4b6SPoul-Henning Kamp 		printf("panic: %s\n", buf);
5624f1b4577SIan Dowse 	} else {
5634f1b4577SIan Dowse 		printf("panic: ");
5644f1b4577SIan Dowse 		vprintf(fmt, ap);
5659a6dc4b6SPoul-Henning Kamp 		printf("\n");
5664f1b4577SIan Dowse 	}
5674f1b4577SIan Dowse 	va_end(ap);
56847d81897SSteve Passe #ifdef SMP
56955c45354SJohn Baldwin 	printf("cpuid = %d\n", PCPU_GET(cpuid));
5702bcc63c5SJohn Baldwin #endif
571ad4240feSJulian Elischer 
5722d50560aSMarcel Moolenaar #ifdef KDB
573e485b64bSJohn Baldwin 	if (newpanic && trace_on_panic)
5742d50560aSMarcel Moolenaar 		kdb_backtrace();
575ad4240feSJulian Elischer 	if (debugger_on_panic)
5763de213ccSRobert Watson 		kdb_enter(KDB_WHY_PANIC, "panic");
5771432aa0cSJohn Baldwin #ifdef RESTARTABLE_PANICS
5781a5333c3SJohn Baldwin 	/* See if the user aborted the panic, in which case we continue. */
5791a5333c3SJohn Baldwin 	if (panicstr == NULL) {
5801a5333c3SJohn Baldwin #ifdef SMP
5810711ca46SJohn Baldwin 		atomic_store_rel_int(&panic_cpu, NOCPU);
5821a5333c3SJohn Baldwin #endif
5831a5333c3SJohn Baldwin 		return;
5841a5333c3SJohn Baldwin 	}
585ad4240feSJulian Elischer #endif
5861432aa0cSJohn Baldwin #endif
587982d11f8SJeff Roberson 	/*thread_lock(td); */
588fe799533SAndrew Gallatin 	td->td_flags |= TDF_INPANIC;
589982d11f8SJeff Roberson 	/* thread_unlock(td); */
590259ed917SPeter Wemm 	if (!sync_on_panic)
591259ed917SPeter Wemm 		bootopt |= RB_NOSYNC;
59241a4e90eSKonstantin Belousov 	critical_exit();
593ad4240feSJulian Elischer 	boot(bootopt);
594ad4240feSJulian Elischer }
595ad4240feSJulian Elischer 
596e0d898b4SJulian Elischer /*
597db82a982SMike Smith  * Support for poweroff delay.
598b22692bdSNick Hibma  *
599b22692bdSNick Hibma  * Please note that setting this delay too short might power off your machine
600b22692bdSNick Hibma  * before the write cache on your hard disk has been flushed, leading to
601b22692bdSNick Hibma  * soft-updates inconsistencies.
602db82a982SMike Smith  */
6039eec6969SMike Smith #ifndef POWEROFF_DELAY
6049eec6969SMike Smith # define POWEROFF_DELAY 5000
6059eec6969SMike Smith #endif
6069eec6969SMike Smith static int poweroff_delay = POWEROFF_DELAY;
6079eec6969SMike Smith 
608db82a982SMike Smith SYSCTL_INT(_kern_shutdown, OID_AUTO, poweroff_delay, CTLFLAG_RW,
609db82a982SMike Smith 	&poweroff_delay, 0, "");
610db82a982SMike Smith 
611fcb893a8SMike Smith static void
612fcb893a8SMike Smith poweroff_wait(void *junk, int howto)
613db82a982SMike Smith {
614e95499bdSAlfred Perlstein 
615db82a982SMike Smith 	if (!(howto & RB_POWEROFF) || poweroff_delay <= 0)
616db82a982SMike Smith 		return;
617db82a982SMike Smith 	DELAY(poweroff_delay * 1000);
618db82a982SMike Smith }
6195e950839SLuoqi Chen 
6205e950839SLuoqi Chen /*
6215e950839SLuoqi Chen  * Some system processes (e.g. syncer) need to be stopped at appropriate
6225e950839SLuoqi Chen  * points in their main loops prior to a system shutdown, so that they
6235e950839SLuoqi Chen  * won't interfere with the shutdown process (e.g. by holding a disk buf
6245e950839SLuoqi Chen  * to cause sync to fail).  For each of these system processes, register
6255e950839SLuoqi Chen  * shutdown_kproc() as a handler for one of shutdown events.
6265e950839SLuoqi Chen  */
6275e950839SLuoqi Chen static int kproc_shutdown_wait = 60;
6285e950839SLuoqi Chen SYSCTL_INT(_kern_shutdown, OID_AUTO, kproc_shutdown_wait, CTLFLAG_RW,
6295e950839SLuoqi Chen     &kproc_shutdown_wait, 0, "");
6305e950839SLuoqi Chen 
6315e950839SLuoqi Chen void
632ffc831daSJohn Baldwin kproc_shutdown(void *arg, int howto)
6335e950839SLuoqi Chen {
6345e950839SLuoqi Chen 	struct proc *p;
6355e950839SLuoqi Chen 	int error;
6365e950839SLuoqi Chen 
6375e950839SLuoqi Chen 	if (panicstr)
6385e950839SLuoqi Chen 		return;
6395e950839SLuoqi Chen 
6405e950839SLuoqi Chen 	p = (struct proc *)arg;
641b1c81391SNate Lawson 	printf("Waiting (max %d seconds) for system process `%s' to stop...",
6424f9d48e4SJohn Baldwin 	    kproc_shutdown_wait, p->p_comm);
6433745c395SJulian Elischer 	error = kproc_suspend(p, kproc_shutdown_wait * hz);
6445e950839SLuoqi Chen 
6455e950839SLuoqi Chen 	if (error == EWOULDBLOCK)
646b1c81391SNate Lawson 		printf("timed out\n");
6475e950839SLuoqi Chen 	else
648b1c81391SNate Lawson 		printf("done\n");
6495e950839SLuoqi Chen }
65081661c94SPoul-Henning Kamp 
6517ab24ea3SJulian Elischer void
6527ab24ea3SJulian Elischer kthread_shutdown(void *arg, int howto)
6537ab24ea3SJulian Elischer {
6547ab24ea3SJulian Elischer 	struct thread *td;
6557ab24ea3SJulian Elischer 	int error;
6567ab24ea3SJulian Elischer 
6577ab24ea3SJulian Elischer 	if (panicstr)
6587ab24ea3SJulian Elischer 		return;
6597ab24ea3SJulian Elischer 
6607ab24ea3SJulian Elischer 	td = (struct thread *)arg;
6617ab24ea3SJulian Elischer 	printf("Waiting (max %d seconds) for system thread `%s' to stop...",
6624f9d48e4SJohn Baldwin 	    kproc_shutdown_wait, td->td_name);
6637ab24ea3SJulian Elischer 	error = kthread_suspend(td, kproc_shutdown_wait * hz);
6647ab24ea3SJulian Elischer 
6657ab24ea3SJulian Elischer 	if (error == EWOULDBLOCK)
6667ab24ea3SJulian Elischer 		printf("timed out\n");
6677ab24ea3SJulian Elischer 	else
6687ab24ea3SJulian Elischer 		printf("done\n");
6697ab24ea3SJulian Elischer }
6707ab24ea3SJulian Elischer 
67181661c94SPoul-Henning Kamp /* Registration of dumpers */
67281661c94SPoul-Henning Kamp int
67381661c94SPoul-Henning Kamp set_dumper(struct dumperinfo *di)
67481661c94SPoul-Henning Kamp {
675e95499bdSAlfred Perlstein 
67681661c94SPoul-Henning Kamp 	if (di == NULL) {
67781661c94SPoul-Henning Kamp 		bzero(&dumper, sizeof dumper);
67881661c94SPoul-Henning Kamp 		return (0);
67981661c94SPoul-Henning Kamp 	}
68081661c94SPoul-Henning Kamp 	if (dumper.dumper != NULL)
68181661c94SPoul-Henning Kamp 		return (EBUSY);
68281661c94SPoul-Henning Kamp 	dumper = *di;
68381661c94SPoul-Henning Kamp 	return (0);
68481661c94SPoul-Henning Kamp }
68581661c94SPoul-Henning Kamp 
686007b1b7bSRuslan Ermilov /* Call dumper with bounds checking. */
687007b1b7bSRuslan Ermilov int
688007b1b7bSRuslan Ermilov dump_write(struct dumperinfo *di, void *virtual, vm_offset_t physical,
689007b1b7bSRuslan Ermilov     off_t offset, size_t length)
690007b1b7bSRuslan Ermilov {
691007b1b7bSRuslan Ermilov 
692007b1b7bSRuslan Ermilov 	if (length != 0 && (offset < di->mediaoffset ||
693007b1b7bSRuslan Ermilov 	    offset - di->mediaoffset + length > di->mediasize)) {
694007b1b7bSRuslan Ermilov 		printf("Attempt to write outside dump device boundaries.\n");
695007b1b7bSRuslan Ermilov 		return (ENXIO);
696007b1b7bSRuslan Ermilov 	}
697007b1b7bSRuslan Ermilov 	return (di->dumper(di->priv, virtual, physical, offset, length));
698007b1b7bSRuslan Ermilov }
699007b1b7bSRuslan Ermilov 
700e6592ee5SPeter Wemm void
701e6592ee5SPeter Wemm mkdumpheader(struct kerneldumpheader *kdh, char *magic, uint32_t archver,
702e6592ee5SPeter Wemm     uint64_t dumplen, uint32_t blksz)
703e6592ee5SPeter Wemm {
704e6592ee5SPeter Wemm 
705e6592ee5SPeter Wemm 	bzero(kdh, sizeof(*kdh));
706e6592ee5SPeter Wemm 	strncpy(kdh->magic, magic, sizeof(kdh->magic));
707e6592ee5SPeter Wemm 	strncpy(kdh->architecture, MACHINE_ARCH, sizeof(kdh->architecture));
708e6592ee5SPeter Wemm 	kdh->version = htod32(KERNELDUMPVERSION);
709e6592ee5SPeter Wemm 	kdh->architectureversion = htod32(archver);
710e6592ee5SPeter Wemm 	kdh->dumplength = htod64(dumplen);
711e6592ee5SPeter Wemm 	kdh->dumptime = htod64(time_second);
712e6592ee5SPeter Wemm 	kdh->blocksize = htod32(blksz);
713c1f19219SJamie Gritton 	strncpy(kdh->hostname, prison0.pr_hostname, sizeof(kdh->hostname));
714e6592ee5SPeter Wemm 	strncpy(kdh->versionstring, version, sizeof(kdh->versionstring));
715e6592ee5SPeter Wemm 	if (panicstr != NULL)
716e6592ee5SPeter Wemm 		strncpy(kdh->panicstring, panicstr, sizeof(kdh->panicstring));
717e6592ee5SPeter Wemm 	kdh->parity = kerneldump_parity(kdh);
718e6592ee5SPeter Wemm }
719