xref: /freebsd/sys/kern/kern_shutdown.c (revision 76e18b25a07d827284d0929bbbca9720ab3ab80d)
1ad4240feSJulian Elischer /*-
2ad4240feSJulian Elischer  * Copyright (c) 1986, 1988, 1991, 1993
3ad4240feSJulian Elischer  *	The Regents of the University of California.  All rights reserved.
4ad4240feSJulian Elischer  * (c) UNIX System Laboratories, Inc.
5ad4240feSJulian Elischer  * All or some portions of this file are derived from material licensed
6ad4240feSJulian Elischer  * to the University of California by American Telephone and Telegraph
7ad4240feSJulian Elischer  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
8ad4240feSJulian Elischer  * the permission of UNIX System Laboratories, Inc.
9ad4240feSJulian Elischer  *
10ad4240feSJulian Elischer  * Redistribution and use in source and binary forms, with or without
11ad4240feSJulian Elischer  * modification, are permitted provided that the following conditions
12ad4240feSJulian Elischer  * are met:
13ad4240feSJulian Elischer  * 1. Redistributions of source code must retain the above copyright
14ad4240feSJulian Elischer  *    notice, this list of conditions and the following disclaimer.
15ad4240feSJulian Elischer  * 2. Redistributions in binary form must reproduce the above copyright
16ad4240feSJulian Elischer  *    notice, this list of conditions and the following disclaimer in the
17ad4240feSJulian Elischer  *    documentation and/or other materials provided with the distribution.
18ad4240feSJulian Elischer  * 4. Neither the name of the University nor the names of its contributors
19ad4240feSJulian Elischer  *    may be used to endorse or promote products derived from this software
20ad4240feSJulian Elischer  *    without specific prior written permission.
21ad4240feSJulian Elischer  *
22ad4240feSJulian Elischer  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23ad4240feSJulian Elischer  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24ad4240feSJulian Elischer  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25ad4240feSJulian Elischer  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26ad4240feSJulian Elischer  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27ad4240feSJulian Elischer  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28ad4240feSJulian Elischer  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29ad4240feSJulian Elischer  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30ad4240feSJulian Elischer  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31ad4240feSJulian Elischer  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32ad4240feSJulian Elischer  * SUCH DAMAGE.
33ad4240feSJulian Elischer  *
34ad4240feSJulian Elischer  *	@(#)kern_shutdown.c	8.3 (Berkeley) 1/21/94
35ad4240feSJulian Elischer  */
36ad4240feSJulian Elischer 
37677b542eSDavid E. O'Brien #include <sys/cdefs.h>
38677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
39677b542eSDavid E. O'Brien 
40618c7db3SRobert Watson #include "opt_ddb.h"
412d50560aSMarcel Moolenaar #include "opt_kdb.h"
426d58e6cbSBruce Evans #include "opt_panic.h"
436d58e6cbSBruce Evans #include "opt_show_busybufs.h"
449923b511SScott Long #include "opt_sched.h"
45ad4240feSJulian Elischer 
46ad4240feSJulian Elischer #include <sys/param.h>
47ad4240feSJulian Elischer #include <sys/systm.h>
489626b608SPoul-Henning Kamp #include <sys/bio.h>
49fc8f7066SBruce Evans #include <sys/buf.h>
501d79f1bbSJohn Baldwin #include <sys/conf.h>
511d79f1bbSJohn Baldwin #include <sys/cons.h>
521d79f1bbSJohn Baldwin #include <sys/eventhandler.h>
5376ca6f88SJamie Gritton #include <sys/jail.h>
542d50560aSMarcel Moolenaar #include <sys/kdb.h>
55ad4240feSJulian Elischer #include <sys/kernel.h>
56e6592ee5SPeter Wemm #include <sys/kerneldump.h>
575e950839SLuoqi Chen #include <sys/kthread.h>
58dcd7d9b7SMaxim Sobolev #include <sys/malloc.h>
59ac0ad63fSBruce Evans #include <sys/mount.h>
60acd3428bSRobert Watson #include <sys/priv.h>
611d79f1bbSJohn Baldwin #include <sys/proc.h>
621d79f1bbSJohn Baldwin #include <sys/reboot.h>
631d79f1bbSJohn Baldwin #include <sys/resourcevar.h>
6420e25d7dSPeter Wemm #include <sys/sched.h>
65248bb937SAttilio Rao #include <sys/smp.h>
66ad4240feSJulian Elischer #include <sys/sysctl.h>
67ad4240feSJulian Elischer #include <sys/sysproto.h>
68ad4240feSJulian Elischer 
69618c7db3SRobert Watson #include <ddb/ddb.h>
70618c7db3SRobert Watson 
7126502503SMarcel Moolenaar #include <machine/cpu.h>
72d39e457bSPoul-Henning Kamp #include <machine/pcb.h>
73752dff3dSJake Burkholder #include <machine/smp.h>
74ad4240feSJulian Elischer 
75aed55708SRobert Watson #include <security/mac/mac_framework.h>
76aed55708SRobert Watson 
770909f38aSPawel Jakub Dawidek #include <vm/vm.h>
780909f38aSPawel Jakub Dawidek #include <vm/vm_object.h>
790909f38aSPawel Jakub Dawidek #include <vm/vm_page.h>
800909f38aSPawel Jakub Dawidek #include <vm/vm_pager.h>
810909f38aSPawel Jakub Dawidek #include <vm/swap_pager.h>
820909f38aSPawel Jakub Dawidek 
83ad4240feSJulian Elischer #include <sys/signalvar.h>
84ad4240feSJulian Elischer 
85ad4240feSJulian Elischer #ifndef PANIC_REBOOT_WAIT_TIME
86ad4240feSJulian Elischer #define PANIC_REBOOT_WAIT_TIME 15 /* default to 15 seconds */
87ad4240feSJulian Elischer #endif
88ad4240feSJulian Elischer 
89ad4240feSJulian Elischer /*
90ad4240feSJulian Elischer  * Note that stdarg.h and the ANSI style va_start macro is used for both
91ad4240feSJulian Elischer  * ANSI and traditional C compilers.
92ad4240feSJulian Elischer  */
93ad4240feSJulian Elischer #include <machine/stdarg.h>
94ad4240feSJulian Elischer 
952d50560aSMarcel Moolenaar #ifdef KDB
962d50560aSMarcel Moolenaar #ifdef KDB_UNATTENDED
979959b1a8SMike Smith int debugger_on_panic = 0;
98ad4240feSJulian Elischer #else
999959b1a8SMike Smith int debugger_on_panic = 1;
100ad4240feSJulian Elischer #endif
10108a9c205SAndriy Gapon SYSCTL_INT(_debug, OID_AUTO, debugger_on_panic, CTLFLAG_RW | CTLFLAG_TUN,
1023d177f46SBill Fumerola 	&debugger_on_panic, 0, "Run debugger on kernel panic");
10308a9c205SAndriy Gapon TUNABLE_INT("debug.debugger_on_panic", &debugger_on_panic);
104e485b64bSJohn Baldwin 
1052d50560aSMarcel Moolenaar #ifdef KDB_TRACE
10608a9c205SAndriy Gapon static int trace_on_panic = 1;
107e485b64bSJohn Baldwin #else
10808a9c205SAndriy Gapon static int trace_on_panic = 0;
109e485b64bSJohn Baldwin #endif
11008a9c205SAndriy Gapon SYSCTL_INT(_debug, OID_AUTO, trace_on_panic, CTLFLAG_RW | CTLFLAG_TUN,
111e485b64bSJohn Baldwin 	&trace_on_panic, 0, "Print stack trace on kernel panic");
11208a9c205SAndriy Gapon TUNABLE_INT("debug.trace_on_panic", &trace_on_panic);
1132d50560aSMarcel Moolenaar #endif /* KDB */
114ad4240feSJulian Elischer 
11508a9c205SAndriy Gapon static int sync_on_panic = 0;
11608a9c205SAndriy Gapon SYSCTL_INT(_kern, OID_AUTO, sync_on_panic, CTLFLAG_RW | CTLFLAG_TUN,
117259ed917SPeter Wemm 	&sync_on_panic, 0, "Do a sync before rebooting from a panic");
11808a9c205SAndriy Gapon TUNABLE_INT("kern.sync_on_panic", &sync_on_panic);
119259ed917SPeter Wemm 
120db82a982SMike Smith SYSCTL_NODE(_kern, OID_AUTO, shutdown, CTLFLAG_RW, 0, "Shutdown environment");
121db82a982SMike Smith 
1225230cfd2SJulian Elischer /*
123ad4240feSJulian Elischer  * Variable panicstr contains argument to first call to panic; used as flag
124ad4240feSJulian Elischer  * to indicate that the kernel has already called panic.
125ad4240feSJulian Elischer  */
126ad4240feSJulian Elischer const char *panicstr;
127ad4240feSJulian Elischer 
12816a011f9SPaul Saab int dumping;				/* system is dumping */
12936a52c3cSJeff Roberson int rebooting;				/* system is rebooting */
13081661c94SPoul-Henning Kamp static struct dumperinfo dumper;	/* our selected dumper */
1312d50560aSMarcel Moolenaar 
1322d50560aSMarcel Moolenaar /* Context information for dump-debuggers. */
1332d50560aSMarcel Moolenaar static struct pcb dumppcb;		/* Registers. */
1342d50560aSMarcel Moolenaar static lwpid_t dumptid;			/* Thread ID. */
13516a011f9SPaul Saab 
13682acbcf5SPeter Wemm static void poweroff_wait(void *, int);
13782acbcf5SPeter Wemm static void shutdown_halt(void *junk, int howto);
13882acbcf5SPeter Wemm static void shutdown_panic(void *junk, int howto);
13982acbcf5SPeter Wemm static void shutdown_reset(void *junk, int howto);
140f06a54f0SPoul-Henning Kamp 
141fcb893a8SMike Smith /* register various local shutdown events */
142fcb893a8SMike Smith static void
143fcb893a8SMike Smith shutdown_conf(void *unused)
144fcb893a8SMike Smith {
145e95499bdSAlfred Perlstein 
146e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, poweroff_wait, NULL,
1476f15a274SAlexander Motin 	    SHUTDOWN_PRI_FIRST + 100);
148e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_halt, NULL,
149e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 100);
150e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_panic, NULL,
151e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 100);
152e95499bdSAlfred Perlstein 	EVENTHANDLER_REGISTER(shutdown_final, shutdown_reset, NULL,
153e95499bdSAlfred Perlstein 	    SHUTDOWN_PRI_LAST + 200);
154fcb893a8SMike Smith }
155ad4240feSJulian Elischer 
156237fdd78SRobert Watson SYSINIT(shutdown_conf, SI_SUB_INTRINSIC, SI_ORDER_ANY, shutdown_conf, NULL);
157fcb893a8SMike Smith 
158ad4240feSJulian Elischer /*
1590c14ff0eSRobert Watson  * The system call that results in a reboot.
160ad4240feSJulian Elischer  */
161835a82eeSMatthew Dillon /* ARGSUSED */
162ad4240feSJulian Elischer int
163b40ce416SJulian Elischer reboot(struct thread *td, struct reboot_args *uap)
164ad4240feSJulian Elischer {
165ad4240feSJulian Elischer 	int error;
166ad4240feSJulian Elischer 
167a2ecb9b7SRobert Watson 	error = 0;
168a2ecb9b7SRobert Watson #ifdef MAC
16930d239bcSRobert Watson 	error = mac_system_check_reboot(td->td_ucred, uap->opt);
170a2ecb9b7SRobert Watson #endif
171a2ecb9b7SRobert Watson 	if (error == 0)
172acd3428bSRobert Watson 		error = priv_check(td, PRIV_REBOOT);
173a2ecb9b7SRobert Watson 	if (error == 0) {
174835a82eeSMatthew Dillon 		mtx_lock(&Giant);
175*76e18b25SMarcel Moolenaar 		kern_reboot(uap->opt);
176835a82eeSMatthew Dillon 		mtx_unlock(&Giant);
177a2ecb9b7SRobert Watson 	}
178835a82eeSMatthew Dillon 	return (error);
179ad4240feSJulian Elischer }
180ad4240feSJulian Elischer 
181ad4240feSJulian Elischer /*
182ad4240feSJulian Elischer  * Called by events that want to shut down.. e.g  <CTL><ALT><DEL> on a PC
183ad4240feSJulian Elischer  */
1843e755f76SMike Smith static int shutdown_howto = 0;
1853e755f76SMike Smith 
186ad4240feSJulian Elischer void
1873e755f76SMike Smith shutdown_nice(int howto)
188ad4240feSJulian Elischer {
189e95499bdSAlfred Perlstein 
1903e755f76SMike Smith 	shutdown_howto = howto;
1913e755f76SMike Smith 
192ad4240feSJulian Elischer 	/* Send a signal to init(8) and have it shutdown the world */
193ad4240feSJulian Elischer 	if (initproc != NULL) {
19487729a2bSJohn Baldwin 		PROC_LOCK(initproc);
195ad4240feSJulian Elischer 		psignal(initproc, SIGINT);
19687729a2bSJohn Baldwin 		PROC_UNLOCK(initproc);
197ad4240feSJulian Elischer 	} else {
198ad4240feSJulian Elischer 		/* No init(8) running, so simply reboot */
199*76e18b25SMarcel Moolenaar 		kern_reboot(RB_NOSYNC);
200ad4240feSJulian Elischer 	}
201ad4240feSJulian Elischer 	return;
202ad4240feSJulian Elischer }
203ad4240feSJulian Elischer static int	waittime = -1;
204ad4240feSJulian Elischer 
20572dfe7a3SPoul-Henning Kamp static void
20682acbcf5SPeter Wemm print_uptime(void)
20772dfe7a3SPoul-Henning Kamp {
20872dfe7a3SPoul-Henning Kamp 	int f;
20972dfe7a3SPoul-Henning Kamp 	struct timespec ts;
21072dfe7a3SPoul-Henning Kamp 
21172dfe7a3SPoul-Henning Kamp 	getnanouptime(&ts);
21272dfe7a3SPoul-Henning Kamp 	printf("Uptime: ");
21372dfe7a3SPoul-Henning Kamp 	f = 0;
21472dfe7a3SPoul-Henning Kamp 	if (ts.tv_sec >= 86400) {
2154a6404dfSJohn Baldwin 		printf("%ldd", (long)ts.tv_sec / 86400);
21672dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 86400;
21772dfe7a3SPoul-Henning Kamp 		f = 1;
21872dfe7a3SPoul-Henning Kamp 	}
21972dfe7a3SPoul-Henning Kamp 	if (f || ts.tv_sec >= 3600) {
2204a6404dfSJohn Baldwin 		printf("%ldh", (long)ts.tv_sec / 3600);
22172dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 3600;
22272dfe7a3SPoul-Henning Kamp 		f = 1;
22372dfe7a3SPoul-Henning Kamp 	}
22472dfe7a3SPoul-Henning Kamp 	if (f || ts.tv_sec >= 60) {
2254a6404dfSJohn Baldwin 		printf("%ldm", (long)ts.tv_sec / 60);
22672dfe7a3SPoul-Henning Kamp 		ts.tv_sec %= 60;
22772dfe7a3SPoul-Henning Kamp 		f = 1;
22872dfe7a3SPoul-Henning Kamp 	}
2294a6404dfSJohn Baldwin 	printf("%lds\n", (long)ts.tv_sec);
23072dfe7a3SPoul-Henning Kamp }
23172dfe7a3SPoul-Henning Kamp 
232d39e457bSPoul-Henning Kamp static void
233d39e457bSPoul-Henning Kamp doadump(void)
234d39e457bSPoul-Henning Kamp {
235e95499bdSAlfred Perlstein 
236f6449d9dSJulian Elischer 	/*
237f6449d9dSJulian Elischer 	 * Sometimes people have to call this from the kernel debugger.
238f6449d9dSJulian Elischer 	 * (if 'panic' can not dump)
239f6449d9dSJulian Elischer 	 * Give them a clue as to why they can't dump.
240f6449d9dSJulian Elischer 	 */
241f6449d9dSJulian Elischer 	if (dumper.dumper == NULL) {
24227d68f90SDavid Malone 		printf("Cannot dump. Device not defined or unavailable.\n");
243f6449d9dSJulian Elischer 		return;
244f6449d9dSJulian Elischer 	}
245f6449d9dSJulian Elischer 
246d39e457bSPoul-Henning Kamp 	savectx(&dumppcb);
2472d50560aSMarcel Moolenaar 	dumptid = curthread->td_tid;
248d39e457bSPoul-Henning Kamp 	dumping++;
249618c7db3SRobert Watson #ifdef DDB
250618c7db3SRobert Watson 	if (textdump_pending)
251618c7db3SRobert Watson 		textdump_dumpsys(&dumper);
252618c7db3SRobert Watson 	else
253618c7db3SRobert Watson #endif
254d39e457bSPoul-Henning Kamp 		dumpsys(&dumper);
2559e473363SRuslan Ermilov 	dumping--;
256d39e457bSPoul-Henning Kamp }
257d39e457bSPoul-Henning Kamp 
258d07f87a2SDon Lewis static int
259d07f87a2SDon Lewis isbufbusy(struct buf *bp)
260d07f87a2SDon Lewis {
261d07f87a2SDon Lewis 	if (((bp->b_flags & (B_INVAL | B_PERSISTENT)) == 0 &&
262d638e093SAttilio Rao 	    BUF_ISLOCKED(bp)) ||
263d07f87a2SDon Lewis 	    ((bp->b_flags & (B_DELWRI | B_INVAL)) == B_DELWRI))
264d07f87a2SDon Lewis 		return (1);
265d07f87a2SDon Lewis 	return (0);
266d07f87a2SDon Lewis }
267d07f87a2SDon Lewis 
268ad4240feSJulian Elischer /*
26970ce93f4SNate Lawson  * Shutdown the system cleanly to prepare for reboot, halt, or power off.
270ad4240feSJulian Elischer  */
271*76e18b25SMarcel Moolenaar void
272*76e18b25SMarcel Moolenaar kern_reboot(int howto)
273ad4240feSJulian Elischer {
274b6915bdbSDon Lewis 	static int first_buf_printf = 1;
275ad4240feSJulian Elischer 
276f7ebc7ceSMarcel Moolenaar #if defined(SMP)
27770ce93f4SNate Lawson 	/*
27870ce93f4SNate Lawson 	 * Bind us to CPU 0 so that all shutdown code runs there.  Some
27970ce93f4SNate Lawson 	 * systems don't shutdown properly (i.e., ACPI power off) if we
28070ce93f4SNate Lawson 	 * run on another processor.
28170ce93f4SNate Lawson 	 */
282982d11f8SJeff Roberson 	thread_lock(curthread);
28320e25d7dSPeter Wemm 	sched_bind(curthread, 0);
284982d11f8SJeff Roberson 	thread_unlock(curthread);
285*76e18b25SMarcel Moolenaar 	KASSERT(PCPU_GET(cpuid) == 0, ("%s: not running on cpu 0", __func__));
28620e25d7dSPeter Wemm #endif
28736a52c3cSJeff Roberson 	/* We're in the process of rebooting. */
28836a52c3cSJeff Roberson 	rebooting = 1;
28920e25d7dSPeter Wemm 
2903e755f76SMike Smith 	/* collect extra flags that shutdown_nice might have set */
2913e755f76SMike Smith 	howto |= shutdown_howto;
2923e755f76SMike Smith 
29361e96500SJohn Baldwin 	/* We are out of the debugger now. */
2942d50560aSMarcel Moolenaar 	kdb_active = 0;
29561e96500SJohn Baldwin 
2965230cfd2SJulian Elischer 	/*
2975230cfd2SJulian Elischer 	 * Do any callouts that should be done BEFORE syncing the filesystems.
2985230cfd2SJulian Elischer 	 */
299fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_pre_sync, howto);
3005230cfd2SJulian Elischer 
3015230cfd2SJulian Elischer 	/*
3025230cfd2SJulian Elischer 	 * Now sync filesystems
3035230cfd2SJulian Elischer 	 */
304ad4240feSJulian Elischer 	if (!cold && (howto & RB_NOSYNC) == 0 && waittime < 0) {
305ad4240feSJulian Elischer 		register struct buf *bp;
30662820f25SJason Evans 		int iter, nbusy, pbusy;
3070c0b25aeSJohn Baldwin #ifndef PREEMPTION
30862820f25SJason Evans 		int subiter;
3090c0b25aeSJohn Baldwin #endif
310ad4240feSJulian Elischer 
311ad4240feSJulian Elischer 		waittime = 0;
312ad4240feSJulian Elischer 
3133fafa27bSStephan Uphoff 		sync(curthread, NULL);
314ad4240feSJulian Elischer 
315b1897c19SJulian Elischer 		/*
316b1897c19SJulian Elischer 		 * With soft updates, some buffers that are
317b1897c19SJulian Elischer 		 * written will be remarked as dirty until other
318b1897c19SJulian Elischer 		 * buffers are written.
319b1897c19SJulian Elischer 		 */
32062820f25SJason Evans 		for (iter = pbusy = 0; iter < 20; iter++) {
321ad4240feSJulian Elischer 			nbusy = 0;
322d07f87a2SDon Lewis 			for (bp = &buf[nbuf]; --bp >= buf; )
323d07f87a2SDon Lewis 				if (isbufbusy(bp))
324ad4240feSJulian Elischer 					nbusy++;
325b6915bdbSDon Lewis 			if (nbusy == 0) {
326b6915bdbSDon Lewis 				if (first_buf_printf)
32737abb77fSPoul-Henning Kamp 					printf("All buffers synced.");
328ad4240feSJulian Elischer 				break;
329b6915bdbSDon Lewis 			}
330b6915bdbSDon Lewis 			if (first_buf_printf) {
331b6915bdbSDon Lewis 				printf("Syncing disks, buffers remaining... ");
332b6915bdbSDon Lewis 				first_buf_printf = 0;
333b6915bdbSDon Lewis 			}
334ad4240feSJulian Elischer 			printf("%d ", nbusy);
33562820f25SJason Evans 			if (nbusy < pbusy)
33662820f25SJason Evans 				iter = 0;
33762820f25SJason Evans 			pbusy = nbusy;
3383fafa27bSStephan Uphoff 			sync(curthread, NULL);
3390c0b25aeSJohn Baldwin 
3400c0b25aeSJohn Baldwin #ifdef PREEMPTION
3410c0b25aeSJohn Baldwin 			/*
3420c0b25aeSJohn Baldwin 			 * Drop Giant and spin for a while to allow
3430c0b25aeSJohn Baldwin 			 * interrupt threads to run.
3440c0b25aeSJohn Baldwin 			 */
3450c0b25aeSJohn Baldwin 			DROP_GIANT();
3460c0b25aeSJohn Baldwin 			DELAY(50000 * iter);
3470c0b25aeSJohn Baldwin 			PICKUP_GIANT();
3480c0b25aeSJohn Baldwin #else
3490c0b25aeSJohn Baldwin 			/*
3500c0b25aeSJohn Baldwin 			 * Drop Giant and context switch several times to
3510c0b25aeSJohn Baldwin 			 * allow interrupt threads to run.
3520c0b25aeSJohn Baldwin 			 */
353c86b6ff5SJohn Baldwin 			DROP_GIANT();
35462820f25SJason Evans 			for (subiter = 0; subiter < 50 * iter; subiter++) {
355982d11f8SJeff Roberson 				thread_lock(curthread);
356bf0acc27SJohn Baldwin 				mi_switch(SW_VOL, NULL);
357982d11f8SJeff Roberson 				thread_unlock(curthread);
35862820f25SJason Evans 				DELAY(1000);
35962820f25SJason Evans 			}
36020cdcc5bSJohn Baldwin 			PICKUP_GIANT();
3610c0b25aeSJohn Baldwin #endif
362ad4240feSJulian Elischer 		}
363c8c216d5SNate Lawson 		printf("\n");
364d02d6d04SMike Smith 		/*
365d02d6d04SMike Smith 		 * Count only busy local buffers to prevent forcing
366d02d6d04SMike Smith 		 * a fsck if we're just a client of a wedged NFS server
367d02d6d04SMike Smith 		 */
368d02d6d04SMike Smith 		nbusy = 0;
369d02d6d04SMike Smith 		for (bp = &buf[nbuf]; --bp >= buf; ) {
370d07f87a2SDon Lewis 			if (isbufbusy(bp)) {
371c5690651SPoul-Henning Kamp #if 0
372c5690651SPoul-Henning Kamp /* XXX: This is bogus.  We should probably have a BO_REMOTE flag instead */
373f3732fd1SPoul-Henning Kamp 				if (bp->b_dev == NULL) {
3740429e37aSPoul-Henning Kamp 					TAILQ_REMOVE(&mountlist,
37567812eacSKirk McKusick 					    bp->b_vp->v_mount, mnt_list);
3769c111b31SPoul-Henning Kamp 					continue;
377dfd5dee1SPeter Wemm 				}
378c5690651SPoul-Henning Kamp #endif
3799c111b31SPoul-Henning Kamp 				nbusy++;
3809c111b31SPoul-Henning Kamp #if defined(SHOW_BUSYBUFS) || defined(DIAGNOSTIC)
3819c111b31SPoul-Henning Kamp 				printf(
382c5690651SPoul-Henning Kamp 			    "%d: bufobj:%p, flags:%0x, blkno:%ld, lblkno:%ld\n",
383c5690651SPoul-Henning Kamp 				    nbusy, bp->b_bufobj,
3849c111b31SPoul-Henning Kamp 				    bp->b_flags, (long)bp->b_blkno,
3859c111b31SPoul-Henning Kamp 				    (long)bp->b_lblkno);
3869c111b31SPoul-Henning Kamp #endif
3879c111b31SPoul-Henning Kamp 			}
388d02d6d04SMike Smith 		}
389ad4240feSJulian Elischer 		if (nbusy) {
390ad4240feSJulian Elischer 			/*
391ad4240feSJulian Elischer 			 * Failed to sync all blocks. Indicate this and don't
392ad4240feSJulian Elischer 			 * unmount filesystems (thus forcing an fsck on reboot).
393ad4240feSJulian Elischer 			 */
394b6915bdbSDon Lewis 			printf("Giving up on %d buffers\n", nbusy);
395ad4240feSJulian Elischer 			DELAY(5000000);	/* 5 seconds */
396ad4240feSJulian Elischer 		} else {
397b6915bdbSDon Lewis 			if (!first_buf_printf)
398b6915bdbSDon Lewis 				printf("Final sync complete\n");
399ad4240feSJulian Elischer 			/*
400ad4240feSJulian Elischer 			 * Unmount filesystems
401ad4240feSJulian Elischer 			 */
402ad4240feSJulian Elischer 			if (panicstr == 0)
403ad4240feSJulian Elischer 				vfs_unmountall();
404ad4240feSJulian Elischer 		}
4050909f38aSPawel Jakub Dawidek 		swapoff_all();
406ad4240feSJulian Elischer 		DELAY(100000);		/* wait for console output to finish */
407ad4240feSJulian Elischer 	}
4085230cfd2SJulian Elischer 
40972dfe7a3SPoul-Henning Kamp 	print_uptime();
41072dfe7a3SPoul-Henning Kamp 
4115230cfd2SJulian Elischer 	/*
4125230cfd2SJulian Elischer 	 * Ok, now do things that assume all filesystem activity has
4135230cfd2SJulian Elischer 	 * been completed.
4145230cfd2SJulian Elischer 	 */
415fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_post_sync, howto);
41670ce93f4SNate Lawson 
417f6449d9dSJulian Elischer 	if ((howto & (RB_HALT|RB_DUMP)) == RB_DUMP && !cold && !dumping)
418d39e457bSPoul-Henning Kamp 		doadump();
4192cfa0a03SJustin T. Gibbs 
4202cfa0a03SJustin T. Gibbs 	/* Now that we're going to really halt the system... */
421fcb893a8SMike Smith 	EVENTHANDLER_INVOKE(shutdown_final, howto);
4222cfa0a03SJustin T. Gibbs 
423fcb893a8SMike Smith 	for(;;) ;	/* safety against shutdown_reset not working */
424fcb893a8SMike Smith 	/* NOTREACHED */
425fcb893a8SMike Smith }
426fcb893a8SMike Smith 
427fcb893a8SMike Smith /*
428fcb893a8SMike Smith  * If the shutdown was a clean halt, behave accordingly.
429fcb893a8SMike Smith  */
430fcb893a8SMike Smith static void
431fcb893a8SMike Smith shutdown_halt(void *junk, int howto)
432fcb893a8SMike Smith {
433e95499bdSAlfred Perlstein 
434ad4240feSJulian Elischer 	if (howto & RB_HALT) {
435ad4240feSJulian Elischer 		printf("\n");
436ad4240feSJulian Elischer 		printf("The operating system has halted.\n");
437ad4240feSJulian Elischer 		printf("Please press any key to reboot.\n\n");
438d13d3630SJulian Elischer 		switch (cngetc()) {
439d13d3630SJulian Elischer 		case -1:		/* No console, just die */
440d13d3630SJulian Elischer 			cpu_halt();
441d13d3630SJulian Elischer 			/* NOTREACHED */
442d13d3630SJulian Elischer 		default:
4432cfa0a03SJustin T. Gibbs 			howto &= ~RB_HALT;
444d13d3630SJulian Elischer 			break;
445d13d3630SJulian Elischer 		}
446fcb893a8SMike Smith 	}
447fcb893a8SMike Smith }
448ad4240feSJulian Elischer 
449fcb893a8SMike Smith /*
450fcb893a8SMike Smith  * Check to see if the system paniced, pause and then reboot
451fcb893a8SMike Smith  * according to the specified delay.
452fcb893a8SMike Smith  */
453fcb893a8SMike Smith static void
454fcb893a8SMike Smith shutdown_panic(void *junk, int howto)
455fcb893a8SMike Smith {
456fcb893a8SMike Smith 	int loop;
457fcb893a8SMike Smith 
458fcb893a8SMike Smith 	if (howto & RB_DUMP) {
459ad4240feSJulian Elischer 		if (PANIC_REBOOT_WAIT_TIME != 0) {
460ad4240feSJulian Elischer 			if (PANIC_REBOOT_WAIT_TIME != -1) {
4612cfa0a03SJustin T. Gibbs 				printf("Automatic reboot in %d seconds - "
4622cfa0a03SJustin T. Gibbs 				       "press a key on the console to abort\n",
463ad4240feSJulian Elischer 					PANIC_REBOOT_WAIT_TIME);
4642cfa0a03SJustin T. Gibbs 				for (loop = PANIC_REBOOT_WAIT_TIME * 10;
4652cfa0a03SJustin T. Gibbs 				     loop > 0; --loop) {
466ad4240feSJulian Elischer 					DELAY(1000 * 100); /* 1/10th second */
467a7f8f2abSBruce Evans 					/* Did user type a key? */
468a7f8f2abSBruce Evans 					if (cncheckc() != -1)
469ad4240feSJulian Elischer 						break;
470ad4240feSJulian Elischer 				}
471ad4240feSJulian Elischer 				if (!loop)
472fcb893a8SMike Smith 					return;
473ad4240feSJulian Elischer 			}
474ad4240feSJulian Elischer 		} else { /* zero time specified - reboot NOW */
475fcb893a8SMike Smith 			return;
476ad4240feSJulian Elischer 		}
477422702e9SNik Clayton 		printf("--> Press a key on the console to reboot,\n");
478422702e9SNik Clayton 		printf("--> or switch off the system now.\n");
479ad4240feSJulian Elischer 		cngetc();
480ad4240feSJulian Elischer 	}
481fcb893a8SMike Smith }
482fcb893a8SMike Smith 
483fcb893a8SMike Smith /*
484fcb893a8SMike Smith  * Everything done, now reset
485fcb893a8SMike Smith  */
486fcb893a8SMike Smith static void
487fcb893a8SMike Smith shutdown_reset(void *junk, int howto)
488fcb893a8SMike Smith {
489e95499bdSAlfred Perlstein 
490ad4240feSJulian Elischer 	printf("Rebooting...\n");
491ad4240feSJulian Elischer 	DELAY(1000000);	/* wait 1 sec for printf's to complete and be read */
492248bb937SAttilio Rao 
493248bb937SAttilio Rao 	/*
494248bb937SAttilio Rao 	 * Acquiring smp_ipi_mtx here has a double effect:
495248bb937SAttilio Rao 	 * - it disables interrupts avoiding CPU0 preemption
496248bb937SAttilio Rao 	 *   by fast handlers (thus deadlocking  against other CPUs)
497248bb937SAttilio Rao 	 * - it avoids deadlocks against smp_rendezvous() or, more
498248bb937SAttilio Rao 	 *   generally, threads busy-waiting, with this spinlock held,
499248bb937SAttilio Rao 	 *   and waiting for responses by threads on other CPUs
500248bb937SAttilio Rao 	 *   (ie. smp_tlb_shootdown()).
5010a2d5feaSAttilio Rao 	 *
5020a2d5feaSAttilio Rao 	 * For the !SMP case it just needs to handle the former problem.
503248bb937SAttilio Rao 	 */
5040a2d5feaSAttilio Rao #ifdef SMP
505248bb937SAttilio Rao 	mtx_lock_spin(&smp_ipi_mtx);
5060a2d5feaSAttilio Rao #else
5070a2d5feaSAttilio Rao 	spinlock_enter();
5080a2d5feaSAttilio Rao #endif
509248bb937SAttilio Rao 
510269fb9d7SJulian Elischer 	/* cpu_boot(howto); */ /* doesn't do anything at the moment */
511ad4240feSJulian Elischer 	cpu_reset();
512fcb893a8SMike Smith 	/* NOTREACHED */ /* assuming reset worked */
513ad4240feSJulian Elischer }
514ad4240feSJulian Elischer 
515ad4240feSJulian Elischer /*
516ad4240feSJulian Elischer  * Panic is called on unresolvable fatal errors.  It prints "panic: mesg",
517ad4240feSJulian Elischer  * and then reboots.  If we are called twice, then we avoid trying to sync
518ad4240feSJulian Elischer  * the disks as this often leads to recursive panics.
519ad4240feSJulian Elischer  */
520ad4240feSJulian Elischer void
5219a6dc4b6SPoul-Henning Kamp panic(const char *fmt, ...)
522ad4240feSJulian Elischer {
52364dd590eSAndriy Gapon #ifdef SMP
52464dd590eSAndriy Gapon 	static volatile u_int panic_cpu = NOCPU;
52564dd590eSAndriy Gapon #endif
526fe799533SAndrew Gallatin 	struct thread *td = curthread;
527e485b64bSJohn Baldwin 	int bootopt, newpanic;
528ad4240feSJulian Elischer 	va_list ap;
52999237364SAndrey A. Chernov 	static char buf[256];
530ad4240feSJulian Elischer 
53141a4e90eSKonstantin Belousov 	critical_enter();
5320384fff8SJason Evans #ifdef SMP
5331a5333c3SJohn Baldwin 	/*
5341a5333c3SJohn Baldwin 	 * We don't want multiple CPU's to panic at the same time, so we
5350711ca46SJohn Baldwin 	 * use panic_cpu as a simple spinlock.  We have to keep checking
5360711ca46SJohn Baldwin 	 * panic_cpu if we are spinning in case the panic on the first
5371a5333c3SJohn Baldwin 	 * CPU is canceled.
5381a5333c3SJohn Baldwin 	 */
5390711ca46SJohn Baldwin 	if (panic_cpu != PCPU_GET(cpuid))
5400711ca46SJohn Baldwin 		while (atomic_cmpset_int(&panic_cpu, NOCPU,
5410711ca46SJohn Baldwin 		    PCPU_GET(cpuid)) == 0)
5420711ca46SJohn Baldwin 			while (panic_cpu != NOCPU)
5430711ca46SJohn Baldwin 				; /* nothing */
5440384fff8SJason Evans #endif
5450384fff8SJason Evans 
546ad4240feSJulian Elischer 	bootopt = RB_AUTOBOOT | RB_DUMP;
547e485b64bSJohn Baldwin 	newpanic = 0;
548ad4240feSJulian Elischer 	if (panicstr)
549ad4240feSJulian Elischer 		bootopt |= RB_NOSYNC;
550e485b64bSJohn Baldwin 	else {
551ad4240feSJulian Elischer 		panicstr = fmt;
552e485b64bSJohn Baldwin 		newpanic = 1;
553e485b64bSJohn Baldwin 	}
554ad4240feSJulian Elischer 
555ad4240feSJulian Elischer 	va_start(ap, fmt);
5564f1b4577SIan Dowse 	if (newpanic) {
5572127f260SArchie Cobbs 		(void)vsnprintf(buf, sizeof(buf), fmt, ap);
55899237364SAndrey A. Chernov 		panicstr = buf;
5599a6dc4b6SPoul-Henning Kamp 		printf("panic: %s\n", buf);
5604f1b4577SIan Dowse 	} else {
5614f1b4577SIan Dowse 		printf("panic: ");
5624f1b4577SIan Dowse 		vprintf(fmt, ap);
5639a6dc4b6SPoul-Henning Kamp 		printf("\n");
5644f1b4577SIan Dowse 	}
5654f1b4577SIan Dowse 	va_end(ap);
56647d81897SSteve Passe #ifdef SMP
56755c45354SJohn Baldwin 	printf("cpuid = %d\n", PCPU_GET(cpuid));
5682bcc63c5SJohn Baldwin #endif
569ad4240feSJulian Elischer 
5702d50560aSMarcel Moolenaar #ifdef KDB
571e485b64bSJohn Baldwin 	if (newpanic && trace_on_panic)
5722d50560aSMarcel Moolenaar 		kdb_backtrace();
573ad4240feSJulian Elischer 	if (debugger_on_panic)
5743de213ccSRobert Watson 		kdb_enter(KDB_WHY_PANIC, "panic");
5751432aa0cSJohn Baldwin #ifdef RESTARTABLE_PANICS
5761a5333c3SJohn Baldwin 	/* See if the user aborted the panic, in which case we continue. */
5771a5333c3SJohn Baldwin 	if (panicstr == NULL) {
5781a5333c3SJohn Baldwin #ifdef SMP
5790711ca46SJohn Baldwin 		atomic_store_rel_int(&panic_cpu, NOCPU);
5801a5333c3SJohn Baldwin #endif
5811a5333c3SJohn Baldwin 		return;
5821a5333c3SJohn Baldwin 	}
583ad4240feSJulian Elischer #endif
5841432aa0cSJohn Baldwin #endif
585982d11f8SJeff Roberson 	/*thread_lock(td); */
586fe799533SAndrew Gallatin 	td->td_flags |= TDF_INPANIC;
587982d11f8SJeff Roberson 	/* thread_unlock(td); */
588259ed917SPeter Wemm 	if (!sync_on_panic)
589259ed917SPeter Wemm 		bootopt |= RB_NOSYNC;
59041a4e90eSKonstantin Belousov 	critical_exit();
591*76e18b25SMarcel Moolenaar 	kern_reboot(bootopt);
592ad4240feSJulian Elischer }
593ad4240feSJulian Elischer 
594e0d898b4SJulian Elischer /*
595db82a982SMike Smith  * Support for poweroff delay.
596b22692bdSNick Hibma  *
597b22692bdSNick Hibma  * Please note that setting this delay too short might power off your machine
598b22692bdSNick Hibma  * before the write cache on your hard disk has been flushed, leading to
599b22692bdSNick Hibma  * soft-updates inconsistencies.
600db82a982SMike Smith  */
6019eec6969SMike Smith #ifndef POWEROFF_DELAY
6029eec6969SMike Smith # define POWEROFF_DELAY 5000
6039eec6969SMike Smith #endif
6049eec6969SMike Smith static int poweroff_delay = POWEROFF_DELAY;
6059eec6969SMike Smith 
606db82a982SMike Smith SYSCTL_INT(_kern_shutdown, OID_AUTO, poweroff_delay, CTLFLAG_RW,
607db82a982SMike Smith 	&poweroff_delay, 0, "");
608db82a982SMike Smith 
609fcb893a8SMike Smith static void
610fcb893a8SMike Smith poweroff_wait(void *junk, int howto)
611db82a982SMike Smith {
612e95499bdSAlfred Perlstein 
613db82a982SMike Smith 	if (!(howto & RB_POWEROFF) || poweroff_delay <= 0)
614db82a982SMike Smith 		return;
615db82a982SMike Smith 	DELAY(poweroff_delay * 1000);
616db82a982SMike Smith }
6175e950839SLuoqi Chen 
6185e950839SLuoqi Chen /*
6195e950839SLuoqi Chen  * Some system processes (e.g. syncer) need to be stopped at appropriate
6205e950839SLuoqi Chen  * points in their main loops prior to a system shutdown, so that they
6215e950839SLuoqi Chen  * won't interfere with the shutdown process (e.g. by holding a disk buf
6225e950839SLuoqi Chen  * to cause sync to fail).  For each of these system processes, register
6235e950839SLuoqi Chen  * shutdown_kproc() as a handler for one of shutdown events.
6245e950839SLuoqi Chen  */
6255e950839SLuoqi Chen static int kproc_shutdown_wait = 60;
6265e950839SLuoqi Chen SYSCTL_INT(_kern_shutdown, OID_AUTO, kproc_shutdown_wait, CTLFLAG_RW,
6275e950839SLuoqi Chen     &kproc_shutdown_wait, 0, "");
6285e950839SLuoqi Chen 
6295e950839SLuoqi Chen void
630ffc831daSJohn Baldwin kproc_shutdown(void *arg, int howto)
6315e950839SLuoqi Chen {
6325e950839SLuoqi Chen 	struct proc *p;
6335e950839SLuoqi Chen 	int error;
6345e950839SLuoqi Chen 
6355e950839SLuoqi Chen 	if (panicstr)
6365e950839SLuoqi Chen 		return;
6375e950839SLuoqi Chen 
6385e950839SLuoqi Chen 	p = (struct proc *)arg;
639b1c81391SNate Lawson 	printf("Waiting (max %d seconds) for system process `%s' to stop...",
6404f9d48e4SJohn Baldwin 	    kproc_shutdown_wait, p->p_comm);
6413745c395SJulian Elischer 	error = kproc_suspend(p, kproc_shutdown_wait * hz);
6425e950839SLuoqi Chen 
6435e950839SLuoqi Chen 	if (error == EWOULDBLOCK)
644b1c81391SNate Lawson 		printf("timed out\n");
6455e950839SLuoqi Chen 	else
646b1c81391SNate Lawson 		printf("done\n");
6475e950839SLuoqi Chen }
64881661c94SPoul-Henning Kamp 
6497ab24ea3SJulian Elischer void
6507ab24ea3SJulian Elischer kthread_shutdown(void *arg, int howto)
6517ab24ea3SJulian Elischer {
6527ab24ea3SJulian Elischer 	struct thread *td;
6537ab24ea3SJulian Elischer 	int error;
6547ab24ea3SJulian Elischer 
6557ab24ea3SJulian Elischer 	if (panicstr)
6567ab24ea3SJulian Elischer 		return;
6577ab24ea3SJulian Elischer 
6587ab24ea3SJulian Elischer 	td = (struct thread *)arg;
6597ab24ea3SJulian Elischer 	printf("Waiting (max %d seconds) for system thread `%s' to stop...",
6604f9d48e4SJohn Baldwin 	    kproc_shutdown_wait, td->td_name);
6617ab24ea3SJulian Elischer 	error = kthread_suspend(td, kproc_shutdown_wait * hz);
6627ab24ea3SJulian Elischer 
6637ab24ea3SJulian Elischer 	if (error == EWOULDBLOCK)
6647ab24ea3SJulian Elischer 		printf("timed out\n");
6657ab24ea3SJulian Elischer 	else
6667ab24ea3SJulian Elischer 		printf("done\n");
6677ab24ea3SJulian Elischer }
6687ab24ea3SJulian Elischer 
66981661c94SPoul-Henning Kamp /* Registration of dumpers */
67081661c94SPoul-Henning Kamp int
67181661c94SPoul-Henning Kamp set_dumper(struct dumperinfo *di)
67281661c94SPoul-Henning Kamp {
673e95499bdSAlfred Perlstein 
67481661c94SPoul-Henning Kamp 	if (di == NULL) {
67581661c94SPoul-Henning Kamp 		bzero(&dumper, sizeof dumper);
67681661c94SPoul-Henning Kamp 		return (0);
67781661c94SPoul-Henning Kamp 	}
67881661c94SPoul-Henning Kamp 	if (dumper.dumper != NULL)
67981661c94SPoul-Henning Kamp 		return (EBUSY);
68081661c94SPoul-Henning Kamp 	dumper = *di;
68181661c94SPoul-Henning Kamp 	return (0);
68281661c94SPoul-Henning Kamp }
68381661c94SPoul-Henning Kamp 
684007b1b7bSRuslan Ermilov /* Call dumper with bounds checking. */
685007b1b7bSRuslan Ermilov int
686007b1b7bSRuslan Ermilov dump_write(struct dumperinfo *di, void *virtual, vm_offset_t physical,
687007b1b7bSRuslan Ermilov     off_t offset, size_t length)
688007b1b7bSRuslan Ermilov {
689007b1b7bSRuslan Ermilov 
690007b1b7bSRuslan Ermilov 	if (length != 0 && (offset < di->mediaoffset ||
691007b1b7bSRuslan Ermilov 	    offset - di->mediaoffset + length > di->mediasize)) {
692007b1b7bSRuslan Ermilov 		printf("Attempt to write outside dump device boundaries.\n");
693007b1b7bSRuslan Ermilov 		return (ENXIO);
694007b1b7bSRuslan Ermilov 	}
695007b1b7bSRuslan Ermilov 	return (di->dumper(di->priv, virtual, physical, offset, length));
696007b1b7bSRuslan Ermilov }
697007b1b7bSRuslan Ermilov 
698e6592ee5SPeter Wemm void
699e6592ee5SPeter Wemm mkdumpheader(struct kerneldumpheader *kdh, char *magic, uint32_t archver,
700e6592ee5SPeter Wemm     uint64_t dumplen, uint32_t blksz)
701e6592ee5SPeter Wemm {
702e6592ee5SPeter Wemm 
703e6592ee5SPeter Wemm 	bzero(kdh, sizeof(*kdh));
704e6592ee5SPeter Wemm 	strncpy(kdh->magic, magic, sizeof(kdh->magic));
705e6592ee5SPeter Wemm 	strncpy(kdh->architecture, MACHINE_ARCH, sizeof(kdh->architecture));
706e6592ee5SPeter Wemm 	kdh->version = htod32(KERNELDUMPVERSION);
707e6592ee5SPeter Wemm 	kdh->architectureversion = htod32(archver);
708e6592ee5SPeter Wemm 	kdh->dumplength = htod64(dumplen);
709e6592ee5SPeter Wemm 	kdh->dumptime = htod64(time_second);
710e6592ee5SPeter Wemm 	kdh->blocksize = htod32(blksz);
711c1f19219SJamie Gritton 	strncpy(kdh->hostname, prison0.pr_hostname, sizeof(kdh->hostname));
712e6592ee5SPeter Wemm 	strncpy(kdh->versionstring, version, sizeof(kdh->versionstring));
713e6592ee5SPeter Wemm 	if (panicstr != NULL)
714e6592ee5SPeter Wemm 		strncpy(kdh->panicstring, panicstr, sizeof(kdh->panicstring));
715e6592ee5SPeter Wemm 	kdh->parity = kerneldump_parity(kdh);
716e6592ee5SPeter Wemm }
717