xref: /freebsd/sys/kern/kern_clock.c (revision 7628402b070ca215943a3b78586764d5a07bdc5d)
1df8bae1dSRodney W. Grimes /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1982, 1986, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  * (c) UNIX System Laboratories, Inc.
5df8bae1dSRodney W. Grimes  * All or some portions of this file are derived from material licensed
6df8bae1dSRodney W. Grimes  * to the University of California by American Telephone and Telegraph
7df8bae1dSRodney W. Grimes  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
8df8bae1dSRodney W. Grimes  * the permission of UNIX System Laboratories, Inc.
9df8bae1dSRodney W. Grimes  *
10df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
11df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
12df8bae1dSRodney W. Grimes  * are met:
13df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
14df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
15df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
16df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
17df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
18df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
19df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
20df8bae1dSRodney W. Grimes  *    without specific prior written permission.
21df8bae1dSRodney W. Grimes  *
22df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
33df8bae1dSRodney W. Grimes  *
34df8bae1dSRodney W. Grimes  *	@(#)kern_clock.c	8.5 (Berkeley) 1/21/94
35df8bae1dSRodney W. Grimes  */
36df8bae1dSRodney W. Grimes 
37677b542eSDavid E. O'Brien #include <sys/cdefs.h>
38677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
39677b542eSDavid E. O'Brien 
40911d16b8SEd Maste #include "opt_kdb.h"
41f0796cd2SGleb Smirnoff #include "opt_device_polling.h"
424da0d332SPeter Wemm #include "opt_hwpmc_hooks.h"
4332c20357SPoul-Henning Kamp #include "opt_ntp.h"
44370c3cb5SSean Kelly #include "opt_watchdog.h"
4532c20357SPoul-Henning Kamp 
46df8bae1dSRodney W. Grimes #include <sys/param.h>
47df8bae1dSRodney W. Grimes #include <sys/systm.h>
48df8bae1dSRodney W. Grimes #include <sys/callout.h>
492d50560aSMarcel Moolenaar #include <sys/kdb.h>
50df8bae1dSRodney W. Grimes #include <sys/kernel.h>
51f34fa851SJohn Baldwin #include <sys/lock.h>
5261d80e90SJohn Baldwin #include <sys/ktr.h>
5335e0e5b3SJohn Baldwin #include <sys/mutex.h>
54df8bae1dSRodney W. Grimes #include <sys/proc.h>
55e4625663SJeff Roberson #include <sys/resource.h>
56df8bae1dSRodney W. Grimes #include <sys/resourcevar.h>
57b43179fbSJeff Roberson #include <sys/sched.h>
58797f2d22SPoul-Henning Kamp #include <sys/signalvar.h>
596caa8a15SJohn Baldwin #include <sys/smp.h>
608a129caeSDavid Greenman #include <vm/vm.h>
61efeaf95aSDavid Greenman #include <vm/pmap.h>
62efeaf95aSDavid Greenman #include <vm/vm_map.h>
63797f2d22SPoul-Henning Kamp #include <sys/sysctl.h>
648088699fSJohn Baldwin #include <sys/bus.h>
658088699fSJohn Baldwin #include <sys/interrupt.h>
66104a9b7eSAlexander Kabaev #include <sys/limits.h>
67e7fa55afSPoul-Henning Kamp #include <sys/timetc.h>
68df8bae1dSRodney W. Grimes 
69df8bae1dSRodney W. Grimes #ifdef GPROF
70df8bae1dSRodney W. Grimes #include <sys/gmon.h>
71df8bae1dSRodney W. Grimes #endif
72df8bae1dSRodney W. Grimes 
7336c0fd9dSJoseph Koshy #ifdef HWPMC_HOOKS
7436c0fd9dSJoseph Koshy #include <sys/pmckern.h>
7536c0fd9dSJoseph Koshy #endif
7636c0fd9dSJoseph Koshy 
77e4fc250cSLuigi Rizzo #ifdef DEVICE_POLLING
78e4fc250cSLuigi Rizzo extern void hardclock_device_poll(void);
79e4fc250cSLuigi Rizzo #endif /* DEVICE_POLLING */
80eae8fc2cSSteve Passe 
814d77a549SAlfred Perlstein static void initclocks(void *dummy);
822b14f991SJulian Elischer SYSINIT(clocks, SI_SUB_CLOCKS, SI_ORDER_FIRST, initclocks, NULL)
832b14f991SJulian Elischer 
848b98fec9SJeff Roberson /* Spin-lock protecting profiling statistics. */
8586a49deaSAttilio Rao static struct mtx time_lock;
868b98fec9SJeff Roberson 
8762919d78SPeter Wemm static int
8862919d78SPeter Wemm sysctl_kern_cp_time(SYSCTL_HANDLER_ARGS)
8962919d78SPeter Wemm {
9062919d78SPeter Wemm 	int error;
917628402bSPeter Wemm 	long cp_time[CPUSTATES];
92cff2e749SPaul Saab #ifdef SCTL_MASK32
9362919d78SPeter Wemm 	int i;
9462919d78SPeter Wemm 	unsigned int cp_time32[CPUSTATES];
957628402bSPeter Wemm #endif
9662919d78SPeter Wemm 
977628402bSPeter Wemm 	read_cpu_time(cp_time);
987628402bSPeter Wemm #ifdef SCTL_MASK32
99cff2e749SPaul Saab 	if (req->flags & SCTL_MASK32) {
10062919d78SPeter Wemm 		if (!req->oldptr)
10162919d78SPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(cp_time32));
10262919d78SPeter Wemm 		for (i = 0; i < CPUSTATES; i++)
10362919d78SPeter Wemm 			cp_time32[i] = (unsigned int)cp_time[i];
10462919d78SPeter Wemm 		error = SYSCTL_OUT(req, cp_time32, sizeof(cp_time32));
10562919d78SPeter Wemm 	} else
10662919d78SPeter Wemm #endif
10762919d78SPeter Wemm 	{
10862919d78SPeter Wemm 		if (!req->oldptr)
10962919d78SPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(cp_time));
11062919d78SPeter Wemm 		error = SYSCTL_OUT(req, cp_time, sizeof(cp_time));
11162919d78SPeter Wemm 	}
11262919d78SPeter Wemm 	return error;
11362919d78SPeter Wemm }
11462919d78SPeter Wemm 
11562919d78SPeter Wemm SYSCTL_PROC(_kern, OID_AUTO, cp_time, CTLTYPE_LONG|CTLFLAG_RD,
11662919d78SPeter Wemm     0,0, sysctl_kern_cp_time, "LU", "CPU time statistics");
1177f112b04SRobert Watson 
1187628402bSPeter Wemm static long empty[CPUSTATES];
1197628402bSPeter Wemm 
1207628402bSPeter Wemm static int
1217628402bSPeter Wemm sysctl_kern_cp_times(SYSCTL_HANDLER_ARGS)
1227628402bSPeter Wemm {
1237628402bSPeter Wemm 	struct pcpu *pcpu;
1247628402bSPeter Wemm 	int error;
1257628402bSPeter Wemm 	int i, c;
1267628402bSPeter Wemm 	long *cp_time;
1277628402bSPeter Wemm #ifdef SCTL_MASK32
1287628402bSPeter Wemm 	unsigned int cp_time32[CPUSTATES];
1297628402bSPeter Wemm #endif
1307628402bSPeter Wemm 
1317628402bSPeter Wemm 	if (!req->oldptr) {
1327628402bSPeter Wemm #ifdef SCTL_MASK32
1337628402bSPeter Wemm 		if (req->flags & SCTL_MASK32)
1347628402bSPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(cp_time32) * (mp_maxid + 1));
1357628402bSPeter Wemm 		else
1367628402bSPeter Wemm #endif
1377628402bSPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(long) * CPUSTATES * (mp_maxid + 1));
1387628402bSPeter Wemm 	}
1397628402bSPeter Wemm 	for (error = 0, c = 0; error == 0 && c <= mp_maxid; c++) {
1407628402bSPeter Wemm 		if (!CPU_ABSENT(c)) {
1417628402bSPeter Wemm 			pcpu = pcpu_find(c);
1427628402bSPeter Wemm 			cp_time = pcpu->pc_cp_time;
1437628402bSPeter Wemm 		} else {
1447628402bSPeter Wemm 			cp_time = empty;
1457628402bSPeter Wemm 		}
1467628402bSPeter Wemm #ifdef SCTL_MASK32
1477628402bSPeter Wemm 		if (req->flags & SCTL_MASK32) {
1487628402bSPeter Wemm 			for (i = 0; i < CPUSTATES; i++)
1497628402bSPeter Wemm 				cp_time32[i] = (unsigned int)cp_time[i];
1507628402bSPeter Wemm 			error = SYSCTL_OUT(req, cp_time32, sizeof(cp_time32));
1517628402bSPeter Wemm 		} else
1527628402bSPeter Wemm #endif
1537628402bSPeter Wemm 			error = SYSCTL_OUT(req, cp_time, sizeof(long) * CPUSTATES);
1547628402bSPeter Wemm 	}
1557628402bSPeter Wemm 	return error;
1567628402bSPeter Wemm }
1577628402bSPeter Wemm 
1587628402bSPeter Wemm SYSCTL_PROC(_kern, OID_AUTO, cp_times, CTLTYPE_LONG|CTLFLAG_RD,
1597628402bSPeter Wemm     0,0, sysctl_kern_cp_times, "LU", "per-CPU time statistics");
1607628402bSPeter Wemm 
1617628402bSPeter Wemm void
1627628402bSPeter Wemm read_cpu_time(long *cp_time)
1637628402bSPeter Wemm {
1647628402bSPeter Wemm 	struct pcpu *pc;
1657628402bSPeter Wemm 	int i, j;
1667628402bSPeter Wemm 
1677628402bSPeter Wemm 	/* Sum up global cp_time[]. */
1687628402bSPeter Wemm 	bzero(cp_time, sizeof(long) * CPUSTATES);
1697628402bSPeter Wemm 	for (i = 0; i <= mp_maxid; i++) {
1707628402bSPeter Wemm 		if (CPU_ABSENT(i))
1717628402bSPeter Wemm 			continue;
1727628402bSPeter Wemm 		pc = pcpu_find(i);
1737628402bSPeter Wemm 		for (j = 0; j < CPUSTATES; j++)
1747628402bSPeter Wemm 			cp_time[j] += pc->pc_cp_time[j];
1757628402bSPeter Wemm 	}
1767628402bSPeter Wemm }
1777628402bSPeter Wemm 
1784103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
1794103b765SPoul-Henning Kamp #include <sys/watchdog.h>
180370c3cb5SSean Kelly 
1814103b765SPoul-Henning Kamp static int watchdog_ticks;
182370c3cb5SSean Kelly static int watchdog_enabled;
1834103b765SPoul-Henning Kamp static void watchdog_fire(void);
1844103b765SPoul-Henning Kamp static void watchdog_config(void *, u_int, int *);
1854103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */
186370c3cb5SSean Kelly 
1873bac064fSPoul-Henning Kamp /*
188df8bae1dSRodney W. Grimes  * Clock handling routines.
189df8bae1dSRodney W. Grimes  *
190b05dcf3cSPoul-Henning Kamp  * This code is written to operate with two timers that run independently of
191b05dcf3cSPoul-Henning Kamp  * each other.
1927ec73f64SPoul-Henning Kamp  *
193b05dcf3cSPoul-Henning Kamp  * The main timer, running hz times per second, is used to trigger interval
194b05dcf3cSPoul-Henning Kamp  * timers, timeouts and rescheduling as needed.
1957ec73f64SPoul-Henning Kamp  *
196b05dcf3cSPoul-Henning Kamp  * The second timer handles kernel and user profiling,
197b05dcf3cSPoul-Henning Kamp  * and does resource use estimation.  If the second timer is programmable,
198b05dcf3cSPoul-Henning Kamp  * it is randomized to avoid aliasing between the two clocks.  For example,
199b05dcf3cSPoul-Henning Kamp  * the randomization prevents an adversary from always giving up the cpu
200df8bae1dSRodney W. Grimes  * just before its quantum expires.  Otherwise, it would never accumulate
201df8bae1dSRodney W. Grimes  * cpu ticks.  The mean frequency of the second timer is stathz.
202b05dcf3cSPoul-Henning Kamp  *
203b05dcf3cSPoul-Henning Kamp  * If no second timer exists, stathz will be zero; in this case we drive
204b05dcf3cSPoul-Henning Kamp  * profiling and statistics off the main clock.  This WILL NOT be accurate;
205b05dcf3cSPoul-Henning Kamp  * do not do it unless absolutely necessary.
206b05dcf3cSPoul-Henning Kamp  *
207df8bae1dSRodney W. Grimes  * The statistics clock may (or may not) be run at a higher rate while
208b05dcf3cSPoul-Henning Kamp  * profiling.  This profile clock runs at profhz.  We require that profhz
209b05dcf3cSPoul-Henning Kamp  * be an integral multiple of stathz.
210b05dcf3cSPoul-Henning Kamp  *
211b05dcf3cSPoul-Henning Kamp  * If the statistics clock is running fast, it must be divided by the ratio
212b05dcf3cSPoul-Henning Kamp  * profhz/stathz for statistics.  (For profiling, every tick counts.)
213df8bae1dSRodney W. Grimes  *
2147ec73f64SPoul-Henning Kamp  * Time-of-day is maintained using a "timecounter", which may or may
2157ec73f64SPoul-Henning Kamp  * not be related to the hardware generating the above mentioned
2167ec73f64SPoul-Henning Kamp  * interrupts.
217df8bae1dSRodney W. Grimes  */
218df8bae1dSRodney W. Grimes 
219df8bae1dSRodney W. Grimes int	stathz;
220df8bae1dSRodney W. Grimes int	profhz;
221238dd320SJake Burkholder int	profprocs;
222df8bae1dSRodney W. Grimes int	ticks;
223238dd320SJake Burkholder int	psratio;
224df8bae1dSRodney W. Grimes 
225df8bae1dSRodney W. Grimes /*
226df8bae1dSRodney W. Grimes  * Initialize clock frequencies and start both clocks running.
227df8bae1dSRodney W. Grimes  */
2282b14f991SJulian Elischer /* ARGSUSED*/
2292b14f991SJulian Elischer static void
230d841aaa7SBruce Evans initclocks(dummy)
231d841aaa7SBruce Evans 	void *dummy;
232df8bae1dSRodney W. Grimes {
233df8bae1dSRodney W. Grimes 	register int i;
234df8bae1dSRodney W. Grimes 
235df8bae1dSRodney W. Grimes 	/*
236df8bae1dSRodney W. Grimes 	 * Set divisors to 1 (normal case) and let the machine-specific
237df8bae1dSRodney W. Grimes 	 * code do its bit.
238df8bae1dSRodney W. Grimes 	 */
2398b98fec9SJeff Roberson 	mtx_init(&time_lock, "time lock", NULL, MTX_SPIN);
24063d69d25SRobert Watson 	cpu_initclocks();
241df8bae1dSRodney W. Grimes 
242df8bae1dSRodney W. Grimes 	/*
243df8bae1dSRodney W. Grimes 	 * Compute profhz/stathz, and fix profhz if needed.
244df8bae1dSRodney W. Grimes 	 */
245df8bae1dSRodney W. Grimes 	i = stathz ? stathz : hz;
246df8bae1dSRodney W. Grimes 	if (profhz == 0)
247df8bae1dSRodney W. Grimes 		profhz = i;
248df8bae1dSRodney W. Grimes 	psratio = profhz / i;
2494103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
2504103b765SPoul-Henning Kamp 	EVENTHANDLER_REGISTER(watchdog_list, watchdog_config, NULL, 0);
2514103b765SPoul-Henning Kamp #endif
252df8bae1dSRodney W. Grimes }
253df8bae1dSRodney W. Grimes 
254df8bae1dSRodney W. Grimes /*
255238dd320SJake Burkholder  * Each time the real-time timer fires, this function is called on all CPUs.
256b439e431SJohn Baldwin  * Note that hardclock() calls hardclock_cpu() for the boot CPU, so only
257238dd320SJake Burkholder  * the other CPUs in the system need to call this function.
2586caa8a15SJohn Baldwin  */
2596caa8a15SJohn Baldwin void
260b439e431SJohn Baldwin hardclock_cpu(int usermode)
2616caa8a15SJohn Baldwin {
2626caa8a15SJohn Baldwin 	struct pstats *pstats;
263238dd320SJake Burkholder 	struct thread *td = curthread;
264b40ce416SJulian Elischer 	struct proc *p = td->td_proc;
265b61ce5b0SJeff Roberson 	int flags;
2666caa8a15SJohn Baldwin 
2676caa8a15SJohn Baldwin 	/*
2686caa8a15SJohn Baldwin 	 * Run current process's virtual and profile time, as needed.
2696caa8a15SJohn Baldwin 	 */
270ad1e7d28SJulian Elischer 	pstats = p->p_stats;
271b61ce5b0SJeff Roberson 	flags = 0;
272ad1e7d28SJulian Elischer 	if (usermode &&
27340acdeabSJeff Roberson 	    timevalisset(&pstats->p_timer[ITIMER_VIRTUAL].it_value)) {
27440acdeabSJeff Roberson 		PROC_SLOCK(p);
275b61ce5b0SJeff Roberson 		if (itimerdecr(&pstats->p_timer[ITIMER_VIRTUAL], tick) == 0)
276b61ce5b0SJeff Roberson 			flags |= TDF_ALRMPEND | TDF_ASTPENDING;
27740acdeabSJeff Roberson 		PROC_SUNLOCK(p);
27840acdeabSJeff Roberson 	}
27940acdeabSJeff Roberson 	if (timevalisset(&pstats->p_timer[ITIMER_PROF].it_value)) {
28040acdeabSJeff Roberson 		PROC_SLOCK(p);
281b61ce5b0SJeff Roberson 		if (itimerdecr(&pstats->p_timer[ITIMER_PROF], tick) == 0)
282b61ce5b0SJeff Roberson 			flags |= TDF_PROFPEND | TDF_ASTPENDING;
28340acdeabSJeff Roberson 		PROC_SUNLOCK(p);
28440acdeabSJeff Roberson 	}
28540acdeabSJeff Roberson 	thread_lock(td);
28640acdeabSJeff Roberson 	sched_tick();
287b61ce5b0SJeff Roberson 	td->td_flags |= flags;
28840acdeabSJeff Roberson 	thread_unlock(td);
28936c0fd9dSJoseph Koshy 
29036c0fd9dSJoseph Koshy #ifdef	HWPMC_HOOKS
29136c0fd9dSJoseph Koshy 	if (PMC_CPU_HAS_SAMPLES(PCPU_GET(cpuid)))
29236c0fd9dSJoseph Koshy 		PMC_CALL_HOOK_UNLOCKED(curthread, PMC_FN_DO_SAMPLES, NULL);
29336c0fd9dSJoseph Koshy #endif
2946caa8a15SJohn Baldwin }
2956caa8a15SJohn Baldwin 
2966caa8a15SJohn Baldwin /*
297df8bae1dSRodney W. Grimes  * The real-time timer, interrupting hz times per second.
298df8bae1dSRodney W. Grimes  */
299df8bae1dSRodney W. Grimes void
300b439e431SJohn Baldwin hardclock(int usermode, uintfptr_t pc)
301df8bae1dSRodney W. Grimes {
302fa2fbc3dSJake Burkholder 	int need_softclock = 0;
303df8bae1dSRodney W. Grimes 
304b439e431SJohn Baldwin 	hardclock_cpu(usermode);
305b05dcf3cSPoul-Henning Kamp 
306e7fa55afSPoul-Henning Kamp 	tc_ticktock();
307df8bae1dSRodney W. Grimes 	/*
308df8bae1dSRodney W. Grimes 	 * If no separate statistics clock is available, run it from here.
3096caa8a15SJohn Baldwin 	 *
3106caa8a15SJohn Baldwin 	 * XXX: this only works for UP
311df8bae1dSRodney W. Grimes 	 */
312238dd320SJake Burkholder 	if (stathz == 0) {
313b439e431SJohn Baldwin 		profclock(usermode, pc);
314b439e431SJohn Baldwin 		statclock(usermode);
315238dd320SJake Burkholder 	}
316df8bae1dSRodney W. Grimes 
317e4fc250cSLuigi Rizzo #ifdef DEVICE_POLLING
318daccb638SLuigi Rizzo 	hardclock_device_poll();	/* this is very short and quick */
319e4fc250cSLuigi Rizzo #endif /* DEVICE_POLLING */
3203f31c649SGarrett Wollman 
321b05dcf3cSPoul-Henning Kamp 	/*
322b05dcf3cSPoul-Henning Kamp 	 * Process callouts at a very low cpu priority, so we don't keep the
323b05dcf3cSPoul-Henning Kamp 	 * relatively high clock interrupt priority any longer than necessary.
324b05dcf3cSPoul-Henning Kamp 	 */
32521a7a9aeSJohn Baldwin 	mtx_lock_spin_flags(&callout_lock, MTX_QUIET);
326fa2fbc3dSJake Burkholder 	ticks++;
3276ad26d83SXin LI 	if (!TAILQ_EMPTY(&callwheel[ticks & callwheelmask])) {
328fa2fbc3dSJake Burkholder 		need_softclock = 1;
329b05dcf3cSPoul-Henning Kamp 	} else if (softticks + 1 == ticks)
330b05dcf3cSPoul-Henning Kamp 		++softticks;
33121a7a9aeSJohn Baldwin 	mtx_unlock_spin_flags(&callout_lock, MTX_QUIET);
332fa2fbc3dSJake Burkholder 
333fa2fbc3dSJake Burkholder 	/*
33440acdeabSJeff Roberson 	 * swi_sched acquires the thread lock, so we don't want to call it
33540acdeabSJeff Roberson 	 * with callout_lock held; incorrect locking order.
336fa2fbc3dSJake Burkholder 	 */
337fa2fbc3dSJake Burkholder 	if (need_softclock)
338c86b6ff5SJohn Baldwin 		swi_sched(softclock_ih, 0);
339370c3cb5SSean Kelly 
3404103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
3414103b765SPoul-Henning Kamp 	if (watchdog_enabled > 0 && --watchdog_ticks <= 0)
342370c3cb5SSean Kelly 		watchdog_fire();
3434103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */
344ab36c067SJustin T. Gibbs }
345ab36c067SJustin T. Gibbs 
346df8bae1dSRodney W. Grimes /*
347227ee8a1SPoul-Henning Kamp  * Compute number of ticks in the specified amount of time.
348df8bae1dSRodney W. Grimes  */
349df8bae1dSRodney W. Grimes int
350227ee8a1SPoul-Henning Kamp tvtohz(tv)
351df8bae1dSRodney W. Grimes 	struct timeval *tv;
352df8bae1dSRodney W. Grimes {
3536976af69SBruce Evans 	register unsigned long ticks;
3546976af69SBruce Evans 	register long sec, usec;
355df8bae1dSRodney W. Grimes 
356df8bae1dSRodney W. Grimes 	/*
3576976af69SBruce Evans 	 * If the number of usecs in the whole seconds part of the time
3586976af69SBruce Evans 	 * difference fits in a long, then the total number of usecs will
3596976af69SBruce Evans 	 * fit in an unsigned long.  Compute the total and convert it to
3606976af69SBruce Evans 	 * ticks, rounding up and adding 1 to allow for the current tick
3616976af69SBruce Evans 	 * to expire.  Rounding also depends on unsigned long arithmetic
3626976af69SBruce Evans 	 * to avoid overflow.
363df8bae1dSRodney W. Grimes 	 *
3646976af69SBruce Evans 	 * Otherwise, if the number of ticks in the whole seconds part of
3656976af69SBruce Evans 	 * the time difference fits in a long, then convert the parts to
3666976af69SBruce Evans 	 * ticks separately and add, using similar rounding methods and
3676976af69SBruce Evans 	 * overflow avoidance.  This method would work in the previous
3686976af69SBruce Evans 	 * case but it is slightly slower and assumes that hz is integral.
3696976af69SBruce Evans 	 *
3706976af69SBruce Evans 	 * Otherwise, round the time difference down to the maximum
3716976af69SBruce Evans 	 * representable value.
3726976af69SBruce Evans 	 *
3736976af69SBruce Evans 	 * If ints have 32 bits, then the maximum value for any timeout in
3746976af69SBruce Evans 	 * 10ms ticks is 248 days.
375df8bae1dSRodney W. Grimes 	 */
376227ee8a1SPoul-Henning Kamp 	sec = tv->tv_sec;
377227ee8a1SPoul-Henning Kamp 	usec = tv->tv_usec;
3786976af69SBruce Evans 	if (usec < 0) {
3796976af69SBruce Evans 		sec--;
3806976af69SBruce Evans 		usec += 1000000;
3816976af69SBruce Evans 	}
3826976af69SBruce Evans 	if (sec < 0) {
3836976af69SBruce Evans #ifdef DIAGNOSTIC
384b05dcf3cSPoul-Henning Kamp 		if (usec > 0) {
3857ec73f64SPoul-Henning Kamp 			sec++;
3867ec73f64SPoul-Henning Kamp 			usec -= 1000000;
3877ec73f64SPoul-Henning Kamp 		}
388227ee8a1SPoul-Henning Kamp 		printf("tvotohz: negative time difference %ld sec %ld usec\n",
3896976af69SBruce Evans 		       sec, usec);
3906976af69SBruce Evans #endif
3916976af69SBruce Evans 		ticks = 1;
3926976af69SBruce Evans 	} else if (sec <= LONG_MAX / 1000000)
3936976af69SBruce Evans 		ticks = (sec * 1000000 + (unsigned long)usec + (tick - 1))
3946976af69SBruce Evans 			/ tick + 1;
3956976af69SBruce Evans 	else if (sec <= LONG_MAX / hz)
3966976af69SBruce Evans 		ticks = sec * hz
3976976af69SBruce Evans 			+ ((unsigned long)usec + (tick - 1)) / tick + 1;
3986976af69SBruce Evans 	else
3996976af69SBruce Evans 		ticks = LONG_MAX;
4006976af69SBruce Evans 	if (ticks > INT_MAX)
4016976af69SBruce Evans 		ticks = INT_MAX;
402d6116663SAlexander Langer 	return ((int)ticks);
403df8bae1dSRodney W. Grimes }
404df8bae1dSRodney W. Grimes 
405df8bae1dSRodney W. Grimes /*
406df8bae1dSRodney W. Grimes  * Start profiling on a process.
407df8bae1dSRodney W. Grimes  *
408df8bae1dSRodney W. Grimes  * Kernel profiling passes proc0 which never exits and hence
409df8bae1dSRodney W. Grimes  * keeps the profile clock running constantly.
410df8bae1dSRodney W. Grimes  */
411df8bae1dSRodney W. Grimes void
412df8bae1dSRodney W. Grimes startprofclock(p)
413df8bae1dSRodney W. Grimes 	register struct proc *p;
414df8bae1dSRodney W. Grimes {
415df8bae1dSRodney W. Grimes 
4169752f794SJohn Baldwin 	PROC_LOCK_ASSERT(p, MA_OWNED);
4179752f794SJohn Baldwin 	if (p->p_flag & P_STOPPROF)
418a282253aSJulian Elischer 		return;
4199752f794SJohn Baldwin 	if ((p->p_flag & P_PROFIL) == 0) {
4209752f794SJohn Baldwin 		p->p_flag |= P_PROFIL;
4218b98fec9SJeff Roberson 		mtx_lock_spin(&time_lock);
422238dd320SJake Burkholder 		if (++profprocs == 1)
423238dd320SJake Burkholder 			cpu_startprofclock();
4248b98fec9SJeff Roberson 		mtx_unlock_spin(&time_lock);
425df8bae1dSRodney W. Grimes 	}
4269752f794SJohn Baldwin }
427df8bae1dSRodney W. Grimes 
428df8bae1dSRodney W. Grimes /*
429df8bae1dSRodney W. Grimes  * Stop profiling on a process.
430df8bae1dSRodney W. Grimes  */
431df8bae1dSRodney W. Grimes void
432df8bae1dSRodney W. Grimes stopprofclock(p)
433df8bae1dSRodney W. Grimes 	register struct proc *p;
434df8bae1dSRodney W. Grimes {
435df8bae1dSRodney W. Grimes 
436a282253aSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
4379752f794SJohn Baldwin 	if (p->p_flag & P_PROFIL) {
4389752f794SJohn Baldwin 		if (p->p_profthreads != 0) {
4399752f794SJohn Baldwin 			p->p_flag |= P_STOPPROF;
4409752f794SJohn Baldwin 			while (p->p_profthreads != 0)
441a282253aSJulian Elischer 				msleep(&p->p_profthreads, &p->p_mtx, PPAUSE,
442a89ec05eSPeter Wemm 				    "stopprof", 0);
4439752f794SJohn Baldwin 			p->p_flag &= ~P_STOPPROF;
444a282253aSJulian Elischer 		}
445b62b2304SColin Percival 		if ((p->p_flag & P_PROFIL) == 0)
446b62b2304SColin Percival 			return;
4479752f794SJohn Baldwin 		p->p_flag &= ~P_PROFIL;
4488b98fec9SJeff Roberson 		mtx_lock_spin(&time_lock);
449238dd320SJake Burkholder 		if (--profprocs == 0)
450238dd320SJake Burkholder 			cpu_stopprofclock();
4518b98fec9SJeff Roberson 		mtx_unlock_spin(&time_lock);
452df8bae1dSRodney W. Grimes 	}
4539752f794SJohn Baldwin }
454df8bae1dSRodney W. Grimes 
455df8bae1dSRodney W. Grimes /*
4561c4bcd05SJeff Roberson  * Statistics clock.  Updates rusage information and calls the scheduler
4571c4bcd05SJeff Roberson  * to adjust priorities of the active thread.
4581c4bcd05SJeff Roberson  *
459238dd320SJake Burkholder  * This should be called by all active processors.
460df8bae1dSRodney W. Grimes  */
461df8bae1dSRodney W. Grimes void
462b439e431SJohn Baldwin statclock(int usermode)
463df8bae1dSRodney W. Grimes {
4648a129caeSDavid Greenman 	struct rusage *ru;
4658a129caeSDavid Greenman 	struct vmspace *vm;
466238dd320SJake Burkholder 	struct thread *td;
467238dd320SJake Burkholder 	struct proc *p;
468238dd320SJake Burkholder 	long rss;
4697628402bSPeter Wemm 	long *cp_time;
4708a129caeSDavid Greenman 
471238dd320SJake Burkholder 	td = curthread;
472238dd320SJake Burkholder 	p = td->td_proc;
473238dd320SJake Burkholder 
4747628402bSPeter Wemm 	cp_time = (long *)PCPU_PTR(cp_time);
475b439e431SJohn Baldwin 	if (usermode) {
476df8bae1dSRodney W. Grimes 		/*
47771a62f8aSBruce Evans 		 * Charge the time as appropriate.
478df8bae1dSRodney W. Grimes 		 */
4798460a577SJohn Birrell #ifdef KSE
4800e2a4d3aSDavid Xu 		if (p->p_flag & P_SA)
4815215b187SJeff Roberson 			thread_statclock(1);
4828460a577SJohn Birrell #endif
483e8444a7eSPoul-Henning Kamp 		td->td_uticks++;
484fa885116SJulian Elischer 		if (p->p_nice > NZERO)
4857628402bSPeter Wemm 			cp_time[CP_NICE]++;
486df8bae1dSRodney W. Grimes 		else
4877628402bSPeter Wemm 			cp_time[CP_USER]++;
488df8bae1dSRodney W. Grimes 	} else {
489df8bae1dSRodney W. Grimes 		/*
490df8bae1dSRodney W. Grimes 		 * Came from kernel mode, so we were:
491df8bae1dSRodney W. Grimes 		 * - handling an interrupt,
492df8bae1dSRodney W. Grimes 		 * - doing syscall or trap work on behalf of the current
493df8bae1dSRodney W. Grimes 		 *   user process, or
494df8bae1dSRodney W. Grimes 		 * - spinning in the idle loop.
495df8bae1dSRodney W. Grimes 		 * Whichever it is, charge the time as appropriate.
496df8bae1dSRodney W. Grimes 		 * Note that we charge interrupts to the current process,
497df8bae1dSRodney W. Grimes 		 * regardless of whether they are ``for'' that process,
498df8bae1dSRodney W. Grimes 		 * so that we know how much of its real time was spent
499df8bae1dSRodney W. Grimes 		 * in ``non-process'' (i.e., interrupt) work.
500df8bae1dSRodney W. Grimes 		 */
501e0f66ef8SJohn Baldwin 		if ((td->td_pflags & TDP_ITHREAD) ||
502e0f66ef8SJohn Baldwin 		    td->td_intr_nesting_level >= 2) {
503e8444a7eSPoul-Henning Kamp 			td->td_iticks++;
5047628402bSPeter Wemm 			cp_time[CP_INTR]++;
5050384fff8SJason Evans 		} else {
5068460a577SJohn Birrell #ifdef KSE
5070e2a4d3aSDavid Xu 			if (p->p_flag & P_SA)
5085215b187SJeff Roberson 				thread_statclock(0);
5098460a577SJohn Birrell #endif
510eb2da9a5SPoul-Henning Kamp 			td->td_pticks++;
511e8444a7eSPoul-Henning Kamp 			td->td_sticks++;
512486a9414SJulian Elischer 			if (!TD_IS_IDLETHREAD(td))
5137628402bSPeter Wemm 				cp_time[CP_SYS]++;
5140384fff8SJason Evans 			else
5157628402bSPeter Wemm 				cp_time[CP_IDLE]++;
516df8bae1dSRodney W. Grimes 		}
5170384fff8SJason Evans 	}
518f5e9e8ecSBruce Evans 
519f5e9e8ecSBruce Evans 	/* Update resource usage integrals and maximums. */
52016f9f205SJohn Baldwin 	MPASS(p->p_vmspace != NULL);
52116f9f205SJohn Baldwin 	vm = p->p_vmspace;
5221c4bcd05SJeff Roberson 	ru = &td->td_ru;
5231c6d46f9SLuoqi Chen 	ru->ru_ixrss += pgtok(vm->vm_tsize);
5241c6d46f9SLuoqi Chen 	ru->ru_idrss += pgtok(vm->vm_dsize);
5251c6d46f9SLuoqi Chen 	ru->ru_isrss += pgtok(vm->vm_ssize);
5261c6d46f9SLuoqi Chen 	rss = pgtok(vmspace_resident_count(vm));
527f5e9e8ecSBruce Evans 	if (ru->ru_maxrss < rss)
528f5e9e8ecSBruce Evans 		ru->ru_maxrss = rss;
52940acdeabSJeff Roberson 	CTR4(KTR_SCHED, "statclock: %p(%s) prio %d stathz %d",
530431f8906SJulian Elischer 	    td, td->td_name, td->td_priority, (stathz)?stathz:hz);
5317628402bSPeter Wemm 	thread_lock_flags(td, MTX_QUIET);
53240acdeabSJeff Roberson 	sched_clock(td);
53340acdeabSJeff Roberson 	thread_unlock(td);
5346caa8a15SJohn Baldwin }
5356c567274SJohn Baldwin 
5366caa8a15SJohn Baldwin void
537b439e431SJohn Baldwin profclock(int usermode, uintfptr_t pc)
5386caa8a15SJohn Baldwin {
539238dd320SJake Burkholder 	struct thread *td;
540238dd320SJake Burkholder #ifdef GPROF
541238dd320SJake Burkholder 	struct gmonparam *g;
5425c8b4441SJohn Baldwin 	uintfptr_t i;
543238dd320SJake Burkholder #endif
5446caa8a15SJohn Baldwin 
5454a338afdSJulian Elischer 	td = curthread;
546b439e431SJohn Baldwin 	if (usermode) {
547238dd320SJake Burkholder 		/*
548238dd320SJake Burkholder 		 * Came from user mode; CPU was in user state.
549238dd320SJake Burkholder 		 * If this process is being profiled, record the tick.
550a282253aSJulian Elischer 		 * if there is no related user location yet, don't
551a282253aSJulian Elischer 		 * bother trying to count it.
552238dd320SJake Burkholder 		 */
5539752f794SJohn Baldwin 		if (td->td_proc->p_flag & P_PROFIL)
554b439e431SJohn Baldwin 			addupc_intr(td, pc, 1);
555238dd320SJake Burkholder 	}
556238dd320SJake Burkholder #ifdef GPROF
557238dd320SJake Burkholder 	else {
558238dd320SJake Burkholder 		/*
559238dd320SJake Burkholder 		 * Kernel statistics are just like addupc_intr, only easier.
560238dd320SJake Burkholder 		 */
561238dd320SJake Burkholder 		g = &_gmonparam;
562b439e431SJohn Baldwin 		if (g->state == GMON_PROF_ON && pc >= g->lowpc) {
563b439e431SJohn Baldwin 			i = PC_TO_I(g, pc);
564238dd320SJake Burkholder 			if (i < g->textsize) {
565b439e431SJohn Baldwin 				KCOUNT(g, i)++;
566238dd320SJake Burkholder 			}
567238dd320SJake Burkholder 		}
568238dd320SJake Burkholder 	}
569238dd320SJake Burkholder #endif
570df8bae1dSRodney W. Grimes }
571df8bae1dSRodney W. Grimes 
572df8bae1dSRodney W. Grimes /*
573df8bae1dSRodney W. Grimes  * Return information about system clocks.
574df8bae1dSRodney W. Grimes  */
575787d58f2SPoul-Henning Kamp static int
57682d9ae4eSPoul-Henning Kamp sysctl_kern_clockrate(SYSCTL_HANDLER_ARGS)
577df8bae1dSRodney W. Grimes {
578df8bae1dSRodney W. Grimes 	struct clockinfo clkinfo;
579df8bae1dSRodney W. Grimes 	/*
580df8bae1dSRodney W. Grimes 	 * Construct clockinfo structure.
581df8bae1dSRodney W. Grimes 	 */
582a9a0f15aSBruce Evans 	bzero(&clkinfo, sizeof(clkinfo));
583df8bae1dSRodney W. Grimes 	clkinfo.hz = hz;
584df8bae1dSRodney W. Grimes 	clkinfo.tick = tick;
585df8bae1dSRodney W. Grimes 	clkinfo.profhz = profhz;
586df8bae1dSRodney W. Grimes 	clkinfo.stathz = stathz ? stathz : hz;
587ae0eb976SPoul-Henning Kamp 	return (sysctl_handle_opaque(oidp, &clkinfo, sizeof clkinfo, req));
588df8bae1dSRodney W. Grimes }
5893f31c649SGarrett Wollman 
590946bb7a2SPoul-Henning Kamp SYSCTL_PROC(_kern, KERN_CLOCKRATE, clockrate, CTLTYPE_STRUCT|CTLFLAG_RD,
591af1408e3SLuigi Rizzo 	0, 0, sysctl_kern_clockrate, "S,clockinfo",
592af1408e3SLuigi Rizzo 	"Rate and period of various kernel clocks");
593370c3cb5SSean Kelly 
5944103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
5954103b765SPoul-Henning Kamp 
5964103b765SPoul-Henning Kamp static void
5979079fff5SNick Hibma watchdog_config(void *unused __unused, u_int cmd, int *error)
598370c3cb5SSean Kelly {
5994103b765SPoul-Henning Kamp 	u_int u;
600370c3cb5SSean Kelly 
6014103b765SPoul-Henning Kamp 	u = cmd & WD_INTERVAL;
6029079fff5SNick Hibma 	if (u >= WD_TO_1SEC) {
6034103b765SPoul-Henning Kamp 		watchdog_ticks = (1 << (u - WD_TO_1SEC)) * hz;
6044103b765SPoul-Henning Kamp 		watchdog_enabled = 1;
6059079fff5SNick Hibma 		*error = 0;
6064103b765SPoul-Henning Kamp 	} else {
6074103b765SPoul-Henning Kamp 		watchdog_enabled = 0;
608370c3cb5SSean Kelly 	}
6094103b765SPoul-Henning Kamp }
610370c3cb5SSean Kelly 
611370c3cb5SSean Kelly /*
612370c3cb5SSean Kelly  * Handle a watchdog timeout by dumping interrupt information and
613911d16b8SEd Maste  * then either dropping to DDB or panicking.
614370c3cb5SSean Kelly  */
615370c3cb5SSean Kelly static void
616370c3cb5SSean Kelly watchdog_fire(void)
617370c3cb5SSean Kelly {
618370c3cb5SSean Kelly 	int nintr;
619370c3cb5SSean Kelly 	u_int64_t inttotal;
620370c3cb5SSean Kelly 	u_long *curintr;
621370c3cb5SSean Kelly 	char *curname;
622370c3cb5SSean Kelly 
623370c3cb5SSean Kelly 	curintr = intrcnt;
624370c3cb5SSean Kelly 	curname = intrnames;
625370c3cb5SSean Kelly 	inttotal = 0;
626370c3cb5SSean Kelly 	nintr = eintrcnt - intrcnt;
627370c3cb5SSean Kelly 
628370c3cb5SSean Kelly 	printf("interrupt                   total\n");
629370c3cb5SSean Kelly 	while (--nintr >= 0) {
630370c3cb5SSean Kelly 		if (*curintr)
631370c3cb5SSean Kelly 			printf("%-12s %20lu\n", curname, *curintr);
632370c3cb5SSean Kelly 		curname += strlen(curname) + 1;
633370c3cb5SSean Kelly 		inttotal += *curintr++;
634370c3cb5SSean Kelly 	}
6356cda4155SSean Kelly 	printf("Total        %20ju\n", (uintmax_t)inttotal);
636911d16b8SEd Maste 
637911d16b8SEd Maste #if defined(KDB) && !defined(KDB_UNATTENDED)
638911d16b8SEd Maste 	kdb_backtrace();
639911d16b8SEd Maste 	kdb_enter("watchdog timeout");
640911d16b8SEd Maste #else
641370c3cb5SSean Kelly 	panic("watchdog timeout");
642911d16b8SEd Maste #endif
643370c3cb5SSean Kelly }
644370c3cb5SSean Kelly 
6454103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */
646