xref: /freebsd/sys/kern/kern_clock.c (revision ef54068b54c35b966b7017d8a8ad8b4fa35308d3)
1df8bae1dSRodney W. Grimes /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1982, 1986, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  * (c) UNIX System Laboratories, Inc.
5df8bae1dSRodney W. Grimes  * All or some portions of this file are derived from material licensed
6df8bae1dSRodney W. Grimes  * to the University of California by American Telephone and Telegraph
7df8bae1dSRodney W. Grimes  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
8df8bae1dSRodney W. Grimes  * the permission of UNIX System Laboratories, Inc.
9df8bae1dSRodney W. Grimes  *
10df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
11df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
12df8bae1dSRodney W. Grimes  * are met:
13df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
14df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
15df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
16df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
17df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
18df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
19df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
20df8bae1dSRodney W. Grimes  *    without specific prior written permission.
21df8bae1dSRodney W. Grimes  *
22df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
33df8bae1dSRodney W. Grimes  *
34df8bae1dSRodney W. Grimes  *	@(#)kern_clock.c	8.5 (Berkeley) 1/21/94
35df8bae1dSRodney W. Grimes  */
36df8bae1dSRodney W. Grimes 
37677b542eSDavid E. O'Brien #include <sys/cdefs.h>
38677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
39677b542eSDavid E. O'Brien 
40911d16b8SEd Maste #include "opt_kdb.h"
41f0796cd2SGleb Smirnoff #include "opt_device_polling.h"
424da0d332SPeter Wemm #include "opt_hwpmc_hooks.h"
4332c20357SPoul-Henning Kamp #include "opt_ntp.h"
44370c3cb5SSean Kelly #include "opt_watchdog.h"
4532c20357SPoul-Henning Kamp 
46df8bae1dSRodney W. Grimes #include <sys/param.h>
47df8bae1dSRodney W. Grimes #include <sys/systm.h>
48df8bae1dSRodney W. Grimes #include <sys/callout.h>
492d50560aSMarcel Moolenaar #include <sys/kdb.h>
50df8bae1dSRodney W. Grimes #include <sys/kernel.h>
51f34fa851SJohn Baldwin #include <sys/lock.h>
5261d80e90SJohn Baldwin #include <sys/ktr.h>
5335e0e5b3SJohn Baldwin #include <sys/mutex.h>
54df8bae1dSRodney W. Grimes #include <sys/proc.h>
55e4625663SJeff Roberson #include <sys/resource.h>
56df8bae1dSRodney W. Grimes #include <sys/resourcevar.h>
57b43179fbSJeff Roberson #include <sys/sched.h>
58797f2d22SPoul-Henning Kamp #include <sys/signalvar.h>
596caa8a15SJohn Baldwin #include <sys/smp.h>
608a129caeSDavid Greenman #include <vm/vm.h>
61efeaf95aSDavid Greenman #include <vm/pmap.h>
62efeaf95aSDavid Greenman #include <vm/vm_map.h>
63797f2d22SPoul-Henning Kamp #include <sys/sysctl.h>
648088699fSJohn Baldwin #include <sys/bus.h>
658088699fSJohn Baldwin #include <sys/interrupt.h>
66104a9b7eSAlexander Kabaev #include <sys/limits.h>
67e7fa55afSPoul-Henning Kamp #include <sys/timetc.h>
68df8bae1dSRodney W. Grimes 
69df8bae1dSRodney W. Grimes #ifdef GPROF
70df8bae1dSRodney W. Grimes #include <sys/gmon.h>
71df8bae1dSRodney W. Grimes #endif
72df8bae1dSRodney W. Grimes 
7336c0fd9dSJoseph Koshy #ifdef HWPMC_HOOKS
7436c0fd9dSJoseph Koshy #include <sys/pmckern.h>
7536c0fd9dSJoseph Koshy #endif
7636c0fd9dSJoseph Koshy 
77e4fc250cSLuigi Rizzo #ifdef DEVICE_POLLING
78e4fc250cSLuigi Rizzo extern void hardclock_device_poll(void);
79e4fc250cSLuigi Rizzo #endif /* DEVICE_POLLING */
80eae8fc2cSSteve Passe 
814d77a549SAlfred Perlstein static void initclocks(void *dummy);
822b14f991SJulian Elischer SYSINIT(clocks, SI_SUB_CLOCKS, SI_ORDER_FIRST, initclocks, NULL)
832b14f991SJulian Elischer 
848b98fec9SJeff Roberson /* Spin-lock protecting profiling statistics. */
8586a49deaSAttilio Rao static struct mtx time_lock;
868b98fec9SJeff Roberson 
8762919d78SPeter Wemm static int
8862919d78SPeter Wemm sysctl_kern_cp_time(SYSCTL_HANDLER_ARGS)
8962919d78SPeter Wemm {
9062919d78SPeter Wemm 	int error;
917628402bSPeter Wemm 	long cp_time[CPUSTATES];
92cff2e749SPaul Saab #ifdef SCTL_MASK32
9362919d78SPeter Wemm 	int i;
9462919d78SPeter Wemm 	unsigned int cp_time32[CPUSTATES];
957628402bSPeter Wemm #endif
9662919d78SPeter Wemm 
977628402bSPeter Wemm 	read_cpu_time(cp_time);
987628402bSPeter Wemm #ifdef SCTL_MASK32
99cff2e749SPaul Saab 	if (req->flags & SCTL_MASK32) {
10062919d78SPeter Wemm 		if (!req->oldptr)
10162919d78SPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(cp_time32));
10262919d78SPeter Wemm 		for (i = 0; i < CPUSTATES; i++)
10362919d78SPeter Wemm 			cp_time32[i] = (unsigned int)cp_time[i];
10462919d78SPeter Wemm 		error = SYSCTL_OUT(req, cp_time32, sizeof(cp_time32));
10562919d78SPeter Wemm 	} else
10662919d78SPeter Wemm #endif
10762919d78SPeter Wemm 	{
10862919d78SPeter Wemm 		if (!req->oldptr)
10962919d78SPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(cp_time));
11062919d78SPeter Wemm 		error = SYSCTL_OUT(req, cp_time, sizeof(cp_time));
11162919d78SPeter Wemm 	}
11262919d78SPeter Wemm 	return error;
11362919d78SPeter Wemm }
11462919d78SPeter Wemm 
11562919d78SPeter Wemm SYSCTL_PROC(_kern, OID_AUTO, cp_time, CTLTYPE_LONG|CTLFLAG_RD,
11662919d78SPeter Wemm     0,0, sysctl_kern_cp_time, "LU", "CPU time statistics");
1177f112b04SRobert Watson 
1187628402bSPeter Wemm static long empty[CPUSTATES];
1197628402bSPeter Wemm 
1207628402bSPeter Wemm static int
1217628402bSPeter Wemm sysctl_kern_cp_times(SYSCTL_HANDLER_ARGS)
1227628402bSPeter Wemm {
1237628402bSPeter Wemm 	struct pcpu *pcpu;
1247628402bSPeter Wemm 	int error;
125ef54068bSRobert Watson 	int c;
1267628402bSPeter Wemm 	long *cp_time;
1277628402bSPeter Wemm #ifdef SCTL_MASK32
1287628402bSPeter Wemm 	unsigned int cp_time32[CPUSTATES];
129ef54068bSRobert Watson 	int i;
1307628402bSPeter Wemm #endif
1317628402bSPeter Wemm 
1327628402bSPeter Wemm 	if (!req->oldptr) {
1337628402bSPeter Wemm #ifdef SCTL_MASK32
1347628402bSPeter Wemm 		if (req->flags & SCTL_MASK32)
1357628402bSPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(cp_time32) * (mp_maxid + 1));
1367628402bSPeter Wemm 		else
1377628402bSPeter Wemm #endif
1387628402bSPeter Wemm 			return SYSCTL_OUT(req, 0, sizeof(long) * CPUSTATES * (mp_maxid + 1));
1397628402bSPeter Wemm 	}
1407628402bSPeter Wemm 	for (error = 0, c = 0; error == 0 && c <= mp_maxid; c++) {
1417628402bSPeter Wemm 		if (!CPU_ABSENT(c)) {
1427628402bSPeter Wemm 			pcpu = pcpu_find(c);
1437628402bSPeter Wemm 			cp_time = pcpu->pc_cp_time;
1447628402bSPeter Wemm 		} else {
1457628402bSPeter Wemm 			cp_time = empty;
1467628402bSPeter Wemm 		}
1477628402bSPeter Wemm #ifdef SCTL_MASK32
1487628402bSPeter Wemm 		if (req->flags & SCTL_MASK32) {
1497628402bSPeter Wemm 			for (i = 0; i < CPUSTATES; i++)
1507628402bSPeter Wemm 				cp_time32[i] = (unsigned int)cp_time[i];
1517628402bSPeter Wemm 			error = SYSCTL_OUT(req, cp_time32, sizeof(cp_time32));
1527628402bSPeter Wemm 		} else
1537628402bSPeter Wemm #endif
1547628402bSPeter Wemm 			error = SYSCTL_OUT(req, cp_time, sizeof(long) * CPUSTATES);
1557628402bSPeter Wemm 	}
1567628402bSPeter Wemm 	return error;
1577628402bSPeter Wemm }
1587628402bSPeter Wemm 
1597628402bSPeter Wemm SYSCTL_PROC(_kern, OID_AUTO, cp_times, CTLTYPE_LONG|CTLFLAG_RD,
1607628402bSPeter Wemm     0,0, sysctl_kern_cp_times, "LU", "per-CPU time statistics");
1617628402bSPeter Wemm 
1627628402bSPeter Wemm void
1637628402bSPeter Wemm read_cpu_time(long *cp_time)
1647628402bSPeter Wemm {
1657628402bSPeter Wemm 	struct pcpu *pc;
1667628402bSPeter Wemm 	int i, j;
1677628402bSPeter Wemm 
1687628402bSPeter Wemm 	/* Sum up global cp_time[]. */
1697628402bSPeter Wemm 	bzero(cp_time, sizeof(long) * CPUSTATES);
1707628402bSPeter Wemm 	for (i = 0; i <= mp_maxid; i++) {
1717628402bSPeter Wemm 		if (CPU_ABSENT(i))
1727628402bSPeter Wemm 			continue;
1737628402bSPeter Wemm 		pc = pcpu_find(i);
1747628402bSPeter Wemm 		for (j = 0; j < CPUSTATES; j++)
1757628402bSPeter Wemm 			cp_time[j] += pc->pc_cp_time[j];
1767628402bSPeter Wemm 	}
1777628402bSPeter Wemm }
1787628402bSPeter Wemm 
1794103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
1804103b765SPoul-Henning Kamp #include <sys/watchdog.h>
181370c3cb5SSean Kelly 
1824103b765SPoul-Henning Kamp static int watchdog_ticks;
183370c3cb5SSean Kelly static int watchdog_enabled;
1844103b765SPoul-Henning Kamp static void watchdog_fire(void);
1854103b765SPoul-Henning Kamp static void watchdog_config(void *, u_int, int *);
1864103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */
187370c3cb5SSean Kelly 
1883bac064fSPoul-Henning Kamp /*
189df8bae1dSRodney W. Grimes  * Clock handling routines.
190df8bae1dSRodney W. Grimes  *
191b05dcf3cSPoul-Henning Kamp  * This code is written to operate with two timers that run independently of
192b05dcf3cSPoul-Henning Kamp  * each other.
1937ec73f64SPoul-Henning Kamp  *
194b05dcf3cSPoul-Henning Kamp  * The main timer, running hz times per second, is used to trigger interval
195b05dcf3cSPoul-Henning Kamp  * timers, timeouts and rescheduling as needed.
1967ec73f64SPoul-Henning Kamp  *
197b05dcf3cSPoul-Henning Kamp  * The second timer handles kernel and user profiling,
198b05dcf3cSPoul-Henning Kamp  * and does resource use estimation.  If the second timer is programmable,
199b05dcf3cSPoul-Henning Kamp  * it is randomized to avoid aliasing between the two clocks.  For example,
200b05dcf3cSPoul-Henning Kamp  * the randomization prevents an adversary from always giving up the cpu
201df8bae1dSRodney W. Grimes  * just before its quantum expires.  Otherwise, it would never accumulate
202df8bae1dSRodney W. Grimes  * cpu ticks.  The mean frequency of the second timer is stathz.
203b05dcf3cSPoul-Henning Kamp  *
204b05dcf3cSPoul-Henning Kamp  * If no second timer exists, stathz will be zero; in this case we drive
205b05dcf3cSPoul-Henning Kamp  * profiling and statistics off the main clock.  This WILL NOT be accurate;
206b05dcf3cSPoul-Henning Kamp  * do not do it unless absolutely necessary.
207b05dcf3cSPoul-Henning Kamp  *
208df8bae1dSRodney W. Grimes  * The statistics clock may (or may not) be run at a higher rate while
209b05dcf3cSPoul-Henning Kamp  * profiling.  This profile clock runs at profhz.  We require that profhz
210b05dcf3cSPoul-Henning Kamp  * be an integral multiple of stathz.
211b05dcf3cSPoul-Henning Kamp  *
212b05dcf3cSPoul-Henning Kamp  * If the statistics clock is running fast, it must be divided by the ratio
213b05dcf3cSPoul-Henning Kamp  * profhz/stathz for statistics.  (For profiling, every tick counts.)
214df8bae1dSRodney W. Grimes  *
2157ec73f64SPoul-Henning Kamp  * Time-of-day is maintained using a "timecounter", which may or may
2167ec73f64SPoul-Henning Kamp  * not be related to the hardware generating the above mentioned
2177ec73f64SPoul-Henning Kamp  * interrupts.
218df8bae1dSRodney W. Grimes  */
219df8bae1dSRodney W. Grimes 
220df8bae1dSRodney W. Grimes int	stathz;
221df8bae1dSRodney W. Grimes int	profhz;
222238dd320SJake Burkholder int	profprocs;
223df8bae1dSRodney W. Grimes int	ticks;
224238dd320SJake Burkholder int	psratio;
225df8bae1dSRodney W. Grimes 
226df8bae1dSRodney W. Grimes /*
227df8bae1dSRodney W. Grimes  * Initialize clock frequencies and start both clocks running.
228df8bae1dSRodney W. Grimes  */
2292b14f991SJulian Elischer /* ARGSUSED*/
2302b14f991SJulian Elischer static void
231d841aaa7SBruce Evans initclocks(dummy)
232d841aaa7SBruce Evans 	void *dummy;
233df8bae1dSRodney W. Grimes {
234df8bae1dSRodney W. Grimes 	register int i;
235df8bae1dSRodney W. Grimes 
236df8bae1dSRodney W. Grimes 	/*
237df8bae1dSRodney W. Grimes 	 * Set divisors to 1 (normal case) and let the machine-specific
238df8bae1dSRodney W. Grimes 	 * code do its bit.
239df8bae1dSRodney W. Grimes 	 */
2408b98fec9SJeff Roberson 	mtx_init(&time_lock, "time lock", NULL, MTX_SPIN);
24163d69d25SRobert Watson 	cpu_initclocks();
242df8bae1dSRodney W. Grimes 
243df8bae1dSRodney W. Grimes 	/*
244df8bae1dSRodney W. Grimes 	 * Compute profhz/stathz, and fix profhz if needed.
245df8bae1dSRodney W. Grimes 	 */
246df8bae1dSRodney W. Grimes 	i = stathz ? stathz : hz;
247df8bae1dSRodney W. Grimes 	if (profhz == 0)
248df8bae1dSRodney W. Grimes 		profhz = i;
249df8bae1dSRodney W. Grimes 	psratio = profhz / i;
2504103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
2514103b765SPoul-Henning Kamp 	EVENTHANDLER_REGISTER(watchdog_list, watchdog_config, NULL, 0);
2524103b765SPoul-Henning Kamp #endif
253df8bae1dSRodney W. Grimes }
254df8bae1dSRodney W. Grimes 
255df8bae1dSRodney W. Grimes /*
256238dd320SJake Burkholder  * Each time the real-time timer fires, this function is called on all CPUs.
257b439e431SJohn Baldwin  * Note that hardclock() calls hardclock_cpu() for the boot CPU, so only
258238dd320SJake Burkholder  * the other CPUs in the system need to call this function.
2596caa8a15SJohn Baldwin  */
2606caa8a15SJohn Baldwin void
261b439e431SJohn Baldwin hardclock_cpu(int usermode)
2626caa8a15SJohn Baldwin {
2636caa8a15SJohn Baldwin 	struct pstats *pstats;
264238dd320SJake Burkholder 	struct thread *td = curthread;
265b40ce416SJulian Elischer 	struct proc *p = td->td_proc;
266b61ce5b0SJeff Roberson 	int flags;
2676caa8a15SJohn Baldwin 
2686caa8a15SJohn Baldwin 	/*
2696caa8a15SJohn Baldwin 	 * Run current process's virtual and profile time, as needed.
2706caa8a15SJohn Baldwin 	 */
271ad1e7d28SJulian Elischer 	pstats = p->p_stats;
272b61ce5b0SJeff Roberson 	flags = 0;
273ad1e7d28SJulian Elischer 	if (usermode &&
27440acdeabSJeff Roberson 	    timevalisset(&pstats->p_timer[ITIMER_VIRTUAL].it_value)) {
27540acdeabSJeff Roberson 		PROC_SLOCK(p);
276b61ce5b0SJeff Roberson 		if (itimerdecr(&pstats->p_timer[ITIMER_VIRTUAL], tick) == 0)
277b61ce5b0SJeff Roberson 			flags |= TDF_ALRMPEND | TDF_ASTPENDING;
27840acdeabSJeff Roberson 		PROC_SUNLOCK(p);
27940acdeabSJeff Roberson 	}
28040acdeabSJeff Roberson 	if (timevalisset(&pstats->p_timer[ITIMER_PROF].it_value)) {
28140acdeabSJeff Roberson 		PROC_SLOCK(p);
282b61ce5b0SJeff Roberson 		if (itimerdecr(&pstats->p_timer[ITIMER_PROF], tick) == 0)
283b61ce5b0SJeff Roberson 			flags |= TDF_PROFPEND | TDF_ASTPENDING;
28440acdeabSJeff Roberson 		PROC_SUNLOCK(p);
28540acdeabSJeff Roberson 	}
28640acdeabSJeff Roberson 	thread_lock(td);
28740acdeabSJeff Roberson 	sched_tick();
288b61ce5b0SJeff Roberson 	td->td_flags |= flags;
28940acdeabSJeff Roberson 	thread_unlock(td);
29036c0fd9dSJoseph Koshy 
29136c0fd9dSJoseph Koshy #ifdef	HWPMC_HOOKS
29236c0fd9dSJoseph Koshy 	if (PMC_CPU_HAS_SAMPLES(PCPU_GET(cpuid)))
29336c0fd9dSJoseph Koshy 		PMC_CALL_HOOK_UNLOCKED(curthread, PMC_FN_DO_SAMPLES, NULL);
29436c0fd9dSJoseph Koshy #endif
2956caa8a15SJohn Baldwin }
2966caa8a15SJohn Baldwin 
2976caa8a15SJohn Baldwin /*
298df8bae1dSRodney W. Grimes  * The real-time timer, interrupting hz times per second.
299df8bae1dSRodney W. Grimes  */
300df8bae1dSRodney W. Grimes void
301b439e431SJohn Baldwin hardclock(int usermode, uintfptr_t pc)
302df8bae1dSRodney W. Grimes {
303fa2fbc3dSJake Burkholder 	int need_softclock = 0;
304df8bae1dSRodney W. Grimes 
305b439e431SJohn Baldwin 	hardclock_cpu(usermode);
306b05dcf3cSPoul-Henning Kamp 
307e7fa55afSPoul-Henning Kamp 	tc_ticktock();
308df8bae1dSRodney W. Grimes 	/*
309df8bae1dSRodney W. Grimes 	 * If no separate statistics clock is available, run it from here.
3106caa8a15SJohn Baldwin 	 *
3116caa8a15SJohn Baldwin 	 * XXX: this only works for UP
312df8bae1dSRodney W. Grimes 	 */
313238dd320SJake Burkholder 	if (stathz == 0) {
314b439e431SJohn Baldwin 		profclock(usermode, pc);
315b439e431SJohn Baldwin 		statclock(usermode);
316238dd320SJake Burkholder 	}
317df8bae1dSRodney W. Grimes 
318e4fc250cSLuigi Rizzo #ifdef DEVICE_POLLING
319daccb638SLuigi Rizzo 	hardclock_device_poll();	/* this is very short and quick */
320e4fc250cSLuigi Rizzo #endif /* DEVICE_POLLING */
3213f31c649SGarrett Wollman 
322b05dcf3cSPoul-Henning Kamp 	/*
323b05dcf3cSPoul-Henning Kamp 	 * Process callouts at a very low cpu priority, so we don't keep the
324b05dcf3cSPoul-Henning Kamp 	 * relatively high clock interrupt priority any longer than necessary.
325b05dcf3cSPoul-Henning Kamp 	 */
32621a7a9aeSJohn Baldwin 	mtx_lock_spin_flags(&callout_lock, MTX_QUIET);
327fa2fbc3dSJake Burkholder 	ticks++;
3286ad26d83SXin LI 	if (!TAILQ_EMPTY(&callwheel[ticks & callwheelmask])) {
329fa2fbc3dSJake Burkholder 		need_softclock = 1;
330b05dcf3cSPoul-Henning Kamp 	} else if (softticks + 1 == ticks)
331b05dcf3cSPoul-Henning Kamp 		++softticks;
33221a7a9aeSJohn Baldwin 	mtx_unlock_spin_flags(&callout_lock, MTX_QUIET);
333fa2fbc3dSJake Burkholder 
334fa2fbc3dSJake Burkholder 	/*
33540acdeabSJeff Roberson 	 * swi_sched acquires the thread lock, so we don't want to call it
33640acdeabSJeff Roberson 	 * with callout_lock held; incorrect locking order.
337fa2fbc3dSJake Burkholder 	 */
338fa2fbc3dSJake Burkholder 	if (need_softclock)
339c86b6ff5SJohn Baldwin 		swi_sched(softclock_ih, 0);
340370c3cb5SSean Kelly 
3414103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
3424103b765SPoul-Henning Kamp 	if (watchdog_enabled > 0 && --watchdog_ticks <= 0)
343370c3cb5SSean Kelly 		watchdog_fire();
3444103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */
345ab36c067SJustin T. Gibbs }
346ab36c067SJustin T. Gibbs 
347df8bae1dSRodney W. Grimes /*
348227ee8a1SPoul-Henning Kamp  * Compute number of ticks in the specified amount of time.
349df8bae1dSRodney W. Grimes  */
350df8bae1dSRodney W. Grimes int
351227ee8a1SPoul-Henning Kamp tvtohz(tv)
352df8bae1dSRodney W. Grimes 	struct timeval *tv;
353df8bae1dSRodney W. Grimes {
3546976af69SBruce Evans 	register unsigned long ticks;
3556976af69SBruce Evans 	register long sec, usec;
356df8bae1dSRodney W. Grimes 
357df8bae1dSRodney W. Grimes 	/*
3586976af69SBruce Evans 	 * If the number of usecs in the whole seconds part of the time
3596976af69SBruce Evans 	 * difference fits in a long, then the total number of usecs will
3606976af69SBruce Evans 	 * fit in an unsigned long.  Compute the total and convert it to
3616976af69SBruce Evans 	 * ticks, rounding up and adding 1 to allow for the current tick
3626976af69SBruce Evans 	 * to expire.  Rounding also depends on unsigned long arithmetic
3636976af69SBruce Evans 	 * to avoid overflow.
364df8bae1dSRodney W. Grimes 	 *
3656976af69SBruce Evans 	 * Otherwise, if the number of ticks in the whole seconds part of
3666976af69SBruce Evans 	 * the time difference fits in a long, then convert the parts to
3676976af69SBruce Evans 	 * ticks separately and add, using similar rounding methods and
3686976af69SBruce Evans 	 * overflow avoidance.  This method would work in the previous
3696976af69SBruce Evans 	 * case but it is slightly slower and assumes that hz is integral.
3706976af69SBruce Evans 	 *
3716976af69SBruce Evans 	 * Otherwise, round the time difference down to the maximum
3726976af69SBruce Evans 	 * representable value.
3736976af69SBruce Evans 	 *
3746976af69SBruce Evans 	 * If ints have 32 bits, then the maximum value for any timeout in
3756976af69SBruce Evans 	 * 10ms ticks is 248 days.
376df8bae1dSRodney W. Grimes 	 */
377227ee8a1SPoul-Henning Kamp 	sec = tv->tv_sec;
378227ee8a1SPoul-Henning Kamp 	usec = tv->tv_usec;
3796976af69SBruce Evans 	if (usec < 0) {
3806976af69SBruce Evans 		sec--;
3816976af69SBruce Evans 		usec += 1000000;
3826976af69SBruce Evans 	}
3836976af69SBruce Evans 	if (sec < 0) {
3846976af69SBruce Evans #ifdef DIAGNOSTIC
385b05dcf3cSPoul-Henning Kamp 		if (usec > 0) {
3867ec73f64SPoul-Henning Kamp 			sec++;
3877ec73f64SPoul-Henning Kamp 			usec -= 1000000;
3887ec73f64SPoul-Henning Kamp 		}
389227ee8a1SPoul-Henning Kamp 		printf("tvotohz: negative time difference %ld sec %ld usec\n",
3906976af69SBruce Evans 		       sec, usec);
3916976af69SBruce Evans #endif
3926976af69SBruce Evans 		ticks = 1;
3936976af69SBruce Evans 	} else if (sec <= LONG_MAX / 1000000)
3946976af69SBruce Evans 		ticks = (sec * 1000000 + (unsigned long)usec + (tick - 1))
3956976af69SBruce Evans 			/ tick + 1;
3966976af69SBruce Evans 	else if (sec <= LONG_MAX / hz)
3976976af69SBruce Evans 		ticks = sec * hz
3986976af69SBruce Evans 			+ ((unsigned long)usec + (tick - 1)) / tick + 1;
3996976af69SBruce Evans 	else
4006976af69SBruce Evans 		ticks = LONG_MAX;
4016976af69SBruce Evans 	if (ticks > INT_MAX)
4026976af69SBruce Evans 		ticks = INT_MAX;
403d6116663SAlexander Langer 	return ((int)ticks);
404df8bae1dSRodney W. Grimes }
405df8bae1dSRodney W. Grimes 
406df8bae1dSRodney W. Grimes /*
407df8bae1dSRodney W. Grimes  * Start profiling on a process.
408df8bae1dSRodney W. Grimes  *
409df8bae1dSRodney W. Grimes  * Kernel profiling passes proc0 which never exits and hence
410df8bae1dSRodney W. Grimes  * keeps the profile clock running constantly.
411df8bae1dSRodney W. Grimes  */
412df8bae1dSRodney W. Grimes void
413df8bae1dSRodney W. Grimes startprofclock(p)
414df8bae1dSRodney W. Grimes 	register struct proc *p;
415df8bae1dSRodney W. Grimes {
416df8bae1dSRodney W. Grimes 
4179752f794SJohn Baldwin 	PROC_LOCK_ASSERT(p, MA_OWNED);
4189752f794SJohn Baldwin 	if (p->p_flag & P_STOPPROF)
419a282253aSJulian Elischer 		return;
4209752f794SJohn Baldwin 	if ((p->p_flag & P_PROFIL) == 0) {
4219752f794SJohn Baldwin 		p->p_flag |= P_PROFIL;
4228b98fec9SJeff Roberson 		mtx_lock_spin(&time_lock);
423238dd320SJake Burkholder 		if (++profprocs == 1)
424238dd320SJake Burkholder 			cpu_startprofclock();
4258b98fec9SJeff Roberson 		mtx_unlock_spin(&time_lock);
426df8bae1dSRodney W. Grimes 	}
4279752f794SJohn Baldwin }
428df8bae1dSRodney W. Grimes 
429df8bae1dSRodney W. Grimes /*
430df8bae1dSRodney W. Grimes  * Stop profiling on a process.
431df8bae1dSRodney W. Grimes  */
432df8bae1dSRodney W. Grimes void
433df8bae1dSRodney W. Grimes stopprofclock(p)
434df8bae1dSRodney W. Grimes 	register struct proc *p;
435df8bae1dSRodney W. Grimes {
436df8bae1dSRodney W. Grimes 
437a282253aSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
4389752f794SJohn Baldwin 	if (p->p_flag & P_PROFIL) {
4399752f794SJohn Baldwin 		if (p->p_profthreads != 0) {
4409752f794SJohn Baldwin 			p->p_flag |= P_STOPPROF;
4419752f794SJohn Baldwin 			while (p->p_profthreads != 0)
442a282253aSJulian Elischer 				msleep(&p->p_profthreads, &p->p_mtx, PPAUSE,
443a89ec05eSPeter Wemm 				    "stopprof", 0);
4449752f794SJohn Baldwin 			p->p_flag &= ~P_STOPPROF;
445a282253aSJulian Elischer 		}
446b62b2304SColin Percival 		if ((p->p_flag & P_PROFIL) == 0)
447b62b2304SColin Percival 			return;
4489752f794SJohn Baldwin 		p->p_flag &= ~P_PROFIL;
4498b98fec9SJeff Roberson 		mtx_lock_spin(&time_lock);
450238dd320SJake Burkholder 		if (--profprocs == 0)
451238dd320SJake Burkholder 			cpu_stopprofclock();
4528b98fec9SJeff Roberson 		mtx_unlock_spin(&time_lock);
453df8bae1dSRodney W. Grimes 	}
4549752f794SJohn Baldwin }
455df8bae1dSRodney W. Grimes 
456df8bae1dSRodney W. Grimes /*
4571c4bcd05SJeff Roberson  * Statistics clock.  Updates rusage information and calls the scheduler
4581c4bcd05SJeff Roberson  * to adjust priorities of the active thread.
4591c4bcd05SJeff Roberson  *
460238dd320SJake Burkholder  * This should be called by all active processors.
461df8bae1dSRodney W. Grimes  */
462df8bae1dSRodney W. Grimes void
463b439e431SJohn Baldwin statclock(int usermode)
464df8bae1dSRodney W. Grimes {
4658a129caeSDavid Greenman 	struct rusage *ru;
4668a129caeSDavid Greenman 	struct vmspace *vm;
467238dd320SJake Burkholder 	struct thread *td;
468238dd320SJake Burkholder 	struct proc *p;
469238dd320SJake Burkholder 	long rss;
4707628402bSPeter Wemm 	long *cp_time;
4718a129caeSDavid Greenman 
472238dd320SJake Burkholder 	td = curthread;
473238dd320SJake Burkholder 	p = td->td_proc;
474238dd320SJake Burkholder 
4757628402bSPeter Wemm 	cp_time = (long *)PCPU_PTR(cp_time);
476b439e431SJohn Baldwin 	if (usermode) {
477df8bae1dSRodney W. Grimes 		/*
47871a62f8aSBruce Evans 		 * Charge the time as appropriate.
479df8bae1dSRodney W. Grimes 		 */
4808460a577SJohn Birrell #ifdef KSE
4810e2a4d3aSDavid Xu 		if (p->p_flag & P_SA)
4825215b187SJeff Roberson 			thread_statclock(1);
4838460a577SJohn Birrell #endif
484e8444a7eSPoul-Henning Kamp 		td->td_uticks++;
485fa885116SJulian Elischer 		if (p->p_nice > NZERO)
4867628402bSPeter Wemm 			cp_time[CP_NICE]++;
487df8bae1dSRodney W. Grimes 		else
4887628402bSPeter Wemm 			cp_time[CP_USER]++;
489df8bae1dSRodney W. Grimes 	} else {
490df8bae1dSRodney W. Grimes 		/*
491df8bae1dSRodney W. Grimes 		 * Came from kernel mode, so we were:
492df8bae1dSRodney W. Grimes 		 * - handling an interrupt,
493df8bae1dSRodney W. Grimes 		 * - doing syscall or trap work on behalf of the current
494df8bae1dSRodney W. Grimes 		 *   user process, or
495df8bae1dSRodney W. Grimes 		 * - spinning in the idle loop.
496df8bae1dSRodney W. Grimes 		 * Whichever it is, charge the time as appropriate.
497df8bae1dSRodney W. Grimes 		 * Note that we charge interrupts to the current process,
498df8bae1dSRodney W. Grimes 		 * regardless of whether they are ``for'' that process,
499df8bae1dSRodney W. Grimes 		 * so that we know how much of its real time was spent
500df8bae1dSRodney W. Grimes 		 * in ``non-process'' (i.e., interrupt) work.
501df8bae1dSRodney W. Grimes 		 */
502e0f66ef8SJohn Baldwin 		if ((td->td_pflags & TDP_ITHREAD) ||
503e0f66ef8SJohn Baldwin 		    td->td_intr_nesting_level >= 2) {
504e8444a7eSPoul-Henning Kamp 			td->td_iticks++;
5057628402bSPeter Wemm 			cp_time[CP_INTR]++;
5060384fff8SJason Evans 		} else {
5078460a577SJohn Birrell #ifdef KSE
5080e2a4d3aSDavid Xu 			if (p->p_flag & P_SA)
5095215b187SJeff Roberson 				thread_statclock(0);
5108460a577SJohn Birrell #endif
511eb2da9a5SPoul-Henning Kamp 			td->td_pticks++;
512e8444a7eSPoul-Henning Kamp 			td->td_sticks++;
513486a9414SJulian Elischer 			if (!TD_IS_IDLETHREAD(td))
5147628402bSPeter Wemm 				cp_time[CP_SYS]++;
5150384fff8SJason Evans 			else
5167628402bSPeter Wemm 				cp_time[CP_IDLE]++;
517df8bae1dSRodney W. Grimes 		}
5180384fff8SJason Evans 	}
519f5e9e8ecSBruce Evans 
520f5e9e8ecSBruce Evans 	/* Update resource usage integrals and maximums. */
52116f9f205SJohn Baldwin 	MPASS(p->p_vmspace != NULL);
52216f9f205SJohn Baldwin 	vm = p->p_vmspace;
5231c4bcd05SJeff Roberson 	ru = &td->td_ru;
5241c6d46f9SLuoqi Chen 	ru->ru_ixrss += pgtok(vm->vm_tsize);
5251c6d46f9SLuoqi Chen 	ru->ru_idrss += pgtok(vm->vm_dsize);
5261c6d46f9SLuoqi Chen 	ru->ru_isrss += pgtok(vm->vm_ssize);
5271c6d46f9SLuoqi Chen 	rss = pgtok(vmspace_resident_count(vm));
528f5e9e8ecSBruce Evans 	if (ru->ru_maxrss < rss)
529f5e9e8ecSBruce Evans 		ru->ru_maxrss = rss;
53040acdeabSJeff Roberson 	CTR4(KTR_SCHED, "statclock: %p(%s) prio %d stathz %d",
531431f8906SJulian Elischer 	    td, td->td_name, td->td_priority, (stathz)?stathz:hz);
5327628402bSPeter Wemm 	thread_lock_flags(td, MTX_QUIET);
53340acdeabSJeff Roberson 	sched_clock(td);
53440acdeabSJeff Roberson 	thread_unlock(td);
5356caa8a15SJohn Baldwin }
5366c567274SJohn Baldwin 
5376caa8a15SJohn Baldwin void
538b439e431SJohn Baldwin profclock(int usermode, uintfptr_t pc)
5396caa8a15SJohn Baldwin {
540238dd320SJake Burkholder 	struct thread *td;
541238dd320SJake Burkholder #ifdef GPROF
542238dd320SJake Burkholder 	struct gmonparam *g;
5435c8b4441SJohn Baldwin 	uintfptr_t i;
544238dd320SJake Burkholder #endif
5456caa8a15SJohn Baldwin 
5464a338afdSJulian Elischer 	td = curthread;
547b439e431SJohn Baldwin 	if (usermode) {
548238dd320SJake Burkholder 		/*
549238dd320SJake Burkholder 		 * Came from user mode; CPU was in user state.
550238dd320SJake Burkholder 		 * If this process is being profiled, record the tick.
551a282253aSJulian Elischer 		 * if there is no related user location yet, don't
552a282253aSJulian Elischer 		 * bother trying to count it.
553238dd320SJake Burkholder 		 */
5549752f794SJohn Baldwin 		if (td->td_proc->p_flag & P_PROFIL)
555b439e431SJohn Baldwin 			addupc_intr(td, pc, 1);
556238dd320SJake Burkholder 	}
557238dd320SJake Burkholder #ifdef GPROF
558238dd320SJake Burkholder 	else {
559238dd320SJake Burkholder 		/*
560238dd320SJake Burkholder 		 * Kernel statistics are just like addupc_intr, only easier.
561238dd320SJake Burkholder 		 */
562238dd320SJake Burkholder 		g = &_gmonparam;
563b439e431SJohn Baldwin 		if (g->state == GMON_PROF_ON && pc >= g->lowpc) {
564b439e431SJohn Baldwin 			i = PC_TO_I(g, pc);
565238dd320SJake Burkholder 			if (i < g->textsize) {
566b439e431SJohn Baldwin 				KCOUNT(g, i)++;
567238dd320SJake Burkholder 			}
568238dd320SJake Burkholder 		}
569238dd320SJake Burkholder 	}
570238dd320SJake Burkholder #endif
571df8bae1dSRodney W. Grimes }
572df8bae1dSRodney W. Grimes 
573df8bae1dSRodney W. Grimes /*
574df8bae1dSRodney W. Grimes  * Return information about system clocks.
575df8bae1dSRodney W. Grimes  */
576787d58f2SPoul-Henning Kamp static int
57782d9ae4eSPoul-Henning Kamp sysctl_kern_clockrate(SYSCTL_HANDLER_ARGS)
578df8bae1dSRodney W. Grimes {
579df8bae1dSRodney W. Grimes 	struct clockinfo clkinfo;
580df8bae1dSRodney W. Grimes 	/*
581df8bae1dSRodney W. Grimes 	 * Construct clockinfo structure.
582df8bae1dSRodney W. Grimes 	 */
583a9a0f15aSBruce Evans 	bzero(&clkinfo, sizeof(clkinfo));
584df8bae1dSRodney W. Grimes 	clkinfo.hz = hz;
585df8bae1dSRodney W. Grimes 	clkinfo.tick = tick;
586df8bae1dSRodney W. Grimes 	clkinfo.profhz = profhz;
587df8bae1dSRodney W. Grimes 	clkinfo.stathz = stathz ? stathz : hz;
588ae0eb976SPoul-Henning Kamp 	return (sysctl_handle_opaque(oidp, &clkinfo, sizeof clkinfo, req));
589df8bae1dSRodney W. Grimes }
5903f31c649SGarrett Wollman 
591946bb7a2SPoul-Henning Kamp SYSCTL_PROC(_kern, KERN_CLOCKRATE, clockrate, CTLTYPE_STRUCT|CTLFLAG_RD,
592af1408e3SLuigi Rizzo 	0, 0, sysctl_kern_clockrate, "S,clockinfo",
593af1408e3SLuigi Rizzo 	"Rate and period of various kernel clocks");
594370c3cb5SSean Kelly 
5954103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG
5964103b765SPoul-Henning Kamp 
5974103b765SPoul-Henning Kamp static void
5989079fff5SNick Hibma watchdog_config(void *unused __unused, u_int cmd, int *error)
599370c3cb5SSean Kelly {
6004103b765SPoul-Henning Kamp 	u_int u;
601370c3cb5SSean Kelly 
6024103b765SPoul-Henning Kamp 	u = cmd & WD_INTERVAL;
6039079fff5SNick Hibma 	if (u >= WD_TO_1SEC) {
6044103b765SPoul-Henning Kamp 		watchdog_ticks = (1 << (u - WD_TO_1SEC)) * hz;
6054103b765SPoul-Henning Kamp 		watchdog_enabled = 1;
6069079fff5SNick Hibma 		*error = 0;
6074103b765SPoul-Henning Kamp 	} else {
6084103b765SPoul-Henning Kamp 		watchdog_enabled = 0;
609370c3cb5SSean Kelly 	}
6104103b765SPoul-Henning Kamp }
611370c3cb5SSean Kelly 
612370c3cb5SSean Kelly /*
613370c3cb5SSean Kelly  * Handle a watchdog timeout by dumping interrupt information and
614911d16b8SEd Maste  * then either dropping to DDB or panicking.
615370c3cb5SSean Kelly  */
616370c3cb5SSean Kelly static void
617370c3cb5SSean Kelly watchdog_fire(void)
618370c3cb5SSean Kelly {
619370c3cb5SSean Kelly 	int nintr;
620370c3cb5SSean Kelly 	u_int64_t inttotal;
621370c3cb5SSean Kelly 	u_long *curintr;
622370c3cb5SSean Kelly 	char *curname;
623370c3cb5SSean Kelly 
624370c3cb5SSean Kelly 	curintr = intrcnt;
625370c3cb5SSean Kelly 	curname = intrnames;
626370c3cb5SSean Kelly 	inttotal = 0;
627370c3cb5SSean Kelly 	nintr = eintrcnt - intrcnt;
628370c3cb5SSean Kelly 
629370c3cb5SSean Kelly 	printf("interrupt                   total\n");
630370c3cb5SSean Kelly 	while (--nintr >= 0) {
631370c3cb5SSean Kelly 		if (*curintr)
632370c3cb5SSean Kelly 			printf("%-12s %20lu\n", curname, *curintr);
633370c3cb5SSean Kelly 		curname += strlen(curname) + 1;
634370c3cb5SSean Kelly 		inttotal += *curintr++;
635370c3cb5SSean Kelly 	}
6366cda4155SSean Kelly 	printf("Total        %20ju\n", (uintmax_t)inttotal);
637911d16b8SEd Maste 
638911d16b8SEd Maste #if defined(KDB) && !defined(KDB_UNATTENDED)
639911d16b8SEd Maste 	kdb_backtrace();
640911d16b8SEd Maste 	kdb_enter("watchdog timeout");
641911d16b8SEd Maste #else
642370c3cb5SSean Kelly 	panic("watchdog timeout");
643911d16b8SEd Maste #endif
644370c3cb5SSean Kelly }
645370c3cb5SSean Kelly 
6464103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */
647