1df8bae1dSRodney W. Grimes /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1982, 1986, 1991, 1993 3df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * (c) UNIX System Laboratories, Inc. 5df8bae1dSRodney W. Grimes * All or some portions of this file are derived from material licensed 6df8bae1dSRodney W. Grimes * to the University of California by American Telephone and Telegraph 7df8bae1dSRodney W. Grimes * Co. or Unix System Laboratories, Inc. and are reproduced herein with 8df8bae1dSRodney W. Grimes * the permission of UNIX System Laboratories, Inc. 9df8bae1dSRodney W. Grimes * 10df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 11df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 12df8bae1dSRodney W. Grimes * are met: 13df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 14df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 15df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 16df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 17df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 18df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 19df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 20df8bae1dSRodney W. Grimes * without specific prior written permission. 21df8bae1dSRodney W. Grimes * 22df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32df8bae1dSRodney W. Grimes * SUCH DAMAGE. 33df8bae1dSRodney W. Grimes * 34df8bae1dSRodney W. Grimes * @(#)kern_clock.c 8.5 (Berkeley) 1/21/94 35df8bae1dSRodney W. Grimes */ 36df8bae1dSRodney W. Grimes 37677b542eSDavid E. O'Brien #include <sys/cdefs.h> 38677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 39677b542eSDavid E. O'Brien 40911d16b8SEd Maste #include "opt_kdb.h" 41f0796cd2SGleb Smirnoff #include "opt_device_polling.h" 424da0d332SPeter Wemm #include "opt_hwpmc_hooks.h" 4332c20357SPoul-Henning Kamp #include "opt_ntp.h" 44370c3cb5SSean Kelly #include "opt_watchdog.h" 4532c20357SPoul-Henning Kamp 46df8bae1dSRodney W. Grimes #include <sys/param.h> 47df8bae1dSRodney W. Grimes #include <sys/systm.h> 48df8bae1dSRodney W. Grimes #include <sys/callout.h> 492d50560aSMarcel Moolenaar #include <sys/kdb.h> 50df8bae1dSRodney W. Grimes #include <sys/kernel.h> 51f34fa851SJohn Baldwin #include <sys/lock.h> 5261d80e90SJohn Baldwin #include <sys/ktr.h> 5335e0e5b3SJohn Baldwin #include <sys/mutex.h> 54df8bae1dSRodney W. Grimes #include <sys/proc.h> 55e4625663SJeff Roberson #include <sys/resource.h> 56df8bae1dSRodney W. Grimes #include <sys/resourcevar.h> 57b43179fbSJeff Roberson #include <sys/sched.h> 58797f2d22SPoul-Henning Kamp #include <sys/signalvar.h> 596caa8a15SJohn Baldwin #include <sys/smp.h> 608a129caeSDavid Greenman #include <vm/vm.h> 61efeaf95aSDavid Greenman #include <vm/pmap.h> 62efeaf95aSDavid Greenman #include <vm/vm_map.h> 63797f2d22SPoul-Henning Kamp #include <sys/sysctl.h> 648088699fSJohn Baldwin #include <sys/bus.h> 658088699fSJohn Baldwin #include <sys/interrupt.h> 66104a9b7eSAlexander Kabaev #include <sys/limits.h> 67e7fa55afSPoul-Henning Kamp #include <sys/timetc.h> 68df8bae1dSRodney W. Grimes 69df8bae1dSRodney W. Grimes #ifdef GPROF 70df8bae1dSRodney W. Grimes #include <sys/gmon.h> 71df8bae1dSRodney W. Grimes #endif 72df8bae1dSRodney W. Grimes 7336c0fd9dSJoseph Koshy #ifdef HWPMC_HOOKS 7436c0fd9dSJoseph Koshy #include <sys/pmckern.h> 7536c0fd9dSJoseph Koshy #endif 7636c0fd9dSJoseph Koshy 77e4fc250cSLuigi Rizzo #ifdef DEVICE_POLLING 78e4fc250cSLuigi Rizzo extern void hardclock_device_poll(void); 79e4fc250cSLuigi Rizzo #endif /* DEVICE_POLLING */ 80eae8fc2cSSteve Passe 814d77a549SAlfred Perlstein static void initclocks(void *dummy); 822b14f991SJulian Elischer SYSINIT(clocks, SI_SUB_CLOCKS, SI_ORDER_FIRST, initclocks, NULL) 832b14f991SJulian Elischer 848b98fec9SJeff Roberson /* Spin-lock protecting profiling statistics. */ 8586a49deaSAttilio Rao static struct mtx time_lock; 868b98fec9SJeff Roberson 8762919d78SPeter Wemm static int 8862919d78SPeter Wemm sysctl_kern_cp_time(SYSCTL_HANDLER_ARGS) 8962919d78SPeter Wemm { 9062919d78SPeter Wemm int error; 917628402bSPeter Wemm long cp_time[CPUSTATES]; 92cff2e749SPaul Saab #ifdef SCTL_MASK32 9362919d78SPeter Wemm int i; 9462919d78SPeter Wemm unsigned int cp_time32[CPUSTATES]; 957628402bSPeter Wemm #endif 9662919d78SPeter Wemm 977628402bSPeter Wemm read_cpu_time(cp_time); 987628402bSPeter Wemm #ifdef SCTL_MASK32 99cff2e749SPaul Saab if (req->flags & SCTL_MASK32) { 10062919d78SPeter Wemm if (!req->oldptr) 10162919d78SPeter Wemm return SYSCTL_OUT(req, 0, sizeof(cp_time32)); 10262919d78SPeter Wemm for (i = 0; i < CPUSTATES; i++) 10362919d78SPeter Wemm cp_time32[i] = (unsigned int)cp_time[i]; 10462919d78SPeter Wemm error = SYSCTL_OUT(req, cp_time32, sizeof(cp_time32)); 10562919d78SPeter Wemm } else 10662919d78SPeter Wemm #endif 10762919d78SPeter Wemm { 10862919d78SPeter Wemm if (!req->oldptr) 10962919d78SPeter Wemm return SYSCTL_OUT(req, 0, sizeof(cp_time)); 11062919d78SPeter Wemm error = SYSCTL_OUT(req, cp_time, sizeof(cp_time)); 11162919d78SPeter Wemm } 11262919d78SPeter Wemm return error; 11362919d78SPeter Wemm } 11462919d78SPeter Wemm 11562919d78SPeter Wemm SYSCTL_PROC(_kern, OID_AUTO, cp_time, CTLTYPE_LONG|CTLFLAG_RD, 11662919d78SPeter Wemm 0,0, sysctl_kern_cp_time, "LU", "CPU time statistics"); 1177f112b04SRobert Watson 1187628402bSPeter Wemm static long empty[CPUSTATES]; 1197628402bSPeter Wemm 1207628402bSPeter Wemm static int 1217628402bSPeter Wemm sysctl_kern_cp_times(SYSCTL_HANDLER_ARGS) 1227628402bSPeter Wemm { 1237628402bSPeter Wemm struct pcpu *pcpu; 1247628402bSPeter Wemm int error; 125ef54068bSRobert Watson int c; 1267628402bSPeter Wemm long *cp_time; 1277628402bSPeter Wemm #ifdef SCTL_MASK32 1287628402bSPeter Wemm unsigned int cp_time32[CPUSTATES]; 129ef54068bSRobert Watson int i; 1307628402bSPeter Wemm #endif 1317628402bSPeter Wemm 1327628402bSPeter Wemm if (!req->oldptr) { 1337628402bSPeter Wemm #ifdef SCTL_MASK32 1347628402bSPeter Wemm if (req->flags & SCTL_MASK32) 1357628402bSPeter Wemm return SYSCTL_OUT(req, 0, sizeof(cp_time32) * (mp_maxid + 1)); 1367628402bSPeter Wemm else 1377628402bSPeter Wemm #endif 1387628402bSPeter Wemm return SYSCTL_OUT(req, 0, sizeof(long) * CPUSTATES * (mp_maxid + 1)); 1397628402bSPeter Wemm } 1407628402bSPeter Wemm for (error = 0, c = 0; error == 0 && c <= mp_maxid; c++) { 1417628402bSPeter Wemm if (!CPU_ABSENT(c)) { 1427628402bSPeter Wemm pcpu = pcpu_find(c); 1437628402bSPeter Wemm cp_time = pcpu->pc_cp_time; 1447628402bSPeter Wemm } else { 1457628402bSPeter Wemm cp_time = empty; 1467628402bSPeter Wemm } 1477628402bSPeter Wemm #ifdef SCTL_MASK32 1487628402bSPeter Wemm if (req->flags & SCTL_MASK32) { 1497628402bSPeter Wemm for (i = 0; i < CPUSTATES; i++) 1507628402bSPeter Wemm cp_time32[i] = (unsigned int)cp_time[i]; 1517628402bSPeter Wemm error = SYSCTL_OUT(req, cp_time32, sizeof(cp_time32)); 1527628402bSPeter Wemm } else 1537628402bSPeter Wemm #endif 1547628402bSPeter Wemm error = SYSCTL_OUT(req, cp_time, sizeof(long) * CPUSTATES); 1557628402bSPeter Wemm } 1567628402bSPeter Wemm return error; 1577628402bSPeter Wemm } 1587628402bSPeter Wemm 1597628402bSPeter Wemm SYSCTL_PROC(_kern, OID_AUTO, cp_times, CTLTYPE_LONG|CTLFLAG_RD, 1607628402bSPeter Wemm 0,0, sysctl_kern_cp_times, "LU", "per-CPU time statistics"); 1617628402bSPeter Wemm 1627628402bSPeter Wemm void 1637628402bSPeter Wemm read_cpu_time(long *cp_time) 1647628402bSPeter Wemm { 1657628402bSPeter Wemm struct pcpu *pc; 1667628402bSPeter Wemm int i, j; 1677628402bSPeter Wemm 1687628402bSPeter Wemm /* Sum up global cp_time[]. */ 1697628402bSPeter Wemm bzero(cp_time, sizeof(long) * CPUSTATES); 1707628402bSPeter Wemm for (i = 0; i <= mp_maxid; i++) { 1717628402bSPeter Wemm if (CPU_ABSENT(i)) 1727628402bSPeter Wemm continue; 1737628402bSPeter Wemm pc = pcpu_find(i); 1747628402bSPeter Wemm for (j = 0; j < CPUSTATES; j++) 1757628402bSPeter Wemm cp_time[j] += pc->pc_cp_time[j]; 1767628402bSPeter Wemm } 1777628402bSPeter Wemm } 1787628402bSPeter Wemm 1794103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG 1804103b765SPoul-Henning Kamp #include <sys/watchdog.h> 181370c3cb5SSean Kelly 1824103b765SPoul-Henning Kamp static int watchdog_ticks; 183370c3cb5SSean Kelly static int watchdog_enabled; 1844103b765SPoul-Henning Kamp static void watchdog_fire(void); 1854103b765SPoul-Henning Kamp static void watchdog_config(void *, u_int, int *); 1864103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */ 187370c3cb5SSean Kelly 1883bac064fSPoul-Henning Kamp /* 189df8bae1dSRodney W. Grimes * Clock handling routines. 190df8bae1dSRodney W. Grimes * 191b05dcf3cSPoul-Henning Kamp * This code is written to operate with two timers that run independently of 192b05dcf3cSPoul-Henning Kamp * each other. 1937ec73f64SPoul-Henning Kamp * 194b05dcf3cSPoul-Henning Kamp * The main timer, running hz times per second, is used to trigger interval 195b05dcf3cSPoul-Henning Kamp * timers, timeouts and rescheduling as needed. 1967ec73f64SPoul-Henning Kamp * 197b05dcf3cSPoul-Henning Kamp * The second timer handles kernel and user profiling, 198b05dcf3cSPoul-Henning Kamp * and does resource use estimation. If the second timer is programmable, 199b05dcf3cSPoul-Henning Kamp * it is randomized to avoid aliasing between the two clocks. For example, 200b05dcf3cSPoul-Henning Kamp * the randomization prevents an adversary from always giving up the cpu 201df8bae1dSRodney W. Grimes * just before its quantum expires. Otherwise, it would never accumulate 202df8bae1dSRodney W. Grimes * cpu ticks. The mean frequency of the second timer is stathz. 203b05dcf3cSPoul-Henning Kamp * 204b05dcf3cSPoul-Henning Kamp * If no second timer exists, stathz will be zero; in this case we drive 205b05dcf3cSPoul-Henning Kamp * profiling and statistics off the main clock. This WILL NOT be accurate; 206b05dcf3cSPoul-Henning Kamp * do not do it unless absolutely necessary. 207b05dcf3cSPoul-Henning Kamp * 208df8bae1dSRodney W. Grimes * The statistics clock may (or may not) be run at a higher rate while 209b05dcf3cSPoul-Henning Kamp * profiling. This profile clock runs at profhz. We require that profhz 210b05dcf3cSPoul-Henning Kamp * be an integral multiple of stathz. 211b05dcf3cSPoul-Henning Kamp * 212b05dcf3cSPoul-Henning Kamp * If the statistics clock is running fast, it must be divided by the ratio 213b05dcf3cSPoul-Henning Kamp * profhz/stathz for statistics. (For profiling, every tick counts.) 214df8bae1dSRodney W. Grimes * 2157ec73f64SPoul-Henning Kamp * Time-of-day is maintained using a "timecounter", which may or may 2167ec73f64SPoul-Henning Kamp * not be related to the hardware generating the above mentioned 2177ec73f64SPoul-Henning Kamp * interrupts. 218df8bae1dSRodney W. Grimes */ 219df8bae1dSRodney W. Grimes 220df8bae1dSRodney W. Grimes int stathz; 221df8bae1dSRodney W. Grimes int profhz; 222238dd320SJake Burkholder int profprocs; 223df8bae1dSRodney W. Grimes int ticks; 224238dd320SJake Burkholder int psratio; 225df8bae1dSRodney W. Grimes 226df8bae1dSRodney W. Grimes /* 227df8bae1dSRodney W. Grimes * Initialize clock frequencies and start both clocks running. 228df8bae1dSRodney W. Grimes */ 2292b14f991SJulian Elischer /* ARGSUSED*/ 2302b14f991SJulian Elischer static void 231d841aaa7SBruce Evans initclocks(dummy) 232d841aaa7SBruce Evans void *dummy; 233df8bae1dSRodney W. Grimes { 234df8bae1dSRodney W. Grimes register int i; 235df8bae1dSRodney W. Grimes 236df8bae1dSRodney W. Grimes /* 237df8bae1dSRodney W. Grimes * Set divisors to 1 (normal case) and let the machine-specific 238df8bae1dSRodney W. Grimes * code do its bit. 239df8bae1dSRodney W. Grimes */ 2408b98fec9SJeff Roberson mtx_init(&time_lock, "time lock", NULL, MTX_SPIN); 24163d69d25SRobert Watson cpu_initclocks(); 242df8bae1dSRodney W. Grimes 243df8bae1dSRodney W. Grimes /* 244df8bae1dSRodney W. Grimes * Compute profhz/stathz, and fix profhz if needed. 245df8bae1dSRodney W. Grimes */ 246df8bae1dSRodney W. Grimes i = stathz ? stathz : hz; 247df8bae1dSRodney W. Grimes if (profhz == 0) 248df8bae1dSRodney W. Grimes profhz = i; 249df8bae1dSRodney W. Grimes psratio = profhz / i; 2504103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG 2514103b765SPoul-Henning Kamp EVENTHANDLER_REGISTER(watchdog_list, watchdog_config, NULL, 0); 2524103b765SPoul-Henning Kamp #endif 253df8bae1dSRodney W. Grimes } 254df8bae1dSRodney W. Grimes 255df8bae1dSRodney W. Grimes /* 256238dd320SJake Burkholder * Each time the real-time timer fires, this function is called on all CPUs. 257b439e431SJohn Baldwin * Note that hardclock() calls hardclock_cpu() for the boot CPU, so only 258238dd320SJake Burkholder * the other CPUs in the system need to call this function. 2596caa8a15SJohn Baldwin */ 2606caa8a15SJohn Baldwin void 261b439e431SJohn Baldwin hardclock_cpu(int usermode) 2626caa8a15SJohn Baldwin { 2636caa8a15SJohn Baldwin struct pstats *pstats; 264238dd320SJake Burkholder struct thread *td = curthread; 265b40ce416SJulian Elischer struct proc *p = td->td_proc; 266b61ce5b0SJeff Roberson int flags; 2676caa8a15SJohn Baldwin 2686caa8a15SJohn Baldwin /* 2696caa8a15SJohn Baldwin * Run current process's virtual and profile time, as needed. 2706caa8a15SJohn Baldwin */ 271ad1e7d28SJulian Elischer pstats = p->p_stats; 272b61ce5b0SJeff Roberson flags = 0; 273ad1e7d28SJulian Elischer if (usermode && 27440acdeabSJeff Roberson timevalisset(&pstats->p_timer[ITIMER_VIRTUAL].it_value)) { 27540acdeabSJeff Roberson PROC_SLOCK(p); 276b61ce5b0SJeff Roberson if (itimerdecr(&pstats->p_timer[ITIMER_VIRTUAL], tick) == 0) 277b61ce5b0SJeff Roberson flags |= TDF_ALRMPEND | TDF_ASTPENDING; 27840acdeabSJeff Roberson PROC_SUNLOCK(p); 27940acdeabSJeff Roberson } 28040acdeabSJeff Roberson if (timevalisset(&pstats->p_timer[ITIMER_PROF].it_value)) { 28140acdeabSJeff Roberson PROC_SLOCK(p); 282b61ce5b0SJeff Roberson if (itimerdecr(&pstats->p_timer[ITIMER_PROF], tick) == 0) 283b61ce5b0SJeff Roberson flags |= TDF_PROFPEND | TDF_ASTPENDING; 28440acdeabSJeff Roberson PROC_SUNLOCK(p); 28540acdeabSJeff Roberson } 28640acdeabSJeff Roberson thread_lock(td); 28740acdeabSJeff Roberson sched_tick(); 288b61ce5b0SJeff Roberson td->td_flags |= flags; 28940acdeabSJeff Roberson thread_unlock(td); 29036c0fd9dSJoseph Koshy 29136c0fd9dSJoseph Koshy #ifdef HWPMC_HOOKS 29236c0fd9dSJoseph Koshy if (PMC_CPU_HAS_SAMPLES(PCPU_GET(cpuid))) 29336c0fd9dSJoseph Koshy PMC_CALL_HOOK_UNLOCKED(curthread, PMC_FN_DO_SAMPLES, NULL); 29436c0fd9dSJoseph Koshy #endif 2956caa8a15SJohn Baldwin } 2966caa8a15SJohn Baldwin 2976caa8a15SJohn Baldwin /* 298df8bae1dSRodney W. Grimes * The real-time timer, interrupting hz times per second. 299df8bae1dSRodney W. Grimes */ 300df8bae1dSRodney W. Grimes void 301b439e431SJohn Baldwin hardclock(int usermode, uintfptr_t pc) 302df8bae1dSRodney W. Grimes { 303fa2fbc3dSJake Burkholder int need_softclock = 0; 304df8bae1dSRodney W. Grimes 305b439e431SJohn Baldwin hardclock_cpu(usermode); 306b05dcf3cSPoul-Henning Kamp 307e7fa55afSPoul-Henning Kamp tc_ticktock(); 308df8bae1dSRodney W. Grimes /* 309df8bae1dSRodney W. Grimes * If no separate statistics clock is available, run it from here. 3106caa8a15SJohn Baldwin * 3116caa8a15SJohn Baldwin * XXX: this only works for UP 312df8bae1dSRodney W. Grimes */ 313238dd320SJake Burkholder if (stathz == 0) { 314b439e431SJohn Baldwin profclock(usermode, pc); 315b439e431SJohn Baldwin statclock(usermode); 316238dd320SJake Burkholder } 317df8bae1dSRodney W. Grimes 318e4fc250cSLuigi Rizzo #ifdef DEVICE_POLLING 319daccb638SLuigi Rizzo hardclock_device_poll(); /* this is very short and quick */ 320e4fc250cSLuigi Rizzo #endif /* DEVICE_POLLING */ 3213f31c649SGarrett Wollman 322b05dcf3cSPoul-Henning Kamp /* 323b05dcf3cSPoul-Henning Kamp * Process callouts at a very low cpu priority, so we don't keep the 324b05dcf3cSPoul-Henning Kamp * relatively high clock interrupt priority any longer than necessary. 325b05dcf3cSPoul-Henning Kamp */ 32621a7a9aeSJohn Baldwin mtx_lock_spin_flags(&callout_lock, MTX_QUIET); 327fa2fbc3dSJake Burkholder ticks++; 3286ad26d83SXin LI if (!TAILQ_EMPTY(&callwheel[ticks & callwheelmask])) { 329fa2fbc3dSJake Burkholder need_softclock = 1; 330b05dcf3cSPoul-Henning Kamp } else if (softticks + 1 == ticks) 331b05dcf3cSPoul-Henning Kamp ++softticks; 33221a7a9aeSJohn Baldwin mtx_unlock_spin_flags(&callout_lock, MTX_QUIET); 333fa2fbc3dSJake Burkholder 334fa2fbc3dSJake Burkholder /* 33540acdeabSJeff Roberson * swi_sched acquires the thread lock, so we don't want to call it 33640acdeabSJeff Roberson * with callout_lock held; incorrect locking order. 337fa2fbc3dSJake Burkholder */ 338fa2fbc3dSJake Burkholder if (need_softclock) 339c86b6ff5SJohn Baldwin swi_sched(softclock_ih, 0); 340370c3cb5SSean Kelly 3414103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG 3424103b765SPoul-Henning Kamp if (watchdog_enabled > 0 && --watchdog_ticks <= 0) 343370c3cb5SSean Kelly watchdog_fire(); 3444103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */ 345ab36c067SJustin T. Gibbs } 346ab36c067SJustin T. Gibbs 347df8bae1dSRodney W. Grimes /* 348227ee8a1SPoul-Henning Kamp * Compute number of ticks in the specified amount of time. 349df8bae1dSRodney W. Grimes */ 350df8bae1dSRodney W. Grimes int 351227ee8a1SPoul-Henning Kamp tvtohz(tv) 352df8bae1dSRodney W. Grimes struct timeval *tv; 353df8bae1dSRodney W. Grimes { 3546976af69SBruce Evans register unsigned long ticks; 3556976af69SBruce Evans register long sec, usec; 356df8bae1dSRodney W. Grimes 357df8bae1dSRodney W. Grimes /* 3586976af69SBruce Evans * If the number of usecs in the whole seconds part of the time 3596976af69SBruce Evans * difference fits in a long, then the total number of usecs will 3606976af69SBruce Evans * fit in an unsigned long. Compute the total and convert it to 3616976af69SBruce Evans * ticks, rounding up and adding 1 to allow for the current tick 3626976af69SBruce Evans * to expire. Rounding also depends on unsigned long arithmetic 3636976af69SBruce Evans * to avoid overflow. 364df8bae1dSRodney W. Grimes * 3656976af69SBruce Evans * Otherwise, if the number of ticks in the whole seconds part of 3666976af69SBruce Evans * the time difference fits in a long, then convert the parts to 3676976af69SBruce Evans * ticks separately and add, using similar rounding methods and 3686976af69SBruce Evans * overflow avoidance. This method would work in the previous 3696976af69SBruce Evans * case but it is slightly slower and assumes that hz is integral. 3706976af69SBruce Evans * 3716976af69SBruce Evans * Otherwise, round the time difference down to the maximum 3726976af69SBruce Evans * representable value. 3736976af69SBruce Evans * 3746976af69SBruce Evans * If ints have 32 bits, then the maximum value for any timeout in 3756976af69SBruce Evans * 10ms ticks is 248 days. 376df8bae1dSRodney W. Grimes */ 377227ee8a1SPoul-Henning Kamp sec = tv->tv_sec; 378227ee8a1SPoul-Henning Kamp usec = tv->tv_usec; 3796976af69SBruce Evans if (usec < 0) { 3806976af69SBruce Evans sec--; 3816976af69SBruce Evans usec += 1000000; 3826976af69SBruce Evans } 3836976af69SBruce Evans if (sec < 0) { 3846976af69SBruce Evans #ifdef DIAGNOSTIC 385b05dcf3cSPoul-Henning Kamp if (usec > 0) { 3867ec73f64SPoul-Henning Kamp sec++; 3877ec73f64SPoul-Henning Kamp usec -= 1000000; 3887ec73f64SPoul-Henning Kamp } 389227ee8a1SPoul-Henning Kamp printf("tvotohz: negative time difference %ld sec %ld usec\n", 3906976af69SBruce Evans sec, usec); 3916976af69SBruce Evans #endif 3926976af69SBruce Evans ticks = 1; 3936976af69SBruce Evans } else if (sec <= LONG_MAX / 1000000) 3946976af69SBruce Evans ticks = (sec * 1000000 + (unsigned long)usec + (tick - 1)) 3956976af69SBruce Evans / tick + 1; 3966976af69SBruce Evans else if (sec <= LONG_MAX / hz) 3976976af69SBruce Evans ticks = sec * hz 3986976af69SBruce Evans + ((unsigned long)usec + (tick - 1)) / tick + 1; 3996976af69SBruce Evans else 4006976af69SBruce Evans ticks = LONG_MAX; 4016976af69SBruce Evans if (ticks > INT_MAX) 4026976af69SBruce Evans ticks = INT_MAX; 403d6116663SAlexander Langer return ((int)ticks); 404df8bae1dSRodney W. Grimes } 405df8bae1dSRodney W. Grimes 406df8bae1dSRodney W. Grimes /* 407df8bae1dSRodney W. Grimes * Start profiling on a process. 408df8bae1dSRodney W. Grimes * 409df8bae1dSRodney W. Grimes * Kernel profiling passes proc0 which never exits and hence 410df8bae1dSRodney W. Grimes * keeps the profile clock running constantly. 411df8bae1dSRodney W. Grimes */ 412df8bae1dSRodney W. Grimes void 413df8bae1dSRodney W. Grimes startprofclock(p) 414df8bae1dSRodney W. Grimes register struct proc *p; 415df8bae1dSRodney W. Grimes { 416df8bae1dSRodney W. Grimes 4179752f794SJohn Baldwin PROC_LOCK_ASSERT(p, MA_OWNED); 4189752f794SJohn Baldwin if (p->p_flag & P_STOPPROF) 419a282253aSJulian Elischer return; 4209752f794SJohn Baldwin if ((p->p_flag & P_PROFIL) == 0) { 4219752f794SJohn Baldwin p->p_flag |= P_PROFIL; 4228b98fec9SJeff Roberson mtx_lock_spin(&time_lock); 423238dd320SJake Burkholder if (++profprocs == 1) 424238dd320SJake Burkholder cpu_startprofclock(); 4258b98fec9SJeff Roberson mtx_unlock_spin(&time_lock); 426df8bae1dSRodney W. Grimes } 4279752f794SJohn Baldwin } 428df8bae1dSRodney W. Grimes 429df8bae1dSRodney W. Grimes /* 430df8bae1dSRodney W. Grimes * Stop profiling on a process. 431df8bae1dSRodney W. Grimes */ 432df8bae1dSRodney W. Grimes void 433df8bae1dSRodney W. Grimes stopprofclock(p) 434df8bae1dSRodney W. Grimes register struct proc *p; 435df8bae1dSRodney W. Grimes { 436df8bae1dSRodney W. Grimes 437a282253aSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 4389752f794SJohn Baldwin if (p->p_flag & P_PROFIL) { 4399752f794SJohn Baldwin if (p->p_profthreads != 0) { 4409752f794SJohn Baldwin p->p_flag |= P_STOPPROF; 4419752f794SJohn Baldwin while (p->p_profthreads != 0) 442a282253aSJulian Elischer msleep(&p->p_profthreads, &p->p_mtx, PPAUSE, 443a89ec05eSPeter Wemm "stopprof", 0); 4449752f794SJohn Baldwin p->p_flag &= ~P_STOPPROF; 445a282253aSJulian Elischer } 446b62b2304SColin Percival if ((p->p_flag & P_PROFIL) == 0) 447b62b2304SColin Percival return; 4489752f794SJohn Baldwin p->p_flag &= ~P_PROFIL; 4498b98fec9SJeff Roberson mtx_lock_spin(&time_lock); 450238dd320SJake Burkholder if (--profprocs == 0) 451238dd320SJake Burkholder cpu_stopprofclock(); 4528b98fec9SJeff Roberson mtx_unlock_spin(&time_lock); 453df8bae1dSRodney W. Grimes } 4549752f794SJohn Baldwin } 455df8bae1dSRodney W. Grimes 456df8bae1dSRodney W. Grimes /* 4571c4bcd05SJeff Roberson * Statistics clock. Updates rusage information and calls the scheduler 4581c4bcd05SJeff Roberson * to adjust priorities of the active thread. 4591c4bcd05SJeff Roberson * 460238dd320SJake Burkholder * This should be called by all active processors. 461df8bae1dSRodney W. Grimes */ 462df8bae1dSRodney W. Grimes void 463b439e431SJohn Baldwin statclock(int usermode) 464df8bae1dSRodney W. Grimes { 4658a129caeSDavid Greenman struct rusage *ru; 4668a129caeSDavid Greenman struct vmspace *vm; 467238dd320SJake Burkholder struct thread *td; 468238dd320SJake Burkholder struct proc *p; 469238dd320SJake Burkholder long rss; 4707628402bSPeter Wemm long *cp_time; 4718a129caeSDavid Greenman 472238dd320SJake Burkholder td = curthread; 473238dd320SJake Burkholder p = td->td_proc; 474238dd320SJake Burkholder 4757628402bSPeter Wemm cp_time = (long *)PCPU_PTR(cp_time); 476b439e431SJohn Baldwin if (usermode) { 477df8bae1dSRodney W. Grimes /* 47871a62f8aSBruce Evans * Charge the time as appropriate. 479df8bae1dSRodney W. Grimes */ 4808460a577SJohn Birrell #ifdef KSE 4810e2a4d3aSDavid Xu if (p->p_flag & P_SA) 4825215b187SJeff Roberson thread_statclock(1); 4838460a577SJohn Birrell #endif 484e8444a7eSPoul-Henning Kamp td->td_uticks++; 485fa885116SJulian Elischer if (p->p_nice > NZERO) 4867628402bSPeter Wemm cp_time[CP_NICE]++; 487df8bae1dSRodney W. Grimes else 4887628402bSPeter Wemm cp_time[CP_USER]++; 489df8bae1dSRodney W. Grimes } else { 490df8bae1dSRodney W. Grimes /* 491df8bae1dSRodney W. Grimes * Came from kernel mode, so we were: 492df8bae1dSRodney W. Grimes * - handling an interrupt, 493df8bae1dSRodney W. Grimes * - doing syscall or trap work on behalf of the current 494df8bae1dSRodney W. Grimes * user process, or 495df8bae1dSRodney W. Grimes * - spinning in the idle loop. 496df8bae1dSRodney W. Grimes * Whichever it is, charge the time as appropriate. 497df8bae1dSRodney W. Grimes * Note that we charge interrupts to the current process, 498df8bae1dSRodney W. Grimes * regardless of whether they are ``for'' that process, 499df8bae1dSRodney W. Grimes * so that we know how much of its real time was spent 500df8bae1dSRodney W. Grimes * in ``non-process'' (i.e., interrupt) work. 501df8bae1dSRodney W. Grimes */ 502e0f66ef8SJohn Baldwin if ((td->td_pflags & TDP_ITHREAD) || 503e0f66ef8SJohn Baldwin td->td_intr_nesting_level >= 2) { 504e8444a7eSPoul-Henning Kamp td->td_iticks++; 5057628402bSPeter Wemm cp_time[CP_INTR]++; 5060384fff8SJason Evans } else { 5078460a577SJohn Birrell #ifdef KSE 5080e2a4d3aSDavid Xu if (p->p_flag & P_SA) 5095215b187SJeff Roberson thread_statclock(0); 5108460a577SJohn Birrell #endif 511eb2da9a5SPoul-Henning Kamp td->td_pticks++; 512e8444a7eSPoul-Henning Kamp td->td_sticks++; 513486a9414SJulian Elischer if (!TD_IS_IDLETHREAD(td)) 5147628402bSPeter Wemm cp_time[CP_SYS]++; 5150384fff8SJason Evans else 5167628402bSPeter Wemm cp_time[CP_IDLE]++; 517df8bae1dSRodney W. Grimes } 5180384fff8SJason Evans } 519f5e9e8ecSBruce Evans 520f5e9e8ecSBruce Evans /* Update resource usage integrals and maximums. */ 52116f9f205SJohn Baldwin MPASS(p->p_vmspace != NULL); 52216f9f205SJohn Baldwin vm = p->p_vmspace; 5231c4bcd05SJeff Roberson ru = &td->td_ru; 5241c6d46f9SLuoqi Chen ru->ru_ixrss += pgtok(vm->vm_tsize); 5251c6d46f9SLuoqi Chen ru->ru_idrss += pgtok(vm->vm_dsize); 5261c6d46f9SLuoqi Chen ru->ru_isrss += pgtok(vm->vm_ssize); 5271c6d46f9SLuoqi Chen rss = pgtok(vmspace_resident_count(vm)); 528f5e9e8ecSBruce Evans if (ru->ru_maxrss < rss) 529f5e9e8ecSBruce Evans ru->ru_maxrss = rss; 53040acdeabSJeff Roberson CTR4(KTR_SCHED, "statclock: %p(%s) prio %d stathz %d", 531431f8906SJulian Elischer td, td->td_name, td->td_priority, (stathz)?stathz:hz); 5327628402bSPeter Wemm thread_lock_flags(td, MTX_QUIET); 53340acdeabSJeff Roberson sched_clock(td); 53440acdeabSJeff Roberson thread_unlock(td); 5356caa8a15SJohn Baldwin } 5366c567274SJohn Baldwin 5376caa8a15SJohn Baldwin void 538b439e431SJohn Baldwin profclock(int usermode, uintfptr_t pc) 5396caa8a15SJohn Baldwin { 540238dd320SJake Burkholder struct thread *td; 541238dd320SJake Burkholder #ifdef GPROF 542238dd320SJake Burkholder struct gmonparam *g; 5435c8b4441SJohn Baldwin uintfptr_t i; 544238dd320SJake Burkholder #endif 5456caa8a15SJohn Baldwin 5464a338afdSJulian Elischer td = curthread; 547b439e431SJohn Baldwin if (usermode) { 548238dd320SJake Burkholder /* 549238dd320SJake Burkholder * Came from user mode; CPU was in user state. 550238dd320SJake Burkholder * If this process is being profiled, record the tick. 551a282253aSJulian Elischer * if there is no related user location yet, don't 552a282253aSJulian Elischer * bother trying to count it. 553238dd320SJake Burkholder */ 5549752f794SJohn Baldwin if (td->td_proc->p_flag & P_PROFIL) 555b439e431SJohn Baldwin addupc_intr(td, pc, 1); 556238dd320SJake Burkholder } 557238dd320SJake Burkholder #ifdef GPROF 558238dd320SJake Burkholder else { 559238dd320SJake Burkholder /* 560238dd320SJake Burkholder * Kernel statistics are just like addupc_intr, only easier. 561238dd320SJake Burkholder */ 562238dd320SJake Burkholder g = &_gmonparam; 563b439e431SJohn Baldwin if (g->state == GMON_PROF_ON && pc >= g->lowpc) { 564b439e431SJohn Baldwin i = PC_TO_I(g, pc); 565238dd320SJake Burkholder if (i < g->textsize) { 566b439e431SJohn Baldwin KCOUNT(g, i)++; 567238dd320SJake Burkholder } 568238dd320SJake Burkholder } 569238dd320SJake Burkholder } 570238dd320SJake Burkholder #endif 571df8bae1dSRodney W. Grimes } 572df8bae1dSRodney W. Grimes 573df8bae1dSRodney W. Grimes /* 574df8bae1dSRodney W. Grimes * Return information about system clocks. 575df8bae1dSRodney W. Grimes */ 576787d58f2SPoul-Henning Kamp static int 57782d9ae4eSPoul-Henning Kamp sysctl_kern_clockrate(SYSCTL_HANDLER_ARGS) 578df8bae1dSRodney W. Grimes { 579df8bae1dSRodney W. Grimes struct clockinfo clkinfo; 580df8bae1dSRodney W. Grimes /* 581df8bae1dSRodney W. Grimes * Construct clockinfo structure. 582df8bae1dSRodney W. Grimes */ 583a9a0f15aSBruce Evans bzero(&clkinfo, sizeof(clkinfo)); 584df8bae1dSRodney W. Grimes clkinfo.hz = hz; 585df8bae1dSRodney W. Grimes clkinfo.tick = tick; 586df8bae1dSRodney W. Grimes clkinfo.profhz = profhz; 587df8bae1dSRodney W. Grimes clkinfo.stathz = stathz ? stathz : hz; 588ae0eb976SPoul-Henning Kamp return (sysctl_handle_opaque(oidp, &clkinfo, sizeof clkinfo, req)); 589df8bae1dSRodney W. Grimes } 5903f31c649SGarrett Wollman 591946bb7a2SPoul-Henning Kamp SYSCTL_PROC(_kern, KERN_CLOCKRATE, clockrate, CTLTYPE_STRUCT|CTLFLAG_RD, 592af1408e3SLuigi Rizzo 0, 0, sysctl_kern_clockrate, "S,clockinfo", 593af1408e3SLuigi Rizzo "Rate and period of various kernel clocks"); 594370c3cb5SSean Kelly 5954103b765SPoul-Henning Kamp #ifdef SW_WATCHDOG 5964103b765SPoul-Henning Kamp 5974103b765SPoul-Henning Kamp static void 5989079fff5SNick Hibma watchdog_config(void *unused __unused, u_int cmd, int *error) 599370c3cb5SSean Kelly { 6004103b765SPoul-Henning Kamp u_int u; 601370c3cb5SSean Kelly 6024103b765SPoul-Henning Kamp u = cmd & WD_INTERVAL; 6039079fff5SNick Hibma if (u >= WD_TO_1SEC) { 6044103b765SPoul-Henning Kamp watchdog_ticks = (1 << (u - WD_TO_1SEC)) * hz; 6054103b765SPoul-Henning Kamp watchdog_enabled = 1; 6069079fff5SNick Hibma *error = 0; 6074103b765SPoul-Henning Kamp } else { 6084103b765SPoul-Henning Kamp watchdog_enabled = 0; 609370c3cb5SSean Kelly } 6104103b765SPoul-Henning Kamp } 611370c3cb5SSean Kelly 612370c3cb5SSean Kelly /* 613370c3cb5SSean Kelly * Handle a watchdog timeout by dumping interrupt information and 614911d16b8SEd Maste * then either dropping to DDB or panicking. 615370c3cb5SSean Kelly */ 616370c3cb5SSean Kelly static void 617370c3cb5SSean Kelly watchdog_fire(void) 618370c3cb5SSean Kelly { 619370c3cb5SSean Kelly int nintr; 620370c3cb5SSean Kelly u_int64_t inttotal; 621370c3cb5SSean Kelly u_long *curintr; 622370c3cb5SSean Kelly char *curname; 623370c3cb5SSean Kelly 624370c3cb5SSean Kelly curintr = intrcnt; 625370c3cb5SSean Kelly curname = intrnames; 626370c3cb5SSean Kelly inttotal = 0; 627370c3cb5SSean Kelly nintr = eintrcnt - intrcnt; 628370c3cb5SSean Kelly 629370c3cb5SSean Kelly printf("interrupt total\n"); 630370c3cb5SSean Kelly while (--nintr >= 0) { 631370c3cb5SSean Kelly if (*curintr) 632370c3cb5SSean Kelly printf("%-12s %20lu\n", curname, *curintr); 633370c3cb5SSean Kelly curname += strlen(curname) + 1; 634370c3cb5SSean Kelly inttotal += *curintr++; 635370c3cb5SSean Kelly } 6366cda4155SSean Kelly printf("Total %20ju\n", (uintmax_t)inttotal); 637911d16b8SEd Maste 638911d16b8SEd Maste #if defined(KDB) && !defined(KDB_UNATTENDED) 639911d16b8SEd Maste kdb_backtrace(); 640911d16b8SEd Maste kdb_enter("watchdog timeout"); 641911d16b8SEd Maste #else 642370c3cb5SSean Kelly panic("watchdog timeout"); 643911d16b8SEd Maste #endif 644370c3cb5SSean Kelly } 645370c3cb5SSean Kelly 6464103b765SPoul-Henning Kamp #endif /* SW_WATCHDOG */ 647