183a81bcbSJohn Baldwin /*- 283a81bcbSJohn Baldwin * Copyright (c) 2006 John Baldwin <jhb@FreeBSD.org> 383a81bcbSJohn Baldwin * All rights reserved. 483a81bcbSJohn Baldwin * 583a81bcbSJohn Baldwin * Redistribution and use in source and binary forms, with or without 683a81bcbSJohn Baldwin * modification, are permitted provided that the following conditions 783a81bcbSJohn Baldwin * are met: 883a81bcbSJohn Baldwin * 1. Redistributions of source code must retain the above copyright 983a81bcbSJohn Baldwin * notice, this list of conditions and the following disclaimer. 1083a81bcbSJohn Baldwin * 2. Redistributions in binary form must reproduce the above copyright 1183a81bcbSJohn Baldwin * notice, this list of conditions and the following disclaimer in the 1283a81bcbSJohn Baldwin * documentation and/or other materials provided with the distribution. 1383a81bcbSJohn Baldwin * 1483a81bcbSJohn Baldwin * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 1583a81bcbSJohn Baldwin * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 1683a81bcbSJohn Baldwin * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 1783a81bcbSJohn Baldwin * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 1883a81bcbSJohn Baldwin * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 1983a81bcbSJohn Baldwin * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2083a81bcbSJohn Baldwin * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 2183a81bcbSJohn Baldwin * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2283a81bcbSJohn Baldwin * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2383a81bcbSJohn Baldwin * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 2483a81bcbSJohn Baldwin * SUCH DAMAGE. 2583a81bcbSJohn Baldwin */ 2683a81bcbSJohn Baldwin 2783a81bcbSJohn Baldwin /* 2883a81bcbSJohn Baldwin * This module holds the global variables and functions used to maintain 2983a81bcbSJohn Baldwin * lock_object structures. 3083a81bcbSJohn Baldwin */ 3183a81bcbSJohn Baldwin 3283a81bcbSJohn Baldwin #include <sys/cdefs.h> 3383a81bcbSJohn Baldwin __FBSDID("$FreeBSD$"); 3483a81bcbSJohn Baldwin 356ef970a9SJohn Baldwin #include "opt_ddb.h" 367c0435b9SKip Macy #include "opt_mprof.h" 376ef970a9SJohn Baldwin 3883a81bcbSJohn Baldwin #include <sys/param.h> 3983a81bcbSJohn Baldwin #include <sys/systm.h> 40eea4f254SJeff Roberson #include <sys/kernel.h> 4183a81bcbSJohn Baldwin #include <sys/ktr.h> 4283a81bcbSJohn Baldwin #include <sys/lock.h> 437c0435b9SKip Macy #include <sys/lock_profile.h> 44eea4f254SJeff Roberson #include <sys/malloc.h> 452e6b8de4SJeff Roberson #include <sys/mutex.h> 46eea4f254SJeff Roberson #include <sys/pcpu.h> 47eea4f254SJeff Roberson #include <sys/proc.h> 48eea4f254SJeff Roberson #include <sys/sbuf.h> 492e6b8de4SJeff Roberson #include <sys/sched.h> 50eea4f254SJeff Roberson #include <sys/smp.h> 51eea4f254SJeff Roberson #include <sys/sysctl.h> 5283a81bcbSJohn Baldwin 5383a81bcbSJohn Baldwin #ifdef DDB 5483a81bcbSJohn Baldwin #include <ddb/ddb.h> 5583a81bcbSJohn Baldwin #endif 5683a81bcbSJohn Baldwin 57eea4f254SJeff Roberson #include <machine/cpufunc.h> 58eea4f254SJeff Roberson 59*8e5a3e9aSMateusz Guzik SDT_PROVIDER_DEFINE(lock); 60*8e5a3e9aSMateusz Guzik SDT_PROBE_DEFINE1(lock, , , starvation, "u_int"); 61*8e5a3e9aSMateusz Guzik 6283a81bcbSJohn Baldwin CTASSERT(LOCK_CLASS_MAX == 15); 6383a81bcbSJohn Baldwin 6483a81bcbSJohn Baldwin struct lock_class *lock_classes[LOCK_CLASS_MAX + 1] = { 6583a81bcbSJohn Baldwin &lock_class_mtx_spin, 6683a81bcbSJohn Baldwin &lock_class_mtx_sleep, 6783a81bcbSJohn Baldwin &lock_class_sx, 68f53d15feSStephan Uphoff &lock_class_rm, 69cd32bd7aSJohn Baldwin &lock_class_rm_sleepable, 703f08bd8bSJohn Baldwin &lock_class_rw, 7161bd5e21SKip Macy &lock_class_lockmgr, 7283a81bcbSJohn Baldwin }; 7383a81bcbSJohn Baldwin 7483a81bcbSJohn Baldwin void 7583a81bcbSJohn Baldwin lock_init(struct lock_object *lock, struct lock_class *class, const char *name, 7683a81bcbSJohn Baldwin const char *type, int flags) 7783a81bcbSJohn Baldwin { 7883a81bcbSJohn Baldwin int i; 7983a81bcbSJohn Baldwin 8083a81bcbSJohn Baldwin /* Check for double-init and zero object. */ 81fd07ddcfSDmitry Chagin KASSERT(flags & LO_NEW || !lock_initialized(lock), 82fd07ddcfSDmitry Chagin ("lock \"%s\" %p already initialized", name, lock)); 8383a81bcbSJohn Baldwin 8483a81bcbSJohn Baldwin /* Look up lock class to find its index. */ 8583a81bcbSJohn Baldwin for (i = 0; i < LOCK_CLASS_MAX; i++) 8683a81bcbSJohn Baldwin if (lock_classes[i] == class) { 8783a81bcbSJohn Baldwin lock->lo_flags = i << LO_CLASSSHIFT; 8883a81bcbSJohn Baldwin break; 8983a81bcbSJohn Baldwin } 9083a81bcbSJohn Baldwin KASSERT(i < LOCK_CLASS_MAX, ("unknown lock class %p", class)); 9183a81bcbSJohn Baldwin 9283a81bcbSJohn Baldwin /* Initialize the lock object. */ 9383a81bcbSJohn Baldwin lock->lo_name = name; 9483a81bcbSJohn Baldwin lock->lo_flags |= flags | LO_INITIALIZED; 9583a81bcbSJohn Baldwin LOCK_LOG_INIT(lock, 0); 9690356491SAttilio Rao WITNESS_INIT(lock, (type != NULL) ? type : name); 9783a81bcbSJohn Baldwin } 9883a81bcbSJohn Baldwin 9983a81bcbSJohn Baldwin void 10083a81bcbSJohn Baldwin lock_destroy(struct lock_object *lock) 10183a81bcbSJohn Baldwin { 10283a81bcbSJohn Baldwin 1033a6cdc4eSJohn-Mark Gurney KASSERT(lock_initialized(lock), ("lock %p is not initialized", lock)); 10483a81bcbSJohn Baldwin WITNESS_DESTROY(lock); 10583a81bcbSJohn Baldwin LOCK_LOG_DESTROY(lock, 0); 10683a81bcbSJohn Baldwin lock->lo_flags &= ~LO_INITIALIZED; 10783a81bcbSJohn Baldwin } 10883a81bcbSJohn Baldwin 109*8e5a3e9aSMateusz Guzik static SYSCTL_NODE(_debug, OID_AUTO, lock, CTLFLAG_RD, NULL, "lock debugging"); 110*8e5a3e9aSMateusz Guzik static SYSCTL_NODE(_debug_lock, OID_AUTO, delay, CTLFLAG_RD, NULL, 111*8e5a3e9aSMateusz Guzik "lock delay"); 112*8e5a3e9aSMateusz Guzik 113*8e5a3e9aSMateusz Guzik static u_int __read_mostly starvation_limit = 131072; 114*8e5a3e9aSMateusz Guzik SYSCTL_INT(_debug_lock_delay, OID_AUTO, starvation_limit, CTLFLAG_RW, 115*8e5a3e9aSMateusz Guzik &starvation_limit, 0, ""); 116*8e5a3e9aSMateusz Guzik 117*8e5a3e9aSMateusz Guzik static u_int __read_mostly restrict_starvation = 0; 118*8e5a3e9aSMateusz Guzik SYSCTL_INT(_debug_lock_delay, OID_AUTO, restrict_starvation, CTLFLAG_RW, 119*8e5a3e9aSMateusz Guzik &restrict_starvation, 0, ""); 120*8e5a3e9aSMateusz Guzik 1211ada9041SMateusz Guzik void 1221ada9041SMateusz Guzik lock_delay(struct lock_delay_arg *la) 1231ada9041SMateusz Guzik { 1241ada9041SMateusz Guzik struct lock_delay_config *lc = la->config; 125*8e5a3e9aSMateusz Guzik u_int i; 1261ada9041SMateusz Guzik 127*8e5a3e9aSMateusz Guzik la->delay <<= 1; 128*8e5a3e9aSMateusz Guzik if (__predict_false(la->delay > lc->max)) 129*8e5a3e9aSMateusz Guzik la->delay = lc->max; 1301ada9041SMateusz Guzik 131*8e5a3e9aSMateusz Guzik for (i = la->delay; i > 0; i++) 1321ada9041SMateusz Guzik cpu_spinwait(); 1331ada9041SMateusz Guzik 134*8e5a3e9aSMateusz Guzik la->spin_cnt += la->delay; 135*8e5a3e9aSMateusz Guzik if (__predict_false(la->spin_cnt > starvation_limit)) { 136*8e5a3e9aSMateusz Guzik SDT_PROBE1(lock, , , starvation, la->delay); 137*8e5a3e9aSMateusz Guzik if (restrict_starvation) 138*8e5a3e9aSMateusz Guzik la->delay = lc->base; 139*8e5a3e9aSMateusz Guzik } 140*8e5a3e9aSMateusz Guzik } 141*8e5a3e9aSMateusz Guzik 142*8e5a3e9aSMateusz Guzik static u_int 143*8e5a3e9aSMateusz Guzik lock_roundup_2(u_int val) 144*8e5a3e9aSMateusz Guzik { 145*8e5a3e9aSMateusz Guzik u_int res; 146*8e5a3e9aSMateusz Guzik 147*8e5a3e9aSMateusz Guzik for (res = 1; res <= val; res <<= 1) 148*8e5a3e9aSMateusz Guzik continue; 149*8e5a3e9aSMateusz Guzik 150*8e5a3e9aSMateusz Guzik return (res); 151*8e5a3e9aSMateusz Guzik } 152*8e5a3e9aSMateusz Guzik 153*8e5a3e9aSMateusz Guzik void 154*8e5a3e9aSMateusz Guzik lock_delay_default_init(struct lock_delay_config *lc) 155*8e5a3e9aSMateusz Guzik { 156*8e5a3e9aSMateusz Guzik 157*8e5a3e9aSMateusz Guzik lc->base = lock_roundup_2(mp_ncpus) / 4; 158*8e5a3e9aSMateusz Guzik lc->max = lc->base * 1024; 1591ada9041SMateusz Guzik } 1601ada9041SMateusz Guzik 16183a81bcbSJohn Baldwin #ifdef DDB 16283a81bcbSJohn Baldwin DB_SHOW_COMMAND(lock, db_show_lock) 16383a81bcbSJohn Baldwin { 16483a81bcbSJohn Baldwin struct lock_object *lock; 16583a81bcbSJohn Baldwin struct lock_class *class; 16683a81bcbSJohn Baldwin 16783a81bcbSJohn Baldwin if (!have_addr) 16883a81bcbSJohn Baldwin return; 16983a81bcbSJohn Baldwin lock = (struct lock_object *)addr; 17083a81bcbSJohn Baldwin if (LO_CLASSINDEX(lock) > LOCK_CLASS_MAX) { 17183a81bcbSJohn Baldwin db_printf("Unknown lock class: %d\n", LO_CLASSINDEX(lock)); 17283a81bcbSJohn Baldwin return; 17383a81bcbSJohn Baldwin } 17483a81bcbSJohn Baldwin class = LOCK_CLASS(lock); 17583a81bcbSJohn Baldwin db_printf(" class: %s\n", class->lc_name); 17683a81bcbSJohn Baldwin db_printf(" name: %s\n", lock->lo_name); 17783a81bcbSJohn Baldwin class->lc_ddb_show(lock); 17883a81bcbSJohn Baldwin } 17983a81bcbSJohn Baldwin #endif 1807c0435b9SKip Macy 1817c0435b9SKip Macy #ifdef LOCK_PROFILING 182eea4f254SJeff Roberson 183eea4f254SJeff Roberson /* 184eea4f254SJeff Roberson * One object per-thread for each lock the thread owns. Tracks individual 185eea4f254SJeff Roberson * lock instances. 186eea4f254SJeff Roberson */ 187eea4f254SJeff Roberson struct lock_profile_object { 188eea4f254SJeff Roberson LIST_ENTRY(lock_profile_object) lpo_link; 189eea4f254SJeff Roberson struct lock_object *lpo_obj; 190eea4f254SJeff Roberson const char *lpo_file; 191eea4f254SJeff Roberson int lpo_line; 192eea4f254SJeff Roberson uint16_t lpo_ref; 193eea4f254SJeff Roberson uint16_t lpo_cnt; 19460ae52f7SEd Schouten uint64_t lpo_acqtime; 19560ae52f7SEd Schouten uint64_t lpo_waittime; 196eea4f254SJeff Roberson u_int lpo_contest_locking; 197eea4f254SJeff Roberson }; 198eea4f254SJeff Roberson 199eea4f254SJeff Roberson /* 200eea4f254SJeff Roberson * One lock_prof for each (file, line, lock object) triple. 201eea4f254SJeff Roberson */ 202eea4f254SJeff Roberson struct lock_prof { 203eea4f254SJeff Roberson SLIST_ENTRY(lock_prof) link; 2040c66dc67SJeff Roberson struct lock_class *class; 205eea4f254SJeff Roberson const char *file; 206eea4f254SJeff Roberson const char *name; 207eea4f254SJeff Roberson int line; 208eea4f254SJeff Roberson int ticks; 209947265b6SKip Macy uintmax_t cnt_wait_max; 210eea4f254SJeff Roberson uintmax_t cnt_max; 211eea4f254SJeff Roberson uintmax_t cnt_tot; 212eea4f254SJeff Roberson uintmax_t cnt_wait; 213eea4f254SJeff Roberson uintmax_t cnt_cur; 214eea4f254SJeff Roberson uintmax_t cnt_contest_locking; 215eea4f254SJeff Roberson }; 216eea4f254SJeff Roberson 217eea4f254SJeff Roberson SLIST_HEAD(lphead, lock_prof); 218eea4f254SJeff Roberson 219eea4f254SJeff Roberson #define LPROF_HASH_SIZE 4096 220eea4f254SJeff Roberson #define LPROF_HASH_MASK (LPROF_HASH_SIZE - 1) 221eea4f254SJeff Roberson #define LPROF_CACHE_SIZE 4096 222eea4f254SJeff Roberson 223eea4f254SJeff Roberson /* 224eea4f254SJeff Roberson * Array of objects and profs for each type of object for each cpu. Spinlocks 225b1ce21c6SRebecca Cran * are handled separately because a thread may be preempted and acquire a 226eea4f254SJeff Roberson * spinlock while in the lock profiling code of a non-spinlock. In this way 227eea4f254SJeff Roberson * we only need a critical section to protect the per-cpu lists. 228eea4f254SJeff Roberson */ 229eea4f254SJeff Roberson struct lock_prof_type { 230eea4f254SJeff Roberson struct lphead lpt_lpalloc; 231eea4f254SJeff Roberson struct lpohead lpt_lpoalloc; 232eea4f254SJeff Roberson struct lphead lpt_hash[LPROF_HASH_SIZE]; 233eea4f254SJeff Roberson struct lock_prof lpt_prof[LPROF_CACHE_SIZE]; 234eea4f254SJeff Roberson struct lock_profile_object lpt_objs[LPROF_CACHE_SIZE]; 235eea4f254SJeff Roberson }; 236eea4f254SJeff Roberson 237eea4f254SJeff Roberson struct lock_prof_cpu { 238eea4f254SJeff Roberson struct lock_prof_type lpc_types[2]; /* One for spin one for other. */ 239eea4f254SJeff Roberson }; 240eea4f254SJeff Roberson 241eea4f254SJeff Roberson struct lock_prof_cpu *lp_cpu[MAXCPU]; 242eea4f254SJeff Roberson 24329051116SMateusz Guzik volatile int __read_mostly lock_prof_enable; 2442e6b8de4SJeff Roberson static volatile int lock_prof_resetting; 245eea4f254SJeff Roberson 2464e657159SMatthew D Fleming #define LPROF_SBUF_SIZE 256 247eea4f254SJeff Roberson 248eea4f254SJeff Roberson static int lock_prof_rejected; 249eea4f254SJeff Roberson static int lock_prof_skipspin; 250eea4f254SJeff Roberson static int lock_prof_skipcount; 251eea4f254SJeff Roberson 252eea4f254SJeff Roberson #ifndef USE_CPU_NANOSECONDS 25360ae52f7SEd Schouten uint64_t 254eea4f254SJeff Roberson nanoseconds(void) 2557c0435b9SKip Macy { 256eea4f254SJeff Roberson struct bintime bt; 25760ae52f7SEd Schouten uint64_t ns; 2587c0435b9SKip Macy 259eea4f254SJeff Roberson binuptime(&bt); 260eea4f254SJeff Roberson /* From bintime2timespec */ 26160ae52f7SEd Schouten ns = bt.sec * (uint64_t)1000000000; 262eea4f254SJeff Roberson ns += ((uint64_t)1000000000 * (uint32_t)(bt.frac >> 32)) >> 32; 263eea4f254SJeff Roberson return (ns); 264eea4f254SJeff Roberson } 265eea4f254SJeff Roberson #endif 266fe68a916SKip Macy 267eea4f254SJeff Roberson static void 268eea4f254SJeff Roberson lock_prof_init_type(struct lock_prof_type *type) 269eea4f254SJeff Roberson { 270eea4f254SJeff Roberson int i; 271fe68a916SKip Macy 272eea4f254SJeff Roberson SLIST_INIT(&type->lpt_lpalloc); 273eea4f254SJeff Roberson LIST_INIT(&type->lpt_lpoalloc); 274eea4f254SJeff Roberson for (i = 0; i < LPROF_CACHE_SIZE; i++) { 275eea4f254SJeff Roberson SLIST_INSERT_HEAD(&type->lpt_lpalloc, &type->lpt_prof[i], 276eea4f254SJeff Roberson link); 277eea4f254SJeff Roberson LIST_INSERT_HEAD(&type->lpt_lpoalloc, &type->lpt_objs[i], 278eea4f254SJeff Roberson lpo_link); 279eea4f254SJeff Roberson } 280eea4f254SJeff Roberson } 281eea4f254SJeff Roberson 282eea4f254SJeff Roberson static void 283eea4f254SJeff Roberson lock_prof_init(void *arg) 284eea4f254SJeff Roberson { 285eea4f254SJeff Roberson int cpu; 286eea4f254SJeff Roberson 287eea4f254SJeff Roberson for (cpu = 0; cpu <= mp_maxid; cpu++) { 288eea4f254SJeff Roberson lp_cpu[cpu] = malloc(sizeof(*lp_cpu[cpu]), M_DEVBUF, 289eea4f254SJeff Roberson M_WAITOK | M_ZERO); 290eea4f254SJeff Roberson lock_prof_init_type(&lp_cpu[cpu]->lpc_types[0]); 291eea4f254SJeff Roberson lock_prof_init_type(&lp_cpu[cpu]->lpc_types[1]); 292eea4f254SJeff Roberson } 293eea4f254SJeff Roberson } 294eea4f254SJeff Roberson SYSINIT(lockprof, SI_SUB_SMP, SI_ORDER_ANY, lock_prof_init, NULL); 295eea4f254SJeff Roberson 2962e6b8de4SJeff Roberson static void 2972e6b8de4SJeff Roberson lock_prof_reset_wait(void) 2982e6b8de4SJeff Roberson { 2992e6b8de4SJeff Roberson 3002e6b8de4SJeff Roberson /* 30128d91af3SJeff Roberson * Spin relinquishing our cpu so that quiesce_all_cpus may 30228d91af3SJeff Roberson * complete. 3032e6b8de4SJeff Roberson */ 3042e6b8de4SJeff Roberson while (lock_prof_resetting) 3052e6b8de4SJeff Roberson sched_relinquish(curthread); 3062e6b8de4SJeff Roberson } 3072e6b8de4SJeff Roberson 308eea4f254SJeff Roberson static void 309eea4f254SJeff Roberson lock_prof_reset(void) 310eea4f254SJeff Roberson { 311eea4f254SJeff Roberson struct lock_prof_cpu *lpc; 312eea4f254SJeff Roberson int enabled, i, cpu; 313eea4f254SJeff Roberson 3142e6b8de4SJeff Roberson /* 3152e6b8de4SJeff Roberson * We not only race with acquiring and releasing locks but also 3162e6b8de4SJeff Roberson * thread exit. To be certain that threads exit without valid head 3172e6b8de4SJeff Roberson * pointers they must see resetting set before enabled is cleared. 3182e6b8de4SJeff Roberson * Otherwise a lock may not be removed from a per-thread list due 3192e6b8de4SJeff Roberson * to disabled being set but not wait for reset() to remove it below. 3202e6b8de4SJeff Roberson */ 3212e6b8de4SJeff Roberson atomic_store_rel_int(&lock_prof_resetting, 1); 322eea4f254SJeff Roberson enabled = lock_prof_enable; 323eea4f254SJeff Roberson lock_prof_enable = 0; 32428d91af3SJeff Roberson quiesce_all_cpus("profreset", 0); 3252e6b8de4SJeff Roberson /* 3262e6b8de4SJeff Roberson * Some objects may have migrated between CPUs. Clear all links 3272e6b8de4SJeff Roberson * before we zero the structures. Some items may still be linked 3282e6b8de4SJeff Roberson * into per-thread lists as well. 3292e6b8de4SJeff Roberson */ 330eea4f254SJeff Roberson for (cpu = 0; cpu <= mp_maxid; cpu++) { 331eea4f254SJeff Roberson lpc = lp_cpu[cpu]; 332eea4f254SJeff Roberson for (i = 0; i < LPROF_CACHE_SIZE; i++) { 333eea4f254SJeff Roberson LIST_REMOVE(&lpc->lpc_types[0].lpt_objs[i], lpo_link); 334eea4f254SJeff Roberson LIST_REMOVE(&lpc->lpc_types[1].lpt_objs[i], lpo_link); 335eea4f254SJeff Roberson } 3362e6b8de4SJeff Roberson } 3372e6b8de4SJeff Roberson for (cpu = 0; cpu <= mp_maxid; cpu++) { 3382e6b8de4SJeff Roberson lpc = lp_cpu[cpu]; 339eea4f254SJeff Roberson bzero(lpc, sizeof(*lpc)); 340eea4f254SJeff Roberson lock_prof_init_type(&lpc->lpc_types[0]); 341eea4f254SJeff Roberson lock_prof_init_type(&lpc->lpc_types[1]); 342eea4f254SJeff Roberson } 3432e6b8de4SJeff Roberson atomic_store_rel_int(&lock_prof_resetting, 0); 344eea4f254SJeff Roberson lock_prof_enable = enabled; 345eea4f254SJeff Roberson } 346eea4f254SJeff Roberson 347eea4f254SJeff Roberson static void 348eea4f254SJeff Roberson lock_prof_output(struct lock_prof *lp, struct sbuf *sb) 349eea4f254SJeff Roberson { 350eea4f254SJeff Roberson const char *p; 351eea4f254SJeff Roberson 352eea4f254SJeff Roberson for (p = lp->file; p != NULL && strncmp(p, "../", 3) == 0; p += 3); 353eea4f254SJeff Roberson sbuf_printf(sb, 354947265b6SKip Macy "%8ju %9ju %11ju %11ju %11ju %6ju %6ju %2ju %6ju %s:%d (%s:%s)\n", 355947265b6SKip Macy lp->cnt_max / 1000, lp->cnt_wait_max / 1000, lp->cnt_tot / 1000, 356eea4f254SJeff Roberson lp->cnt_wait / 1000, lp->cnt_cur, 357eea4f254SJeff Roberson lp->cnt_cur == 0 ? (uintmax_t)0 : 358eea4f254SJeff Roberson lp->cnt_tot / (lp->cnt_cur * 1000), 359eea4f254SJeff Roberson lp->cnt_cur == 0 ? (uintmax_t)0 : 360eea4f254SJeff Roberson lp->cnt_wait / (lp->cnt_cur * 1000), 361eea4f254SJeff Roberson (uintmax_t)0, lp->cnt_contest_locking, 3620c66dc67SJeff Roberson p, lp->line, lp->class->lc_name, lp->name); 363eea4f254SJeff Roberson } 364eea4f254SJeff Roberson 365eea4f254SJeff Roberson static void 366eea4f254SJeff Roberson lock_prof_sum(struct lock_prof *match, struct lock_prof *dst, int hash, 367eea4f254SJeff Roberson int spin, int t) 368eea4f254SJeff Roberson { 369eea4f254SJeff Roberson struct lock_prof_type *type; 370eea4f254SJeff Roberson struct lock_prof *l; 371eea4f254SJeff Roberson int cpu; 372eea4f254SJeff Roberson 373eea4f254SJeff Roberson dst->file = match->file; 374eea4f254SJeff Roberson dst->line = match->line; 3750c66dc67SJeff Roberson dst->class = match->class; 376eea4f254SJeff Roberson dst->name = match->name; 377eea4f254SJeff Roberson 378eea4f254SJeff Roberson for (cpu = 0; cpu <= mp_maxid; cpu++) { 379eea4f254SJeff Roberson if (lp_cpu[cpu] == NULL) 380eea4f254SJeff Roberson continue; 381eea4f254SJeff Roberson type = &lp_cpu[cpu]->lpc_types[spin]; 382eea4f254SJeff Roberson SLIST_FOREACH(l, &type->lpt_hash[hash], link) { 383eea4f254SJeff Roberson if (l->ticks == t) 384eea4f254SJeff Roberson continue; 385eea4f254SJeff Roberson if (l->file != match->file || l->line != match->line || 3860c66dc67SJeff Roberson l->name != match->name) 387eea4f254SJeff Roberson continue; 388eea4f254SJeff Roberson l->ticks = t; 389eea4f254SJeff Roberson if (l->cnt_max > dst->cnt_max) 390eea4f254SJeff Roberson dst->cnt_max = l->cnt_max; 391947265b6SKip Macy if (l->cnt_wait_max > dst->cnt_wait_max) 392947265b6SKip Macy dst->cnt_wait_max = l->cnt_wait_max; 393eea4f254SJeff Roberson dst->cnt_tot += l->cnt_tot; 394eea4f254SJeff Roberson dst->cnt_wait += l->cnt_wait; 395eea4f254SJeff Roberson dst->cnt_cur += l->cnt_cur; 396eea4f254SJeff Roberson dst->cnt_contest_locking += l->cnt_contest_locking; 397eea4f254SJeff Roberson } 398eea4f254SJeff Roberson } 399eea4f254SJeff Roberson 400eea4f254SJeff Roberson } 401eea4f254SJeff Roberson 402eea4f254SJeff Roberson static void 403eea4f254SJeff Roberson lock_prof_type_stats(struct lock_prof_type *type, struct sbuf *sb, int spin, 404eea4f254SJeff Roberson int t) 405eea4f254SJeff Roberson { 406eea4f254SJeff Roberson struct lock_prof *l; 407eea4f254SJeff Roberson int i; 408eea4f254SJeff Roberson 409eea4f254SJeff Roberson for (i = 0; i < LPROF_HASH_SIZE; ++i) { 410eea4f254SJeff Roberson SLIST_FOREACH(l, &type->lpt_hash[i], link) { 411eea4f254SJeff Roberson struct lock_prof lp = {}; 412eea4f254SJeff Roberson 413eea4f254SJeff Roberson if (l->ticks == t) 414eea4f254SJeff Roberson continue; 415eea4f254SJeff Roberson lock_prof_sum(l, &lp, i, spin, t); 416eea4f254SJeff Roberson lock_prof_output(&lp, sb); 417eea4f254SJeff Roberson } 418eea4f254SJeff Roberson } 419eea4f254SJeff Roberson } 420eea4f254SJeff Roberson 421eea4f254SJeff Roberson static int 422eea4f254SJeff Roberson dump_lock_prof_stats(SYSCTL_HANDLER_ARGS) 423eea4f254SJeff Roberson { 424eea4f254SJeff Roberson struct sbuf *sb; 425eea4f254SJeff Roberson int error, cpu, t; 4260c66dc67SJeff Roberson int enabled; 427eea4f254SJeff Roberson 42800f0e671SMatthew D Fleming error = sysctl_wire_old_buffer(req, 0); 42900f0e671SMatthew D Fleming if (error != 0) 43000f0e671SMatthew D Fleming return (error); 4314e657159SMatthew D Fleming sb = sbuf_new_for_sysctl(NULL, NULL, LPROF_SBUF_SIZE, req); 432947265b6SKip Macy sbuf_printf(sb, "\n%8s %9s %11s %11s %11s %6s %6s %2s %6s %s\n", 433947265b6SKip Macy "max", "wait_max", "total", "wait_total", "count", "avg", "wait_avg", "cnt_hold", "cnt_lock", "name"); 4340c66dc67SJeff Roberson enabled = lock_prof_enable; 4350c66dc67SJeff Roberson lock_prof_enable = 0; 43628d91af3SJeff Roberson quiesce_all_cpus("profstat", 0); 437eea4f254SJeff Roberson t = ticks; 438eea4f254SJeff Roberson for (cpu = 0; cpu <= mp_maxid; cpu++) { 439eea4f254SJeff Roberson if (lp_cpu[cpu] == NULL) 440eea4f254SJeff Roberson continue; 441eea4f254SJeff Roberson lock_prof_type_stats(&lp_cpu[cpu]->lpc_types[0], sb, 0, t); 442eea4f254SJeff Roberson lock_prof_type_stats(&lp_cpu[cpu]->lpc_types[1], sb, 1, t); 443eea4f254SJeff Roberson } 4440c66dc67SJeff Roberson lock_prof_enable = enabled; 445eea4f254SJeff Roberson 4464e657159SMatthew D Fleming error = sbuf_finish(sb); 4474e657159SMatthew D Fleming /* Output a trailing NUL. */ 4484e657159SMatthew D Fleming if (error == 0) 4494e657159SMatthew D Fleming error = SYSCTL_OUT(req, "", 1); 450eea4f254SJeff Roberson sbuf_delete(sb); 451eea4f254SJeff Roberson return (error); 452eea4f254SJeff Roberson } 453eea4f254SJeff Roberson 454eea4f254SJeff Roberson static int 455eea4f254SJeff Roberson enable_lock_prof(SYSCTL_HANDLER_ARGS) 456eea4f254SJeff Roberson { 457eea4f254SJeff Roberson int error, v; 458eea4f254SJeff Roberson 459eea4f254SJeff Roberson v = lock_prof_enable; 460eea4f254SJeff Roberson error = sysctl_handle_int(oidp, &v, v, req); 461eea4f254SJeff Roberson if (error) 462eea4f254SJeff Roberson return (error); 463eea4f254SJeff Roberson if (req->newptr == NULL) 464eea4f254SJeff Roberson return (error); 465eea4f254SJeff Roberson if (v == lock_prof_enable) 466eea4f254SJeff Roberson return (0); 467eea4f254SJeff Roberson if (v == 1) 468eea4f254SJeff Roberson lock_prof_reset(); 469eea4f254SJeff Roberson lock_prof_enable = !!v; 470eea4f254SJeff Roberson 471eea4f254SJeff Roberson return (0); 472eea4f254SJeff Roberson } 473eea4f254SJeff Roberson 474eea4f254SJeff Roberson static int 475eea4f254SJeff Roberson reset_lock_prof_stats(SYSCTL_HANDLER_ARGS) 476eea4f254SJeff Roberson { 477eea4f254SJeff Roberson int error, v; 478eea4f254SJeff Roberson 479eea4f254SJeff Roberson v = 0; 480eea4f254SJeff Roberson error = sysctl_handle_int(oidp, &v, 0, req); 481eea4f254SJeff Roberson if (error) 482eea4f254SJeff Roberson return (error); 483eea4f254SJeff Roberson if (req->newptr == NULL) 484eea4f254SJeff Roberson return (error); 485eea4f254SJeff Roberson if (v == 0) 486eea4f254SJeff Roberson return (0); 487eea4f254SJeff Roberson lock_prof_reset(); 488eea4f254SJeff Roberson 489eea4f254SJeff Roberson return (0); 490eea4f254SJeff Roberson } 491eea4f254SJeff Roberson 492eea4f254SJeff Roberson static struct lock_prof * 493eea4f254SJeff Roberson lock_profile_lookup(struct lock_object *lo, int spin, const char *file, 494eea4f254SJeff Roberson int line) 495eea4f254SJeff Roberson { 496eea4f254SJeff Roberson const char *unknown = "(unknown)"; 497eea4f254SJeff Roberson struct lock_prof_type *type; 498eea4f254SJeff Roberson struct lock_prof *lp; 499eea4f254SJeff Roberson struct lphead *head; 500eea4f254SJeff Roberson const char *p; 501eea4f254SJeff Roberson u_int hash; 502eea4f254SJeff Roberson 503eea4f254SJeff Roberson p = file; 504eea4f254SJeff Roberson if (p == NULL || *p == '\0') 505eea4f254SJeff Roberson p = unknown; 506eea4f254SJeff Roberson hash = (uintptr_t)lo->lo_name * 31 + (uintptr_t)p * 31 + line; 507eea4f254SJeff Roberson hash &= LPROF_HASH_MASK; 508eea4f254SJeff Roberson type = &lp_cpu[PCPU_GET(cpuid)]->lpc_types[spin]; 509eea4f254SJeff Roberson head = &type->lpt_hash[hash]; 510eea4f254SJeff Roberson SLIST_FOREACH(lp, head, link) { 511eea4f254SJeff Roberson if (lp->line == line && lp->file == p && 512eea4f254SJeff Roberson lp->name == lo->lo_name) 513eea4f254SJeff Roberson return (lp); 514eea4f254SJeff Roberson 515eea4f254SJeff Roberson } 516eea4f254SJeff Roberson lp = SLIST_FIRST(&type->lpt_lpalloc); 517eea4f254SJeff Roberson if (lp == NULL) { 518eea4f254SJeff Roberson lock_prof_rejected++; 519eea4f254SJeff Roberson return (lp); 520eea4f254SJeff Roberson } 521eea4f254SJeff Roberson SLIST_REMOVE_HEAD(&type->lpt_lpalloc, link); 522eea4f254SJeff Roberson lp->file = p; 523eea4f254SJeff Roberson lp->line = line; 5240c66dc67SJeff Roberson lp->class = LOCK_CLASS(lo); 525eea4f254SJeff Roberson lp->name = lo->lo_name; 526eea4f254SJeff Roberson SLIST_INSERT_HEAD(&type->lpt_hash[hash], lp, link); 527eea4f254SJeff Roberson return (lp); 528eea4f254SJeff Roberson } 529eea4f254SJeff Roberson 530eea4f254SJeff Roberson static struct lock_profile_object * 531eea4f254SJeff Roberson lock_profile_object_lookup(struct lock_object *lo, int spin, const char *file, 532eea4f254SJeff Roberson int line) 533eea4f254SJeff Roberson { 534eea4f254SJeff Roberson struct lock_profile_object *l; 535eea4f254SJeff Roberson struct lock_prof_type *type; 536eea4f254SJeff Roberson struct lpohead *head; 537eea4f254SJeff Roberson 538eea4f254SJeff Roberson head = &curthread->td_lprof[spin]; 539eea4f254SJeff Roberson LIST_FOREACH(l, head, lpo_link) 540eea4f254SJeff Roberson if (l->lpo_obj == lo && l->lpo_file == file && 541eea4f254SJeff Roberson l->lpo_line == line) 542eea4f254SJeff Roberson return (l); 543eea4f254SJeff Roberson type = &lp_cpu[PCPU_GET(cpuid)]->lpc_types[spin]; 544eea4f254SJeff Roberson l = LIST_FIRST(&type->lpt_lpoalloc); 545eea4f254SJeff Roberson if (l == NULL) { 546eea4f254SJeff Roberson lock_prof_rejected++; 547eea4f254SJeff Roberson return (NULL); 548eea4f254SJeff Roberson } 549eea4f254SJeff Roberson LIST_REMOVE(l, lpo_link); 550eea4f254SJeff Roberson l->lpo_obj = lo; 551eea4f254SJeff Roberson l->lpo_file = file; 552eea4f254SJeff Roberson l->lpo_line = line; 553eea4f254SJeff Roberson l->lpo_cnt = 0; 554eea4f254SJeff Roberson LIST_INSERT_HEAD(head, l, lpo_link); 555eea4f254SJeff Roberson 556eea4f254SJeff Roberson return (l); 557eea4f254SJeff Roberson } 558eea4f254SJeff Roberson 559eea4f254SJeff Roberson void 560eea4f254SJeff Roberson lock_profile_obtain_lock_success(struct lock_object *lo, int contested, 561eea4f254SJeff Roberson uint64_t waittime, const char *file, int line) 562eea4f254SJeff Roberson { 563eea4f254SJeff Roberson static int lock_prof_count; 564eea4f254SJeff Roberson struct lock_profile_object *l; 565eea4f254SJeff Roberson int spin; 566eea4f254SJeff Roberson 56735370593SAndriy Gapon if (SCHEDULER_STOPPED()) 56835370593SAndriy Gapon return; 56935370593SAndriy Gapon 570eea4f254SJeff Roberson /* don't reset the timer when/if recursing */ 571eea4f254SJeff Roberson if (!lock_prof_enable || (lo->lo_flags & LO_NOPROFILE)) 572eea4f254SJeff Roberson return; 573eea4f254SJeff Roberson if (lock_prof_skipcount && 574357911ceSKris Kennaway (++lock_prof_count % lock_prof_skipcount) != 0) 575eea4f254SJeff Roberson return; 57613ddf72dSAttilio Rao spin = (LOCK_CLASS(lo)->lc_flags & LC_SPINLOCK) ? 1 : 0; 577eea4f254SJeff Roberson if (spin && lock_prof_skipspin == 1) 578eea4f254SJeff Roberson return; 5792e6b8de4SJeff Roberson critical_enter(); 5802e6b8de4SJeff Roberson /* Recheck enabled now that we're in a critical section. */ 5812e6b8de4SJeff Roberson if (lock_prof_enable == 0) 5822e6b8de4SJeff Roberson goto out; 583eea4f254SJeff Roberson l = lock_profile_object_lookup(lo, spin, file, line); 584eea4f254SJeff Roberson if (l == NULL) 5852e6b8de4SJeff Roberson goto out; 586eea4f254SJeff Roberson l->lpo_cnt++; 587eea4f254SJeff Roberson if (++l->lpo_ref > 1) 5882e6b8de4SJeff Roberson goto out; 589eea4f254SJeff Roberson l->lpo_contest_locking = contested; 5907c0435b9SKip Macy l->lpo_acqtime = nanoseconds(); 591aa077979SKip Macy if (waittime && (l->lpo_acqtime > waittime)) 5927c0435b9SKip Macy l->lpo_waittime = l->lpo_acqtime - waittime; 593aa077979SKip Macy else 594aa077979SKip Macy l->lpo_waittime = 0; 5952e6b8de4SJeff Roberson out: 5962e6b8de4SJeff Roberson critical_exit(); 5972e6b8de4SJeff Roberson } 5982e6b8de4SJeff Roberson 5992e6b8de4SJeff Roberson void 6002e6b8de4SJeff Roberson lock_profile_thread_exit(struct thread *td) 6012e6b8de4SJeff Roberson { 6022e6b8de4SJeff Roberson #ifdef INVARIANTS 6032e6b8de4SJeff Roberson struct lock_profile_object *l; 6042e6b8de4SJeff Roberson 6052e6b8de4SJeff Roberson MPASS(curthread->td_critnest == 0); 6062e6b8de4SJeff Roberson #endif 6072e6b8de4SJeff Roberson /* 6082e6b8de4SJeff Roberson * If lock profiling was disabled we have to wait for reset to 6092e6b8de4SJeff Roberson * clear our pointers before we can exit safely. 6102e6b8de4SJeff Roberson */ 6112e6b8de4SJeff Roberson lock_prof_reset_wait(); 6122e6b8de4SJeff Roberson #ifdef INVARIANTS 6132e6b8de4SJeff Roberson LIST_FOREACH(l, &td->td_lprof[0], lpo_link) 6142e6b8de4SJeff Roberson printf("thread still holds lock acquired at %s:%d\n", 6152e6b8de4SJeff Roberson l->lpo_file, l->lpo_line); 6162e6b8de4SJeff Roberson LIST_FOREACH(l, &td->td_lprof[1], lpo_link) 6172e6b8de4SJeff Roberson printf("thread still holds lock acquired at %s:%d\n", 6182e6b8de4SJeff Roberson l->lpo_file, l->lpo_line); 6192e6b8de4SJeff Roberson #endif 6202e6b8de4SJeff Roberson MPASS(LIST_FIRST(&td->td_lprof[0]) == NULL); 6212e6b8de4SJeff Roberson MPASS(LIST_FIRST(&td->td_lprof[1]) == NULL); 6227c0435b9SKip Macy } 6237c0435b9SKip Macy 624eea4f254SJeff Roberson void 625eea4f254SJeff Roberson lock_profile_release_lock(struct lock_object *lo) 6267c0435b9SKip Macy { 627eea4f254SJeff Roberson struct lock_profile_object *l; 628eea4f254SJeff Roberson struct lock_prof_type *type; 629eea4f254SJeff Roberson struct lock_prof *lp; 63060ae52f7SEd Schouten uint64_t curtime, holdtime; 631eea4f254SJeff Roberson struct lpohead *head; 632eea4f254SJeff Roberson int spin; 6337c0435b9SKip Macy 63435370593SAndriy Gapon if (SCHEDULER_STOPPED()) 63535370593SAndriy Gapon return; 6362e6b8de4SJeff Roberson if (lo->lo_flags & LO_NOPROFILE) 6377c0435b9SKip Macy return; 63813ddf72dSAttilio Rao spin = (LOCK_CLASS(lo)->lc_flags & LC_SPINLOCK) ? 1 : 0; 639eea4f254SJeff Roberson head = &curthread->td_lprof[spin]; 6402e6b8de4SJeff Roberson if (LIST_FIRST(head) == NULL) 6412e6b8de4SJeff Roberson return; 642eea4f254SJeff Roberson critical_enter(); 6432e6b8de4SJeff Roberson /* Recheck enabled now that we're in a critical section. */ 6442e6b8de4SJeff Roberson if (lock_prof_enable == 0 && lock_prof_resetting == 1) 6452e6b8de4SJeff Roberson goto out; 6462e6b8de4SJeff Roberson /* 6472e6b8de4SJeff Roberson * If lock profiling is not enabled we still want to remove the 6482e6b8de4SJeff Roberson * lpo from our queue. 6492e6b8de4SJeff Roberson */ 650eea4f254SJeff Roberson LIST_FOREACH(l, head, lpo_link) 651eea4f254SJeff Roberson if (l->lpo_obj == lo) 6527c0435b9SKip Macy break; 653eea4f254SJeff Roberson if (l == NULL) 654eea4f254SJeff Roberson goto out; 655eea4f254SJeff Roberson if (--l->lpo_ref > 0) 656eea4f254SJeff Roberson goto out; 657eea4f254SJeff Roberson lp = lock_profile_lookup(lo, spin, l->lpo_file, l->lpo_line); 658eea4f254SJeff Roberson if (lp == NULL) 659eea4f254SJeff Roberson goto release; 660e7154e7eSAndriy Gapon curtime = nanoseconds(); 661e7154e7eSAndriy Gapon if (curtime < l->lpo_acqtime) 662eea4f254SJeff Roberson goto release; 663e7154e7eSAndriy Gapon holdtime = curtime - l->lpo_acqtime; 664e7154e7eSAndriy Gapon 6657c0435b9SKip Macy /* 66683b72e3eSKip Macy * Record if the lock has been held longer now than ever 6677c0435b9SKip Macy * before. 6687c0435b9SKip Macy */ 669eea4f254SJeff Roberson if (holdtime > lp->cnt_max) 670eea4f254SJeff Roberson lp->cnt_max = holdtime; 671947265b6SKip Macy if (l->lpo_waittime > lp->cnt_wait_max) 672947265b6SKip Macy lp->cnt_wait_max = l->lpo_waittime; 673eea4f254SJeff Roberson lp->cnt_tot += holdtime; 674eea4f254SJeff Roberson lp->cnt_wait += l->lpo_waittime; 675eea4f254SJeff Roberson lp->cnt_contest_locking += l->lpo_contest_locking; 676eea4f254SJeff Roberson lp->cnt_cur += l->lpo_cnt; 677eea4f254SJeff Roberson release: 678eea4f254SJeff Roberson LIST_REMOVE(l, lpo_link); 679eea4f254SJeff Roberson type = &lp_cpu[PCPU_GET(cpuid)]->lpc_types[spin]; 680eea4f254SJeff Roberson LIST_INSERT_HEAD(&type->lpt_lpoalloc, l, lpo_link); 681eea4f254SJeff Roberson out: 682eea4f254SJeff Roberson critical_exit(); 683eea4f254SJeff Roberson } 6847c0435b9SKip Macy 6856472ac3dSEd Schouten static SYSCTL_NODE(_debug_lock, OID_AUTO, prof, CTLFLAG_RD, NULL, 6866472ac3dSEd Schouten "lock profiling"); 687eea4f254SJeff Roberson SYSCTL_INT(_debug_lock_prof, OID_AUTO, skipspin, CTLFLAG_RW, 688eea4f254SJeff Roberson &lock_prof_skipspin, 0, "Skip profiling on spinlocks."); 689eea4f254SJeff Roberson SYSCTL_INT(_debug_lock_prof, OID_AUTO, skipcount, CTLFLAG_RW, 690eea4f254SJeff Roberson &lock_prof_skipcount, 0, "Sample approximately every N lock acquisitions."); 691eea4f254SJeff Roberson SYSCTL_INT(_debug_lock_prof, OID_AUTO, rejected, CTLFLAG_RD, 692eea4f254SJeff Roberson &lock_prof_rejected, 0, "Number of rejected profiling records"); 693eea4f254SJeff Roberson SYSCTL_PROC(_debug_lock_prof, OID_AUTO, stats, CTLTYPE_STRING | CTLFLAG_RD, 694eea4f254SJeff Roberson NULL, 0, dump_lock_prof_stats, "A", "Lock profiling statistics"); 695eea4f254SJeff Roberson SYSCTL_PROC(_debug_lock_prof, OID_AUTO, reset, CTLTYPE_INT | CTLFLAG_RW, 696eea4f254SJeff Roberson NULL, 0, reset_lock_prof_stats, "I", "Reset lock profiling statistics"); 697eea4f254SJeff Roberson SYSCTL_PROC(_debug_lock_prof, OID_AUTO, enable, CTLTYPE_INT | CTLFLAG_RW, 698eea4f254SJeff Roberson NULL, 0, enable_lock_prof, "I", "Enable lock profiling"); 699eea4f254SJeff Roberson 7007c0435b9SKip Macy #endif 701