xref: /freebsd/sys/kern/kern_mutex.c (revision fb919e4d5a2c1baca52ac70d1064f140fffdda71)
10384fff8SJason Evans /*-
20384fff8SJason Evans  * Copyright (c) 1998 Berkeley Software Design, Inc. All rights reserved.
30384fff8SJason Evans  *
40384fff8SJason Evans  * Redistribution and use in source and binary forms, with or without
50384fff8SJason Evans  * modification, are permitted provided that the following conditions
60384fff8SJason Evans  * are met:
70384fff8SJason Evans  * 1. Redistributions of source code must retain the above copyright
80384fff8SJason Evans  *    notice, this list of conditions and the following disclaimer.
90384fff8SJason Evans  * 2. Redistributions in binary form must reproduce the above copyright
100384fff8SJason Evans  *    notice, this list of conditions and the following disclaimer in the
110384fff8SJason Evans  *    documentation and/or other materials provided with the distribution.
120384fff8SJason Evans  * 3. Berkeley Software Design Inc's name may not be used to endorse or
130384fff8SJason Evans  *    promote products derived from this software without specific prior
140384fff8SJason Evans  *    written permission.
150384fff8SJason Evans  *
160384fff8SJason Evans  * THIS SOFTWARE IS PROVIDED BY BERKELEY SOFTWARE DESIGN INC ``AS IS'' AND
170384fff8SJason Evans  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
180384fff8SJason Evans  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
190384fff8SJason Evans  * ARE DISCLAIMED.  IN NO EVENT SHALL BERKELEY SOFTWARE DESIGN INC BE LIABLE
200384fff8SJason Evans  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
210384fff8SJason Evans  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
220384fff8SJason Evans  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
230384fff8SJason Evans  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
240384fff8SJason Evans  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
250384fff8SJason Evans  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
260384fff8SJason Evans  * SUCH DAMAGE.
270384fff8SJason Evans  *
280384fff8SJason Evans  *	from BSDI $Id: mutex_witness.c,v 1.1.2.20 2000/04/27 03:10:27 cp Exp $
2936412d79SJohn Baldwin  *	and BSDI $Id: synch_machdep.c,v 2.3.2.39 2000/04/27 03:10:25 cp Exp $
300384fff8SJason Evans  * $FreeBSD$
310384fff8SJason Evans  */
320384fff8SJason Evans 
330384fff8SJason Evans /*
349ed346baSBosko Milekic  * Machine independent bits of mutex implementation and implementation of
359ed346baSBosko Milekic  * `witness' structure & related debugging routines.
369ed346baSBosko Milekic  */
379ed346baSBosko Milekic 
389ed346baSBosko Milekic /*
390384fff8SJason Evans  *	Main Entry: witness
400384fff8SJason Evans  *	Pronunciation: 'wit-n&s
410384fff8SJason Evans  *	Function: noun
420384fff8SJason Evans  *	Etymology: Middle English witnesse, from Old English witnes knowledge,
430384fff8SJason Evans  *	    testimony, witness, from 2wit
440384fff8SJason Evans  *	Date: before 12th century
450384fff8SJason Evans  *	1 : attestation of a fact or event : TESTIMONY
460384fff8SJason Evans  *	2 : one that gives evidence; specifically : one who testifies in
470384fff8SJason Evans  *	    a cause or before a judicial tribunal
480384fff8SJason Evans  *	3 : one asked to be present at a transaction so as to be able to
490384fff8SJason Evans  *	    testify to its having taken place
500384fff8SJason Evans  *	4 : one who has personal knowledge of something
510384fff8SJason Evans  *	5 a : something serving as evidence or proof : SIGN
520384fff8SJason Evans  *	  b : public affirmation by word or example of usually
530384fff8SJason Evans  *	      religious faith or conviction <the heroic witness to divine
540384fff8SJason Evans  *	      life -- Pilot>
550384fff8SJason Evans  *	6 capitalized : a member of the Jehovah's Witnesses
560384fff8SJason Evans  */
570384fff8SJason Evans 
589c36c934SJohn Baldwin #include "opt_ddb.h"
59a5a96a19SJohn Baldwin 
600384fff8SJason Evans #include <sys/param.h>
6136412d79SJohn Baldwin #include <sys/bus.h>
6236412d79SJohn Baldwin #include <sys/kernel.h>
6319284646SJohn Baldwin #include <sys/lock.h>
64fb919e4dSMark Murray #include <sys/malloc.h>
6519284646SJohn Baldwin #include <sys/mutex.h>
660384fff8SJason Evans #include <sys/proc.h>
67a5a96a19SJohn Baldwin #include <sys/sysctl.h>
680384fff8SJason Evans #include <sys/systm.h>
6936412d79SJohn Baldwin #include <sys/vmmeter.h>
700384fff8SJason Evans #include <sys/ktr.h>
710384fff8SJason Evans 
7236412d79SJohn Baldwin #include <machine/atomic.h>
7336412d79SJohn Baldwin #include <machine/bus.h>
7436412d79SJohn Baldwin #include <machine/clock.h>
750384fff8SJason Evans #include <machine/cpu.h>
7636412d79SJohn Baldwin 
779c36c934SJohn Baldwin #include <ddb/ddb.h>
789c36c934SJohn Baldwin 
7936412d79SJohn Baldwin #include <vm/vm.h>
8036412d79SJohn Baldwin #include <vm/vm_extern.h>
8136412d79SJohn Baldwin 
820cde2e34SJason Evans /*
839ed346baSBosko Milekic  * Internal utility macros.
840cde2e34SJason Evans  */
859ed346baSBosko Milekic #define mtx_unowned(m)	((m)->mtx_lock == MTX_UNOWNED)
860cde2e34SJason Evans 
879ed346baSBosko Milekic #define mtx_owner(m)	(mtx_unowned((m)) ? NULL \
889ed346baSBosko Milekic 	: (struct proc *)((m)->mtx_lock & MTX_FLAGMASK))
899ed346baSBosko Milekic 
90d5a08a60SJake Burkholder #define SET_PRIO(p, pri)	(p)->p_pri.pri_level = (pri)
910cde2e34SJason Evans 
920cde2e34SJason Evans /*
9319284646SJohn Baldwin  * Lock classes for sleep and spin mutexes.
940cde2e34SJason Evans  */
9519284646SJohn Baldwin struct lock_class lock_class_mtx_sleep = {
9619284646SJohn Baldwin 	"sleep mutex",
9719284646SJohn Baldwin 	LC_SLEEPLOCK | LC_RECURSABLE
9819284646SJohn Baldwin };
9919284646SJohn Baldwin struct lock_class lock_class_mtx_spin = {
10019284646SJohn Baldwin 	"spin mutex",
10119284646SJohn Baldwin 	LC_SPINLOCK | LC_RECURSABLE
1028484de75SJohn Baldwin };
1038484de75SJohn Baldwin 
1049ed346baSBosko Milekic /*
1059ed346baSBosko Milekic  * Prototypes for non-exported routines.
1069ed346baSBosko Milekic  */
1071bd0eefbSJohn Baldwin static void	propagate_priority(struct proc *);
10836412d79SJohn Baldwin 
10936412d79SJohn Baldwin static void
11036412d79SJohn Baldwin propagate_priority(struct proc *p)
11136412d79SJohn Baldwin {
112d5a08a60SJake Burkholder 	int pri = p->p_pri.pri_level;
11336412d79SJohn Baldwin 	struct mtx *m = p->p_blocked;
11436412d79SJohn Baldwin 
1151bd0eefbSJohn Baldwin 	mtx_assert(&sched_lock, MA_OWNED);
11636412d79SJohn Baldwin 	for (;;) {
11736412d79SJohn Baldwin 		struct proc *p1;
11836412d79SJohn Baldwin 
11936412d79SJohn Baldwin 		p = mtx_owner(m);
12036412d79SJohn Baldwin 
12136412d79SJohn Baldwin 		if (p == NULL) {
12236412d79SJohn Baldwin 			/*
12336412d79SJohn Baldwin 			 * This really isn't quite right. Really
12436412d79SJohn Baldwin 			 * ought to bump priority of process that
12536412d79SJohn Baldwin 			 * next acquires the mutex.
12636412d79SJohn Baldwin 			 */
12736412d79SJohn Baldwin 			MPASS(m->mtx_lock == MTX_CONTESTED);
12836412d79SJohn Baldwin 			return;
12936412d79SJohn Baldwin 		}
1309ed346baSBosko Milekic 
13136412d79SJohn Baldwin 		MPASS(p->p_magic == P_MAGIC);
1321bd0eefbSJohn Baldwin 		KASSERT(p->p_stat != SSLEEP, ("sleeping process owns a mutex"));
133d5a08a60SJake Burkholder 		if (p->p_pri.pri_level <= pri)
13436412d79SJohn Baldwin 			return;
1351bd0eefbSJohn Baldwin 
1361bd0eefbSJohn Baldwin 		/*
1371bd0eefbSJohn Baldwin 		 * Bump this process' priority.
1381bd0eefbSJohn Baldwin 		 */
1391bd0eefbSJohn Baldwin 		SET_PRIO(p, pri);
1401bd0eefbSJohn Baldwin 
14136412d79SJohn Baldwin 		/*
14236412d79SJohn Baldwin 		 * If lock holder is actually running, just bump priority.
14336412d79SJohn Baldwin 		 */
14425d209f2SJohn Baldwin 		if (p->p_oncpu != NOCPU) {
145f0b60d75SMark Murray 			MPASS(p->p_stat == SRUN || p->p_stat == SZOMB || p->p_stat == SSTOP);
14636412d79SJohn Baldwin 			return;
14736412d79SJohn Baldwin 		}
148d5a08a60SJake Burkholder 
1491b43703bSJohn Baldwin #ifndef SMP
1501b43703bSJohn Baldwin 		/*
1511b43703bSJohn Baldwin 		 * For UP, we check to see if p is curproc (this shouldn't
1521b43703bSJohn Baldwin 		 * ever happen however as it would mean we are in a deadlock.)
1531b43703bSJohn Baldwin 		 */
1541b43703bSJohn Baldwin 		KASSERT(p != curproc, ("Deadlock detected"));
1551b43703bSJohn Baldwin #endif
1561b43703bSJohn Baldwin 
15736412d79SJohn Baldwin 		/*
15836412d79SJohn Baldwin 		 * If on run queue move to new run queue, and
15936412d79SJohn Baldwin 		 * quit.
16036412d79SJohn Baldwin 		 */
16136412d79SJohn Baldwin 		if (p->p_stat == SRUN) {
16236412d79SJohn Baldwin 			MPASS(p->p_blocked == NULL);
16336412d79SJohn Baldwin 			remrunqueue(p);
16436412d79SJohn Baldwin 			setrunqueue(p);
16536412d79SJohn Baldwin 			return;
16636412d79SJohn Baldwin 		}
16736412d79SJohn Baldwin 
16836412d79SJohn Baldwin 		/*
1691bd0eefbSJohn Baldwin 		 * If we aren't blocked on a mutex, we should be.
17036412d79SJohn Baldwin 		 */
1711bd0eefbSJohn Baldwin 		KASSERT(p->p_stat == SMTX, (
1721bd0eefbSJohn Baldwin 		    "process %d(%s):%d holds %s but isn't blocked on a mutex\n",
1731bd0eefbSJohn Baldwin 		    p->p_pid, p->p_comm, p->p_stat,
17419284646SJohn Baldwin 		    m->mtx_object.lo_name));
17536412d79SJohn Baldwin 
17636412d79SJohn Baldwin 		/*
17736412d79SJohn Baldwin 		 * Pick up the mutex that p is blocked on.
17836412d79SJohn Baldwin 		 */
17936412d79SJohn Baldwin 		m = p->p_blocked;
18036412d79SJohn Baldwin 		MPASS(m != NULL);
18136412d79SJohn Baldwin 
18236412d79SJohn Baldwin 		/*
18336412d79SJohn Baldwin 		 * Check if the proc needs to be moved up on
18436412d79SJohn Baldwin 		 * the blocked chain
18536412d79SJohn Baldwin 		 */
1861bd0eefbSJohn Baldwin 		if (p == TAILQ_FIRST(&m->mtx_blocked)) {
1871bd0eefbSJohn Baldwin 			continue;
1881bd0eefbSJohn Baldwin 		}
1899ed346baSBosko Milekic 
190d5a08a60SJake Burkholder 		p1 = TAILQ_PREV(p, procqueue, p_procq);
191d5a08a60SJake Burkholder 		if (p1->p_pri.pri_level <= pri) {
19236412d79SJohn Baldwin 			continue;
19336412d79SJohn Baldwin 		}
19436412d79SJohn Baldwin 
19536412d79SJohn Baldwin 		/*
1961bd0eefbSJohn Baldwin 		 * Remove proc from blocked chain and determine where
1971bd0eefbSJohn Baldwin 		 * it should be moved up to.  Since we know that p1 has
1981bd0eefbSJohn Baldwin 		 * a lower priority than p, we know that at least one
1991bd0eefbSJohn Baldwin 		 * process in the chain has a lower priority and that
2001bd0eefbSJohn Baldwin 		 * p1 will thus not be NULL after the loop.
20136412d79SJohn Baldwin 		 */
20236412d79SJohn Baldwin 		TAILQ_REMOVE(&m->mtx_blocked, p, p_procq);
20336412d79SJohn Baldwin 		TAILQ_FOREACH(p1, &m->mtx_blocked, p_procq) {
20436412d79SJohn Baldwin 			MPASS(p1->p_magic == P_MAGIC);
205d5a08a60SJake Burkholder 			if (p1->p_pri.pri_level > pri)
20636412d79SJohn Baldwin 				break;
20736412d79SJohn Baldwin 		}
2089ed346baSBosko Milekic 
2091bd0eefbSJohn Baldwin 		MPASS(p1 != NULL);
21036412d79SJohn Baldwin 		TAILQ_INSERT_BEFORE(p1, p, p_procq);
21136412d79SJohn Baldwin 		CTR4(KTR_LOCK,
2128484de75SJohn Baldwin 		    "propagate_priority: p %p moved before %p on [%p] %s",
21319284646SJohn Baldwin 		    p, p1, m, m->mtx_object.lo_name);
21436412d79SJohn Baldwin 	}
21536412d79SJohn Baldwin }
21636412d79SJohn Baldwin 
2170cde2e34SJason Evans /*
2186283b7d0SJohn Baldwin  * Function versions of the inlined __mtx_* macros.  These are used by
2196283b7d0SJohn Baldwin  * modules and can also be called from assembly language if needed.
2206283b7d0SJohn Baldwin  */
2216283b7d0SJohn Baldwin void
2226283b7d0SJohn Baldwin _mtx_lock_flags(struct mtx *m, int opts, const char *file, int line)
2236283b7d0SJohn Baldwin {
2246283b7d0SJohn Baldwin 
2256283b7d0SJohn Baldwin 	__mtx_lock_flags(m, opts, file, line);
2266283b7d0SJohn Baldwin }
2276283b7d0SJohn Baldwin 
2286283b7d0SJohn Baldwin void
2296283b7d0SJohn Baldwin _mtx_unlock_flags(struct mtx *m, int opts, const char *file, int line)
2306283b7d0SJohn Baldwin {
2316283b7d0SJohn Baldwin 
2326283b7d0SJohn Baldwin 	__mtx_unlock_flags(m, opts, file, line);
2336283b7d0SJohn Baldwin }
2346283b7d0SJohn Baldwin 
2356283b7d0SJohn Baldwin void
2366283b7d0SJohn Baldwin _mtx_lock_spin_flags(struct mtx *m, int opts, const char *file, int line)
2376283b7d0SJohn Baldwin {
2386283b7d0SJohn Baldwin 
2396283b7d0SJohn Baldwin 	__mtx_lock_spin_flags(m, opts, file, line);
2406283b7d0SJohn Baldwin }
2416283b7d0SJohn Baldwin 
2426283b7d0SJohn Baldwin void
2436283b7d0SJohn Baldwin _mtx_unlock_spin_flags(struct mtx *m, int opts, const char *file, int line)
2446283b7d0SJohn Baldwin {
2456283b7d0SJohn Baldwin 
2466283b7d0SJohn Baldwin 	__mtx_unlock_spin_flags(m, opts, file, line);
2476283b7d0SJohn Baldwin }
2486283b7d0SJohn Baldwin 
2496283b7d0SJohn Baldwin /*
2509ed346baSBosko Milekic  * The important part of mtx_trylock{,_flags}()
2519ed346baSBosko Milekic  * Tries to acquire lock `m.' We do NOT handle recursion here; we assume that
2529ed346baSBosko Milekic  * if we're called, it's because we know we don't already own this lock.
2530cde2e34SJason Evans  */
2540cde2e34SJason Evans int
2559ed346baSBosko Milekic _mtx_trylock(struct mtx *m, int opts, const char *file, int line)
2560cde2e34SJason Evans {
2570cde2e34SJason Evans 	int rval;
2580cde2e34SJason Evans 
25927863426SBosko Milekic 	MPASS(curproc != NULL);
2609ed346baSBosko Milekic 
2619ed346baSBosko Milekic 	/*
2629ed346baSBosko Milekic 	 * _mtx_trylock does not accept MTX_NOSWITCH option.
2639ed346baSBosko Milekic 	 */
2645746a1d8SBosko Milekic 	KASSERT((opts & MTX_NOSWITCH) == 0,
2655746a1d8SBosko Milekic 	    ("mtx_trylock() called with invalid option flag(s) %d", opts));
2669ed346baSBosko Milekic 
26727863426SBosko Milekic 	rval = _obtain_lock(m, curproc);
2689ed346baSBosko Milekic 
26919284646SJohn Baldwin 	LOCK_LOG_TRY("LOCK", &m->mtx_object, opts, rval, file, line);
27019284646SJohn Baldwin 	if (rval) {
2719ed346baSBosko Milekic 		/*
2729ed346baSBosko Milekic 		 * We do not handle recursion in _mtx_trylock; see the
2739ed346baSBosko Milekic 		 * note at the top of the routine.
2749ed346baSBosko Milekic 		 */
2755746a1d8SBosko Milekic 		KASSERT(!mtx_recursed(m),
2765746a1d8SBosko Milekic 		    ("mtx_trylock() called on a recursed mutex"));
27719284646SJohn Baldwin 		mtx_update_flags(m, 1);
27819284646SJohn Baldwin 		WITNESS_LOCK(&m->mtx_object, opts | LOP_TRYLOCK, file, line);
2790cde2e34SJason Evans 	}
2809ed346baSBosko Milekic 
28119284646SJohn Baldwin 	return (rval);
2820cde2e34SJason Evans }
2830cde2e34SJason Evans 
2840cde2e34SJason Evans /*
2859ed346baSBosko Milekic  * _mtx_lock_sleep: the tougher part of acquiring an MTX_DEF lock.
2869ed346baSBosko Milekic  *
2879ed346baSBosko Milekic  * We call this if the lock is either contested (i.e. we need to go to
2889ed346baSBosko Milekic  * sleep waiting for it), or if we need to recurse on it.
2890cde2e34SJason Evans  */
2900cde2e34SJason Evans void
2919ed346baSBosko Milekic _mtx_lock_sleep(struct mtx *m, int opts, const char *file, int line)
29236412d79SJohn Baldwin {
29327863426SBosko Milekic 	struct proc *p = curproc;
29436412d79SJohn Baldwin 
29536412d79SJohn Baldwin 	if ((m->mtx_lock & MTX_FLAGMASK) == (uintptr_t)p) {
29636412d79SJohn Baldwin 		m->mtx_recurse++;
29708812b39SBosko Milekic 		atomic_set_ptr(&m->mtx_lock, MTX_RECURSED);
29819284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
2995746a1d8SBosko Milekic 			CTR1(KTR_LOCK, "_mtx_lock_sleep: %p recursing", m);
30036412d79SJohn Baldwin 		return;
30136412d79SJohn Baldwin 	}
3029ed346baSBosko Milekic 
30319284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
30415ec816aSJohn Baldwin 		CTR4(KTR_LOCK,
30515ec816aSJohn Baldwin 		    "_mtx_lock_sleep: %s contested (lock=%p) at %s:%d",
30619284646SJohn Baldwin 		    m->mtx_object.lo_name, (void *)m->mtx_lock, file, line);
3071bd0eefbSJohn Baldwin 
30836412d79SJohn Baldwin 	while (!_obtain_lock(m, p)) {
309f5271ebcSJohn Baldwin 		uintptr_t v;
31036412d79SJohn Baldwin 		struct proc *p1;
31136412d79SJohn Baldwin 
3129ed346baSBosko Milekic 		mtx_lock_spin(&sched_lock);
31336412d79SJohn Baldwin 		/*
3149ed346baSBosko Milekic 		 * Check if the lock has been released while spinning for
3159ed346baSBosko Milekic 		 * the sched_lock.
31636412d79SJohn Baldwin 		 */
31736412d79SJohn Baldwin 		if ((v = m->mtx_lock) == MTX_UNOWNED) {
3189ed346baSBosko Milekic 			mtx_unlock_spin(&sched_lock);
31936412d79SJohn Baldwin 			continue;
32036412d79SJohn Baldwin 		}
3219ed346baSBosko Milekic 
32236412d79SJohn Baldwin 		/*
3239ed346baSBosko Milekic 		 * The mutex was marked contested on release. This means that
3249ed346baSBosko Milekic 		 * there are processes blocked on it.
32536412d79SJohn Baldwin 		 */
32636412d79SJohn Baldwin 		if (v == MTX_CONTESTED) {
32736412d79SJohn Baldwin 			p1 = TAILQ_FIRST(&m->mtx_blocked);
3285746a1d8SBosko Milekic 			MPASS(p1 != NULL);
32936412d79SJohn Baldwin 			m->mtx_lock = (uintptr_t)p | MTX_CONTESTED;
3309ed346baSBosko Milekic 
331d5a08a60SJake Burkholder 			if (p1->p_pri.pri_level < p->p_pri.pri_level)
332d5a08a60SJake Burkholder 				SET_PRIO(p, p1->p_pri.pri_level);
3339ed346baSBosko Milekic 			mtx_unlock_spin(&sched_lock);
33436412d79SJohn Baldwin 			return;
33536412d79SJohn Baldwin 		}
3369ed346baSBosko Milekic 
33736412d79SJohn Baldwin 		/*
3389ed346baSBosko Milekic 		 * If the mutex isn't already contested and a failure occurs
3399ed346baSBosko Milekic 		 * setting the contested bit, the mutex was either released
3409ed346baSBosko Milekic 		 * or the state of the MTX_RECURSED bit changed.
34136412d79SJohn Baldwin 		 */
34236412d79SJohn Baldwin 		if ((v & MTX_CONTESTED) == 0 &&
34336412d79SJohn Baldwin 		    !atomic_cmpset_ptr(&m->mtx_lock, (void *)v,
34436412d79SJohn Baldwin 			(void *)(v | MTX_CONTESTED))) {
3459ed346baSBosko Milekic 			mtx_unlock_spin(&sched_lock);
34636412d79SJohn Baldwin 			continue;
34736412d79SJohn Baldwin 		}
34836412d79SJohn Baldwin 
3499ed346baSBosko Milekic 		/*
3509ed346baSBosko Milekic 		 * We deffinately must sleep for this lock.
3519ed346baSBosko Milekic 		 */
35236412d79SJohn Baldwin 		mtx_assert(m, MA_NOTOWNED);
35336412d79SJohn Baldwin 
35436412d79SJohn Baldwin #ifdef notyet
35536412d79SJohn Baldwin 		/*
3569ed346baSBosko Milekic 		 * If we're borrowing an interrupted thread's VM context, we
3579ed346baSBosko Milekic 		 * must clean up before going to sleep.
35836412d79SJohn Baldwin 		 */
35915ec816aSJohn Baldwin 		if (p->p_ithd != NULL) {
36015ec816aSJohn Baldwin 			struct ithd *it = p->p_ithd;
36136412d79SJohn Baldwin 
36236412d79SJohn Baldwin 			if (it->it_interrupted) {
36319284646SJohn Baldwin 				if (LOCK_LOG_TEST(&m->mtx_object, opts))
36436412d79SJohn Baldwin 					CTR2(KTR_LOCK,
36515ec816aSJohn Baldwin 				    "_mtx_lock_sleep: %p interrupted %p",
36636412d79SJohn Baldwin 					    it, it->it_interrupted);
36736412d79SJohn Baldwin 				intr_thd_fixup(it);
36836412d79SJohn Baldwin 			}
36936412d79SJohn Baldwin 		}
37036412d79SJohn Baldwin #endif
37136412d79SJohn Baldwin 
3729ed346baSBosko Milekic 		/*
3739ed346baSBosko Milekic 		 * Put us on the list of threads blocked on this mutex.
3749ed346baSBosko Milekic 		 */
37536412d79SJohn Baldwin 		if (TAILQ_EMPTY(&m->mtx_blocked)) {
3769ed346baSBosko Milekic 			p1 = (struct proc *)(m->mtx_lock & MTX_FLAGMASK);
3779ed346baSBosko Milekic 			LIST_INSERT_HEAD(&p1->p_contested, m, mtx_contested);
37836412d79SJohn Baldwin 			TAILQ_INSERT_TAIL(&m->mtx_blocked, p, p_procq);
37936412d79SJohn Baldwin 		} else {
38036412d79SJohn Baldwin 			TAILQ_FOREACH(p1, &m->mtx_blocked, p_procq)
381d5a08a60SJake Burkholder 				if (p1->p_pri.pri_level > p->p_pri.pri_level)
38236412d79SJohn Baldwin 					break;
38336412d79SJohn Baldwin 			if (p1)
38436412d79SJohn Baldwin 				TAILQ_INSERT_BEFORE(p1, p, p_procq);
38536412d79SJohn Baldwin 			else
3869ed346baSBosko Milekic 				TAILQ_INSERT_TAIL(&m->mtx_blocked, p, p_procq);
38736412d79SJohn Baldwin 		}
38836412d79SJohn Baldwin 
3899ed346baSBosko Milekic 		/*
3909ed346baSBosko Milekic 		 * Save who we're blocked on.
3919ed346baSBosko Milekic 		 */
3929ed346baSBosko Milekic 		p->p_blocked = m;
39319284646SJohn Baldwin 		p->p_mtxname = m->mtx_object.lo_name;
39436412d79SJohn Baldwin 		p->p_stat = SMTX;
39536412d79SJohn Baldwin 		propagate_priority(p);
3969ed346baSBosko Milekic 
39719284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
398562e4ffeSJohn Baldwin 			CTR3(KTR_LOCK,
3999ed346baSBosko Milekic 			    "_mtx_lock_sleep: p %p blocked on [%p] %s", p, m,
40019284646SJohn Baldwin 			    m->mtx_object.lo_name);
4019ed346baSBosko Milekic 
40220cdcc5bSJohn Baldwin 		mi_switch();
4039ed346baSBosko Milekic 
40419284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
40536412d79SJohn Baldwin 			CTR3(KTR_LOCK,
4069ed346baSBosko Milekic 			  "_mtx_lock_sleep: p %p free from blocked on [%p] %s",
40719284646SJohn Baldwin 			  p, m, m->mtx_object.lo_name);
4089ed346baSBosko Milekic 
4099ed346baSBosko Milekic 		mtx_unlock_spin(&sched_lock);
41036412d79SJohn Baldwin 	}
4119ed346baSBosko Milekic 
41236412d79SJohn Baldwin 	return;
4139ed346baSBosko Milekic }
4149ed346baSBosko Milekic 
4159ed346baSBosko Milekic /*
4169ed346baSBosko Milekic  * _mtx_lock_spin: the tougher part of acquiring an MTX_SPIN lock.
4179ed346baSBosko Milekic  *
4189ed346baSBosko Milekic  * This is only called if we need to actually spin for the lock. Recursion
4199ed346baSBosko Milekic  * is handled inline.
4209ed346baSBosko Milekic  */
4219ed346baSBosko Milekic void
4226283b7d0SJohn Baldwin _mtx_lock_spin(struct mtx *m, int opts, critical_t mtx_crit, const char *file,
4239ed346baSBosko Milekic 	       int line)
42436412d79SJohn Baldwin {
42536412d79SJohn Baldwin 	int i = 0;
42636412d79SJohn Baldwin 
42719284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
4285746a1d8SBosko Milekic 		CTR1(KTR_LOCK, "_mtx_lock_spin: %p spinning", m);
4299ed346baSBosko Milekic 
43036412d79SJohn Baldwin 	for (;;) {
43127863426SBosko Milekic 		if (_obtain_lock(m, curproc))
43236412d79SJohn Baldwin 			break;
4339ed346baSBosko Milekic 
4347141f2adSJohn Baldwin 		/* Give interrupts a chance while we spin. */
4357141f2adSJohn Baldwin 		critical_exit(mtx_crit);
43636412d79SJohn Baldwin 		while (m->mtx_lock != MTX_UNOWNED) {
43736412d79SJohn Baldwin 			if (i++ < 1000000)
43836412d79SJohn Baldwin 				continue;
43936412d79SJohn Baldwin 			if (i++ < 6000000)
44036412d79SJohn Baldwin 				DELAY(1);
44136412d79SJohn Baldwin #ifdef DDB
44236412d79SJohn Baldwin 			else if (!db_active)
44336412d79SJohn Baldwin #else
44436412d79SJohn Baldwin 			else
44536412d79SJohn Baldwin #endif
4469ed346baSBosko Milekic 			panic("spin lock %s held by %p for > 5 seconds",
44719284646SJohn Baldwin 			    m->mtx_object.lo_name, (void *)m->mtx_lock);
44836412d79SJohn Baldwin 		}
4497141f2adSJohn Baldwin 		mtx_crit = critical_enter();
45036412d79SJohn Baldwin 	}
45136412d79SJohn Baldwin 
4526283b7d0SJohn Baldwin 	m->mtx_savecrit = mtx_crit;
45319284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
4549ed346baSBosko Milekic 		CTR1(KTR_LOCK, "_mtx_lock_spin: %p spin done", m);
4559ed346baSBosko Milekic 
45636412d79SJohn Baldwin 	return;
45736412d79SJohn Baldwin }
45836412d79SJohn Baldwin 
4599ed346baSBosko Milekic /*
4609ed346baSBosko Milekic  * _mtx_unlock_sleep: the tougher part of releasing an MTX_DEF lock.
4619ed346baSBosko Milekic  *
4629ed346baSBosko Milekic  * We are only called here if the lock is recursed or contested (i.e. we
4639ed346baSBosko Milekic  * need to wake up a blocked thread).
4649ed346baSBosko Milekic  */
46536412d79SJohn Baldwin void
4669ed346baSBosko Milekic _mtx_unlock_sleep(struct mtx *m, int opts, const char *file, int line)
46736412d79SJohn Baldwin {
46836412d79SJohn Baldwin 	struct proc *p, *p1;
46936412d79SJohn Baldwin 	struct mtx *m1;
47036412d79SJohn Baldwin 	int pri;
47136412d79SJohn Baldwin 
47227863426SBosko Milekic 	p = curproc;
4739ed346baSBosko Milekic 
47408812b39SBosko Milekic 	if (mtx_recursed(m)) {
47536412d79SJohn Baldwin 		if (--(m->mtx_recurse) == 0)
47608812b39SBosko Milekic 			atomic_clear_ptr(&m->mtx_lock, MTX_RECURSED);
47719284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
4789ed346baSBosko Milekic 			CTR1(KTR_LOCK, "_mtx_unlock_sleep: %p unrecurse", m);
47936412d79SJohn Baldwin 		return;
48036412d79SJohn Baldwin 	}
4819ed346baSBosko Milekic 
4829ed346baSBosko Milekic 	mtx_lock_spin(&sched_lock);
48319284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
4849ed346baSBosko Milekic 		CTR1(KTR_LOCK, "_mtx_unlock_sleep: %p contested", m);
4859ed346baSBosko Milekic 
48636412d79SJohn Baldwin 	p1 = TAILQ_FIRST(&m->mtx_blocked);
48736412d79SJohn Baldwin 	MPASS(p->p_magic == P_MAGIC);
48836412d79SJohn Baldwin 	MPASS(p1->p_magic == P_MAGIC);
4899ed346baSBosko Milekic 
49036412d79SJohn Baldwin 	TAILQ_REMOVE(&m->mtx_blocked, p1, p_procq);
4919ed346baSBosko Milekic 
49236412d79SJohn Baldwin 	if (TAILQ_EMPTY(&m->mtx_blocked)) {
49336412d79SJohn Baldwin 		LIST_REMOVE(m, mtx_contested);
49436412d79SJohn Baldwin 		_release_lock_quick(m);
49519284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
4969ed346baSBosko Milekic 			CTR1(KTR_LOCK, "_mtx_unlock_sleep: %p not held", m);
49736412d79SJohn Baldwin 	} else
4989ed346baSBosko Milekic 		atomic_store_rel_ptr(&m->mtx_lock, (void *)MTX_CONTESTED);
4999ed346baSBosko Milekic 
500d5a08a60SJake Burkholder 	pri = PRI_MAX;
50136412d79SJohn Baldwin 	LIST_FOREACH(m1, &p->p_contested, mtx_contested) {
502d5a08a60SJake Burkholder 		int cp = TAILQ_FIRST(&m1->mtx_blocked)->p_pri.pri_level;
50336412d79SJohn Baldwin 		if (cp < pri)
50436412d79SJohn Baldwin 			pri = cp;
50536412d79SJohn Baldwin 	}
5069ed346baSBosko Milekic 
507d5a08a60SJake Burkholder 	if (pri > p->p_pri.pri_native)
508d5a08a60SJake Burkholder 		pri = p->p_pri.pri_native;
50936412d79SJohn Baldwin 	SET_PRIO(p, pri);
5109ed346baSBosko Milekic 
51119284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
5129ed346baSBosko Milekic 		CTR2(KTR_LOCK, "_mtx_unlock_sleep: %p contested setrunqueue %p",
5139ed346baSBosko Milekic 		    m, p1);
5149ed346baSBosko Milekic 
51536412d79SJohn Baldwin 	p1->p_blocked = NULL;
51636412d79SJohn Baldwin 	p1->p_stat = SRUN;
51736412d79SJohn Baldwin 	setrunqueue(p1);
5189ed346baSBosko Milekic 
519d5a08a60SJake Burkholder 	if ((opts & MTX_NOSWITCH) == 0 && p1->p_pri.pri_level < pri) {
52036412d79SJohn Baldwin #ifdef notyet
52115ec816aSJohn Baldwin 		if (p->p_ithd != NULL) {
52215ec816aSJohn Baldwin 			struct ithd *it = p->p_ithd;
52336412d79SJohn Baldwin 
52436412d79SJohn Baldwin 			if (it->it_interrupted) {
52519284646SJohn Baldwin 				if (LOCK_LOG_TEST(&m->mtx_object, opts))
52636412d79SJohn Baldwin 					CTR2(KTR_LOCK,
52715ec816aSJohn Baldwin 				    "_mtx_unlock_sleep: %p interrupted %p",
52836412d79SJohn Baldwin 					    it, it->it_interrupted);
52936412d79SJohn Baldwin 				intr_thd_fixup(it);
53036412d79SJohn Baldwin 			}
53136412d79SJohn Baldwin 		}
53236412d79SJohn Baldwin #endif
53336412d79SJohn Baldwin 		setrunqueue(p);
53419284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
535562e4ffeSJohn Baldwin 			CTR2(KTR_LOCK,
5369ed346baSBosko Milekic 			    "_mtx_unlock_sleep: %p switching out lock=%p", m,
5379ed346baSBosko Milekic 			    (void *)m->mtx_lock);
5389ed346baSBosko Milekic 
53936412d79SJohn Baldwin 		mi_switch();
54019284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
5419ed346baSBosko Milekic 			CTR2(KTR_LOCK, "_mtx_unlock_sleep: %p resuming lock=%p",
54231271627SJohn Baldwin 			    m, (void *)m->mtx_lock);
54336412d79SJohn Baldwin 	}
54436412d79SJohn Baldwin 
5459ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
5469ed346baSBosko Milekic 
5479ed346baSBosko Milekic 	return;
5489ed346baSBosko Milekic }
5499ed346baSBosko Milekic 
5509ed346baSBosko Milekic /*
5519ed346baSBosko Milekic  * All the unlocking of MTX_SPIN locks is done inline.
5529ed346baSBosko Milekic  * See the _rel_spin_lock() macro for the details.
5539ed346baSBosko Milekic  */
5549ed346baSBosko Milekic 
55519284646SJohn Baldwin #ifdef WITNESS
55619284646SJohn Baldwin /*
55719284646SJohn Baldwin  * Update the lock object flags before calling witness.  Note that when we
55819284646SJohn Baldwin  * lock a mutex, this is called after getting the lock, but when unlocking
55919284646SJohn Baldwin  * a mutex, this function is called before releasing the lock.
56019284646SJohn Baldwin  */
56119284646SJohn Baldwin void
56219284646SJohn Baldwin _mtx_update_flags(struct mtx *m, int locking)
56319284646SJohn Baldwin {
56419284646SJohn Baldwin 
56519284646SJohn Baldwin 	mtx_assert(m, MA_OWNED);
56619284646SJohn Baldwin 	if (locking) {
56719284646SJohn Baldwin 		m->mtx_object.lo_flags |= LO_LOCKED;
56819284646SJohn Baldwin 		if (mtx_recursed(m))
56919284646SJohn Baldwin 			m->mtx_object.lo_flags |= LO_RECURSED;
57019284646SJohn Baldwin 		else
57119284646SJohn Baldwin 			/* XXX: we shouldn't need this in theory. */
57219284646SJohn Baldwin 			m->mtx_object.lo_flags &= ~LO_RECURSED;
57319284646SJohn Baldwin 	} else {
57419284646SJohn Baldwin 		switch (m->mtx_recurse) {
57519284646SJohn Baldwin 		case 0:
57619284646SJohn Baldwin 			/* XXX: we shouldn't need the LO_RECURSED in theory. */
57719284646SJohn Baldwin 			m->mtx_object.lo_flags &= ~(LO_LOCKED | LO_RECURSED);
57819284646SJohn Baldwin 			break;
57919284646SJohn Baldwin 		case 1:
58019284646SJohn Baldwin 			m->mtx_object.lo_flags &= ~(LO_RECURSED);
58119284646SJohn Baldwin 			break;
58219284646SJohn Baldwin 		default:
58319284646SJohn Baldwin 			break;
58419284646SJohn Baldwin 		}
58519284646SJohn Baldwin 	}
58619284646SJohn Baldwin }
58719284646SJohn Baldwin #endif
58819284646SJohn Baldwin 
5899ed346baSBosko Milekic /*
59015ec816aSJohn Baldwin  * The backing function for the INVARIANTS-enabled mtx_assert()
5919ed346baSBosko Milekic  */
5921103f3b0SJohn Baldwin #ifdef INVARIANT_SUPPORT
5930cde2e34SJason Evans void
59456771ca7SJason Evans _mtx_assert(struct mtx *m, int what, const char *file, int line)
5950cde2e34SJason Evans {
596a10f4966SJake Burkholder 	switch (what) {
5970cde2e34SJason Evans 	case MA_OWNED:
5980cde2e34SJason Evans 	case MA_OWNED | MA_RECURSED:
5990cde2e34SJason Evans 	case MA_OWNED | MA_NOTRECURSED:
600a10f4966SJake Burkholder 		if (!mtx_owned(m))
6010cde2e34SJason Evans 			panic("mutex %s not owned at %s:%d",
60219284646SJohn Baldwin 			    m->mtx_object.lo_name, file, line);
603a10f4966SJake Burkholder 		if (mtx_recursed(m)) {
604a10f4966SJake Burkholder 			if ((what & MA_NOTRECURSED) != 0)
6050cde2e34SJason Evans 				panic("mutex %s recursed at %s:%d",
60619284646SJohn Baldwin 				    m->mtx_object.lo_name, file, line);
607a10f4966SJake Burkholder 		} else if ((what & MA_RECURSED) != 0) {
6080cde2e34SJason Evans 			panic("mutex %s unrecursed at %s:%d",
60919284646SJohn Baldwin 			    m->mtx_object.lo_name, file, line);
6100cde2e34SJason Evans 		}
6110cde2e34SJason Evans 		break;
6120cde2e34SJason Evans 	case MA_NOTOWNED:
613a10f4966SJake Burkholder 		if (mtx_owned(m))
6140cde2e34SJason Evans 			panic("mutex %s owned at %s:%d",
61519284646SJohn Baldwin 			    m->mtx_object.lo_name, file, line);
6160cde2e34SJason Evans 		break;
6170cde2e34SJason Evans 	default:
61856771ca7SJason Evans 		panic("unknown mtx_assert at %s:%d", file, line);
6190cde2e34SJason Evans 	}
6200cde2e34SJason Evans }
6210cde2e34SJason Evans #endif
6220cde2e34SJason Evans 
6239ed346baSBosko Milekic /*
6249ed346baSBosko Milekic  * The MUTEX_DEBUG-enabled mtx_validate()
62519284646SJohn Baldwin  *
62619284646SJohn Baldwin  * Most of these checks have been moved off into the LO_INITIALIZED flag
62719284646SJohn Baldwin  * maintained by the witness code.
6289ed346baSBosko Milekic  */
62936412d79SJohn Baldwin #ifdef MUTEX_DEBUG
63036412d79SJohn Baldwin 
63119284646SJohn Baldwin void	mtx_validate __P((struct mtx *));
63236412d79SJohn Baldwin 
63319284646SJohn Baldwin void
63419284646SJohn Baldwin mtx_validate(struct mtx *m)
63536412d79SJohn Baldwin {
63636412d79SJohn Baldwin 
63736412d79SJohn Baldwin /*
63836412d79SJohn Baldwin  * XXX - When kernacc() is fixed on the alpha to handle K0_SEG memory properly
63936412d79SJohn Baldwin  * we can re-enable the kernacc() checks.
64036412d79SJohn Baldwin  */
64136412d79SJohn Baldwin #ifndef __alpha__
64219284646SJohn Baldwin 	if (!kernacc((caddr_t)m, sizeof(m), VM_PROT_READ | VM_PROT_WRITE))
64319284646SJohn Baldwin 		panic("Can't read and write to mutex %p", m);
64436412d79SJohn Baldwin #endif
64536412d79SJohn Baldwin }
64636412d79SJohn Baldwin #endif
64736412d79SJohn Baldwin 
6489ed346baSBosko Milekic /*
6499ed346baSBosko Milekic  * Mutex initialization routine; initialize lock `m' of type contained in
6509ed346baSBosko Milekic  * `opts' with options contained in `opts' and description `description.'
6519ed346baSBosko Milekic  */
65236412d79SJohn Baldwin void
6539ed346baSBosko Milekic mtx_init(struct mtx *m, const char *description, int opts)
65436412d79SJohn Baldwin {
65519284646SJohn Baldwin 	struct lock_object *lock;
6569ed346baSBosko Milekic 
65719284646SJohn Baldwin 	MPASS((opts & ~(MTX_SPIN | MTX_QUIET | MTX_RECURSE |
65819284646SJohn Baldwin 	    MTX_SLEEPABLE | MTX_NOWITNESS)) == 0);
6599ed346baSBosko Milekic 
66036412d79SJohn Baldwin #ifdef MUTEX_DEBUG
6619ed346baSBosko Milekic 	/* Diagnostic and error correction */
66219284646SJohn Baldwin 	mtx_validate(m);
6636936206eSJohn Baldwin #endif
66436412d79SJohn Baldwin 
66519284646SJohn Baldwin 	bzero(m, sizeof(*m));
66619284646SJohn Baldwin 	lock = &m->mtx_object;
66719284646SJohn Baldwin 	if (opts & MTX_SPIN)
66819284646SJohn Baldwin 		lock->lo_class = &lock_class_mtx_spin;
66919284646SJohn Baldwin 	else
67019284646SJohn Baldwin 		lock->lo_class = &lock_class_mtx_sleep;
67119284646SJohn Baldwin 	lock->lo_name = description;
67219284646SJohn Baldwin 	if (opts & MTX_QUIET)
67319284646SJohn Baldwin 		lock->lo_flags = LO_QUIET;
67419284646SJohn Baldwin 	if (opts & MTX_RECURSE)
67519284646SJohn Baldwin 		lock->lo_flags |= LO_RECURSABLE;
67619284646SJohn Baldwin 	if (opts & MTX_SLEEPABLE)
67719284646SJohn Baldwin 		lock->lo_flags |= LO_SLEEPABLE;
67819284646SJohn Baldwin 	if ((opts & MTX_NOWITNESS) == 0)
67919284646SJohn Baldwin 		lock->lo_flags |= LO_WITNESS;
68019284646SJohn Baldwin 
68119284646SJohn Baldwin 	m->mtx_lock = MTX_UNOWNED;
68236412d79SJohn Baldwin 	TAILQ_INIT(&m->mtx_blocked);
6839ed346baSBosko Milekic 
68419284646SJohn Baldwin 	LOCK_LOG_INIT(lock, opts);
685d1c1b841SJason Evans 
68619284646SJohn Baldwin 	WITNESS_INIT(lock);
68736412d79SJohn Baldwin }
68836412d79SJohn Baldwin 
6899ed346baSBosko Milekic /*
69019284646SJohn Baldwin  * Remove lock `m' from all_mtx queue.  We don't allow MTX_QUIET to be
69119284646SJohn Baldwin  * passed in as a flag here because if the corresponding mtx_init() was
69219284646SJohn Baldwin  * called with MTX_QUIET set, then it will already be set in the mutex's
69319284646SJohn Baldwin  * flags.
6949ed346baSBosko Milekic  */
69536412d79SJohn Baldwin void
69636412d79SJohn Baldwin mtx_destroy(struct mtx *m)
69736412d79SJohn Baldwin {
69836412d79SJohn Baldwin 
69919284646SJohn Baldwin 	LOCK_LOG_DESTROY(&m->mtx_object, 0);
7009ed346baSBosko Milekic 
70119284646SJohn Baldwin 	if (!mtx_owned(m))
70219284646SJohn Baldwin 		MPASS(mtx_unowned(m));
70319284646SJohn Baldwin 	else {
70408812b39SBosko Milekic 		MPASS((m->mtx_lock & (MTX_RECURSED|MTX_CONTESTED)) == 0);
7059ed346baSBosko Milekic 
70619284646SJohn Baldwin 		/* Tell witness this isn't locked to make it happy. */
70719284646SJohn Baldwin 		m->mtx_object.lo_flags &= ~LO_LOCKED;
70819284646SJohn Baldwin 		WITNESS_UNLOCK(&m->mtx_object, MTX_NOSWITCH, __FILE__,
70919284646SJohn Baldwin 		    __LINE__);
71036412d79SJohn Baldwin 	}
7110384fff8SJason Evans 
71219284646SJohn Baldwin 	WITNESS_DESTROY(&m->mtx_object);
7130384fff8SJason Evans }
714