xref: /freebsd/sys/kern/kern_mutex.c (revision 5cb0fbe47e7601a3b3b7b880a5b634dddf0a9cf5)
10384fff8SJason Evans /*-
20384fff8SJason Evans  * Copyright (c) 1998 Berkeley Software Design, Inc. All rights reserved.
30384fff8SJason Evans  *
40384fff8SJason Evans  * Redistribution and use in source and binary forms, with or without
50384fff8SJason Evans  * modification, are permitted provided that the following conditions
60384fff8SJason Evans  * are met:
70384fff8SJason Evans  * 1. Redistributions of source code must retain the above copyright
80384fff8SJason Evans  *    notice, this list of conditions and the following disclaimer.
90384fff8SJason Evans  * 2. Redistributions in binary form must reproduce the above copyright
100384fff8SJason Evans  *    notice, this list of conditions and the following disclaimer in the
110384fff8SJason Evans  *    documentation and/or other materials provided with the distribution.
120384fff8SJason Evans  * 3. Berkeley Software Design Inc's name may not be used to endorse or
130384fff8SJason Evans  *    promote products derived from this software without specific prior
140384fff8SJason Evans  *    written permission.
150384fff8SJason Evans  *
160384fff8SJason Evans  * THIS SOFTWARE IS PROVIDED BY BERKELEY SOFTWARE DESIGN INC ``AS IS'' AND
170384fff8SJason Evans  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
180384fff8SJason Evans  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
190384fff8SJason Evans  * ARE DISCLAIMED.  IN NO EVENT SHALL BERKELEY SOFTWARE DESIGN INC BE LIABLE
200384fff8SJason Evans  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
210384fff8SJason Evans  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
220384fff8SJason Evans  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
230384fff8SJason Evans  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
240384fff8SJason Evans  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
250384fff8SJason Evans  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
260384fff8SJason Evans  * SUCH DAMAGE.
270384fff8SJason Evans  *
280384fff8SJason Evans  *	from BSDI $Id: mutex_witness.c,v 1.1.2.20 2000/04/27 03:10:27 cp Exp $
2936412d79SJohn Baldwin  *	and BSDI $Id: synch_machdep.c,v 2.3.2.39 2000/04/27 03:10:25 cp Exp $
300384fff8SJason Evans  * $FreeBSD$
310384fff8SJason Evans  */
320384fff8SJason Evans 
330384fff8SJason Evans /*
349ed346baSBosko Milekic  * Machine independent bits of mutex implementation and implementation of
359ed346baSBosko Milekic  * `witness' structure & related debugging routines.
369ed346baSBosko Milekic  */
379ed346baSBosko Milekic 
389ed346baSBosko Milekic /*
390384fff8SJason Evans  *	Main Entry: witness
400384fff8SJason Evans  *	Pronunciation: 'wit-n&s
410384fff8SJason Evans  *	Function: noun
420384fff8SJason Evans  *	Etymology: Middle English witnesse, from Old English witnes knowledge,
430384fff8SJason Evans  *	    testimony, witness, from 2wit
440384fff8SJason Evans  *	Date: before 12th century
450384fff8SJason Evans  *	1 : attestation of a fact or event : TESTIMONY
460384fff8SJason Evans  *	2 : one that gives evidence; specifically : one who testifies in
470384fff8SJason Evans  *	    a cause or before a judicial tribunal
480384fff8SJason Evans  *	3 : one asked to be present at a transaction so as to be able to
490384fff8SJason Evans  *	    testify to its having taken place
500384fff8SJason Evans  *	4 : one who has personal knowledge of something
510384fff8SJason Evans  *	5 a : something serving as evidence or proof : SIGN
520384fff8SJason Evans  *	  b : public affirmation by word or example of usually
530384fff8SJason Evans  *	      religious faith or conviction <the heroic witness to divine
540384fff8SJason Evans  *	      life -- Pilot>
550384fff8SJason Evans  *	6 capitalized : a member of the Jehovah's Witnesses
560384fff8SJason Evans  */
570384fff8SJason Evans 
589c36c934SJohn Baldwin #include "opt_ddb.h"
59a5a96a19SJohn Baldwin 
600384fff8SJason Evans #include <sys/param.h>
6136412d79SJohn Baldwin #include <sys/bus.h>
6236412d79SJohn Baldwin #include <sys/kernel.h>
6319284646SJohn Baldwin #include <sys/lock.h>
64fb919e4dSMark Murray #include <sys/malloc.h>
6519284646SJohn Baldwin #include <sys/mutex.h>
660384fff8SJason Evans #include <sys/proc.h>
67c4f7a187SJohn Baldwin #include <sys/resourcevar.h>
68a5a96a19SJohn Baldwin #include <sys/sysctl.h>
690384fff8SJason Evans #include <sys/systm.h>
7036412d79SJohn Baldwin #include <sys/vmmeter.h>
710384fff8SJason Evans #include <sys/ktr.h>
720384fff8SJason Evans 
7336412d79SJohn Baldwin #include <machine/atomic.h>
7436412d79SJohn Baldwin #include <machine/bus.h>
7536412d79SJohn Baldwin #include <machine/clock.h>
760384fff8SJason Evans #include <machine/cpu.h>
7736412d79SJohn Baldwin 
789c36c934SJohn Baldwin #include <ddb/ddb.h>
799c36c934SJohn Baldwin 
8036412d79SJohn Baldwin #include <vm/vm.h>
8136412d79SJohn Baldwin #include <vm/vm_extern.h>
8236412d79SJohn Baldwin 
830cde2e34SJason Evans /*
849ed346baSBosko Milekic  * Internal utility macros.
850cde2e34SJason Evans  */
869ed346baSBosko Milekic #define mtx_unowned(m)	((m)->mtx_lock == MTX_UNOWNED)
870cde2e34SJason Evans 
889ed346baSBosko Milekic #define mtx_owner(m)	(mtx_unowned((m)) ? NULL \
899ed346baSBosko Milekic 	: (struct proc *)((m)->mtx_lock & MTX_FLAGMASK))
909ed346baSBosko Milekic 
91d5a08a60SJake Burkholder #define SET_PRIO(p, pri)	(p)->p_pri.pri_level = (pri)
920cde2e34SJason Evans 
930cde2e34SJason Evans /*
9419284646SJohn Baldwin  * Lock classes for sleep and spin mutexes.
950cde2e34SJason Evans  */
9619284646SJohn Baldwin struct lock_class lock_class_mtx_sleep = {
9719284646SJohn Baldwin 	"sleep mutex",
9819284646SJohn Baldwin 	LC_SLEEPLOCK | LC_RECURSABLE
9919284646SJohn Baldwin };
10019284646SJohn Baldwin struct lock_class lock_class_mtx_spin = {
10119284646SJohn Baldwin 	"spin mutex",
10219284646SJohn Baldwin 	LC_SPINLOCK | LC_RECURSABLE
1038484de75SJohn Baldwin };
1048484de75SJohn Baldwin 
1059ed346baSBosko Milekic /*
1069ed346baSBosko Milekic  * Prototypes for non-exported routines.
1079ed346baSBosko Milekic  */
1081bd0eefbSJohn Baldwin static void	propagate_priority(struct proc *);
10936412d79SJohn Baldwin 
11036412d79SJohn Baldwin static void
11136412d79SJohn Baldwin propagate_priority(struct proc *p)
11236412d79SJohn Baldwin {
113d5a08a60SJake Burkholder 	int pri = p->p_pri.pri_level;
11436412d79SJohn Baldwin 	struct mtx *m = p->p_blocked;
11536412d79SJohn Baldwin 
1161bd0eefbSJohn Baldwin 	mtx_assert(&sched_lock, MA_OWNED);
11736412d79SJohn Baldwin 	for (;;) {
11836412d79SJohn Baldwin 		struct proc *p1;
11936412d79SJohn Baldwin 
12036412d79SJohn Baldwin 		p = mtx_owner(m);
12136412d79SJohn Baldwin 
12236412d79SJohn Baldwin 		if (p == NULL) {
12336412d79SJohn Baldwin 			/*
12436412d79SJohn Baldwin 			 * This really isn't quite right. Really
12536412d79SJohn Baldwin 			 * ought to bump priority of process that
12636412d79SJohn Baldwin 			 * next acquires the mutex.
12736412d79SJohn Baldwin 			 */
12836412d79SJohn Baldwin 			MPASS(m->mtx_lock == MTX_CONTESTED);
12936412d79SJohn Baldwin 			return;
13036412d79SJohn Baldwin 		}
1319ed346baSBosko Milekic 
13236412d79SJohn Baldwin 		MPASS(p->p_magic == P_MAGIC);
1331bd0eefbSJohn Baldwin 		KASSERT(p->p_stat != SSLEEP, ("sleeping process owns a mutex"));
134d5a08a60SJake Burkholder 		if (p->p_pri.pri_level <= pri)
13536412d79SJohn Baldwin 			return;
1361bd0eefbSJohn Baldwin 
1371bd0eefbSJohn Baldwin 		/*
1381bd0eefbSJohn Baldwin 		 * Bump this process' priority.
1391bd0eefbSJohn Baldwin 		 */
1401bd0eefbSJohn Baldwin 		SET_PRIO(p, pri);
1411bd0eefbSJohn Baldwin 
14236412d79SJohn Baldwin 		/*
14336412d79SJohn Baldwin 		 * If lock holder is actually running, just bump priority.
14436412d79SJohn Baldwin 		 */
14525d209f2SJohn Baldwin 		if (p->p_oncpu != NOCPU) {
146f0b60d75SMark Murray 			MPASS(p->p_stat == SRUN || p->p_stat == SZOMB || p->p_stat == SSTOP);
14736412d79SJohn Baldwin 			return;
14836412d79SJohn Baldwin 		}
149d5a08a60SJake Burkholder 
1501b43703bSJohn Baldwin #ifndef SMP
1511b43703bSJohn Baldwin 		/*
1521b43703bSJohn Baldwin 		 * For UP, we check to see if p is curproc (this shouldn't
1531b43703bSJohn Baldwin 		 * ever happen however as it would mean we are in a deadlock.)
1541b43703bSJohn Baldwin 		 */
1551b43703bSJohn Baldwin 		KASSERT(p != curproc, ("Deadlock detected"));
1561b43703bSJohn Baldwin #endif
1571b43703bSJohn Baldwin 
15836412d79SJohn Baldwin 		/*
15936412d79SJohn Baldwin 		 * If on run queue move to new run queue, and
16036412d79SJohn Baldwin 		 * quit.
16136412d79SJohn Baldwin 		 */
16236412d79SJohn Baldwin 		if (p->p_stat == SRUN) {
16336412d79SJohn Baldwin 			MPASS(p->p_blocked == NULL);
16436412d79SJohn Baldwin 			remrunqueue(p);
16536412d79SJohn Baldwin 			setrunqueue(p);
16636412d79SJohn Baldwin 			return;
16736412d79SJohn Baldwin 		}
16836412d79SJohn Baldwin 
16936412d79SJohn Baldwin 		/*
1701bd0eefbSJohn Baldwin 		 * If we aren't blocked on a mutex, we should be.
17136412d79SJohn Baldwin 		 */
1721bd0eefbSJohn Baldwin 		KASSERT(p->p_stat == SMTX, (
1731bd0eefbSJohn Baldwin 		    "process %d(%s):%d holds %s but isn't blocked on a mutex\n",
1741bd0eefbSJohn Baldwin 		    p->p_pid, p->p_comm, p->p_stat,
17519284646SJohn Baldwin 		    m->mtx_object.lo_name));
17636412d79SJohn Baldwin 
17736412d79SJohn Baldwin 		/*
17836412d79SJohn Baldwin 		 * Pick up the mutex that p is blocked on.
17936412d79SJohn Baldwin 		 */
18036412d79SJohn Baldwin 		m = p->p_blocked;
18136412d79SJohn Baldwin 		MPASS(m != NULL);
18236412d79SJohn Baldwin 
18336412d79SJohn Baldwin 		/*
18436412d79SJohn Baldwin 		 * Check if the proc needs to be moved up on
18536412d79SJohn Baldwin 		 * the blocked chain
18636412d79SJohn Baldwin 		 */
1871bd0eefbSJohn Baldwin 		if (p == TAILQ_FIRST(&m->mtx_blocked)) {
1881bd0eefbSJohn Baldwin 			continue;
1891bd0eefbSJohn Baldwin 		}
1909ed346baSBosko Milekic 
191d5a08a60SJake Burkholder 		p1 = TAILQ_PREV(p, procqueue, p_procq);
192d5a08a60SJake Burkholder 		if (p1->p_pri.pri_level <= pri) {
19336412d79SJohn Baldwin 			continue;
19436412d79SJohn Baldwin 		}
19536412d79SJohn Baldwin 
19636412d79SJohn Baldwin 		/*
1971bd0eefbSJohn Baldwin 		 * Remove proc from blocked chain and determine where
1981bd0eefbSJohn Baldwin 		 * it should be moved up to.  Since we know that p1 has
1991bd0eefbSJohn Baldwin 		 * a lower priority than p, we know that at least one
2001bd0eefbSJohn Baldwin 		 * process in the chain has a lower priority and that
2011bd0eefbSJohn Baldwin 		 * p1 will thus not be NULL after the loop.
20236412d79SJohn Baldwin 		 */
20336412d79SJohn Baldwin 		TAILQ_REMOVE(&m->mtx_blocked, p, p_procq);
20436412d79SJohn Baldwin 		TAILQ_FOREACH(p1, &m->mtx_blocked, p_procq) {
20536412d79SJohn Baldwin 			MPASS(p1->p_magic == P_MAGIC);
206d5a08a60SJake Burkholder 			if (p1->p_pri.pri_level > pri)
20736412d79SJohn Baldwin 				break;
20836412d79SJohn Baldwin 		}
2099ed346baSBosko Milekic 
2101bd0eefbSJohn Baldwin 		MPASS(p1 != NULL);
21136412d79SJohn Baldwin 		TAILQ_INSERT_BEFORE(p1, p, p_procq);
21236412d79SJohn Baldwin 		CTR4(KTR_LOCK,
2138484de75SJohn Baldwin 		    "propagate_priority: p %p moved before %p on [%p] %s",
21419284646SJohn Baldwin 		    p, p1, m, m->mtx_object.lo_name);
21536412d79SJohn Baldwin 	}
21636412d79SJohn Baldwin }
21736412d79SJohn Baldwin 
2180cde2e34SJason Evans /*
2196283b7d0SJohn Baldwin  * Function versions of the inlined __mtx_* macros.  These are used by
2206283b7d0SJohn Baldwin  * modules and can also be called from assembly language if needed.
2216283b7d0SJohn Baldwin  */
2226283b7d0SJohn Baldwin void
2236283b7d0SJohn Baldwin _mtx_lock_flags(struct mtx *m, int opts, const char *file, int line)
2246283b7d0SJohn Baldwin {
2256283b7d0SJohn Baldwin 
2266283b7d0SJohn Baldwin 	__mtx_lock_flags(m, opts, file, line);
2276283b7d0SJohn Baldwin }
2286283b7d0SJohn Baldwin 
2296283b7d0SJohn Baldwin void
2306283b7d0SJohn Baldwin _mtx_unlock_flags(struct mtx *m, int opts, const char *file, int line)
2316283b7d0SJohn Baldwin {
2326283b7d0SJohn Baldwin 
2336283b7d0SJohn Baldwin 	__mtx_unlock_flags(m, opts, file, line);
2346283b7d0SJohn Baldwin }
2356283b7d0SJohn Baldwin 
2366283b7d0SJohn Baldwin void
2376283b7d0SJohn Baldwin _mtx_lock_spin_flags(struct mtx *m, int opts, const char *file, int line)
2386283b7d0SJohn Baldwin {
2396283b7d0SJohn Baldwin 
2406283b7d0SJohn Baldwin 	__mtx_lock_spin_flags(m, opts, file, line);
2416283b7d0SJohn Baldwin }
2426283b7d0SJohn Baldwin 
2436283b7d0SJohn Baldwin void
2446283b7d0SJohn Baldwin _mtx_unlock_spin_flags(struct mtx *m, int opts, const char *file, int line)
2456283b7d0SJohn Baldwin {
2466283b7d0SJohn Baldwin 
2476283b7d0SJohn Baldwin 	__mtx_unlock_spin_flags(m, opts, file, line);
2486283b7d0SJohn Baldwin }
2496283b7d0SJohn Baldwin 
2506283b7d0SJohn Baldwin /*
2519ed346baSBosko Milekic  * The important part of mtx_trylock{,_flags}()
2529ed346baSBosko Milekic  * Tries to acquire lock `m.' We do NOT handle recursion here; we assume that
2539ed346baSBosko Milekic  * if we're called, it's because we know we don't already own this lock.
2540cde2e34SJason Evans  */
2550cde2e34SJason Evans int
2569ed346baSBosko Milekic _mtx_trylock(struct mtx *m, int opts, const char *file, int line)
2570cde2e34SJason Evans {
2580cde2e34SJason Evans 	int rval;
2590cde2e34SJason Evans 
26027863426SBosko Milekic 	MPASS(curproc != NULL);
2619ed346baSBosko Milekic 
2629ed346baSBosko Milekic 	/*
2639ed346baSBosko Milekic 	 * _mtx_trylock does not accept MTX_NOSWITCH option.
2649ed346baSBosko Milekic 	 */
2655746a1d8SBosko Milekic 	KASSERT((opts & MTX_NOSWITCH) == 0,
2665746a1d8SBosko Milekic 	    ("mtx_trylock() called with invalid option flag(s) %d", opts));
2679ed346baSBosko Milekic 
26827863426SBosko Milekic 	rval = _obtain_lock(m, curproc);
2699ed346baSBosko Milekic 
27019284646SJohn Baldwin 	LOCK_LOG_TRY("LOCK", &m->mtx_object, opts, rval, file, line);
27119284646SJohn Baldwin 	if (rval) {
2729ed346baSBosko Milekic 		/*
2739ed346baSBosko Milekic 		 * We do not handle recursion in _mtx_trylock; see the
2749ed346baSBosko Milekic 		 * note at the top of the routine.
2759ed346baSBosko Milekic 		 */
2765746a1d8SBosko Milekic 		KASSERT(!mtx_recursed(m),
2775746a1d8SBosko Milekic 		    ("mtx_trylock() called on a recursed mutex"));
2782d96f0b1SJohn Baldwin 		WITNESS_LOCK(&m->mtx_object, opts | LOP_EXCLUSIVE | LOP_TRYLOCK,
2792d96f0b1SJohn Baldwin 		    file, line);
2800cde2e34SJason Evans 	}
2819ed346baSBosko Milekic 
28219284646SJohn Baldwin 	return (rval);
2830cde2e34SJason Evans }
2840cde2e34SJason Evans 
2850cde2e34SJason Evans /*
2869ed346baSBosko Milekic  * _mtx_lock_sleep: the tougher part of acquiring an MTX_DEF lock.
2879ed346baSBosko Milekic  *
2889ed346baSBosko Milekic  * We call this if the lock is either contested (i.e. we need to go to
2899ed346baSBosko Milekic  * sleep waiting for it), or if we need to recurse on it.
2900cde2e34SJason Evans  */
2910cde2e34SJason Evans void
2929ed346baSBosko Milekic _mtx_lock_sleep(struct mtx *m, int opts, const char *file, int line)
29336412d79SJohn Baldwin {
29427863426SBosko Milekic 	struct proc *p = curproc;
29536412d79SJohn Baldwin 
29636412d79SJohn Baldwin 	if ((m->mtx_lock & MTX_FLAGMASK) == (uintptr_t)p) {
29736412d79SJohn Baldwin 		m->mtx_recurse++;
29808812b39SBosko Milekic 		atomic_set_ptr(&m->mtx_lock, MTX_RECURSED);
29919284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
3005746a1d8SBosko Milekic 			CTR1(KTR_LOCK, "_mtx_lock_sleep: %p recursing", m);
30136412d79SJohn Baldwin 		return;
30236412d79SJohn Baldwin 	}
3039ed346baSBosko Milekic 
30419284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
30515ec816aSJohn Baldwin 		CTR4(KTR_LOCK,
30615ec816aSJohn Baldwin 		    "_mtx_lock_sleep: %s contested (lock=%p) at %s:%d",
30719284646SJohn Baldwin 		    m->mtx_object.lo_name, (void *)m->mtx_lock, file, line);
3081bd0eefbSJohn Baldwin 
30936412d79SJohn Baldwin 	while (!_obtain_lock(m, p)) {
310f5271ebcSJohn Baldwin 		uintptr_t v;
31136412d79SJohn Baldwin 		struct proc *p1;
31236412d79SJohn Baldwin 
3139ed346baSBosko Milekic 		mtx_lock_spin(&sched_lock);
31436412d79SJohn Baldwin 		/*
3159ed346baSBosko Milekic 		 * Check if the lock has been released while spinning for
3169ed346baSBosko Milekic 		 * the sched_lock.
31736412d79SJohn Baldwin 		 */
31836412d79SJohn Baldwin 		if ((v = m->mtx_lock) == MTX_UNOWNED) {
3199ed346baSBosko Milekic 			mtx_unlock_spin(&sched_lock);
32036412d79SJohn Baldwin 			continue;
32136412d79SJohn Baldwin 		}
3229ed346baSBosko Milekic 
32336412d79SJohn Baldwin 		/*
3249ed346baSBosko Milekic 		 * The mutex was marked contested on release. This means that
3259ed346baSBosko Milekic 		 * there are processes blocked on it.
32636412d79SJohn Baldwin 		 */
32736412d79SJohn Baldwin 		if (v == MTX_CONTESTED) {
32836412d79SJohn Baldwin 			p1 = TAILQ_FIRST(&m->mtx_blocked);
3295746a1d8SBosko Milekic 			MPASS(p1 != NULL);
33036412d79SJohn Baldwin 			m->mtx_lock = (uintptr_t)p | MTX_CONTESTED;
3319ed346baSBosko Milekic 
332d5a08a60SJake Burkholder 			if (p1->p_pri.pri_level < p->p_pri.pri_level)
333d5a08a60SJake Burkholder 				SET_PRIO(p, p1->p_pri.pri_level);
3349ed346baSBosko Milekic 			mtx_unlock_spin(&sched_lock);
33536412d79SJohn Baldwin 			return;
33636412d79SJohn Baldwin 		}
3379ed346baSBosko Milekic 
33836412d79SJohn Baldwin 		/*
3399ed346baSBosko Milekic 		 * If the mutex isn't already contested and a failure occurs
3409ed346baSBosko Milekic 		 * setting the contested bit, the mutex was either released
3419ed346baSBosko Milekic 		 * or the state of the MTX_RECURSED bit changed.
34236412d79SJohn Baldwin 		 */
34336412d79SJohn Baldwin 		if ((v & MTX_CONTESTED) == 0 &&
34436412d79SJohn Baldwin 		    !atomic_cmpset_ptr(&m->mtx_lock, (void *)v,
34536412d79SJohn Baldwin 			(void *)(v | MTX_CONTESTED))) {
3469ed346baSBosko Milekic 			mtx_unlock_spin(&sched_lock);
34736412d79SJohn Baldwin 			continue;
34836412d79SJohn Baldwin 		}
34936412d79SJohn Baldwin 
3509ed346baSBosko Milekic 		/*
3519ed346baSBosko Milekic 		 * We deffinately must sleep for this lock.
3529ed346baSBosko Milekic 		 */
35336412d79SJohn Baldwin 		mtx_assert(m, MA_NOTOWNED);
35436412d79SJohn Baldwin 
35536412d79SJohn Baldwin #ifdef notyet
35636412d79SJohn Baldwin 		/*
3579ed346baSBosko Milekic 		 * If we're borrowing an interrupted thread's VM context, we
3589ed346baSBosko Milekic 		 * must clean up before going to sleep.
35936412d79SJohn Baldwin 		 */
36015ec816aSJohn Baldwin 		if (p->p_ithd != NULL) {
36115ec816aSJohn Baldwin 			struct ithd *it = p->p_ithd;
36236412d79SJohn Baldwin 
36336412d79SJohn Baldwin 			if (it->it_interrupted) {
36419284646SJohn Baldwin 				if (LOCK_LOG_TEST(&m->mtx_object, opts))
36536412d79SJohn Baldwin 					CTR2(KTR_LOCK,
36615ec816aSJohn Baldwin 				    "_mtx_lock_sleep: %p interrupted %p",
36736412d79SJohn Baldwin 					    it, it->it_interrupted);
36836412d79SJohn Baldwin 				intr_thd_fixup(it);
36936412d79SJohn Baldwin 			}
37036412d79SJohn Baldwin 		}
37136412d79SJohn Baldwin #endif
37236412d79SJohn Baldwin 
3739ed346baSBosko Milekic 		/*
3749ed346baSBosko Milekic 		 * Put us on the list of threads blocked on this mutex.
3759ed346baSBosko Milekic 		 */
37636412d79SJohn Baldwin 		if (TAILQ_EMPTY(&m->mtx_blocked)) {
3779ed346baSBosko Milekic 			p1 = (struct proc *)(m->mtx_lock & MTX_FLAGMASK);
3789ed346baSBosko Milekic 			LIST_INSERT_HEAD(&p1->p_contested, m, mtx_contested);
37936412d79SJohn Baldwin 			TAILQ_INSERT_TAIL(&m->mtx_blocked, p, p_procq);
38036412d79SJohn Baldwin 		} else {
38136412d79SJohn Baldwin 			TAILQ_FOREACH(p1, &m->mtx_blocked, p_procq)
382d5a08a60SJake Burkholder 				if (p1->p_pri.pri_level > p->p_pri.pri_level)
38336412d79SJohn Baldwin 					break;
38436412d79SJohn Baldwin 			if (p1)
38536412d79SJohn Baldwin 				TAILQ_INSERT_BEFORE(p1, p, p_procq);
38636412d79SJohn Baldwin 			else
3879ed346baSBosko Milekic 				TAILQ_INSERT_TAIL(&m->mtx_blocked, p, p_procq);
38836412d79SJohn Baldwin 		}
38936412d79SJohn Baldwin 
3909ed346baSBosko Milekic 		/*
3919ed346baSBosko Milekic 		 * Save who we're blocked on.
3929ed346baSBosko Milekic 		 */
3939ed346baSBosko Milekic 		p->p_blocked = m;
39419284646SJohn Baldwin 		p->p_mtxname = m->mtx_object.lo_name;
39536412d79SJohn Baldwin 		p->p_stat = SMTX;
39636412d79SJohn Baldwin 		propagate_priority(p);
3979ed346baSBosko Milekic 
39819284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
399562e4ffeSJohn Baldwin 			CTR3(KTR_LOCK,
4009ed346baSBosko Milekic 			    "_mtx_lock_sleep: p %p blocked on [%p] %s", p, m,
40119284646SJohn Baldwin 			    m->mtx_object.lo_name);
4029ed346baSBosko Milekic 
403c4f7a187SJohn Baldwin 		p->p_stats->p_ru.ru_nvcsw++;
40420cdcc5bSJohn Baldwin 		mi_switch();
4059ed346baSBosko Milekic 
40619284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
40736412d79SJohn Baldwin 			CTR3(KTR_LOCK,
4089ed346baSBosko Milekic 			  "_mtx_lock_sleep: p %p free from blocked on [%p] %s",
40919284646SJohn Baldwin 			  p, m, m->mtx_object.lo_name);
4109ed346baSBosko Milekic 
4119ed346baSBosko Milekic 		mtx_unlock_spin(&sched_lock);
41236412d79SJohn Baldwin 	}
4139ed346baSBosko Milekic 
41436412d79SJohn Baldwin 	return;
4159ed346baSBosko Milekic }
4169ed346baSBosko Milekic 
4179ed346baSBosko Milekic /*
4189ed346baSBosko Milekic  * _mtx_lock_spin: the tougher part of acquiring an MTX_SPIN lock.
4199ed346baSBosko Milekic  *
4209ed346baSBosko Milekic  * This is only called if we need to actually spin for the lock. Recursion
4219ed346baSBosko Milekic  * is handled inline.
4229ed346baSBosko Milekic  */
4239ed346baSBosko Milekic void
4246283b7d0SJohn Baldwin _mtx_lock_spin(struct mtx *m, int opts, critical_t mtx_crit, const char *file,
4259ed346baSBosko Milekic 	       int line)
42636412d79SJohn Baldwin {
42736412d79SJohn Baldwin 	int i = 0;
42836412d79SJohn Baldwin 
42919284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
4305746a1d8SBosko Milekic 		CTR1(KTR_LOCK, "_mtx_lock_spin: %p spinning", m);
4319ed346baSBosko Milekic 
43236412d79SJohn Baldwin 	for (;;) {
43327863426SBosko Milekic 		if (_obtain_lock(m, curproc))
43436412d79SJohn Baldwin 			break;
4359ed346baSBosko Milekic 
4367141f2adSJohn Baldwin 		/* Give interrupts a chance while we spin. */
4377141f2adSJohn Baldwin 		critical_exit(mtx_crit);
43836412d79SJohn Baldwin 		while (m->mtx_lock != MTX_UNOWNED) {
43936412d79SJohn Baldwin 			if (i++ < 1000000)
44036412d79SJohn Baldwin 				continue;
44136412d79SJohn Baldwin 			if (i++ < 6000000)
44236412d79SJohn Baldwin 				DELAY(1);
44336412d79SJohn Baldwin #ifdef DDB
44436412d79SJohn Baldwin 			else if (!db_active)
44536412d79SJohn Baldwin #else
44636412d79SJohn Baldwin 			else
44736412d79SJohn Baldwin #endif
4489ed346baSBosko Milekic 			panic("spin lock %s held by %p for > 5 seconds",
44919284646SJohn Baldwin 			    m->mtx_object.lo_name, (void *)m->mtx_lock);
45036412d79SJohn Baldwin 		}
4517141f2adSJohn Baldwin 		mtx_crit = critical_enter();
45236412d79SJohn Baldwin 	}
45336412d79SJohn Baldwin 
4546283b7d0SJohn Baldwin 	m->mtx_savecrit = mtx_crit;
45519284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
4569ed346baSBosko Milekic 		CTR1(KTR_LOCK, "_mtx_lock_spin: %p spin done", m);
4579ed346baSBosko Milekic 
45836412d79SJohn Baldwin 	return;
45936412d79SJohn Baldwin }
46036412d79SJohn Baldwin 
4619ed346baSBosko Milekic /*
4629ed346baSBosko Milekic  * _mtx_unlock_sleep: the tougher part of releasing an MTX_DEF lock.
4639ed346baSBosko Milekic  *
4649ed346baSBosko Milekic  * We are only called here if the lock is recursed or contested (i.e. we
4659ed346baSBosko Milekic  * need to wake up a blocked thread).
4669ed346baSBosko Milekic  */
46736412d79SJohn Baldwin void
4689ed346baSBosko Milekic _mtx_unlock_sleep(struct mtx *m, int opts, const char *file, int line)
46936412d79SJohn Baldwin {
47036412d79SJohn Baldwin 	struct proc *p, *p1;
47136412d79SJohn Baldwin 	struct mtx *m1;
47236412d79SJohn Baldwin 	int pri;
47336412d79SJohn Baldwin 
47427863426SBosko Milekic 	p = curproc;
4759ed346baSBosko Milekic 
47608812b39SBosko Milekic 	if (mtx_recursed(m)) {
47736412d79SJohn Baldwin 		if (--(m->mtx_recurse) == 0)
47808812b39SBosko Milekic 			atomic_clear_ptr(&m->mtx_lock, MTX_RECURSED);
47919284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
4809ed346baSBosko Milekic 			CTR1(KTR_LOCK, "_mtx_unlock_sleep: %p unrecurse", m);
48136412d79SJohn Baldwin 		return;
48236412d79SJohn Baldwin 	}
4839ed346baSBosko Milekic 
4849ed346baSBosko Milekic 	mtx_lock_spin(&sched_lock);
48519284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
4869ed346baSBosko Milekic 		CTR1(KTR_LOCK, "_mtx_unlock_sleep: %p contested", m);
4879ed346baSBosko Milekic 
48836412d79SJohn Baldwin 	p1 = TAILQ_FIRST(&m->mtx_blocked);
48936412d79SJohn Baldwin 	MPASS(p->p_magic == P_MAGIC);
49036412d79SJohn Baldwin 	MPASS(p1->p_magic == P_MAGIC);
4919ed346baSBosko Milekic 
49236412d79SJohn Baldwin 	TAILQ_REMOVE(&m->mtx_blocked, p1, p_procq);
4939ed346baSBosko Milekic 
49436412d79SJohn Baldwin 	if (TAILQ_EMPTY(&m->mtx_blocked)) {
49536412d79SJohn Baldwin 		LIST_REMOVE(m, mtx_contested);
49636412d79SJohn Baldwin 		_release_lock_quick(m);
49719284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
4989ed346baSBosko Milekic 			CTR1(KTR_LOCK, "_mtx_unlock_sleep: %p not held", m);
49936412d79SJohn Baldwin 	} else
5009ed346baSBosko Milekic 		atomic_store_rel_ptr(&m->mtx_lock, (void *)MTX_CONTESTED);
5019ed346baSBosko Milekic 
502d5a08a60SJake Burkholder 	pri = PRI_MAX;
50336412d79SJohn Baldwin 	LIST_FOREACH(m1, &p->p_contested, mtx_contested) {
504d5a08a60SJake Burkholder 		int cp = TAILQ_FIRST(&m1->mtx_blocked)->p_pri.pri_level;
50536412d79SJohn Baldwin 		if (cp < pri)
50636412d79SJohn Baldwin 			pri = cp;
50736412d79SJohn Baldwin 	}
5089ed346baSBosko Milekic 
509d5a08a60SJake Burkholder 	if (pri > p->p_pri.pri_native)
510d5a08a60SJake Burkholder 		pri = p->p_pri.pri_native;
51136412d79SJohn Baldwin 	SET_PRIO(p, pri);
5129ed346baSBosko Milekic 
51319284646SJohn Baldwin 	if (LOCK_LOG_TEST(&m->mtx_object, opts))
5149ed346baSBosko Milekic 		CTR2(KTR_LOCK, "_mtx_unlock_sleep: %p contested setrunqueue %p",
5159ed346baSBosko Milekic 		    m, p1);
5169ed346baSBosko Milekic 
51736412d79SJohn Baldwin 	p1->p_blocked = NULL;
51836412d79SJohn Baldwin 	p1->p_stat = SRUN;
51936412d79SJohn Baldwin 	setrunqueue(p1);
5209ed346baSBosko Milekic 
521d5a08a60SJake Burkholder 	if ((opts & MTX_NOSWITCH) == 0 && p1->p_pri.pri_level < pri) {
52236412d79SJohn Baldwin #ifdef notyet
52315ec816aSJohn Baldwin 		if (p->p_ithd != NULL) {
52415ec816aSJohn Baldwin 			struct ithd *it = p->p_ithd;
52536412d79SJohn Baldwin 
52636412d79SJohn Baldwin 			if (it->it_interrupted) {
52719284646SJohn Baldwin 				if (LOCK_LOG_TEST(&m->mtx_object, opts))
52836412d79SJohn Baldwin 					CTR2(KTR_LOCK,
52915ec816aSJohn Baldwin 				    "_mtx_unlock_sleep: %p interrupted %p",
53036412d79SJohn Baldwin 					    it, it->it_interrupted);
53136412d79SJohn Baldwin 				intr_thd_fixup(it);
53236412d79SJohn Baldwin 			}
53336412d79SJohn Baldwin 		}
53436412d79SJohn Baldwin #endif
53536412d79SJohn Baldwin 		setrunqueue(p);
53619284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
537562e4ffeSJohn Baldwin 			CTR2(KTR_LOCK,
5389ed346baSBosko Milekic 			    "_mtx_unlock_sleep: %p switching out lock=%p", m,
5399ed346baSBosko Milekic 			    (void *)m->mtx_lock);
5409ed346baSBosko Milekic 
541c4f7a187SJohn Baldwin 		p->p_stats->p_ru.ru_nivcsw++;
54236412d79SJohn Baldwin 		mi_switch();
54319284646SJohn Baldwin 		if (LOCK_LOG_TEST(&m->mtx_object, opts))
5449ed346baSBosko Milekic 			CTR2(KTR_LOCK, "_mtx_unlock_sleep: %p resuming lock=%p",
54531271627SJohn Baldwin 			    m, (void *)m->mtx_lock);
54636412d79SJohn Baldwin 	}
54736412d79SJohn Baldwin 
5489ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
5499ed346baSBosko Milekic 
5509ed346baSBosko Milekic 	return;
5519ed346baSBosko Milekic }
5529ed346baSBosko Milekic 
5539ed346baSBosko Milekic /*
5549ed346baSBosko Milekic  * All the unlocking of MTX_SPIN locks is done inline.
5559ed346baSBosko Milekic  * See the _rel_spin_lock() macro for the details.
5569ed346baSBosko Milekic  */
5579ed346baSBosko Milekic 
5589ed346baSBosko Milekic /*
55915ec816aSJohn Baldwin  * The backing function for the INVARIANTS-enabled mtx_assert()
5609ed346baSBosko Milekic  */
5611103f3b0SJohn Baldwin #ifdef INVARIANT_SUPPORT
5620cde2e34SJason Evans void
56356771ca7SJason Evans _mtx_assert(struct mtx *m, int what, const char *file, int line)
5640cde2e34SJason Evans {
5655cb0fbe4SJohn Baldwin 
5665cb0fbe4SJohn Baldwin 	if (panicstr != NULL)
5675cb0fbe4SJohn Baldwin 		return;
568a10f4966SJake Burkholder 	switch (what) {
5690cde2e34SJason Evans 	case MA_OWNED:
5700cde2e34SJason Evans 	case MA_OWNED | MA_RECURSED:
5710cde2e34SJason Evans 	case MA_OWNED | MA_NOTRECURSED:
572a10f4966SJake Burkholder 		if (!mtx_owned(m))
5730cde2e34SJason Evans 			panic("mutex %s not owned at %s:%d",
57419284646SJohn Baldwin 			    m->mtx_object.lo_name, file, line);
575a10f4966SJake Burkholder 		if (mtx_recursed(m)) {
576a10f4966SJake Burkholder 			if ((what & MA_NOTRECURSED) != 0)
5770cde2e34SJason Evans 				panic("mutex %s recursed at %s:%d",
57819284646SJohn Baldwin 				    m->mtx_object.lo_name, file, line);
579a10f4966SJake Burkholder 		} else if ((what & MA_RECURSED) != 0) {
5800cde2e34SJason Evans 			panic("mutex %s unrecursed at %s:%d",
58119284646SJohn Baldwin 			    m->mtx_object.lo_name, file, line);
5820cde2e34SJason Evans 		}
5830cde2e34SJason Evans 		break;
5840cde2e34SJason Evans 	case MA_NOTOWNED:
585a10f4966SJake Burkholder 		if (mtx_owned(m))
5860cde2e34SJason Evans 			panic("mutex %s owned at %s:%d",
58719284646SJohn Baldwin 			    m->mtx_object.lo_name, file, line);
5880cde2e34SJason Evans 		break;
5890cde2e34SJason Evans 	default:
59056771ca7SJason Evans 		panic("unknown mtx_assert at %s:%d", file, line);
5910cde2e34SJason Evans 	}
5920cde2e34SJason Evans }
5930cde2e34SJason Evans #endif
5940cde2e34SJason Evans 
5959ed346baSBosko Milekic /*
5969ed346baSBosko Milekic  * The MUTEX_DEBUG-enabled mtx_validate()
59719284646SJohn Baldwin  *
59819284646SJohn Baldwin  * Most of these checks have been moved off into the LO_INITIALIZED flag
59919284646SJohn Baldwin  * maintained by the witness code.
6009ed346baSBosko Milekic  */
60136412d79SJohn Baldwin #ifdef MUTEX_DEBUG
60236412d79SJohn Baldwin 
60319284646SJohn Baldwin void	mtx_validate __P((struct mtx *));
60436412d79SJohn Baldwin 
60519284646SJohn Baldwin void
60619284646SJohn Baldwin mtx_validate(struct mtx *m)
60736412d79SJohn Baldwin {
60836412d79SJohn Baldwin 
60936412d79SJohn Baldwin /*
61036412d79SJohn Baldwin  * XXX - When kernacc() is fixed on the alpha to handle K0_SEG memory properly
61136412d79SJohn Baldwin  * we can re-enable the kernacc() checks.
61236412d79SJohn Baldwin  */
61336412d79SJohn Baldwin #ifndef __alpha__
61419284646SJohn Baldwin 	if (!kernacc((caddr_t)m, sizeof(m), VM_PROT_READ | VM_PROT_WRITE))
61519284646SJohn Baldwin 		panic("Can't read and write to mutex %p", m);
61636412d79SJohn Baldwin #endif
61736412d79SJohn Baldwin }
61836412d79SJohn Baldwin #endif
61936412d79SJohn Baldwin 
6209ed346baSBosko Milekic /*
6219ed346baSBosko Milekic  * Mutex initialization routine; initialize lock `m' of type contained in
6229ed346baSBosko Milekic  * `opts' with options contained in `opts' and description `description.'
6239ed346baSBosko Milekic  */
62436412d79SJohn Baldwin void
6259ed346baSBosko Milekic mtx_init(struct mtx *m, const char *description, int opts)
62636412d79SJohn Baldwin {
62719284646SJohn Baldwin 	struct lock_object *lock;
6289ed346baSBosko Milekic 
62919284646SJohn Baldwin 	MPASS((opts & ~(MTX_SPIN | MTX_QUIET | MTX_RECURSE |
63019284646SJohn Baldwin 	    MTX_SLEEPABLE | MTX_NOWITNESS)) == 0);
6319ed346baSBosko Milekic 
63236412d79SJohn Baldwin #ifdef MUTEX_DEBUG
6339ed346baSBosko Milekic 	/* Diagnostic and error correction */
63419284646SJohn Baldwin 	mtx_validate(m);
6356936206eSJohn Baldwin #endif
63636412d79SJohn Baldwin 
63719284646SJohn Baldwin 	bzero(m, sizeof(*m));
63819284646SJohn Baldwin 	lock = &m->mtx_object;
63919284646SJohn Baldwin 	if (opts & MTX_SPIN)
64019284646SJohn Baldwin 		lock->lo_class = &lock_class_mtx_spin;
64119284646SJohn Baldwin 	else
64219284646SJohn Baldwin 		lock->lo_class = &lock_class_mtx_sleep;
64319284646SJohn Baldwin 	lock->lo_name = description;
64419284646SJohn Baldwin 	if (opts & MTX_QUIET)
64519284646SJohn Baldwin 		lock->lo_flags = LO_QUIET;
64619284646SJohn Baldwin 	if (opts & MTX_RECURSE)
64719284646SJohn Baldwin 		lock->lo_flags |= LO_RECURSABLE;
64819284646SJohn Baldwin 	if (opts & MTX_SLEEPABLE)
64919284646SJohn Baldwin 		lock->lo_flags |= LO_SLEEPABLE;
65019284646SJohn Baldwin 	if ((opts & MTX_NOWITNESS) == 0)
65119284646SJohn Baldwin 		lock->lo_flags |= LO_WITNESS;
65219284646SJohn Baldwin 
65319284646SJohn Baldwin 	m->mtx_lock = MTX_UNOWNED;
65436412d79SJohn Baldwin 	TAILQ_INIT(&m->mtx_blocked);
6559ed346baSBosko Milekic 
65619284646SJohn Baldwin 	LOCK_LOG_INIT(lock, opts);
657d1c1b841SJason Evans 
65819284646SJohn Baldwin 	WITNESS_INIT(lock);
65936412d79SJohn Baldwin }
66036412d79SJohn Baldwin 
6619ed346baSBosko Milekic /*
66219284646SJohn Baldwin  * Remove lock `m' from all_mtx queue.  We don't allow MTX_QUIET to be
66319284646SJohn Baldwin  * passed in as a flag here because if the corresponding mtx_init() was
66419284646SJohn Baldwin  * called with MTX_QUIET set, then it will already be set in the mutex's
66519284646SJohn Baldwin  * flags.
6669ed346baSBosko Milekic  */
66736412d79SJohn Baldwin void
66836412d79SJohn Baldwin mtx_destroy(struct mtx *m)
66936412d79SJohn Baldwin {
67036412d79SJohn Baldwin 
67119284646SJohn Baldwin 	LOCK_LOG_DESTROY(&m->mtx_object, 0);
6729ed346baSBosko Milekic 
67319284646SJohn Baldwin 	if (!mtx_owned(m))
67419284646SJohn Baldwin 		MPASS(mtx_unowned(m));
67519284646SJohn Baldwin 	else {
67608812b39SBosko Milekic 		MPASS((m->mtx_lock & (MTX_RECURSED|MTX_CONTESTED)) == 0);
6779ed346baSBosko Milekic 
67819284646SJohn Baldwin 		/* Tell witness this isn't locked to make it happy. */
6792d96f0b1SJohn Baldwin 		WITNESS_UNLOCK(&m->mtx_object, LOP_EXCLUSIVE | LOP_NOSWITCH,
6802d96f0b1SJohn Baldwin 		    __FILE__, __LINE__);
68136412d79SJohn Baldwin 	}
6820384fff8SJason Evans 
68319284646SJohn Baldwin 	WITNESS_DESTROY(&m->mtx_object);
6840384fff8SJason Evans }
685