xref: /freebsd/sys/kern/kern_lock.c (revision e64b4fa8580b0fd33beb34a9653149492a180951)
19454b2d8SWarner Losh /*-
2047dd67eSAttilio Rao  * Copyright (c) 2008 Attilio Rao <attilio@FreeBSD.org>
3047dd67eSAttilio Rao  * All rights reserved.
453bf4bb2SPeter Wemm  *
553bf4bb2SPeter Wemm  * Redistribution and use in source and binary forms, with or without
653bf4bb2SPeter Wemm  * modification, are permitted provided that the following conditions
753bf4bb2SPeter Wemm  * are met:
853bf4bb2SPeter Wemm  * 1. Redistributions of source code must retain the above copyright
9047dd67eSAttilio Rao  *    notice(s), this list of conditions and the following disclaimer as
10047dd67eSAttilio Rao  *    the first lines of this file unmodified other than the possible
11047dd67eSAttilio Rao  *    addition of one or more copyright notices.
1253bf4bb2SPeter Wemm  * 2. Redistributions in binary form must reproduce the above copyright
13047dd67eSAttilio Rao  *    notice(s), this list of conditions and the following disclaimer in the
1453bf4bb2SPeter Wemm  *    documentation and/or other materials provided with the distribution.
1553bf4bb2SPeter Wemm  *
16047dd67eSAttilio Rao  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) ``AS IS'' AND ANY
17047dd67eSAttilio Rao  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18047dd67eSAttilio Rao  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19047dd67eSAttilio Rao  * DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY
20047dd67eSAttilio Rao  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21047dd67eSAttilio Rao  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
22047dd67eSAttilio Rao  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
23047dd67eSAttilio Rao  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2453bf4bb2SPeter Wemm  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25047dd67eSAttilio Rao  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
26047dd67eSAttilio Rao  * DAMAGE.
2753bf4bb2SPeter Wemm  */
2853bf4bb2SPeter Wemm 
29651175c9SAttilio Rao #include "opt_adaptive_lockmgrs.h"
30047dd67eSAttilio Rao #include "opt_ddb.h"
31f5f9340bSFabien Thomas #include "opt_hwpmc_hooks.h"
32047dd67eSAttilio Rao 
33677b542eSDavid E. O'Brien #include <sys/cdefs.h>
34677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
35677b542eSDavid E. O'Brien 
3653bf4bb2SPeter Wemm #include <sys/param.h>
37cd2fe4e6SAttilio Rao #include <sys/kdb.h>
3861d80e90SJohn Baldwin #include <sys/ktr.h>
3953bf4bb2SPeter Wemm #include <sys/lock.h>
40047dd67eSAttilio Rao #include <sys/lock_profile.h>
418302d183SBruce Evans #include <sys/lockmgr.h>
42d8881ca3SJohn Baldwin #include <sys/mutex.h>
438302d183SBruce Evans #include <sys/proc.h>
44047dd67eSAttilio Rao #include <sys/sleepqueue.h>
45e8ddb61dSJeff Roberson #ifdef DEBUG_LOCKS
46e8ddb61dSJeff Roberson #include <sys/stack.h>
47e8ddb61dSJeff Roberson #endif
48651175c9SAttilio Rao #include <sys/sysctl.h>
49047dd67eSAttilio Rao #include <sys/systm.h>
5053bf4bb2SPeter Wemm 
51047dd67eSAttilio Rao #include <machine/cpu.h>
526efc8a16SAttilio Rao 
53be6847d7SJohn Baldwin #ifdef DDB
54be6847d7SJohn Baldwin #include <ddb/ddb.h>
55047dd67eSAttilio Rao #endif
56047dd67eSAttilio Rao 
57f5f9340bSFabien Thomas #ifdef HWPMC_HOOKS
58f5f9340bSFabien Thomas #include <sys/pmckern.h>
59f5f9340bSFabien Thomas PMC_SOFT_DECLARE( , , lock, failed);
60f5f9340bSFabien Thomas #endif
61f5f9340bSFabien Thomas 
62651175c9SAttilio Rao CTASSERT(((LK_ADAPTIVE | LK_NOSHARE) & LO_CLASSFLAGS) ==
63651175c9SAttilio Rao     (LK_ADAPTIVE | LK_NOSHARE));
64651175c9SAttilio Rao CTASSERT(LK_UNLOCKED == (LK_UNLOCKED &
65651175c9SAttilio Rao     ~(LK_ALL_WAITERS | LK_EXCLUSIVE_SPINNERS)));
66047dd67eSAttilio Rao 
67047dd67eSAttilio Rao #define	SQ_EXCLUSIVE_QUEUE	0
68047dd67eSAttilio Rao #define	SQ_SHARED_QUEUE		1
69047dd67eSAttilio Rao 
70047dd67eSAttilio Rao #ifndef INVARIANTS
71047dd67eSAttilio Rao #define	_lockmgr_assert(lk, what, file, line)
72047dd67eSAttilio Rao #define	TD_LOCKS_INC(td)
73047dd67eSAttilio Rao #define	TD_LOCKS_DEC(td)
74047dd67eSAttilio Rao #else
75047dd67eSAttilio Rao #define	TD_LOCKS_INC(td)	((td)->td_locks++)
76047dd67eSAttilio Rao #define	TD_LOCKS_DEC(td)	((td)->td_locks--)
77047dd67eSAttilio Rao #endif
78047dd67eSAttilio Rao #define	TD_SLOCKS_INC(td)	((td)->td_lk_slocks++)
79047dd67eSAttilio Rao #define	TD_SLOCKS_DEC(td)	((td)->td_lk_slocks--)
80047dd67eSAttilio Rao 
81047dd67eSAttilio Rao #ifndef DEBUG_LOCKS
82047dd67eSAttilio Rao #define	STACK_PRINT(lk)
83047dd67eSAttilio Rao #define	STACK_SAVE(lk)
84047dd67eSAttilio Rao #define	STACK_ZERO(lk)
85047dd67eSAttilio Rao #else
86047dd67eSAttilio Rao #define	STACK_PRINT(lk)	stack_print_ddb(&(lk)->lk_stack)
87047dd67eSAttilio Rao #define	STACK_SAVE(lk)	stack_save(&(lk)->lk_stack)
88047dd67eSAttilio Rao #define	STACK_ZERO(lk)	stack_zero(&(lk)->lk_stack)
89047dd67eSAttilio Rao #endif
90047dd67eSAttilio Rao 
91047dd67eSAttilio Rao #define	LOCK_LOG2(lk, string, arg1, arg2)				\
92047dd67eSAttilio Rao 	if (LOCK_LOG_TEST(&(lk)->lock_object, 0))			\
93047dd67eSAttilio Rao 		CTR2(KTR_LOCK, (string), (arg1), (arg2))
94047dd67eSAttilio Rao #define	LOCK_LOG3(lk, string, arg1, arg2, arg3)				\
95047dd67eSAttilio Rao 	if (LOCK_LOG_TEST(&(lk)->lock_object, 0))			\
96047dd67eSAttilio Rao 		CTR3(KTR_LOCK, (string), (arg1), (arg2), (arg3))
97047dd67eSAttilio Rao 
98e5f94314SAttilio Rao #define	GIANT_DECLARE							\
99e5f94314SAttilio Rao 	int _i = 0;							\
100e5f94314SAttilio Rao 	WITNESS_SAVE_DECL(Giant)
101e5f94314SAttilio Rao #define	GIANT_RESTORE() do {						\
102e5f94314SAttilio Rao 	if (_i > 0) {							\
103e5f94314SAttilio Rao 		while (_i--)						\
104e5f94314SAttilio Rao 			mtx_lock(&Giant);				\
105e5f94314SAttilio Rao 		WITNESS_RESTORE(&Giant.lock_object, Giant);		\
106e5f94314SAttilio Rao 	}								\
107e5f94314SAttilio Rao } while (0)
108e5f94314SAttilio Rao #define	GIANT_SAVE() do {						\
109e5f94314SAttilio Rao 	if (mtx_owned(&Giant)) {					\
110e5f94314SAttilio Rao 		WITNESS_SAVE(&Giant.lock_object, Giant);		\
111e5f94314SAttilio Rao 		while (mtx_owned(&Giant)) {				\
112e5f94314SAttilio Rao 			_i++;						\
113e5f94314SAttilio Rao 			mtx_unlock(&Giant);				\
114e5f94314SAttilio Rao 		}							\
115e5f94314SAttilio Rao 	}								\
116e5f94314SAttilio Rao } while (0)
117e5f94314SAttilio Rao 
11872ba3c08SKonstantin Belousov #define	LK_CAN_SHARE(x, flags)						\
11972ba3c08SKonstantin Belousov 	(((x) & LK_SHARE) &&						\
12072ba3c08SKonstantin Belousov 	(((x) & (LK_EXCLUSIVE_WAITERS | LK_EXCLUSIVE_SPINNERS)) == 0 ||	\
12172ba3c08SKonstantin Belousov 	(curthread->td_lk_slocks != 0 && !(flags & LK_NODDLKTREAT)) ||	\
12272ba3c08SKonstantin Belousov 	(curthread->td_pflags & TDP_DEADLKTREAT)))
123e5f94314SAttilio Rao #define	LK_TRYOP(x)							\
124e5f94314SAttilio Rao 	((x) & LK_NOWAIT)
125e5f94314SAttilio Rao 
126e5f94314SAttilio Rao #define	LK_CAN_WITNESS(x)						\
127e5f94314SAttilio Rao 	(((x) & LK_NOWITNESS) == 0 && !LK_TRYOP(x))
128e5f94314SAttilio Rao #define	LK_TRYWIT(x)							\
129e5f94314SAttilio Rao 	(LK_TRYOP(x) ? LOP_TRYLOCK : 0)
130047dd67eSAttilio Rao 
131651175c9SAttilio Rao #define	LK_CAN_ADAPT(lk, f)						\
132651175c9SAttilio Rao 	(((lk)->lock_object.lo_flags & LK_ADAPTIVE) != 0 &&		\
133651175c9SAttilio Rao 	((f) & LK_SLEEPFAIL) == 0)
134651175c9SAttilio Rao 
135047dd67eSAttilio Rao #define	lockmgr_disowned(lk)						\
136047dd67eSAttilio Rao 	(((lk)->lk_lock & ~(LK_FLAGMASK & ~LK_SHARE)) == LK_KERNPROC)
137047dd67eSAttilio Rao 
138047dd67eSAttilio Rao #define	lockmgr_xlocked(lk)						\
139047dd67eSAttilio Rao 	(((lk)->lk_lock & ~(LK_FLAGMASK & ~LK_SHARE)) == (uintptr_t)curthread)
140047dd67eSAttilio Rao 
141d576deedSPawel Jakub Dawidek static void	assert_lockmgr(const struct lock_object *lock, int how);
142047dd67eSAttilio Rao #ifdef DDB
143d576deedSPawel Jakub Dawidek static void	db_show_lockmgr(const struct lock_object *lock);
144be6847d7SJohn Baldwin #endif
1457faf4d90SDavide Italiano static void	lock_lockmgr(struct lock_object *lock, uintptr_t how);
146a5aedd68SStacey Son #ifdef KDTRACE_HOOKS
147d576deedSPawel Jakub Dawidek static int	owner_lockmgr(const struct lock_object *lock,
148d576deedSPawel Jakub Dawidek 		    struct thread **owner);
149a5aedd68SStacey Son #endif
1507faf4d90SDavide Italiano static uintptr_t unlock_lockmgr(struct lock_object *lock);
15161bd5e21SKip Macy 
15261bd5e21SKip Macy struct lock_class lock_class_lockmgr = {
1533ff6d229SJohn Baldwin 	.lc_name = "lockmgr",
154047dd67eSAttilio Rao 	.lc_flags = LC_RECURSABLE | LC_SLEEPABLE | LC_SLEEPLOCK | LC_UPGRADABLE,
155f9721b43SAttilio Rao 	.lc_assert = assert_lockmgr,
15661bd5e21SKip Macy #ifdef DDB
1576e21afd4SJohn Baldwin 	.lc_ddb_show = db_show_lockmgr,
15861bd5e21SKip Macy #endif
1596e21afd4SJohn Baldwin 	.lc_lock = lock_lockmgr,
160a5aedd68SStacey Son 	.lc_unlock = unlock_lockmgr,
161a5aedd68SStacey Son #ifdef KDTRACE_HOOKS
162a5aedd68SStacey Son 	.lc_owner = owner_lockmgr,
163a5aedd68SStacey Son #endif
16461bd5e21SKip Macy };
16561bd5e21SKip Macy 
166651175c9SAttilio Rao #ifdef ADAPTIVE_LOCKMGRS
167651175c9SAttilio Rao static u_int alk_retries = 10;
168651175c9SAttilio Rao static u_int alk_loops = 10000;
1696472ac3dSEd Schouten static SYSCTL_NODE(_debug, OID_AUTO, lockmgr, CTLFLAG_RD, NULL,
1706472ac3dSEd Schouten     "lockmgr debugging");
171651175c9SAttilio Rao SYSCTL_UINT(_debug_lockmgr, OID_AUTO, retries, CTLFLAG_RW, &alk_retries, 0, "");
172651175c9SAttilio Rao SYSCTL_UINT(_debug_lockmgr, OID_AUTO, loops, CTLFLAG_RW, &alk_loops, 0, "");
173651175c9SAttilio Rao #endif
174651175c9SAttilio Rao 
175047dd67eSAttilio Rao static __inline struct thread *
176d576deedSPawel Jakub Dawidek lockmgr_xholder(const struct lock *lk)
177047dd67eSAttilio Rao {
178047dd67eSAttilio Rao 	uintptr_t x;
179047dd67eSAttilio Rao 
180047dd67eSAttilio Rao 	x = lk->lk_lock;
181047dd67eSAttilio Rao 	return ((x & LK_SHARE) ? NULL : (struct thread *)LK_HOLDER(x));
182047dd67eSAttilio Rao }
18384887fa3SAttilio Rao 
18453bf4bb2SPeter Wemm /*
185047dd67eSAttilio Rao  * It assumes sleepq_lock held and returns with this one unheld.
186047dd67eSAttilio Rao  * It also assumes the generic interlock is sane and previously checked.
187047dd67eSAttilio Rao  * If LK_INTERLOCK is specified the interlock is not reacquired after the
188047dd67eSAttilio Rao  * sleep.
18953bf4bb2SPeter Wemm  */
190047dd67eSAttilio Rao static __inline int
191047dd67eSAttilio Rao sleeplk(struct lock *lk, u_int flags, struct lock_object *ilk,
192047dd67eSAttilio Rao     const char *wmesg, int pri, int timo, int queue)
193047dd67eSAttilio Rao {
194e5f94314SAttilio Rao 	GIANT_DECLARE;
195047dd67eSAttilio Rao 	struct lock_class *class;
196047dd67eSAttilio Rao 	int catch, error;
19753bf4bb2SPeter Wemm 
198047dd67eSAttilio Rao 	class = (flags & LK_INTERLOCK) ? LOCK_CLASS(ilk) : NULL;
1995047a8fdSAttilio Rao 	catch = pri & PCATCH;
200047dd67eSAttilio Rao 	pri &= PRIMASK;
201047dd67eSAttilio Rao 	error = 0;
202047dd67eSAttilio Rao 
203047dd67eSAttilio Rao 	LOCK_LOG3(lk, "%s: %p blocking on the %s sleepqueue", __func__, lk,
204047dd67eSAttilio Rao 	    (queue == SQ_EXCLUSIVE_QUEUE) ? "exclusive" : "shared");
205047dd67eSAttilio Rao 
206047dd67eSAttilio Rao 	if (flags & LK_INTERLOCK)
207047dd67eSAttilio Rao 		class->lc_unlock(ilk);
2082028867dSAttilio Rao 	if (queue == SQ_EXCLUSIVE_QUEUE && (flags & LK_SLEEPFAIL) != 0)
2092028867dSAttilio Rao 		lk->lk_exslpfail++;
210e5f94314SAttilio Rao 	GIANT_SAVE();
211047dd67eSAttilio Rao 	sleepq_add(&lk->lock_object, NULL, wmesg, SLEEPQ_LK | (catch ?
212047dd67eSAttilio Rao 	    SLEEPQ_INTERRUPTIBLE : 0), queue);
213047dd67eSAttilio Rao 	if ((flags & LK_TIMELOCK) && timo)
214047dd67eSAttilio Rao 		sleepq_set_timeout(&lk->lock_object, timo);
215047dd67eSAttilio Rao 
216047dd67eSAttilio Rao 	/*
217047dd67eSAttilio Rao 	 * Decisional switch for real sleeping.
218047dd67eSAttilio Rao 	 */
219047dd67eSAttilio Rao 	if ((flags & LK_TIMELOCK) && timo && catch)
220047dd67eSAttilio Rao 		error = sleepq_timedwait_sig(&lk->lock_object, pri);
221047dd67eSAttilio Rao 	else if ((flags & LK_TIMELOCK) && timo)
222047dd67eSAttilio Rao 		error = sleepq_timedwait(&lk->lock_object, pri);
223047dd67eSAttilio Rao 	else if (catch)
224047dd67eSAttilio Rao 		error = sleepq_wait_sig(&lk->lock_object, pri);
225047dd67eSAttilio Rao 	else
226047dd67eSAttilio Rao 		sleepq_wait(&lk->lock_object, pri);
227e5f94314SAttilio Rao 	GIANT_RESTORE();
228047dd67eSAttilio Rao 	if ((flags & LK_SLEEPFAIL) && error == 0)
229047dd67eSAttilio Rao 		error = ENOLCK;
230047dd67eSAttilio Rao 
231047dd67eSAttilio Rao 	return (error);
232047dd67eSAttilio Rao }
233047dd67eSAttilio Rao 
234da7bbd2cSJohn Baldwin static __inline int
235047dd67eSAttilio Rao wakeupshlk(struct lock *lk, const char *file, int line)
236047dd67eSAttilio Rao {
237047dd67eSAttilio Rao 	uintptr_t v, x;
2382028867dSAttilio Rao 	u_int realexslp;
239da7bbd2cSJohn Baldwin 	int queue, wakeup_swapper;
240047dd67eSAttilio Rao 
241e5f94314SAttilio Rao 	WITNESS_UNLOCK(&lk->lock_object, 0, file, line);
242047dd67eSAttilio Rao 	LOCK_LOG_LOCK("SUNLOCK", &lk->lock_object, 0, 0, file, line);
243047dd67eSAttilio Rao 
244da7bbd2cSJohn Baldwin 	wakeup_swapper = 0;
245047dd67eSAttilio Rao 	for (;;) {
246047dd67eSAttilio Rao 		x = lk->lk_lock;
247047dd67eSAttilio Rao 
248047dd67eSAttilio Rao 		/*
249047dd67eSAttilio Rao 		 * If there is more than one shared lock held, just drop one
250047dd67eSAttilio Rao 		 * and return.
251047dd67eSAttilio Rao 		 */
252047dd67eSAttilio Rao 		if (LK_SHARERS(x) > 1) {
2537f9f80ceSAttilio Rao 			if (atomic_cmpset_rel_ptr(&lk->lk_lock, x,
254047dd67eSAttilio Rao 			    x - LK_ONE_SHARER))
255047dd67eSAttilio Rao 				break;
256047dd67eSAttilio Rao 			continue;
257047dd67eSAttilio Rao 		}
258047dd67eSAttilio Rao 
259047dd67eSAttilio Rao 		/*
260047dd67eSAttilio Rao 		 * If there are not waiters on the exclusive queue, drop the
261047dd67eSAttilio Rao 		 * lock quickly.
262047dd67eSAttilio Rao 		 */
263047dd67eSAttilio Rao 		if ((x & LK_ALL_WAITERS) == 0) {
264651175c9SAttilio Rao 			MPASS((x & ~LK_EXCLUSIVE_SPINNERS) ==
265651175c9SAttilio Rao 			    LK_SHARERS_LOCK(1));
2667f9f80ceSAttilio Rao 			if (atomic_cmpset_rel_ptr(&lk->lk_lock, x, LK_UNLOCKED))
267047dd67eSAttilio Rao 				break;
268047dd67eSAttilio Rao 			continue;
269047dd67eSAttilio Rao 		}
270047dd67eSAttilio Rao 
271047dd67eSAttilio Rao 		/*
272047dd67eSAttilio Rao 		 * We should have a sharer with waiters, so enter the hard
273047dd67eSAttilio Rao 		 * path in order to handle wakeups correctly.
274047dd67eSAttilio Rao 		 */
275047dd67eSAttilio Rao 		sleepq_lock(&lk->lock_object);
276651175c9SAttilio Rao 		x = lk->lk_lock & (LK_ALL_WAITERS | LK_EXCLUSIVE_SPINNERS);
277047dd67eSAttilio Rao 		v = LK_UNLOCKED;
278047dd67eSAttilio Rao 
279047dd67eSAttilio Rao 		/*
280047dd67eSAttilio Rao 		 * If the lock has exclusive waiters, give them preference in
281047dd67eSAttilio Rao 		 * order to avoid deadlock with shared runners up.
2822028867dSAttilio Rao 		 * If interruptible sleeps left the exclusive queue empty
2832028867dSAttilio Rao 		 * avoid a starvation for the threads sleeping on the shared
2842028867dSAttilio Rao 		 * queue by giving them precedence and cleaning up the
2852028867dSAttilio Rao 		 * exclusive waiters bit anyway.
286c636ba83SAttilio Rao 		 * Please note that lk_exslpfail count may be lying about
287c636ba83SAttilio Rao 		 * the real number of waiters with the LK_SLEEPFAIL flag on
288c636ba83SAttilio Rao 		 * because they may be used in conjuction with interruptible
289aab9c8c2SAttilio Rao 		 * sleeps so lk_exslpfail might be considered an 'upper limit'
290aab9c8c2SAttilio Rao 		 * bound, including the edge cases.
291047dd67eSAttilio Rao 		 */
2922028867dSAttilio Rao 		realexslp = sleepq_sleepcnt(&lk->lock_object,
2932028867dSAttilio Rao 		    SQ_EXCLUSIVE_QUEUE);
2942028867dSAttilio Rao 		if ((x & LK_EXCLUSIVE_WAITERS) != 0 && realexslp != 0) {
2952028867dSAttilio Rao 			if (lk->lk_exslpfail < realexslp) {
2962028867dSAttilio Rao 				lk->lk_exslpfail = 0;
297047dd67eSAttilio Rao 				queue = SQ_EXCLUSIVE_QUEUE;
298047dd67eSAttilio Rao 				v |= (x & LK_SHARED_WAITERS);
299047dd67eSAttilio Rao 			} else {
3002028867dSAttilio Rao 				lk->lk_exslpfail = 0;
3012028867dSAttilio Rao 				LOCK_LOG2(lk,
3022028867dSAttilio Rao 				    "%s: %p has only LK_SLEEPFAIL sleepers",
3032028867dSAttilio Rao 				    __func__, lk);
3042028867dSAttilio Rao 				LOCK_LOG2(lk,
3052028867dSAttilio Rao 			    "%s: %p waking up threads on the exclusive queue",
3062028867dSAttilio Rao 				    __func__, lk);
3072028867dSAttilio Rao 				wakeup_swapper =
3082028867dSAttilio Rao 				    sleepq_broadcast(&lk->lock_object,
3092028867dSAttilio Rao 				    SLEEPQ_LK, 0, SQ_EXCLUSIVE_QUEUE);
3102028867dSAttilio Rao 				queue = SQ_SHARED_QUEUE;
3112028867dSAttilio Rao 			}
3122028867dSAttilio Rao 
3132028867dSAttilio Rao 		} else {
3149dbf7a62SAttilio Rao 
3159dbf7a62SAttilio Rao 			/*
3169dbf7a62SAttilio Rao 			 * Exclusive waiters sleeping with LK_SLEEPFAIL on
3179dbf7a62SAttilio Rao 			 * and using interruptible sleeps/timeout may have
3189dbf7a62SAttilio Rao 			 * left spourious lk_exslpfail counts on, so clean
3199dbf7a62SAttilio Rao 			 * it up anyway.
3209dbf7a62SAttilio Rao 			 */
3219dbf7a62SAttilio Rao 			lk->lk_exslpfail = 0;
322047dd67eSAttilio Rao 			queue = SQ_SHARED_QUEUE;
323047dd67eSAttilio Rao 		}
324047dd67eSAttilio Rao 
3257f9f80ceSAttilio Rao 		if (!atomic_cmpset_rel_ptr(&lk->lk_lock, LK_SHARERS_LOCK(1) | x,
326047dd67eSAttilio Rao 		    v)) {
327047dd67eSAttilio Rao 			sleepq_release(&lk->lock_object);
328047dd67eSAttilio Rao 			continue;
329047dd67eSAttilio Rao 		}
330047dd67eSAttilio Rao 		LOCK_LOG3(lk, "%s: %p waking up threads on the %s queue",
331047dd67eSAttilio Rao 		    __func__, lk, queue == SQ_SHARED_QUEUE ? "shared" :
332047dd67eSAttilio Rao 		    "exclusive");
3332028867dSAttilio Rao 		wakeup_swapper |= sleepq_broadcast(&lk->lock_object, SLEEPQ_LK,
334da7bbd2cSJohn Baldwin 		    0, queue);
335047dd67eSAttilio Rao 		sleepq_release(&lk->lock_object);
336047dd67eSAttilio Rao 		break;
337047dd67eSAttilio Rao 	}
338047dd67eSAttilio Rao 
339047dd67eSAttilio Rao 	lock_profile_release_lock(&lk->lock_object);
340b5fb43e5SJohn Baldwin 	TD_LOCKS_DEC(curthread);
341b5fb43e5SJohn Baldwin 	TD_SLOCKS_DEC(curthread);
342da7bbd2cSJohn Baldwin 	return (wakeup_swapper);
343047dd67eSAttilio Rao }
344047dd67eSAttilio Rao 
345047dd67eSAttilio Rao static void
346d576deedSPawel Jakub Dawidek assert_lockmgr(const struct lock_object *lock, int what)
347f9721b43SAttilio Rao {
348f9721b43SAttilio Rao 
349f9721b43SAttilio Rao 	panic("lockmgr locks do not support assertions");
350f9721b43SAttilio Rao }
351f9721b43SAttilio Rao 
352047dd67eSAttilio Rao static void
3537faf4d90SDavide Italiano lock_lockmgr(struct lock_object *lock, uintptr_t how)
3546e21afd4SJohn Baldwin {
3556e21afd4SJohn Baldwin 
3566e21afd4SJohn Baldwin 	panic("lockmgr locks do not support sleep interlocking");
3576e21afd4SJohn Baldwin }
3586e21afd4SJohn Baldwin 
3597faf4d90SDavide Italiano static uintptr_t
3606e21afd4SJohn Baldwin unlock_lockmgr(struct lock_object *lock)
3616e21afd4SJohn Baldwin {
3626e21afd4SJohn Baldwin 
3636e21afd4SJohn Baldwin 	panic("lockmgr locks do not support sleep interlocking");
3646e21afd4SJohn Baldwin }
3656e21afd4SJohn Baldwin 
366a5aedd68SStacey Son #ifdef KDTRACE_HOOKS
367a5aedd68SStacey Son static int
368d576deedSPawel Jakub Dawidek owner_lockmgr(const struct lock_object *lock, struct thread **owner)
369a5aedd68SStacey Son {
370a5aedd68SStacey Son 
371a5aedd68SStacey Son 	panic("lockmgr locks do not support owner inquiring");
372a5aedd68SStacey Son }
373a5aedd68SStacey Son #endif
374a5aedd68SStacey Son 
37599448ed1SJohn Dyson void
376047dd67eSAttilio Rao lockinit(struct lock *lk, int pri, const char *wmesg, int timo, int flags)
37799448ed1SJohn Dyson {
3786efc8a16SAttilio Rao 	int iflags;
3796efc8a16SAttilio Rao 
380047dd67eSAttilio Rao 	MPASS((flags & ~LK_INIT_MASK) == 0);
381353998acSAttilio Rao 	ASSERT_ATOMIC_LOAD_PTR(lk->lk_lock,
382353998acSAttilio Rao             ("%s: lockmgr not aligned for %s: %p", __func__, wmesg,
383353998acSAttilio Rao             &lk->lk_lock));
38499448ed1SJohn Dyson 
385f0830182SAttilio Rao 	iflags = LO_SLEEPABLE | LO_UPGRADABLE;
386f0830182SAttilio Rao 	if (flags & LK_CANRECURSE)
387f0830182SAttilio Rao 		iflags |= LO_RECURSABLE;
388047dd67eSAttilio Rao 	if ((flags & LK_NODUP) == 0)
3896efc8a16SAttilio Rao 		iflags |= LO_DUPOK;
3907fbfba7bSAttilio Rao 	if (flags & LK_NOPROFILE)
3917fbfba7bSAttilio Rao 		iflags |= LO_NOPROFILE;
392047dd67eSAttilio Rao 	if ((flags & LK_NOWITNESS) == 0)
3936efc8a16SAttilio Rao 		iflags |= LO_WITNESS;
3947fbfba7bSAttilio Rao 	if (flags & LK_QUIET)
3957fbfba7bSAttilio Rao 		iflags |= LO_QUIET;
396e63091eaSMarcel Moolenaar 	if (flags & LK_IS_VNODE)
397e63091eaSMarcel Moolenaar 		iflags |= LO_IS_VNODE;
398651175c9SAttilio Rao 	iflags |= flags & (LK_ADAPTIVE | LK_NOSHARE);
399047dd67eSAttilio Rao 
400b5fb43e5SJohn Baldwin 	lock_init(&lk->lock_object, &lock_class_lockmgr, wmesg, NULL, iflags);
401047dd67eSAttilio Rao 	lk->lk_lock = LK_UNLOCKED;
402047dd67eSAttilio Rao 	lk->lk_recurse = 0;
4032028867dSAttilio Rao 	lk->lk_exslpfail = 0;
404047dd67eSAttilio Rao 	lk->lk_timo = timo;
405047dd67eSAttilio Rao 	lk->lk_pri = pri;
406047dd67eSAttilio Rao 	STACK_ZERO(lk);
40799448ed1SJohn Dyson }
40899448ed1SJohn Dyson 
4093634d5b2SJohn Baldwin /*
4103634d5b2SJohn Baldwin  * XXX: Gross hacks to manipulate external lock flags after
4113634d5b2SJohn Baldwin  * initialization.  Used for certain vnode and buf locks.
4123634d5b2SJohn Baldwin  */
4133634d5b2SJohn Baldwin void
4143634d5b2SJohn Baldwin lockallowshare(struct lock *lk)
4153634d5b2SJohn Baldwin {
4163634d5b2SJohn Baldwin 
4173634d5b2SJohn Baldwin 	lockmgr_assert(lk, KA_XLOCKED);
4183634d5b2SJohn Baldwin 	lk->lock_object.lo_flags &= ~LK_NOSHARE;
4193634d5b2SJohn Baldwin }
4203634d5b2SJohn Baldwin 
4213634d5b2SJohn Baldwin void
422575e02d9SKonstantin Belousov lockdisableshare(struct lock *lk)
423575e02d9SKonstantin Belousov {
424575e02d9SKonstantin Belousov 
425575e02d9SKonstantin Belousov 	lockmgr_assert(lk, KA_XLOCKED);
426575e02d9SKonstantin Belousov 	lk->lock_object.lo_flags |= LK_NOSHARE;
427575e02d9SKonstantin Belousov }
428575e02d9SKonstantin Belousov 
429575e02d9SKonstantin Belousov void
4303634d5b2SJohn Baldwin lockallowrecurse(struct lock *lk)
4313634d5b2SJohn Baldwin {
4323634d5b2SJohn Baldwin 
4333634d5b2SJohn Baldwin 	lockmgr_assert(lk, KA_XLOCKED);
4343634d5b2SJohn Baldwin 	lk->lock_object.lo_flags |= LO_RECURSABLE;
4353634d5b2SJohn Baldwin }
4363634d5b2SJohn Baldwin 
4373634d5b2SJohn Baldwin void
4383634d5b2SJohn Baldwin lockdisablerecurse(struct lock *lk)
4393634d5b2SJohn Baldwin {
4403634d5b2SJohn Baldwin 
4413634d5b2SJohn Baldwin 	lockmgr_assert(lk, KA_XLOCKED);
4423634d5b2SJohn Baldwin 	lk->lock_object.lo_flags &= ~LO_RECURSABLE;
4433634d5b2SJohn Baldwin }
4443634d5b2SJohn Baldwin 
445a18b1f1dSJason Evans void
446047dd67eSAttilio Rao lockdestroy(struct lock *lk)
447a18b1f1dSJason Evans {
448c91fcee7SJohn Baldwin 
449047dd67eSAttilio Rao 	KASSERT(lk->lk_lock == LK_UNLOCKED, ("lockmgr still held"));
450047dd67eSAttilio Rao 	KASSERT(lk->lk_recurse == 0, ("lockmgr still recursed"));
4512028867dSAttilio Rao 	KASSERT(lk->lk_exslpfail == 0, ("lockmgr still exclusive waiters"));
452047dd67eSAttilio Rao 	lock_destroy(&lk->lock_object);
453047dd67eSAttilio Rao }
454047dd67eSAttilio Rao 
455047dd67eSAttilio Rao int
456047dd67eSAttilio Rao __lockmgr_args(struct lock *lk, u_int flags, struct lock_object *ilk,
457047dd67eSAttilio Rao     const char *wmesg, int pri, int timo, const char *file, int line)
458047dd67eSAttilio Rao {
459e5f94314SAttilio Rao 	GIANT_DECLARE;
460047dd67eSAttilio Rao 	struct lock_class *class;
461047dd67eSAttilio Rao 	const char *iwmesg;
462047dd67eSAttilio Rao 	uintptr_t tid, v, x;
4632028867dSAttilio Rao 	u_int op, realexslp;
4641723a064SJeff Roberson 	int error, ipri, itimo, queue, wakeup_swapper;
4651723a064SJeff Roberson #ifdef LOCK_PROFILING
4661723a064SJeff Roberson 	uint64_t waittime = 0;
4671723a064SJeff Roberson 	int contested = 0;
4681723a064SJeff Roberson #endif
469651175c9SAttilio Rao #ifdef ADAPTIVE_LOCKMGRS
470651175c9SAttilio Rao 	volatile struct thread *owner;
471651175c9SAttilio Rao 	u_int i, spintries = 0;
472651175c9SAttilio Rao #endif
473047dd67eSAttilio Rao 
474047dd67eSAttilio Rao 	error = 0;
475047dd67eSAttilio Rao 	tid = (uintptr_t)curthread;
476047dd67eSAttilio Rao 	op = (flags & LK_TYPE_MASK);
477047dd67eSAttilio Rao 	iwmesg = (wmesg == LK_WMESG_DEFAULT) ? lk->lock_object.lo_name : wmesg;
478047dd67eSAttilio Rao 	ipri = (pri == LK_PRIO_DEFAULT) ? lk->lk_pri : pri;
479047dd67eSAttilio Rao 	itimo = (timo == LK_TIMO_DEFAULT) ? lk->lk_timo : timo;
480047dd67eSAttilio Rao 
481047dd67eSAttilio Rao 	MPASS((flags & ~LK_TOTAL_MASK) == 0);
482872b7289SAttilio Rao 	KASSERT((op & (op - 1)) == 0,
483872b7289SAttilio Rao 	    ("%s: Invalid requested operation @ %s:%d", __func__, file, line));
484047dd67eSAttilio Rao 	KASSERT((flags & (LK_NOWAIT | LK_SLEEPFAIL)) == 0 ||
485047dd67eSAttilio Rao 	    (op != LK_DOWNGRADE && op != LK_RELEASE),
486047dd67eSAttilio Rao 	    ("%s: Invalid flags in regard of the operation desired @ %s:%d",
487047dd67eSAttilio Rao 	    __func__, file, line));
488047dd67eSAttilio Rao 	KASSERT((flags & LK_INTERLOCK) == 0 || ilk != NULL,
489047dd67eSAttilio Rao 	    ("%s: LK_INTERLOCK passed without valid interlock @ %s:%d",
490047dd67eSAttilio Rao 	    __func__, file, line));
491cd2fe4e6SAttilio Rao 	KASSERT(kdb_active != 0 || !TD_IS_IDLETHREAD(curthread),
492e3ae0dfeSAttilio Rao 	    ("%s: idle thread %p on lockmgr %s @ %s:%d", __func__, curthread,
493e3ae0dfeSAttilio Rao 	    lk->lock_object.lo_name, file, line));
494047dd67eSAttilio Rao 
495047dd67eSAttilio Rao 	class = (flags & LK_INTERLOCK) ? LOCK_CLASS(ilk) : NULL;
496047dd67eSAttilio Rao 	if (panicstr != NULL) {
497047dd67eSAttilio Rao 		if (flags & LK_INTERLOCK)
498047dd67eSAttilio Rao 			class->lc_unlock(ilk);
499047dd67eSAttilio Rao 		return (0);
500047dd67eSAttilio Rao 	}
501047dd67eSAttilio Rao 
502d0a724c5SKonstantin Belousov 	if (lk->lock_object.lo_flags & LK_NOSHARE) {
503d0a724c5SKonstantin Belousov 		switch (op) {
504d0a724c5SKonstantin Belousov 		case LK_SHARED:
505047dd67eSAttilio Rao 			op = LK_EXCLUSIVE;
506d0a724c5SKonstantin Belousov 			break;
507d0a724c5SKonstantin Belousov 		case LK_UPGRADE:
5087c6fe803SKonstantin Belousov 		case LK_TRYUPGRADE:
509d0a724c5SKonstantin Belousov 		case LK_DOWNGRADE:
510d0a724c5SKonstantin Belousov 			_lockmgr_assert(lk, KA_XLOCKED | KA_NOTRECURSED,
511d0a724c5SKonstantin Belousov 			    file, line);
51243287e27SMateusz Guzik 			if (flags & LK_INTERLOCK)
51343287e27SMateusz Guzik 				class->lc_unlock(ilk);
514d0a724c5SKonstantin Belousov 			return (0);
515d0a724c5SKonstantin Belousov 		}
516d0a724c5SKonstantin Belousov 	}
517047dd67eSAttilio Rao 
518da7bbd2cSJohn Baldwin 	wakeup_swapper = 0;
519047dd67eSAttilio Rao 	switch (op) {
520047dd67eSAttilio Rao 	case LK_SHARED:
521e5f94314SAttilio Rao 		if (LK_CAN_WITNESS(flags))
522e5f94314SAttilio Rao 			WITNESS_CHECKORDER(&lk->lock_object, LOP_NEWORDER,
52324150d37SJohn Baldwin 			    file, line, flags & LK_INTERLOCK ? ilk : NULL);
524047dd67eSAttilio Rao 		for (;;) {
525047dd67eSAttilio Rao 			x = lk->lk_lock;
526047dd67eSAttilio Rao 
527047dd67eSAttilio Rao 			/*
528047dd67eSAttilio Rao 			 * If no other thread has an exclusive lock, or
529047dd67eSAttilio Rao 			 * no exclusive waiter is present, bump the count of
530047dd67eSAttilio Rao 			 * sharers.  Since we have to preserve the state of
531047dd67eSAttilio Rao 			 * waiters, if we fail to acquire the shared lock
532047dd67eSAttilio Rao 			 * loop back and retry.
533047dd67eSAttilio Rao 			 */
53472ba3c08SKonstantin Belousov 			if (LK_CAN_SHARE(x, flags)) {
535047dd67eSAttilio Rao 				if (atomic_cmpset_acq_ptr(&lk->lk_lock, x,
536047dd67eSAttilio Rao 				    x + LK_ONE_SHARER))
537047dd67eSAttilio Rao 					break;
538047dd67eSAttilio Rao 				continue;
539047dd67eSAttilio Rao 			}
540f5f9340bSFabien Thomas #ifdef HWPMC_HOOKS
541f5f9340bSFabien Thomas 			PMC_SOFT_CALL( , , lock, failed);
542f5f9340bSFabien Thomas #endif
543047dd67eSAttilio Rao 			lock_profile_obtain_lock_failed(&lk->lock_object,
544047dd67eSAttilio Rao 			    &contested, &waittime);
545047dd67eSAttilio Rao 
546047dd67eSAttilio Rao 			/*
54796f1567fSKonstantin Belousov 			 * If the lock is already held by curthread in
548047dd67eSAttilio Rao 			 * exclusive way avoid a deadlock.
549047dd67eSAttilio Rao 			 */
550047dd67eSAttilio Rao 			if (LK_HOLDER(x) == tid) {
551047dd67eSAttilio Rao 				LOCK_LOG2(lk,
55296f1567fSKonstantin Belousov 				    "%s: %p already held in exclusive mode",
553047dd67eSAttilio Rao 				    __func__, lk);
554047dd67eSAttilio Rao 				error = EDEADLK;
555047dd67eSAttilio Rao 				break;
556a18b1f1dSJason Evans 			}
557a18b1f1dSJason Evans 
558a18b1f1dSJason Evans 			/*
559047dd67eSAttilio Rao 			 * If the lock is expected to not sleep just give up
560047dd67eSAttilio Rao 			 * and return.
561d7a7e179SAttilio Rao 			 */
562047dd67eSAttilio Rao 			if (LK_TRYOP(flags)) {
563047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p fails the try operation",
564047dd67eSAttilio Rao 				    __func__, lk);
565047dd67eSAttilio Rao 				error = EBUSY;
566047dd67eSAttilio Rao 				break;
567047dd67eSAttilio Rao 			}
568047dd67eSAttilio Rao 
569651175c9SAttilio Rao #ifdef ADAPTIVE_LOCKMGRS
570651175c9SAttilio Rao 			/*
571651175c9SAttilio Rao 			 * If the owner is running on another CPU, spin until
572651175c9SAttilio Rao 			 * the owner stops running or the state of the lock
5738d3635c4SAttilio Rao 			 * changes.  We need a double-state handle here
5748d3635c4SAttilio Rao 			 * because for a failed acquisition the lock can be
5758d3635c4SAttilio Rao 			 * either held in exclusive mode or shared mode
5768d3635c4SAttilio Rao 			 * (for the writer starvation avoidance technique).
577651175c9SAttilio Rao 			 */
578651175c9SAttilio Rao 			if (LK_CAN_ADAPT(lk, flags) && (x & LK_SHARE) == 0 &&
579651175c9SAttilio Rao 			    LK_HOLDER(x) != LK_KERNPROC) {
580651175c9SAttilio Rao 				owner = (struct thread *)LK_HOLDER(x);
581651175c9SAttilio Rao 				if (LOCK_LOG_TEST(&lk->lock_object, 0))
582651175c9SAttilio Rao 					CTR3(KTR_LOCK,
583651175c9SAttilio Rao 					    "%s: spinning on %p held by %p",
584651175c9SAttilio Rao 					    __func__, lk, owner);
5852cba8dd3SJohn Baldwin 				KTR_STATE1(KTR_SCHED, "thread",
5862cba8dd3SJohn Baldwin 				    sched_tdname(td), "spinning",
5872cba8dd3SJohn Baldwin 				    "lockname:\"%s\"", lk->lock_object.lo_name);
588651175c9SAttilio Rao 
589651175c9SAttilio Rao 				/*
590651175c9SAttilio Rao 				 * If we are holding also an interlock drop it
591651175c9SAttilio Rao 				 * in order to avoid a deadlock if the lockmgr
592651175c9SAttilio Rao 				 * owner is adaptively spinning on the
593651175c9SAttilio Rao 				 * interlock itself.
594651175c9SAttilio Rao 				 */
595651175c9SAttilio Rao 				if (flags & LK_INTERLOCK) {
596651175c9SAttilio Rao 					class->lc_unlock(ilk);
597651175c9SAttilio Rao 					flags &= ~LK_INTERLOCK;
598651175c9SAttilio Rao 				}
599651175c9SAttilio Rao 				GIANT_SAVE();
600651175c9SAttilio Rao 				while (LK_HOLDER(lk->lk_lock) ==
601651175c9SAttilio Rao 				    (uintptr_t)owner && TD_IS_RUNNING(owner))
602651175c9SAttilio Rao 					cpu_spinwait();
6032cba8dd3SJohn Baldwin 				KTR_STATE0(KTR_SCHED, "thread",
6042cba8dd3SJohn Baldwin 				    sched_tdname(td), "running");
6058d3635c4SAttilio Rao 				GIANT_RESTORE();
6068d3635c4SAttilio Rao 				continue;
607651175c9SAttilio Rao 			} else if (LK_CAN_ADAPT(lk, flags) &&
608651175c9SAttilio Rao 			    (x & LK_SHARE) != 0 && LK_SHARERS(x) &&
609651175c9SAttilio Rao 			    spintries < alk_retries) {
6102cba8dd3SJohn Baldwin 				KTR_STATE1(KTR_SCHED, "thread",
6112cba8dd3SJohn Baldwin 				    sched_tdname(td), "spinning",
6122cba8dd3SJohn Baldwin 				    "lockname:\"%s\"", lk->lock_object.lo_name);
613651175c9SAttilio Rao 				if (flags & LK_INTERLOCK) {
614651175c9SAttilio Rao 					class->lc_unlock(ilk);
615651175c9SAttilio Rao 					flags &= ~LK_INTERLOCK;
616651175c9SAttilio Rao 				}
617651175c9SAttilio Rao 				GIANT_SAVE();
618651175c9SAttilio Rao 				spintries++;
619651175c9SAttilio Rao 				for (i = 0; i < alk_loops; i++) {
620651175c9SAttilio Rao 					if (LOCK_LOG_TEST(&lk->lock_object, 0))
621651175c9SAttilio Rao 						CTR4(KTR_LOCK,
622651175c9SAttilio Rao 				    "%s: shared spinning on %p with %u and %u",
623651175c9SAttilio Rao 						    __func__, lk, spintries, i);
624651175c9SAttilio Rao 					x = lk->lk_lock;
625651175c9SAttilio Rao 					if ((x & LK_SHARE) == 0 ||
626cc246667SKonstantin Belousov 					    LK_CAN_SHARE(x, flags) != 0)
627651175c9SAttilio Rao 						break;
628651175c9SAttilio Rao 					cpu_spinwait();
629651175c9SAttilio Rao 				}
6302cba8dd3SJohn Baldwin 				KTR_STATE0(KTR_SCHED, "thread",
6312cba8dd3SJohn Baldwin 				    sched_tdname(td), "running");
6328d3635c4SAttilio Rao 				GIANT_RESTORE();
633651175c9SAttilio Rao 				if (i != alk_loops)
634651175c9SAttilio Rao 					continue;
635651175c9SAttilio Rao 			}
636651175c9SAttilio Rao #endif
637651175c9SAttilio Rao 
638047dd67eSAttilio Rao 			/*
639047dd67eSAttilio Rao 			 * Acquire the sleepqueue chain lock because we
640047dd67eSAttilio Rao 			 * probabilly will need to manipulate waiters flags.
641047dd67eSAttilio Rao 			 */
642047dd67eSAttilio Rao 			sleepq_lock(&lk->lock_object);
643047dd67eSAttilio Rao 			x = lk->lk_lock;
644047dd67eSAttilio Rao 
645047dd67eSAttilio Rao 			/*
646047dd67eSAttilio Rao 			 * if the lock can be acquired in shared mode, try
647047dd67eSAttilio Rao 			 * again.
648047dd67eSAttilio Rao 			 */
64972ba3c08SKonstantin Belousov 			if (LK_CAN_SHARE(x, flags)) {
650047dd67eSAttilio Rao 				sleepq_release(&lk->lock_object);
651047dd67eSAttilio Rao 				continue;
652047dd67eSAttilio Rao 			}
653047dd67eSAttilio Rao 
654651175c9SAttilio Rao #ifdef ADAPTIVE_LOCKMGRS
655651175c9SAttilio Rao 			/*
656651175c9SAttilio Rao 			 * The current lock owner might have started executing
657651175c9SAttilio Rao 			 * on another CPU (or the lock could have changed
658651175c9SAttilio Rao 			 * owner) while we were waiting on the turnstile
659651175c9SAttilio Rao 			 * chain lock.  If so, drop the turnstile lock and try
660651175c9SAttilio Rao 			 * again.
661651175c9SAttilio Rao 			 */
662651175c9SAttilio Rao 			if (LK_CAN_ADAPT(lk, flags) && (x & LK_SHARE) == 0 &&
663651175c9SAttilio Rao 			    LK_HOLDER(x) != LK_KERNPROC) {
664651175c9SAttilio Rao 				owner = (struct thread *)LK_HOLDER(x);
665651175c9SAttilio Rao 				if (TD_IS_RUNNING(owner)) {
666651175c9SAttilio Rao 					sleepq_release(&lk->lock_object);
667651175c9SAttilio Rao 					continue;
668651175c9SAttilio Rao 				}
669651175c9SAttilio Rao 			}
670651175c9SAttilio Rao #endif
671651175c9SAttilio Rao 
672047dd67eSAttilio Rao 			/*
673047dd67eSAttilio Rao 			 * Try to set the LK_SHARED_WAITERS flag.  If we fail,
674047dd67eSAttilio Rao 			 * loop back and retry.
675047dd67eSAttilio Rao 			 */
676047dd67eSAttilio Rao 			if ((x & LK_SHARED_WAITERS) == 0) {
677047dd67eSAttilio Rao 				if (!atomic_cmpset_acq_ptr(&lk->lk_lock, x,
678047dd67eSAttilio Rao 				    x | LK_SHARED_WAITERS)) {
679047dd67eSAttilio Rao 					sleepq_release(&lk->lock_object);
680047dd67eSAttilio Rao 					continue;
681047dd67eSAttilio Rao 				}
682047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p set shared waiters flag",
683047dd67eSAttilio Rao 				    __func__, lk);
684047dd67eSAttilio Rao 			}
685047dd67eSAttilio Rao 
686047dd67eSAttilio Rao 			/*
687047dd67eSAttilio Rao 			 * As far as we have been unable to acquire the
688047dd67eSAttilio Rao 			 * shared lock and the shared waiters flag is set,
689047dd67eSAttilio Rao 			 * we will sleep.
690047dd67eSAttilio Rao 			 */
691047dd67eSAttilio Rao 			error = sleeplk(lk, flags, ilk, iwmesg, ipri, itimo,
692047dd67eSAttilio Rao 			    SQ_SHARED_QUEUE);
693047dd67eSAttilio Rao 			flags &= ~LK_INTERLOCK;
694047dd67eSAttilio Rao 			if (error) {
695047dd67eSAttilio Rao 				LOCK_LOG3(lk,
696047dd67eSAttilio Rao 				    "%s: interrupted sleep for %p with %d",
697047dd67eSAttilio Rao 				    __func__, lk, error);
698047dd67eSAttilio Rao 				break;
699047dd67eSAttilio Rao 			}
700047dd67eSAttilio Rao 			LOCK_LOG2(lk, "%s: %p resuming from the sleep queue",
701047dd67eSAttilio Rao 			    __func__, lk);
702047dd67eSAttilio Rao 		}
703047dd67eSAttilio Rao 		if (error == 0) {
704047dd67eSAttilio Rao 			lock_profile_obtain_lock_success(&lk->lock_object,
705047dd67eSAttilio Rao 			    contested, waittime, file, line);
706047dd67eSAttilio Rao 			LOCK_LOG_LOCK("SLOCK", &lk->lock_object, 0, 0, file,
707047dd67eSAttilio Rao 			    line);
708e5f94314SAttilio Rao 			WITNESS_LOCK(&lk->lock_object, LK_TRYWIT(flags), file,
709e5f94314SAttilio Rao 			    line);
710047dd67eSAttilio Rao 			TD_LOCKS_INC(curthread);
711047dd67eSAttilio Rao 			TD_SLOCKS_INC(curthread);
712047dd67eSAttilio Rao 			STACK_SAVE(lk);
713047dd67eSAttilio Rao 		}
714047dd67eSAttilio Rao 		break;
715047dd67eSAttilio Rao 	case LK_UPGRADE:
7167c6fe803SKonstantin Belousov 	case LK_TRYUPGRADE:
717047dd67eSAttilio Rao 		_lockmgr_assert(lk, KA_SLOCKED, file, line);
718651175c9SAttilio Rao 		v = lk->lk_lock;
719651175c9SAttilio Rao 		x = v & LK_ALL_WAITERS;
720651175c9SAttilio Rao 		v &= LK_EXCLUSIVE_SPINNERS;
721047dd67eSAttilio Rao 
722047dd67eSAttilio Rao 		/*
723047dd67eSAttilio Rao 		 * Try to switch from one shared lock to an exclusive one.
724047dd67eSAttilio Rao 		 * We need to preserve waiters flags during the operation.
725047dd67eSAttilio Rao 		 */
726651175c9SAttilio Rao 		if (atomic_cmpset_ptr(&lk->lk_lock, LK_SHARERS_LOCK(1) | x | v,
727047dd67eSAttilio Rao 		    tid | x)) {
728047dd67eSAttilio Rao 			LOCK_LOG_LOCK("XUPGRADE", &lk->lock_object, 0, 0, file,
729047dd67eSAttilio Rao 			    line);
730e5f94314SAttilio Rao 			WITNESS_UPGRADE(&lk->lock_object, LOP_EXCLUSIVE |
731e5f94314SAttilio Rao 			    LK_TRYWIT(flags), file, line);
732047dd67eSAttilio Rao 			TD_SLOCKS_DEC(curthread);
733047dd67eSAttilio Rao 			break;
734047dd67eSAttilio Rao 		}
735047dd67eSAttilio Rao 
736047dd67eSAttilio Rao 		/*
7377c6fe803SKonstantin Belousov 		 * In LK_TRYUPGRADE mode, do not drop the lock,
7387c6fe803SKonstantin Belousov 		 * returning EBUSY instead.
7397c6fe803SKonstantin Belousov 		 */
7407c6fe803SKonstantin Belousov 		if (op == LK_TRYUPGRADE) {
7417c6fe803SKonstantin Belousov 			LOCK_LOG2(lk, "%s: %p failed the nowait upgrade",
7427c6fe803SKonstantin Belousov 			    __func__, lk);
7437c6fe803SKonstantin Belousov 			error = EBUSY;
7447c6fe803SKonstantin Belousov 			break;
7457c6fe803SKonstantin Belousov 		}
7467c6fe803SKonstantin Belousov 
7477c6fe803SKonstantin Belousov 		/*
748047dd67eSAttilio Rao 		 * We have been unable to succeed in upgrading, so just
749047dd67eSAttilio Rao 		 * give up the shared lock.
750047dd67eSAttilio Rao 		 */
751814f26daSJohn Baldwin 		wakeup_swapper |= wakeupshlk(lk, file, line);
752047dd67eSAttilio Rao 
753047dd67eSAttilio Rao 		/* FALLTHROUGH */
754047dd67eSAttilio Rao 	case LK_EXCLUSIVE:
755e5f94314SAttilio Rao 		if (LK_CAN_WITNESS(flags))
756e5f94314SAttilio Rao 			WITNESS_CHECKORDER(&lk->lock_object, LOP_NEWORDER |
75724150d37SJohn Baldwin 			    LOP_EXCLUSIVE, file, line, flags & LK_INTERLOCK ?
75824150d37SJohn Baldwin 			    ilk : NULL);
759047dd67eSAttilio Rao 
760047dd67eSAttilio Rao 		/*
76196f1567fSKonstantin Belousov 		 * If curthread already holds the lock and this one is
762047dd67eSAttilio Rao 		 * allowed to recurse, simply recurse on it.
763047dd67eSAttilio Rao 		 */
764047dd67eSAttilio Rao 		if (lockmgr_xlocked(lk)) {
765047dd67eSAttilio Rao 			if ((flags & LK_CANRECURSE) == 0 &&
766f0830182SAttilio Rao 			    (lk->lock_object.lo_flags & LO_RECURSABLE) == 0) {
767047dd67eSAttilio Rao 
768047dd67eSAttilio Rao 				/*
769047dd67eSAttilio Rao 				 * If the lock is expected to not panic just
770047dd67eSAttilio Rao 				 * give up and return.
771047dd67eSAttilio Rao 				 */
772047dd67eSAttilio Rao 				if (LK_TRYOP(flags)) {
773047dd67eSAttilio Rao 					LOCK_LOG2(lk,
774047dd67eSAttilio Rao 					    "%s: %p fails the try operation",
775047dd67eSAttilio Rao 					    __func__, lk);
776047dd67eSAttilio Rao 					error = EBUSY;
777047dd67eSAttilio Rao 					break;
778047dd67eSAttilio Rao 				}
779047dd67eSAttilio Rao 				if (flags & LK_INTERLOCK)
780047dd67eSAttilio Rao 					class->lc_unlock(ilk);
781047dd67eSAttilio Rao 		panic("%s: recursing on non recursive lockmgr %s @ %s:%d\n",
782047dd67eSAttilio Rao 				    __func__, iwmesg, file, line);
783047dd67eSAttilio Rao 			}
784047dd67eSAttilio Rao 			lk->lk_recurse++;
785047dd67eSAttilio Rao 			LOCK_LOG2(lk, "%s: %p recursing", __func__, lk);
786047dd67eSAttilio Rao 			LOCK_LOG_LOCK("XLOCK", &lk->lock_object, 0,
787047dd67eSAttilio Rao 			    lk->lk_recurse, file, line);
788e5f94314SAttilio Rao 			WITNESS_LOCK(&lk->lock_object, LOP_EXCLUSIVE |
789e5f94314SAttilio Rao 			    LK_TRYWIT(flags), file, line);
790047dd67eSAttilio Rao 			TD_LOCKS_INC(curthread);
791047dd67eSAttilio Rao 			break;
792047dd67eSAttilio Rao 		}
793047dd67eSAttilio Rao 
794047dd67eSAttilio Rao 		while (!atomic_cmpset_acq_ptr(&lk->lk_lock, LK_UNLOCKED,
795047dd67eSAttilio Rao 		    tid)) {
796f5f9340bSFabien Thomas #ifdef HWPMC_HOOKS
797f5f9340bSFabien Thomas 			PMC_SOFT_CALL( , , lock, failed);
798f5f9340bSFabien Thomas #endif
799047dd67eSAttilio Rao 			lock_profile_obtain_lock_failed(&lk->lock_object,
800047dd67eSAttilio Rao 			    &contested, &waittime);
801047dd67eSAttilio Rao 
802047dd67eSAttilio Rao 			/*
803047dd67eSAttilio Rao 			 * If the lock is expected to not sleep just give up
804047dd67eSAttilio Rao 			 * and return.
805047dd67eSAttilio Rao 			 */
806047dd67eSAttilio Rao 			if (LK_TRYOP(flags)) {
807047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p fails the try operation",
808047dd67eSAttilio Rao 				    __func__, lk);
809047dd67eSAttilio Rao 				error = EBUSY;
810047dd67eSAttilio Rao 				break;
811047dd67eSAttilio Rao 			}
812047dd67eSAttilio Rao 
813651175c9SAttilio Rao #ifdef ADAPTIVE_LOCKMGRS
814651175c9SAttilio Rao 			/*
815651175c9SAttilio Rao 			 * If the owner is running on another CPU, spin until
816651175c9SAttilio Rao 			 * the owner stops running or the state of the lock
817651175c9SAttilio Rao 			 * changes.
818651175c9SAttilio Rao 			 */
819651175c9SAttilio Rao 			x = lk->lk_lock;
820651175c9SAttilio Rao 			if (LK_CAN_ADAPT(lk, flags) && (x & LK_SHARE) == 0 &&
821651175c9SAttilio Rao 			    LK_HOLDER(x) != LK_KERNPROC) {
822651175c9SAttilio Rao 				owner = (struct thread *)LK_HOLDER(x);
823651175c9SAttilio Rao 				if (LOCK_LOG_TEST(&lk->lock_object, 0))
824651175c9SAttilio Rao 					CTR3(KTR_LOCK,
825651175c9SAttilio Rao 					    "%s: spinning on %p held by %p",
826651175c9SAttilio Rao 					    __func__, lk, owner);
8272cba8dd3SJohn Baldwin 				KTR_STATE1(KTR_SCHED, "thread",
8282cba8dd3SJohn Baldwin 				    sched_tdname(td), "spinning",
8292cba8dd3SJohn Baldwin 				    "lockname:\"%s\"", lk->lock_object.lo_name);
830651175c9SAttilio Rao 
831651175c9SAttilio Rao 				/*
832651175c9SAttilio Rao 				 * If we are holding also an interlock drop it
833651175c9SAttilio Rao 				 * in order to avoid a deadlock if the lockmgr
834651175c9SAttilio Rao 				 * owner is adaptively spinning on the
835651175c9SAttilio Rao 				 * interlock itself.
836651175c9SAttilio Rao 				 */
837651175c9SAttilio Rao 				if (flags & LK_INTERLOCK) {
838651175c9SAttilio Rao 					class->lc_unlock(ilk);
839651175c9SAttilio Rao 					flags &= ~LK_INTERLOCK;
840651175c9SAttilio Rao 				}
841651175c9SAttilio Rao 				GIANT_SAVE();
842651175c9SAttilio Rao 				while (LK_HOLDER(lk->lk_lock) ==
843651175c9SAttilio Rao 				    (uintptr_t)owner && TD_IS_RUNNING(owner))
844651175c9SAttilio Rao 					cpu_spinwait();
8452cba8dd3SJohn Baldwin 				KTR_STATE0(KTR_SCHED, "thread",
8462cba8dd3SJohn Baldwin 				    sched_tdname(td), "running");
8478d3635c4SAttilio Rao 				GIANT_RESTORE();
8488d3635c4SAttilio Rao 				continue;
849651175c9SAttilio Rao 			} else if (LK_CAN_ADAPT(lk, flags) &&
850651175c9SAttilio Rao 			    (x & LK_SHARE) != 0 && LK_SHARERS(x) &&
851651175c9SAttilio Rao 			    spintries < alk_retries) {
852651175c9SAttilio Rao 				if ((x & LK_EXCLUSIVE_SPINNERS) == 0 &&
853651175c9SAttilio Rao 				    !atomic_cmpset_ptr(&lk->lk_lock, x,
854651175c9SAttilio Rao 				    x | LK_EXCLUSIVE_SPINNERS))
855651175c9SAttilio Rao 					continue;
8562cba8dd3SJohn Baldwin 				KTR_STATE1(KTR_SCHED, "thread",
8572cba8dd3SJohn Baldwin 				    sched_tdname(td), "spinning",
8582cba8dd3SJohn Baldwin 				    "lockname:\"%s\"", lk->lock_object.lo_name);
859651175c9SAttilio Rao 				if (flags & LK_INTERLOCK) {
860651175c9SAttilio Rao 					class->lc_unlock(ilk);
861651175c9SAttilio Rao 					flags &= ~LK_INTERLOCK;
862651175c9SAttilio Rao 				}
863651175c9SAttilio Rao 				GIANT_SAVE();
864651175c9SAttilio Rao 				spintries++;
865651175c9SAttilio Rao 				for (i = 0; i < alk_loops; i++) {
866651175c9SAttilio Rao 					if (LOCK_LOG_TEST(&lk->lock_object, 0))
867651175c9SAttilio Rao 						CTR4(KTR_LOCK,
868651175c9SAttilio Rao 				    "%s: shared spinning on %p with %u and %u",
869651175c9SAttilio Rao 						    __func__, lk, spintries, i);
870651175c9SAttilio Rao 					if ((lk->lk_lock &
871651175c9SAttilio Rao 					    LK_EXCLUSIVE_SPINNERS) == 0)
872651175c9SAttilio Rao 						break;
873651175c9SAttilio Rao 					cpu_spinwait();
874651175c9SAttilio Rao 				}
8752cba8dd3SJohn Baldwin 				KTR_STATE0(KTR_SCHED, "thread",
8762cba8dd3SJohn Baldwin 				    sched_tdname(td), "running");
8778d3635c4SAttilio Rao 				GIANT_RESTORE();
878651175c9SAttilio Rao 				if (i != alk_loops)
879651175c9SAttilio Rao 					continue;
880651175c9SAttilio Rao 			}
881651175c9SAttilio Rao #endif
882651175c9SAttilio Rao 
883047dd67eSAttilio Rao 			/*
884047dd67eSAttilio Rao 			 * Acquire the sleepqueue chain lock because we
885047dd67eSAttilio Rao 			 * probabilly will need to manipulate waiters flags.
886047dd67eSAttilio Rao 			 */
887047dd67eSAttilio Rao 			sleepq_lock(&lk->lock_object);
888047dd67eSAttilio Rao 			x = lk->lk_lock;
889047dd67eSAttilio Rao 
890047dd67eSAttilio Rao 			/*
891047dd67eSAttilio Rao 			 * if the lock has been released while we spun on
892047dd67eSAttilio Rao 			 * the sleepqueue chain lock just try again.
893047dd67eSAttilio Rao 			 */
894047dd67eSAttilio Rao 			if (x == LK_UNLOCKED) {
895047dd67eSAttilio Rao 				sleepq_release(&lk->lock_object);
896047dd67eSAttilio Rao 				continue;
897047dd67eSAttilio Rao 			}
898047dd67eSAttilio Rao 
899651175c9SAttilio Rao #ifdef ADAPTIVE_LOCKMGRS
900651175c9SAttilio Rao 			/*
901651175c9SAttilio Rao 			 * The current lock owner might have started executing
902651175c9SAttilio Rao 			 * on another CPU (or the lock could have changed
903651175c9SAttilio Rao 			 * owner) while we were waiting on the turnstile
904651175c9SAttilio Rao 			 * chain lock.  If so, drop the turnstile lock and try
905651175c9SAttilio Rao 			 * again.
906651175c9SAttilio Rao 			 */
907651175c9SAttilio Rao 			if (LK_CAN_ADAPT(lk, flags) && (x & LK_SHARE) == 0 &&
908651175c9SAttilio Rao 			    LK_HOLDER(x) != LK_KERNPROC) {
909651175c9SAttilio Rao 				owner = (struct thread *)LK_HOLDER(x);
910651175c9SAttilio Rao 				if (TD_IS_RUNNING(owner)) {
911651175c9SAttilio Rao 					sleepq_release(&lk->lock_object);
912651175c9SAttilio Rao 					continue;
913651175c9SAttilio Rao 				}
914651175c9SAttilio Rao 			}
915651175c9SAttilio Rao #endif
916651175c9SAttilio Rao 
917047dd67eSAttilio Rao 			/*
918047dd67eSAttilio Rao 			 * The lock can be in the state where there is a
919047dd67eSAttilio Rao 			 * pending queue of waiters, but still no owner.
920047dd67eSAttilio Rao 			 * This happens when the lock is contested and an
921047dd67eSAttilio Rao 			 * owner is going to claim the lock.
922047dd67eSAttilio Rao 			 * If curthread is the one successfully acquiring it
923047dd67eSAttilio Rao 			 * claim lock ownership and return, preserving waiters
924047dd67eSAttilio Rao 			 * flags.
925047dd67eSAttilio Rao 			 */
926651175c9SAttilio Rao 			v = x & (LK_ALL_WAITERS | LK_EXCLUSIVE_SPINNERS);
927651175c9SAttilio Rao 			if ((x & ~v) == LK_UNLOCKED) {
928651175c9SAttilio Rao 				v &= ~LK_EXCLUSIVE_SPINNERS;
929047dd67eSAttilio Rao 				if (atomic_cmpset_acq_ptr(&lk->lk_lock, x,
930047dd67eSAttilio Rao 				    tid | v)) {
931047dd67eSAttilio Rao 					sleepq_release(&lk->lock_object);
932047dd67eSAttilio Rao 					LOCK_LOG2(lk,
933047dd67eSAttilio Rao 					    "%s: %p claimed by a new writer",
934047dd67eSAttilio Rao 					    __func__, lk);
935047dd67eSAttilio Rao 					break;
936047dd67eSAttilio Rao 				}
937047dd67eSAttilio Rao 				sleepq_release(&lk->lock_object);
938047dd67eSAttilio Rao 				continue;
939047dd67eSAttilio Rao 			}
940047dd67eSAttilio Rao 
941047dd67eSAttilio Rao 			/*
942047dd67eSAttilio Rao 			 * Try to set the LK_EXCLUSIVE_WAITERS flag.  If we
943047dd67eSAttilio Rao 			 * fail, loop back and retry.
944047dd67eSAttilio Rao 			 */
945047dd67eSAttilio Rao 			if ((x & LK_EXCLUSIVE_WAITERS) == 0) {
946047dd67eSAttilio Rao 				if (!atomic_cmpset_ptr(&lk->lk_lock, x,
947047dd67eSAttilio Rao 				    x | LK_EXCLUSIVE_WAITERS)) {
948047dd67eSAttilio Rao 					sleepq_release(&lk->lock_object);
949047dd67eSAttilio Rao 					continue;
950047dd67eSAttilio Rao 				}
951047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p set excl waiters flag",
952047dd67eSAttilio Rao 				    __func__, lk);
953047dd67eSAttilio Rao 			}
954047dd67eSAttilio Rao 
955047dd67eSAttilio Rao 			/*
956047dd67eSAttilio Rao 			 * As far as we have been unable to acquire the
957047dd67eSAttilio Rao 			 * exclusive lock and the exclusive waiters flag
958047dd67eSAttilio Rao 			 * is set, we will sleep.
959047dd67eSAttilio Rao 			 */
960047dd67eSAttilio Rao 			error = sleeplk(lk, flags, ilk, iwmesg, ipri, itimo,
961047dd67eSAttilio Rao 			    SQ_EXCLUSIVE_QUEUE);
962047dd67eSAttilio Rao 			flags &= ~LK_INTERLOCK;
963047dd67eSAttilio Rao 			if (error) {
964047dd67eSAttilio Rao 				LOCK_LOG3(lk,
965047dd67eSAttilio Rao 				    "%s: interrupted sleep for %p with %d",
966047dd67eSAttilio Rao 				    __func__, lk, error);
967047dd67eSAttilio Rao 				break;
968047dd67eSAttilio Rao 			}
969047dd67eSAttilio Rao 			LOCK_LOG2(lk, "%s: %p resuming from the sleep queue",
970047dd67eSAttilio Rao 			    __func__, lk);
971047dd67eSAttilio Rao 		}
972047dd67eSAttilio Rao 		if (error == 0) {
973047dd67eSAttilio Rao 			lock_profile_obtain_lock_success(&lk->lock_object,
974047dd67eSAttilio Rao 			    contested, waittime, file, line);
975047dd67eSAttilio Rao 			LOCK_LOG_LOCK("XLOCK", &lk->lock_object, 0,
976047dd67eSAttilio Rao 			    lk->lk_recurse, file, line);
977e5f94314SAttilio Rao 			WITNESS_LOCK(&lk->lock_object, LOP_EXCLUSIVE |
978e5f94314SAttilio Rao 			    LK_TRYWIT(flags), file, line);
979047dd67eSAttilio Rao 			TD_LOCKS_INC(curthread);
980047dd67eSAttilio Rao 			STACK_SAVE(lk);
981047dd67eSAttilio Rao 		}
982047dd67eSAttilio Rao 		break;
983047dd67eSAttilio Rao 	case LK_DOWNGRADE:
9841c7d98d0SAttilio Rao 		_lockmgr_assert(lk, KA_XLOCKED, file, line);
985e5f94314SAttilio Rao 		LOCK_LOG_LOCK("XDOWNGRADE", &lk->lock_object, 0, 0, file, line);
986e5f94314SAttilio Rao 		WITNESS_DOWNGRADE(&lk->lock_object, 0, file, line);
9871c7d98d0SAttilio Rao 
9881c7d98d0SAttilio Rao 		/*
9891c7d98d0SAttilio Rao 		 * Panic if the lock is recursed.
9901c7d98d0SAttilio Rao 		 */
9911c7d98d0SAttilio Rao 		if (lockmgr_xlocked(lk) && lockmgr_recursed(lk)) {
9921c7d98d0SAttilio Rao 			if (flags & LK_INTERLOCK)
9931c7d98d0SAttilio Rao 				class->lc_unlock(ilk);
9941c7d98d0SAttilio Rao 			panic("%s: downgrade a recursed lockmgr %s @ %s:%d\n",
9951c7d98d0SAttilio Rao 			    __func__, iwmesg, file, line);
9961c7d98d0SAttilio Rao 		}
997e5f94314SAttilio Rao 		TD_SLOCKS_INC(curthread);
998047dd67eSAttilio Rao 
999047dd67eSAttilio Rao 		/*
1000047dd67eSAttilio Rao 		 * In order to preserve waiters flags, just spin.
1001047dd67eSAttilio Rao 		 */
1002047dd67eSAttilio Rao 		for (;;) {
1003651175c9SAttilio Rao 			x = lk->lk_lock;
1004651175c9SAttilio Rao 			MPASS((x & LK_EXCLUSIVE_SPINNERS) == 0);
1005651175c9SAttilio Rao 			x &= LK_ALL_WAITERS;
1006047dd67eSAttilio Rao 			if (atomic_cmpset_rel_ptr(&lk->lk_lock, tid | x,
1007e5f94314SAttilio Rao 			    LK_SHARERS_LOCK(1) | x))
1008047dd67eSAttilio Rao 				break;
1009047dd67eSAttilio Rao 			cpu_spinwait();
1010047dd67eSAttilio Rao 		}
1011047dd67eSAttilio Rao 		break;
1012047dd67eSAttilio Rao 	case LK_RELEASE:
1013047dd67eSAttilio Rao 		_lockmgr_assert(lk, KA_LOCKED, file, line);
1014047dd67eSAttilio Rao 		x = lk->lk_lock;
1015047dd67eSAttilio Rao 
1016047dd67eSAttilio Rao 		if ((x & LK_SHARE) == 0) {
1017047dd67eSAttilio Rao 
1018047dd67eSAttilio Rao 			/*
1019047dd67eSAttilio Rao 			 * As first option, treact the lock as if it has not
1020047dd67eSAttilio Rao 			 * any waiter.
1021047dd67eSAttilio Rao 			 * Fix-up the tid var if the lock has been disowned.
1022047dd67eSAttilio Rao 			 */
1023047dd67eSAttilio Rao 			if (LK_HOLDER(x) == LK_KERNPROC)
1024047dd67eSAttilio Rao 				tid = LK_KERNPROC;
1025e5f94314SAttilio Rao 			else {
1026e5f94314SAttilio Rao 				WITNESS_UNLOCK(&lk->lock_object, LOP_EXCLUSIVE,
1027e5f94314SAttilio Rao 				    file, line);
1028047dd67eSAttilio Rao 				TD_LOCKS_DEC(curthread);
1029e5f94314SAttilio Rao 			}
1030047dd67eSAttilio Rao 			LOCK_LOG_LOCK("XUNLOCK", &lk->lock_object, 0,
1031047dd67eSAttilio Rao 			    lk->lk_recurse, file, line);
1032047dd67eSAttilio Rao 
1033047dd67eSAttilio Rao 			/*
1034047dd67eSAttilio Rao 			 * The lock is held in exclusive mode.
1035047dd67eSAttilio Rao 			 * If the lock is recursed also, then unrecurse it.
1036047dd67eSAttilio Rao 			 */
1037047dd67eSAttilio Rao 			if (lockmgr_xlocked(lk) && lockmgr_recursed(lk)) {
1038047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p unrecursing", __func__,
1039047dd67eSAttilio Rao 				    lk);
1040047dd67eSAttilio Rao 				lk->lk_recurse--;
1041047dd67eSAttilio Rao 				break;
1042047dd67eSAttilio Rao 			}
104304a28689SJeff Roberson 			if (tid != LK_KERNPROC)
1044047dd67eSAttilio Rao 				lock_profile_release_lock(&lk->lock_object);
1045047dd67eSAttilio Rao 
1046047dd67eSAttilio Rao 			if (atomic_cmpset_rel_ptr(&lk->lk_lock, tid,
1047047dd67eSAttilio Rao 			    LK_UNLOCKED))
1048047dd67eSAttilio Rao 				break;
1049047dd67eSAttilio Rao 
1050047dd67eSAttilio Rao 			sleepq_lock(&lk->lock_object);
1051651175c9SAttilio Rao 			x = lk->lk_lock;
1052047dd67eSAttilio Rao 			v = LK_UNLOCKED;
1053047dd67eSAttilio Rao 
1054047dd67eSAttilio Rao 			/*
1055047dd67eSAttilio Rao 		 	 * If the lock has exclusive waiters, give them
1056047dd67eSAttilio Rao 			 * preference in order to avoid deadlock with
1057047dd67eSAttilio Rao 			 * shared runners up.
10582028867dSAttilio Rao 			 * If interruptible sleeps left the exclusive queue
10592028867dSAttilio Rao 			 * empty avoid a starvation for the threads sleeping
10602028867dSAttilio Rao 			 * on the shared queue by giving them precedence
10612028867dSAttilio Rao 			 * and cleaning up the exclusive waiters bit anyway.
1062c636ba83SAttilio Rao 			 * Please note that lk_exslpfail count may be lying
1063c636ba83SAttilio Rao 			 * about the real number of waiters with the
1064c636ba83SAttilio Rao 			 * LK_SLEEPFAIL flag on because they may be used in
1065c636ba83SAttilio Rao 			 * conjuction with interruptible sleeps so
1066aab9c8c2SAttilio Rao 			 * lk_exslpfail might be considered an 'upper limit'
1067aab9c8c2SAttilio Rao 			 * bound, including the edge cases.
1068047dd67eSAttilio Rao 			 */
1069651175c9SAttilio Rao 			MPASS((x & LK_EXCLUSIVE_SPINNERS) == 0);
10702028867dSAttilio Rao 			realexslp = sleepq_sleepcnt(&lk->lock_object,
10712028867dSAttilio Rao 			    SQ_EXCLUSIVE_QUEUE);
10722028867dSAttilio Rao 			if ((x & LK_EXCLUSIVE_WAITERS) != 0 && realexslp != 0) {
10732028867dSAttilio Rao 				if (lk->lk_exslpfail < realexslp) {
10742028867dSAttilio Rao 					lk->lk_exslpfail = 0;
1075047dd67eSAttilio Rao 					queue = SQ_EXCLUSIVE_QUEUE;
1076047dd67eSAttilio Rao 					v |= (x & LK_SHARED_WAITERS);
1077047dd67eSAttilio Rao 				} else {
10782028867dSAttilio Rao 					lk->lk_exslpfail = 0;
10792028867dSAttilio Rao 					LOCK_LOG2(lk,
10802028867dSAttilio Rao 					"%s: %p has only LK_SLEEPFAIL sleepers",
10812028867dSAttilio Rao 					    __func__, lk);
10822028867dSAttilio Rao 					LOCK_LOG2(lk,
10832028867dSAttilio Rao 			"%s: %p waking up threads on the exclusive queue",
10842028867dSAttilio Rao 					    __func__, lk);
10852028867dSAttilio Rao 					wakeup_swapper =
10862028867dSAttilio Rao 					    sleepq_broadcast(&lk->lock_object,
10872028867dSAttilio Rao 					    SLEEPQ_LK, 0, SQ_EXCLUSIVE_QUEUE);
10882028867dSAttilio Rao 					queue = SQ_SHARED_QUEUE;
10892028867dSAttilio Rao 				}
10902028867dSAttilio Rao 			} else {
10919dbf7a62SAttilio Rao 
10929dbf7a62SAttilio Rao 				/*
10939dbf7a62SAttilio Rao 				 * Exclusive waiters sleeping with LK_SLEEPFAIL
10949dbf7a62SAttilio Rao 				 * on and using interruptible sleeps/timeout
10959dbf7a62SAttilio Rao 				 * may have left spourious lk_exslpfail counts
10969dbf7a62SAttilio Rao 				 * on, so clean it up anyway.
10979dbf7a62SAttilio Rao 				 */
10989dbf7a62SAttilio Rao 				lk->lk_exslpfail = 0;
1099047dd67eSAttilio Rao 				queue = SQ_SHARED_QUEUE;
1100047dd67eSAttilio Rao 			}
1101047dd67eSAttilio Rao 
1102047dd67eSAttilio Rao 			LOCK_LOG3(lk,
1103047dd67eSAttilio Rao 			    "%s: %p waking up threads on the %s queue",
1104047dd67eSAttilio Rao 			    __func__, lk, queue == SQ_SHARED_QUEUE ? "shared" :
1105047dd67eSAttilio Rao 			    "exclusive");
1106047dd67eSAttilio Rao 			atomic_store_rel_ptr(&lk->lk_lock, v);
11072028867dSAttilio Rao 			wakeup_swapper |= sleepq_broadcast(&lk->lock_object,
1108da7bbd2cSJohn Baldwin 			    SLEEPQ_LK, 0, queue);
1109047dd67eSAttilio Rao 			sleepq_release(&lk->lock_object);
1110047dd67eSAttilio Rao 			break;
1111047dd67eSAttilio Rao 		} else
1112da7bbd2cSJohn Baldwin 			wakeup_swapper = wakeupshlk(lk, file, line);
1113047dd67eSAttilio Rao 		break;
1114047dd67eSAttilio Rao 	case LK_DRAIN:
1115e5f94314SAttilio Rao 		if (LK_CAN_WITNESS(flags))
1116e5f94314SAttilio Rao 			WITNESS_CHECKORDER(&lk->lock_object, LOP_NEWORDER |
111724150d37SJohn Baldwin 			    LOP_EXCLUSIVE, file, line, flags & LK_INTERLOCK ?
111824150d37SJohn Baldwin 			    ilk : NULL);
1119047dd67eSAttilio Rao 
1120047dd67eSAttilio Rao 		/*
112196f1567fSKonstantin Belousov 		 * Trying to drain a lock we already own will result in a
1122047dd67eSAttilio Rao 		 * deadlock.
1123047dd67eSAttilio Rao 		 */
1124047dd67eSAttilio Rao 		if (lockmgr_xlocked(lk)) {
1125047dd67eSAttilio Rao 			if (flags & LK_INTERLOCK)
1126047dd67eSAttilio Rao 				class->lc_unlock(ilk);
1127047dd67eSAttilio Rao 			panic("%s: draining %s with the lock held @ %s:%d\n",
1128047dd67eSAttilio Rao 			    __func__, iwmesg, file, line);
1129047dd67eSAttilio Rao 		}
1130047dd67eSAttilio Rao 
1131047dd67eSAttilio Rao 		while (!atomic_cmpset_acq_ptr(&lk->lk_lock, LK_UNLOCKED, tid)) {
1132f5f9340bSFabien Thomas #ifdef HWPMC_HOOKS
1133f5f9340bSFabien Thomas 			PMC_SOFT_CALL( , , lock, failed);
1134f5f9340bSFabien Thomas #endif
1135047dd67eSAttilio Rao 			lock_profile_obtain_lock_failed(&lk->lock_object,
1136047dd67eSAttilio Rao 			    &contested, &waittime);
1137047dd67eSAttilio Rao 
1138047dd67eSAttilio Rao 			/*
1139047dd67eSAttilio Rao 			 * If the lock is expected to not sleep just give up
1140047dd67eSAttilio Rao 			 * and return.
1141047dd67eSAttilio Rao 			 */
1142047dd67eSAttilio Rao 			if (LK_TRYOP(flags)) {
1143047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p fails the try operation",
1144047dd67eSAttilio Rao 				    __func__, lk);
1145047dd67eSAttilio Rao 				error = EBUSY;
1146047dd67eSAttilio Rao 				break;
1147047dd67eSAttilio Rao 			}
1148047dd67eSAttilio Rao 
1149047dd67eSAttilio Rao 			/*
1150047dd67eSAttilio Rao 			 * Acquire the sleepqueue chain lock because we
1151047dd67eSAttilio Rao 			 * probabilly will need to manipulate waiters flags.
1152047dd67eSAttilio Rao 			 */
1153047dd67eSAttilio Rao 			sleepq_lock(&lk->lock_object);
1154047dd67eSAttilio Rao 			x = lk->lk_lock;
1155047dd67eSAttilio Rao 
1156047dd67eSAttilio Rao 			/*
1157047dd67eSAttilio Rao 			 * if the lock has been released while we spun on
1158047dd67eSAttilio Rao 			 * the sleepqueue chain lock just try again.
1159047dd67eSAttilio Rao 			 */
1160047dd67eSAttilio Rao 			if (x == LK_UNLOCKED) {
1161047dd67eSAttilio Rao 				sleepq_release(&lk->lock_object);
1162047dd67eSAttilio Rao 				continue;
1163047dd67eSAttilio Rao 			}
1164047dd67eSAttilio Rao 
1165651175c9SAttilio Rao 			v = x & (LK_ALL_WAITERS | LK_EXCLUSIVE_SPINNERS);
1166651175c9SAttilio Rao 			if ((x & ~v) == LK_UNLOCKED) {
1167651175c9SAttilio Rao 				v = (x & ~LK_EXCLUSIVE_SPINNERS);
11682028867dSAttilio Rao 
11692028867dSAttilio Rao 				/*
11702028867dSAttilio Rao 				 * If interruptible sleeps left the exclusive
11712028867dSAttilio Rao 				 * queue empty avoid a starvation for the
11722028867dSAttilio Rao 				 * threads sleeping on the shared queue by
11732028867dSAttilio Rao 				 * giving them precedence and cleaning up the
11742028867dSAttilio Rao 				 * exclusive waiters bit anyway.
1175c636ba83SAttilio Rao 				 * Please note that lk_exslpfail count may be
1176c636ba83SAttilio Rao 				 * lying about the real number of waiters with
1177c636ba83SAttilio Rao 				 * the LK_SLEEPFAIL flag on because they may
1178c636ba83SAttilio Rao 				 * be used in conjuction with interruptible
1179aab9c8c2SAttilio Rao 				 * sleeps so lk_exslpfail might be considered
1180aab9c8c2SAttilio Rao 				 * an 'upper limit' bound, including the edge
1181c636ba83SAttilio Rao 				 * cases.
11822028867dSAttilio Rao 				 */
1183047dd67eSAttilio Rao 				if (v & LK_EXCLUSIVE_WAITERS) {
1184047dd67eSAttilio Rao 					queue = SQ_EXCLUSIVE_QUEUE;
1185047dd67eSAttilio Rao 					v &= ~LK_EXCLUSIVE_WAITERS;
1186047dd67eSAttilio Rao 				} else {
11879dbf7a62SAttilio Rao 
11889dbf7a62SAttilio Rao 					/*
11899dbf7a62SAttilio Rao 					 * Exclusive waiters sleeping with
11909dbf7a62SAttilio Rao 					 * LK_SLEEPFAIL on and using
11919dbf7a62SAttilio Rao 					 * interruptible sleeps/timeout may
11929dbf7a62SAttilio Rao 					 * have left spourious lk_exslpfail
11939dbf7a62SAttilio Rao 					 * counts on, so clean it up anyway.
11949dbf7a62SAttilio Rao 					 */
1195047dd67eSAttilio Rao 					MPASS(v & LK_SHARED_WAITERS);
11969dbf7a62SAttilio Rao 					lk->lk_exslpfail = 0;
1197047dd67eSAttilio Rao 					queue = SQ_SHARED_QUEUE;
1198047dd67eSAttilio Rao 					v &= ~LK_SHARED_WAITERS;
1199047dd67eSAttilio Rao 				}
12002028867dSAttilio Rao 				if (queue == SQ_EXCLUSIVE_QUEUE) {
12012028867dSAttilio Rao 					realexslp =
12022028867dSAttilio Rao 					    sleepq_sleepcnt(&lk->lock_object,
12032028867dSAttilio Rao 					    SQ_EXCLUSIVE_QUEUE);
12042028867dSAttilio Rao 					if (lk->lk_exslpfail >= realexslp) {
12052028867dSAttilio Rao 						lk->lk_exslpfail = 0;
12062028867dSAttilio Rao 						queue = SQ_SHARED_QUEUE;
12072028867dSAttilio Rao 						v &= ~LK_SHARED_WAITERS;
12082028867dSAttilio Rao 						if (realexslp != 0) {
12092028867dSAttilio Rao 							LOCK_LOG2(lk,
12102028867dSAttilio Rao 					"%s: %p has only LK_SLEEPFAIL sleepers",
12112028867dSAttilio Rao 							    __func__, lk);
12122028867dSAttilio Rao 							LOCK_LOG2(lk,
12132028867dSAttilio Rao 			"%s: %p waking up threads on the exclusive queue",
12142028867dSAttilio Rao 							    __func__, lk);
12152028867dSAttilio Rao 							wakeup_swapper =
12162028867dSAttilio Rao 							    sleepq_broadcast(
12172028867dSAttilio Rao 							    &lk->lock_object,
12182028867dSAttilio Rao 							    SLEEPQ_LK, 0,
12192028867dSAttilio Rao 							    SQ_EXCLUSIVE_QUEUE);
12202028867dSAttilio Rao 						}
12212028867dSAttilio Rao 					} else
12222028867dSAttilio Rao 						lk->lk_exslpfail = 0;
12232028867dSAttilio Rao 				}
1224047dd67eSAttilio Rao 				if (!atomic_cmpset_ptr(&lk->lk_lock, x, v)) {
1225047dd67eSAttilio Rao 					sleepq_release(&lk->lock_object);
1226047dd67eSAttilio Rao 					continue;
1227047dd67eSAttilio Rao 				}
1228047dd67eSAttilio Rao 				LOCK_LOG3(lk,
1229047dd67eSAttilio Rao 				"%s: %p waking up all threads on the %s queue",
1230047dd67eSAttilio Rao 				    __func__, lk, queue == SQ_SHARED_QUEUE ?
1231047dd67eSAttilio Rao 				    "shared" : "exclusive");
1232814f26daSJohn Baldwin 				wakeup_swapper |= sleepq_broadcast(
1233da7bbd2cSJohn Baldwin 				    &lk->lock_object, SLEEPQ_LK, 0, queue);
1234047dd67eSAttilio Rao 
1235047dd67eSAttilio Rao 				/*
1236047dd67eSAttilio Rao 				 * If shared waiters have been woken up we need
1237047dd67eSAttilio Rao 				 * to wait for one of them to acquire the lock
1238047dd67eSAttilio Rao 				 * before to set the exclusive waiters in
1239047dd67eSAttilio Rao 				 * order to avoid a deadlock.
1240047dd67eSAttilio Rao 				 */
1241047dd67eSAttilio Rao 				if (queue == SQ_SHARED_QUEUE) {
1242047dd67eSAttilio Rao 					for (v = lk->lk_lock;
1243047dd67eSAttilio Rao 					    (v & LK_SHARE) && !LK_SHARERS(v);
1244047dd67eSAttilio Rao 					    v = lk->lk_lock)
1245047dd67eSAttilio Rao 						cpu_spinwait();
1246047dd67eSAttilio Rao 				}
1247047dd67eSAttilio Rao 			}
1248047dd67eSAttilio Rao 
1249047dd67eSAttilio Rao 			/*
1250047dd67eSAttilio Rao 			 * Try to set the LK_EXCLUSIVE_WAITERS flag.  If we
1251047dd67eSAttilio Rao 			 * fail, loop back and retry.
1252047dd67eSAttilio Rao 			 */
1253047dd67eSAttilio Rao 			if ((x & LK_EXCLUSIVE_WAITERS) == 0) {
1254047dd67eSAttilio Rao 				if (!atomic_cmpset_ptr(&lk->lk_lock, x,
1255047dd67eSAttilio Rao 				    x | LK_EXCLUSIVE_WAITERS)) {
1256047dd67eSAttilio Rao 					sleepq_release(&lk->lock_object);
1257047dd67eSAttilio Rao 					continue;
1258047dd67eSAttilio Rao 				}
1259047dd67eSAttilio Rao 				LOCK_LOG2(lk, "%s: %p set drain waiters flag",
1260047dd67eSAttilio Rao 				    __func__, lk);
1261047dd67eSAttilio Rao 			}
1262047dd67eSAttilio Rao 
1263047dd67eSAttilio Rao 			/*
1264047dd67eSAttilio Rao 			 * As far as we have been unable to acquire the
1265047dd67eSAttilio Rao 			 * exclusive lock and the exclusive waiters flag
1266047dd67eSAttilio Rao 			 * is set, we will sleep.
1267047dd67eSAttilio Rao 			 */
1268047dd67eSAttilio Rao 			if (flags & LK_INTERLOCK) {
1269047dd67eSAttilio Rao 				class->lc_unlock(ilk);
1270047dd67eSAttilio Rao 				flags &= ~LK_INTERLOCK;
1271047dd67eSAttilio Rao 			}
1272e5f94314SAttilio Rao 			GIANT_SAVE();
1273047dd67eSAttilio Rao 			sleepq_add(&lk->lock_object, NULL, iwmesg, SLEEPQ_LK,
1274047dd67eSAttilio Rao 			    SQ_EXCLUSIVE_QUEUE);
1275047dd67eSAttilio Rao 			sleepq_wait(&lk->lock_object, ipri & PRIMASK);
1276e5f94314SAttilio Rao 			GIANT_RESTORE();
1277047dd67eSAttilio Rao 			LOCK_LOG2(lk, "%s: %p resuming from the sleep queue",
1278047dd67eSAttilio Rao 			    __func__, lk);
1279047dd67eSAttilio Rao 		}
1280047dd67eSAttilio Rao 
1281047dd67eSAttilio Rao 		if (error == 0) {
1282047dd67eSAttilio Rao 			lock_profile_obtain_lock_success(&lk->lock_object,
1283047dd67eSAttilio Rao 			    contested, waittime, file, line);
1284047dd67eSAttilio Rao 			LOCK_LOG_LOCK("DRAIN", &lk->lock_object, 0,
1285047dd67eSAttilio Rao 			    lk->lk_recurse, file, line);
1286e5f94314SAttilio Rao 			WITNESS_LOCK(&lk->lock_object, LOP_EXCLUSIVE |
1287e5f94314SAttilio Rao 			    LK_TRYWIT(flags), file, line);
1288047dd67eSAttilio Rao 			TD_LOCKS_INC(curthread);
1289047dd67eSAttilio Rao 			STACK_SAVE(lk);
1290047dd67eSAttilio Rao 		}
1291047dd67eSAttilio Rao 		break;
1292047dd67eSAttilio Rao 	default:
1293047dd67eSAttilio Rao 		if (flags & LK_INTERLOCK)
1294047dd67eSAttilio Rao 			class->lc_unlock(ilk);
1295047dd67eSAttilio Rao 		panic("%s: unknown lockmgr request 0x%x\n", __func__, op);
1296047dd67eSAttilio Rao 	}
1297047dd67eSAttilio Rao 
1298047dd67eSAttilio Rao 	if (flags & LK_INTERLOCK)
1299047dd67eSAttilio Rao 		class->lc_unlock(ilk);
1300da7bbd2cSJohn Baldwin 	if (wakeup_swapper)
1301da7bbd2cSJohn Baldwin 		kick_proc0();
1302047dd67eSAttilio Rao 
1303047dd67eSAttilio Rao 	return (error);
1304047dd67eSAttilio Rao }
1305047dd67eSAttilio Rao 
1306d7a7e179SAttilio Rao void
1307047dd67eSAttilio Rao _lockmgr_disown(struct lock *lk, const char *file, int line)
1308047dd67eSAttilio Rao {
1309047dd67eSAttilio Rao 	uintptr_t tid, x;
1310047dd67eSAttilio Rao 
131135370593SAndriy Gapon 	if (SCHEDULER_STOPPED())
131235370593SAndriy Gapon 		return;
131335370593SAndriy Gapon 
1314047dd67eSAttilio Rao 	tid = (uintptr_t)curthread;
13151c7d98d0SAttilio Rao 	_lockmgr_assert(lk, KA_XLOCKED, file, line);
13161c7d98d0SAttilio Rao 
13171c7d98d0SAttilio Rao 	/*
13181c7d98d0SAttilio Rao 	 * Panic if the lock is recursed.
13191c7d98d0SAttilio Rao 	 */
13201c7d98d0SAttilio Rao 	if (lockmgr_xlocked(lk) && lockmgr_recursed(lk))
13211c7d98d0SAttilio Rao 		panic("%s: disown a recursed lockmgr @ %s:%d\n",
13221c7d98d0SAttilio Rao 		    __func__,  file, line);
1323047dd67eSAttilio Rao 
1324047dd67eSAttilio Rao 	/*
132596f1567fSKonstantin Belousov 	 * If the owner is already LK_KERNPROC just skip the whole operation.
1326047dd67eSAttilio Rao 	 */
1327047dd67eSAttilio Rao 	if (LK_HOLDER(lk->lk_lock) != tid)
1328047dd67eSAttilio Rao 		return;
132904a28689SJeff Roberson 	lock_profile_release_lock(&lk->lock_object);
1330e5f94314SAttilio Rao 	LOCK_LOG_LOCK("XDISOWN", &lk->lock_object, 0, 0, file, line);
1331e5f94314SAttilio Rao 	WITNESS_UNLOCK(&lk->lock_object, LOP_EXCLUSIVE, file, line);
1332e5f94314SAttilio Rao 	TD_LOCKS_DEC(curthread);
1333337c5ff4SAttilio Rao 	STACK_SAVE(lk);
1334047dd67eSAttilio Rao 
1335047dd67eSAttilio Rao 	/*
1336047dd67eSAttilio Rao 	 * In order to preserve waiters flags, just spin.
1337047dd67eSAttilio Rao 	 */
1338047dd67eSAttilio Rao 	for (;;) {
1339651175c9SAttilio Rao 		x = lk->lk_lock;
1340651175c9SAttilio Rao 		MPASS((x & LK_EXCLUSIVE_SPINNERS) == 0);
1341651175c9SAttilio Rao 		x &= LK_ALL_WAITERS;
134222dd228dSAttilio Rao 		if (atomic_cmpset_rel_ptr(&lk->lk_lock, tid | x,
1343e5f94314SAttilio Rao 		    LK_KERNPROC | x))
1344047dd67eSAttilio Rao 			return;
1345047dd67eSAttilio Rao 		cpu_spinwait();
1346047dd67eSAttilio Rao 	}
1347047dd67eSAttilio Rao }
1348047dd67eSAttilio Rao 
1349047dd67eSAttilio Rao void
1350d576deedSPawel Jakub Dawidek lockmgr_printinfo(const struct lock *lk)
1351d7a7e179SAttilio Rao {
1352d7a7e179SAttilio Rao 	struct thread *td;
1353047dd67eSAttilio Rao 	uintptr_t x;
1354d7a7e179SAttilio Rao 
1355047dd67eSAttilio Rao 	if (lk->lk_lock == LK_UNLOCKED)
1356047dd67eSAttilio Rao 		printf("lock type %s: UNLOCKED\n", lk->lock_object.lo_name);
1357047dd67eSAttilio Rao 	else if (lk->lk_lock & LK_SHARE)
1358047dd67eSAttilio Rao 		printf("lock type %s: SHARED (count %ju)\n",
1359047dd67eSAttilio Rao 		    lk->lock_object.lo_name,
1360047dd67eSAttilio Rao 		    (uintmax_t)LK_SHARERS(lk->lk_lock));
1361047dd67eSAttilio Rao 	else {
1362047dd67eSAttilio Rao 		td = lockmgr_xholder(lk);
1363*e64b4fa8SKonstantin Belousov 		if (td == (struct thread *)LK_KERNPROC)
1364*e64b4fa8SKonstantin Belousov 			printf("lock type %s: EXCL by KERNPROC\n",
1365*e64b4fa8SKonstantin Belousov 			    lk->lock_object.lo_name);
1366*e64b4fa8SKonstantin Belousov 		else
13672573ea5fSIvan Voras 			printf("lock type %s: EXCL by thread %p "
1368*e64b4fa8SKonstantin Belousov 			    "(pid %d, %s, tid %d)\n", lk->lock_object.lo_name,
1369*e64b4fa8SKonstantin Belousov 			    td, td->td_proc->p_pid, td->td_proc->p_comm,
1370*e64b4fa8SKonstantin Belousov 			    td->td_tid);
1371d7a7e179SAttilio Rao 	}
1372d7a7e179SAttilio Rao 
1373047dd67eSAttilio Rao 	x = lk->lk_lock;
1374047dd67eSAttilio Rao 	if (x & LK_EXCLUSIVE_WAITERS)
1375047dd67eSAttilio Rao 		printf(" with exclusive waiters pending\n");
1376047dd67eSAttilio Rao 	if (x & LK_SHARED_WAITERS)
1377047dd67eSAttilio Rao 		printf(" with shared waiters pending\n");
1378651175c9SAttilio Rao 	if (x & LK_EXCLUSIVE_SPINNERS)
1379651175c9SAttilio Rao 		printf(" with exclusive spinners pending\n");
1380047dd67eSAttilio Rao 
1381047dd67eSAttilio Rao 	STACK_PRINT(lk);
1382047dd67eSAttilio Rao }
1383047dd67eSAttilio Rao 
138499448ed1SJohn Dyson int
1385d576deedSPawel Jakub Dawidek lockstatus(const struct lock *lk)
138699448ed1SJohn Dyson {
1387047dd67eSAttilio Rao 	uintptr_t v, x;
1388047dd67eSAttilio Rao 	int ret;
138999448ed1SJohn Dyson 
1390047dd67eSAttilio Rao 	ret = LK_SHARED;
1391047dd67eSAttilio Rao 	x = lk->lk_lock;
1392047dd67eSAttilio Rao 	v = LK_HOLDER(x);
13930e9eb108SAttilio Rao 
1394047dd67eSAttilio Rao 	if ((x & LK_SHARE) == 0) {
1395047dd67eSAttilio Rao 		if (v == (uintptr_t)curthread || v == LK_KERNPROC)
1396047dd67eSAttilio Rao 			ret = LK_EXCLUSIVE;
13976bdfe06aSEivind Eklund 		else
1398047dd67eSAttilio Rao 			ret = LK_EXCLOTHER;
1399047dd67eSAttilio Rao 	} else if (x == LK_UNLOCKED)
1400047dd67eSAttilio Rao 		ret = 0;
140199448ed1SJohn Dyson 
1402047dd67eSAttilio Rao 	return (ret);
140353bf4bb2SPeter Wemm }
1404be6847d7SJohn Baldwin 
140584887fa3SAttilio Rao #ifdef INVARIANT_SUPPORT
1406de5b1952SAlexander Leidinger 
1407de5b1952SAlexander Leidinger FEATURE(invariant_support,
1408de5b1952SAlexander Leidinger     "Support for modules compiled with INVARIANTS option");
1409de5b1952SAlexander Leidinger 
141084887fa3SAttilio Rao #ifndef INVARIANTS
141184887fa3SAttilio Rao #undef	_lockmgr_assert
141284887fa3SAttilio Rao #endif
141384887fa3SAttilio Rao 
141484887fa3SAttilio Rao void
1415d576deedSPawel Jakub Dawidek _lockmgr_assert(const struct lock *lk, int what, const char *file, int line)
141684887fa3SAttilio Rao {
141784887fa3SAttilio Rao 	int slocked = 0;
141884887fa3SAttilio Rao 
141984887fa3SAttilio Rao 	if (panicstr != NULL)
142084887fa3SAttilio Rao 		return;
142184887fa3SAttilio Rao 	switch (what) {
142284887fa3SAttilio Rao 	case KA_SLOCKED:
142384887fa3SAttilio Rao 	case KA_SLOCKED | KA_NOTRECURSED:
142484887fa3SAttilio Rao 	case KA_SLOCKED | KA_RECURSED:
142584887fa3SAttilio Rao 		slocked = 1;
142684887fa3SAttilio Rao 	case KA_LOCKED:
142784887fa3SAttilio Rao 	case KA_LOCKED | KA_NOTRECURSED:
142884887fa3SAttilio Rao 	case KA_LOCKED | KA_RECURSED:
1429e5f94314SAttilio Rao #ifdef WITNESS
1430e5f94314SAttilio Rao 
1431e5f94314SAttilio Rao 		/*
1432e5f94314SAttilio Rao 		 * We cannot trust WITNESS if the lock is held in exclusive
1433e5f94314SAttilio Rao 		 * mode and a call to lockmgr_disown() happened.
1434e5f94314SAttilio Rao 		 * Workaround this skipping the check if the lock is held in
1435e5f94314SAttilio Rao 		 * exclusive mode even for the KA_LOCKED case.
1436e5f94314SAttilio Rao 		 */
1437e5f94314SAttilio Rao 		if (slocked || (lk->lk_lock & LK_SHARE)) {
1438e5f94314SAttilio Rao 			witness_assert(&lk->lock_object, what, file, line);
1439e5f94314SAttilio Rao 			break;
1440e5f94314SAttilio Rao 		}
1441e5f94314SAttilio Rao #endif
1442047dd67eSAttilio Rao 		if (lk->lk_lock == LK_UNLOCKED ||
1443047dd67eSAttilio Rao 		    ((lk->lk_lock & LK_SHARE) == 0 && (slocked ||
1444047dd67eSAttilio Rao 		    (!lockmgr_xlocked(lk) && !lockmgr_disowned(lk)))))
144584887fa3SAttilio Rao 			panic("Lock %s not %slocked @ %s:%d\n",
1446047dd67eSAttilio Rao 			    lk->lock_object.lo_name, slocked ? "share" : "",
144784887fa3SAttilio Rao 			    file, line);
1448047dd67eSAttilio Rao 
1449047dd67eSAttilio Rao 		if ((lk->lk_lock & LK_SHARE) == 0) {
1450047dd67eSAttilio Rao 			if (lockmgr_recursed(lk)) {
145184887fa3SAttilio Rao 				if (what & KA_NOTRECURSED)
145284887fa3SAttilio Rao 					panic("Lock %s recursed @ %s:%d\n",
1453047dd67eSAttilio Rao 					    lk->lock_object.lo_name, file,
1454047dd67eSAttilio Rao 					    line);
145584887fa3SAttilio Rao 			} else if (what & KA_RECURSED)
145684887fa3SAttilio Rao 				panic("Lock %s not recursed @ %s:%d\n",
1457047dd67eSAttilio Rao 				    lk->lock_object.lo_name, file, line);
145884887fa3SAttilio Rao 		}
145984887fa3SAttilio Rao 		break;
146084887fa3SAttilio Rao 	case KA_XLOCKED:
146184887fa3SAttilio Rao 	case KA_XLOCKED | KA_NOTRECURSED:
146284887fa3SAttilio Rao 	case KA_XLOCKED | KA_RECURSED:
1463047dd67eSAttilio Rao 		if (!lockmgr_xlocked(lk) && !lockmgr_disowned(lk))
146484887fa3SAttilio Rao 			panic("Lock %s not exclusively locked @ %s:%d\n",
1465047dd67eSAttilio Rao 			    lk->lock_object.lo_name, file, line);
1466047dd67eSAttilio Rao 		if (lockmgr_recursed(lk)) {
146784887fa3SAttilio Rao 			if (what & KA_NOTRECURSED)
146884887fa3SAttilio Rao 				panic("Lock %s recursed @ %s:%d\n",
1469047dd67eSAttilio Rao 				    lk->lock_object.lo_name, file, line);
147084887fa3SAttilio Rao 		} else if (what & KA_RECURSED)
147184887fa3SAttilio Rao 			panic("Lock %s not recursed @ %s:%d\n",
1472047dd67eSAttilio Rao 			    lk->lock_object.lo_name, file, line);
147384887fa3SAttilio Rao 		break;
147484887fa3SAttilio Rao 	case KA_UNLOCKED:
1475047dd67eSAttilio Rao 		if (lockmgr_xlocked(lk) || lockmgr_disowned(lk))
147684887fa3SAttilio Rao 			panic("Lock %s exclusively locked @ %s:%d\n",
1477047dd67eSAttilio Rao 			    lk->lock_object.lo_name, file, line);
147884887fa3SAttilio Rao 		break;
147984887fa3SAttilio Rao 	default:
1480047dd67eSAttilio Rao 		panic("Unknown lockmgr assertion: %d @ %s:%d\n", what, file,
1481047dd67eSAttilio Rao 		    line);
148284887fa3SAttilio Rao 	}
148384887fa3SAttilio Rao }
1484047dd67eSAttilio Rao #endif
148584887fa3SAttilio Rao 
1486be6847d7SJohn Baldwin #ifdef DDB
1487462a7addSJohn Baldwin int
1488462a7addSJohn Baldwin lockmgr_chain(struct thread *td, struct thread **ownerp)
1489462a7addSJohn Baldwin {
1490047dd67eSAttilio Rao 	struct lock *lk;
1491462a7addSJohn Baldwin 
1492047dd67eSAttilio Rao 	lk = td->td_wchan;
1493462a7addSJohn Baldwin 
1494047dd67eSAttilio Rao 	if (LOCK_CLASS(&lk->lock_object) != &lock_class_lockmgr)
1495462a7addSJohn Baldwin 		return (0);
1496047dd67eSAttilio Rao 	db_printf("blocked on lockmgr %s", lk->lock_object.lo_name);
1497047dd67eSAttilio Rao 	if (lk->lk_lock & LK_SHARE)
1498047dd67eSAttilio Rao 		db_printf("SHARED (count %ju)\n",
1499047dd67eSAttilio Rao 		    (uintmax_t)LK_SHARERS(lk->lk_lock));
1500047dd67eSAttilio Rao 	else
1501047dd67eSAttilio Rao 		db_printf("EXCL\n");
1502047dd67eSAttilio Rao 	*ownerp = lockmgr_xholder(lk);
1503462a7addSJohn Baldwin 
1504462a7addSJohn Baldwin 	return (1);
1505462a7addSJohn Baldwin }
1506462a7addSJohn Baldwin 
1507047dd67eSAttilio Rao static void
1508d576deedSPawel Jakub Dawidek db_show_lockmgr(const struct lock_object *lock)
1509be6847d7SJohn Baldwin {
1510be6847d7SJohn Baldwin 	struct thread *td;
1511d576deedSPawel Jakub Dawidek 	const struct lock *lk;
1512be6847d7SJohn Baldwin 
1513d576deedSPawel Jakub Dawidek 	lk = (const struct lock *)lock;
1514be6847d7SJohn Baldwin 
1515be6847d7SJohn Baldwin 	db_printf(" state: ");
1516047dd67eSAttilio Rao 	if (lk->lk_lock == LK_UNLOCKED)
1517be6847d7SJohn Baldwin 		db_printf("UNLOCKED\n");
1518047dd67eSAttilio Rao 	else if (lk->lk_lock & LK_SHARE)
1519047dd67eSAttilio Rao 		db_printf("SLOCK: %ju\n", (uintmax_t)LK_SHARERS(lk->lk_lock));
1520047dd67eSAttilio Rao 	else {
1521047dd67eSAttilio Rao 		td = lockmgr_xholder(lk);
1522047dd67eSAttilio Rao 		if (td == (struct thread *)LK_KERNPROC)
1523047dd67eSAttilio Rao 			db_printf("XLOCK: LK_KERNPROC\n");
1524047dd67eSAttilio Rao 		else
1525047dd67eSAttilio Rao 			db_printf("XLOCK: %p (tid %d, pid %d, \"%s\")\n", td,
1526047dd67eSAttilio Rao 			    td->td_tid, td->td_proc->p_pid,
1527047dd67eSAttilio Rao 			    td->td_proc->p_comm);
1528047dd67eSAttilio Rao 		if (lockmgr_recursed(lk))
1529047dd67eSAttilio Rao 			db_printf(" recursed: %d\n", lk->lk_recurse);
1530047dd67eSAttilio Rao 	}
1531047dd67eSAttilio Rao 	db_printf(" waiters: ");
1532047dd67eSAttilio Rao 	switch (lk->lk_lock & LK_ALL_WAITERS) {
1533047dd67eSAttilio Rao 	case LK_SHARED_WAITERS:
1534047dd67eSAttilio Rao 		db_printf("shared\n");
1535e5023dd9SEdward Tomasz Napierala 		break;
1536047dd67eSAttilio Rao 	case LK_EXCLUSIVE_WAITERS:
1537047dd67eSAttilio Rao 		db_printf("exclusive\n");
1538047dd67eSAttilio Rao 		break;
1539047dd67eSAttilio Rao 	case LK_ALL_WAITERS:
1540047dd67eSAttilio Rao 		db_printf("shared and exclusive\n");
1541047dd67eSAttilio Rao 		break;
1542047dd67eSAttilio Rao 	default:
1543047dd67eSAttilio Rao 		db_printf("none\n");
1544047dd67eSAttilio Rao 	}
1545651175c9SAttilio Rao 	db_printf(" spinners: ");
1546651175c9SAttilio Rao 	if (lk->lk_lock & LK_EXCLUSIVE_SPINNERS)
1547651175c9SAttilio Rao 		db_printf("exclusive\n");
1548651175c9SAttilio Rao 	else
1549651175c9SAttilio Rao 		db_printf("none\n");
1550be6847d7SJohn Baldwin }
1551be6847d7SJohn Baldwin #endif
1552