xref: /freebsd/sys/kern/kern_condvar.c (revision 263067951a1029407b1168b41d4f5757228d22dc)
1238510fcSJason Evans /*-
2238510fcSJason Evans  * Copyright (c) 2000 Jake Burkholder <jake@freebsd.org>.
3238510fcSJason Evans  * All rights reserved.
4238510fcSJason Evans  *
5238510fcSJason Evans  * Redistribution and use in source and binary forms, with or without
6238510fcSJason Evans  * modification, are permitted provided that the following conditions
7238510fcSJason Evans  * are met:
8238510fcSJason Evans  * 1. Redistributions of source code must retain the above copyright
9238510fcSJason Evans  *    notice, this list of conditions and the following disclaimer.
10238510fcSJason Evans  * 2. Redistributions in binary form must reproduce the above copyright
11238510fcSJason Evans  *    notice, this list of conditions and the following disclaimer in the
12238510fcSJason Evans  *    documentation and/or other materials provided with the distribution.
13238510fcSJason Evans  *
14238510fcSJason Evans  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15238510fcSJason Evans  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16238510fcSJason Evans  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17238510fcSJason Evans  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18238510fcSJason Evans  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19238510fcSJason Evans  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20238510fcSJason Evans  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21238510fcSJason Evans  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22238510fcSJason Evans  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23238510fcSJason Evans  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24238510fcSJason Evans  * SUCH DAMAGE.
25238510fcSJason Evans  *
26238510fcSJason Evans  * $FreeBSD$
27238510fcSJason Evans  */
28238510fcSJason Evans 
29238510fcSJason Evans #include "opt_ktrace.h"
30238510fcSJason Evans 
31238510fcSJason Evans #include <sys/param.h>
32238510fcSJason Evans #include <sys/systm.h>
33fb919e4dSMark Murray #include <sys/lock.h>
34fb919e4dSMark Murray #include <sys/mutex.h>
35238510fcSJason Evans #include <sys/proc.h>
36238510fcSJason Evans #include <sys/kernel.h>
37238510fcSJason Evans #include <sys/ktr.h>
38238510fcSJason Evans #include <sys/condvar.h>
394e997f4bSJeff Roberson #include <sys/sched.h>
40238510fcSJason Evans #include <sys/signalvar.h>
41238510fcSJason Evans #include <sys/resourcevar.h>
42238510fcSJason Evans #ifdef KTRACE
43238510fcSJason Evans #include <sys/uio.h>
44238510fcSJason Evans #include <sys/ktrace.h>
45238510fcSJason Evans #endif
46238510fcSJason Evans 
47238510fcSJason Evans /*
48238510fcSJason Evans  * Common sanity checks for cv_wait* functions.
49238510fcSJason Evans  */
50b40ce416SJulian Elischer #define	CV_ASSERT(cvp, mp, td) do {					\
51a48740b6SDavid E. O'Brien 	KASSERT((td) != NULL, ("%s: curthread NULL", __func__));	\
5271fad9fdSJulian Elischer 	KASSERT(TD_IS_RUNNING(td), ("%s: not TDS_RUNNING", __func__));	\
53a48740b6SDavid E. O'Brien 	KASSERT((cvp) != NULL, ("%s: cvp NULL", __func__));		\
54a48740b6SDavid E. O'Brien 	KASSERT((mp) != NULL, ("%s: mp NULL", __func__));		\
55238510fcSJason Evans 	mtx_assert((mp), MA_OWNED | MA_NOTRECURSED);			\
56238510fcSJason Evans } while (0)
57238510fcSJason Evans 
58e7876c09SDan Moschuk #ifdef INVARIANTS
59238510fcSJason Evans #define	CV_WAIT_VALIDATE(cvp, mp) do {					\
60238510fcSJason Evans 	if (TAILQ_EMPTY(&(cvp)->cv_waitq)) {				\
61238510fcSJason Evans 		/* Only waiter. */					\
62238510fcSJason Evans 		(cvp)->cv_mtx = (mp);					\
63238510fcSJason Evans 	} else {							\
64238510fcSJason Evans 		/*							\
65238510fcSJason Evans 		 * Other waiter; assert that we're using the		\
66238510fcSJason Evans 		 * same mutex.						\
67238510fcSJason Evans 		 */							\
68238510fcSJason Evans 		KASSERT((cvp)->cv_mtx == (mp),				\
69a48740b6SDavid E. O'Brien 		    ("%s: Multiple mutexes", __func__));		\
70238510fcSJason Evans 	}								\
71238510fcSJason Evans } while (0)
7271fad9fdSJulian Elischer 
73238510fcSJason Evans #define	CV_SIGNAL_VALIDATE(cvp) do {					\
74238510fcSJason Evans 	if (!TAILQ_EMPTY(&(cvp)->cv_waitq)) {				\
75238510fcSJason Evans 		KASSERT(mtx_owned((cvp)->cv_mtx),			\
76a48740b6SDavid E. O'Brien 		    ("%s: Mutex not owned", __func__));			\
77238510fcSJason Evans 	}								\
78238510fcSJason Evans } while (0)
7971fad9fdSJulian Elischer 
80238510fcSJason Evans #else
81238510fcSJason Evans #define	CV_WAIT_VALIDATE(cvp, mp)
82238510fcSJason Evans #define	CV_SIGNAL_VALIDATE(cvp)
83238510fcSJason Evans #endif
84238510fcSJason Evans 
85238510fcSJason Evans static void cv_timedwait_end(void *arg);
86238510fcSJason Evans 
87238510fcSJason Evans /*
88238510fcSJason Evans  * Initialize a condition variable.  Must be called before use.
89238510fcSJason Evans  */
90238510fcSJason Evans void
91238510fcSJason Evans cv_init(struct cv *cvp, const char *desc)
92238510fcSJason Evans {
93238510fcSJason Evans 
94238510fcSJason Evans 	TAILQ_INIT(&cvp->cv_waitq);
95238510fcSJason Evans 	cvp->cv_mtx = NULL;
96238510fcSJason Evans 	cvp->cv_description = desc;
97238510fcSJason Evans }
98238510fcSJason Evans 
99238510fcSJason Evans /*
100238510fcSJason Evans  * Destroy a condition variable.  The condition variable must be re-initialized
101238510fcSJason Evans  * in order to be re-used.
102238510fcSJason Evans  */
103238510fcSJason Evans void
104238510fcSJason Evans cv_destroy(struct cv *cvp)
105238510fcSJason Evans {
106238510fcSJason Evans 
107a48740b6SDavid E. O'Brien 	KASSERT(cv_waitq_empty(cvp), ("%s: cv_waitq non-empty", __func__));
108238510fcSJason Evans }
109238510fcSJason Evans 
110238510fcSJason Evans /*
111238510fcSJason Evans  * Common code for cv_wait* functions.  All require sched_lock.
112238510fcSJason Evans  */
113238510fcSJason Evans 
114238510fcSJason Evans /*
1159d102777SJulian Elischer  * Switch context.
116e602ba25SJulian Elischer  */
1179d102777SJulian Elischer static __inline void
1189d102777SJulian Elischer cv_switch(struct thread *td)
119e602ba25SJulian Elischer {
12071fad9fdSJulian Elischer 	TD_SET_SLEEPING(td);
12171fad9fdSJulian Elischer 	td->td_proc->p_stats->p_ru.ru_nvcsw++;
122238510fcSJason Evans 	mi_switch();
1239ef3a985SJohn Baldwin 	CTR3(KTR_PROC, "cv_switch: resume thread %p (pid %d, %s)", td,
1249ef3a985SJohn Baldwin 	    td->td_proc->p_pid, td->td_proc->p_comm);
125238510fcSJason Evans }
126238510fcSJason Evans 
127238510fcSJason Evans /*
128238510fcSJason Evans  * Switch context, catching signals.
129238510fcSJason Evans  */
130238510fcSJason Evans static __inline int
131b40ce416SJulian Elischer cv_switch_catch(struct thread *td)
132238510fcSJason Evans {
1339ef3a985SJohn Baldwin 	struct proc *p;
134238510fcSJason Evans 	int sig;
135238510fcSJason Evans 
136238510fcSJason Evans 	/*
137238510fcSJason Evans 	 * We put ourselves on the sleep queue and start our timeout before
138628855e7SJulian Elischer 	 * calling cursig, as we could stop there, and a wakeup or a SIGCONT (or
139238510fcSJason Evans 	 * both) could occur while we were stopped.  A SIGCONT would cause us to
140e602ba25SJulian Elischer 	 * be marked as TDS_SLP without resuming us, thus we must be ready for
141628855e7SJulian Elischer 	 * sleep when cursig is called.  If the wakeup happens while we're
14271fad9fdSJulian Elischer 	 * stopped, td->td_wchan will be 0 upon return from cursig,
14371fad9fdSJulian Elischer 	 * and TD_ON_SLEEPQ() will return false.
144238510fcSJason Evans 	 */
145b40ce416SJulian Elischer 	td->td_flags |= TDF_SINTR;
1469ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
1479ef3a985SJohn Baldwin 	p = td->td_proc;
1489ef3a985SJohn Baldwin 	PROC_LOCK(p);
14971fad9fdSJulian Elischer 	sig = cursig(td);
150e602ba25SJulian Elischer 	if (thread_suspend_check(1))
151e602ba25SJulian Elischer 		sig = SIGSTOP;
1529ed346baSBosko Milekic 	mtx_lock_spin(&sched_lock);
153c86b6ff5SJohn Baldwin 	PROC_UNLOCK(p);
154238510fcSJason Evans 	if (sig != 0) {
15571fad9fdSJulian Elischer 		if (TD_ON_SLEEPQ(td))
156b40ce416SJulian Elischer 			cv_waitq_remove(td);
15771fad9fdSJulian Elischer 		TD_SET_RUNNING(td);
15871fad9fdSJulian Elischer 	} else if (TD_ON_SLEEPQ(td)) {
159b40ce416SJulian Elischer 		cv_switch(td);
160238510fcSJason Evans 	}
161b40ce416SJulian Elischer 	td->td_flags &= ~TDF_SINTR;
162238510fcSJason Evans 
163238510fcSJason Evans 	return sig;
164238510fcSJason Evans }
165238510fcSJason Evans 
166238510fcSJason Evans /*
167b40ce416SJulian Elischer  * Add a thread to the wait queue of a condition variable.
168238510fcSJason Evans  */
169238510fcSJason Evans static __inline void
170b40ce416SJulian Elischer cv_waitq_add(struct cv *cvp, struct thread *td)
171238510fcSJason Evans {
172238510fcSJason Evans 
173b40ce416SJulian Elischer 	td->td_flags |= TDF_CVWAITQ;
17471fad9fdSJulian Elischer 	TD_SET_ON_SLEEPQ(td);
175b40ce416SJulian Elischer 	td->td_wchan = cvp;
176b40ce416SJulian Elischer 	td->td_wmesg = cvp->cv_description;
177b40ce416SJulian Elischer 	CTR3(KTR_PROC, "cv_waitq_add: thread %p (pid %d, %s)", td,
1789ef3a985SJohn Baldwin 	    td->td_proc->p_pid, td->td_proc->p_comm);
179b40ce416SJulian Elischer 	TAILQ_INSERT_TAIL(&cvp->cv_waitq, td, td_slpq);
1804e997f4bSJeff Roberson 	sched_sleep(td, td->td_priority);
181238510fcSJason Evans }
182238510fcSJason Evans 
183238510fcSJason Evans /*
184b40ce416SJulian Elischer  * Wait on a condition variable.  The current thread is placed on the condition
185238510fcSJason Evans  * variable's wait queue and suspended.  A cv_signal or cv_broadcast on the same
186b40ce416SJulian Elischer  * condition variable will resume the thread.  The mutex is released before
187238510fcSJason Evans  * sleeping and will be held on return.  It is recommended that the mutex be
188238510fcSJason Evans  * held when cv_signal or cv_broadcast are called.
189238510fcSJason Evans  */
190238510fcSJason Evans void
191238510fcSJason Evans cv_wait(struct cv *cvp, struct mtx *mp)
192238510fcSJason Evans {
193b40ce416SJulian Elischer 	struct thread *td;
194238510fcSJason Evans 	WITNESS_SAVE_DECL(mp);
195238510fcSJason Evans 
196b40ce416SJulian Elischer 	td = curthread;
197238510fcSJason Evans #ifdef KTRACE
1989ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
1999ba7fe1bSJohn Baldwin 		ktrcsw(1, 0);
200238510fcSJason Evans #endif
201b40ce416SJulian Elischer 	CV_ASSERT(cvp, mp, td);
20226306795SJohn Baldwin 	WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, &mp->mtx_object,
20326306795SJohn Baldwin 	    "Waiting on \"%s\"", cvp->cv_description);
20419284646SJohn Baldwin 	WITNESS_SAVE(&mp->mtx_object, mp);
205238510fcSJason Evans 
206fe799533SAndrew Gallatin 	if (cold ) {
207238510fcSJason Evans 		/*
208fe799533SAndrew Gallatin 		 * During autoconfiguration, just give interrupts
209fe799533SAndrew Gallatin 		 * a chance, then just return.  Don't run any other
210fe799533SAndrew Gallatin 		 * thread or panic below, in case this is the idle
211fe799533SAndrew Gallatin 		 * process and already asleep.
212238510fcSJason Evans 		 */
213238510fcSJason Evans 		return;
214238510fcSJason Evans 	}
2154bc37205SJeffrey Hsu 
2164bc37205SJeffrey Hsu 	mtx_lock_spin(&sched_lock);
2174bc37205SJeffrey Hsu 
218238510fcSJason Evans 	CV_WAIT_VALIDATE(cvp, mp);
219238510fcSJason Evans 
220c86b6ff5SJohn Baldwin 	DROP_GIANT();
221c86b6ff5SJohn Baldwin 	mtx_unlock(mp);
222238510fcSJason Evans 
223b40ce416SJulian Elischer 	cv_waitq_add(cvp, td);
224b40ce416SJulian Elischer 	cv_switch(td);
225238510fcSJason Evans 
2269ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
227238510fcSJason Evans #ifdef KTRACE
2289ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
2299ba7fe1bSJohn Baldwin 		ktrcsw(0, 0);
230238510fcSJason Evans #endif
231238510fcSJason Evans 	PICKUP_GIANT();
2329ed346baSBosko Milekic 	mtx_lock(mp);
23319284646SJohn Baldwin 	WITNESS_RESTORE(&mp->mtx_object, mp);
234238510fcSJason Evans }
235238510fcSJason Evans 
236238510fcSJason Evans /*
237238510fcSJason Evans  * Wait on a condition variable, allowing interruption by signals.  Return 0 if
238b40ce416SJulian Elischer  * the thread was resumed with cv_signal or cv_broadcast, EINTR or ERESTART if
239238510fcSJason Evans  * a signal was caught.  If ERESTART is returned the system call should be
240238510fcSJason Evans  * restarted if possible.
241238510fcSJason Evans  */
242238510fcSJason Evans int
243238510fcSJason Evans cv_wait_sig(struct cv *cvp, struct mtx *mp)
244238510fcSJason Evans {
245b40ce416SJulian Elischer 	struct thread *td;
24666f769feSPeter Wemm 	struct proc *p;
247238510fcSJason Evans 	int rval;
248238510fcSJason Evans 	int sig;
249238510fcSJason Evans 	WITNESS_SAVE_DECL(mp);
250238510fcSJason Evans 
251b40ce416SJulian Elischer 	td = curthread;
2529ef3a985SJohn Baldwin 	p = td->td_proc;
253238510fcSJason Evans 	rval = 0;
254238510fcSJason Evans #ifdef KTRACE
2559ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
2569ba7fe1bSJohn Baldwin 		ktrcsw(1, 0);
257238510fcSJason Evans #endif
258b40ce416SJulian Elischer 	CV_ASSERT(cvp, mp, td);
25926306795SJohn Baldwin 	WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, &mp->mtx_object,
26026306795SJohn Baldwin 	    "Waiting on \"%s\"", cvp->cv_description);
26119284646SJohn Baldwin 	WITNESS_SAVE(&mp->mtx_object, mp);
262238510fcSJason Evans 
263238510fcSJason Evans 	if (cold || panicstr) {
264238510fcSJason Evans 		/*
265238510fcSJason Evans 		 * After a panic, or during autoconfiguration, just give
266238510fcSJason Evans 		 * interrupts a chance, then just return; don't run any other
267238510fcSJason Evans 		 * procs or panic below, in case this is the idle process and
268238510fcSJason Evans 		 * already asleep.
269238510fcSJason Evans 		 */
270238510fcSJason Evans 		return 0;
271238510fcSJason Evans 	}
2724bc37205SJeffrey Hsu 
2734bc37205SJeffrey Hsu 	mtx_lock_spin(&sched_lock);
2744bc37205SJeffrey Hsu 
275238510fcSJason Evans 	CV_WAIT_VALIDATE(cvp, mp);
276238510fcSJason Evans 
277c86b6ff5SJohn Baldwin 	DROP_GIANT();
278c86b6ff5SJohn Baldwin 	mtx_unlock(mp);
279238510fcSJason Evans 
280b40ce416SJulian Elischer 	cv_waitq_add(cvp, td);
281b40ce416SJulian Elischer 	sig = cv_switch_catch(td);
282238510fcSJason Evans 
2839ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
284238510fcSJason Evans 
2859ef3a985SJohn Baldwin 	PROC_LOCK(p);
286238510fcSJason Evans 	if (sig == 0)
287e602ba25SJulian Elischer 		sig = cursig(td);	/* XXXKSE */
288238510fcSJason Evans 	if (sig != 0) {
2899ef3a985SJohn Baldwin 		if (SIGISMEMBER(p->p_sigacts->ps_sigintr, sig))
290238510fcSJason Evans 			rval = EINTR;
291238510fcSJason Evans 		else
292238510fcSJason Evans 			rval = ERESTART;
293238510fcSJason Evans 	}
2949ef3a985SJohn Baldwin 	PROC_UNLOCK(p);
295e602ba25SJulian Elischer 	if (p->p_flag & P_WEXIT)
296e602ba25SJulian Elischer 		rval = EINTR;
297238510fcSJason Evans 
298238510fcSJason Evans #ifdef KTRACE
2999ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
3009ba7fe1bSJohn Baldwin 		ktrcsw(0, 0);
301238510fcSJason Evans #endif
3029ba7fe1bSJohn Baldwin 	PICKUP_GIANT();
3039ed346baSBosko Milekic 	mtx_lock(mp);
30419284646SJohn Baldwin 	WITNESS_RESTORE(&mp->mtx_object, mp);
305238510fcSJason Evans 
306238510fcSJason Evans 	return (rval);
307238510fcSJason Evans }
308238510fcSJason Evans 
309238510fcSJason Evans /*
310238510fcSJason Evans  * Wait on a condition variable for at most timo/hz seconds.  Returns 0 if the
311238510fcSJason Evans  * process was resumed by cv_signal or cv_broadcast, EWOULDBLOCK if the timeout
312238510fcSJason Evans  * expires.
313238510fcSJason Evans  */
314238510fcSJason Evans int
315238510fcSJason Evans cv_timedwait(struct cv *cvp, struct mtx *mp, int timo)
316238510fcSJason Evans {
317b40ce416SJulian Elischer 	struct thread *td;
318238510fcSJason Evans 	int rval;
319238510fcSJason Evans 	WITNESS_SAVE_DECL(mp);
320238510fcSJason Evans 
321b40ce416SJulian Elischer 	td = curthread;
322238510fcSJason Evans 	rval = 0;
323238510fcSJason Evans #ifdef KTRACE
3249ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
3259ba7fe1bSJohn Baldwin 		ktrcsw(1, 0);
326238510fcSJason Evans #endif
327b40ce416SJulian Elischer 	CV_ASSERT(cvp, mp, td);
32826306795SJohn Baldwin 	WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, &mp->mtx_object,
32926306795SJohn Baldwin 	    "Waiting on \"%s\"", cvp->cv_description);
33019284646SJohn Baldwin 	WITNESS_SAVE(&mp->mtx_object, mp);
331238510fcSJason Evans 
332238510fcSJason Evans 	if (cold || panicstr) {
333238510fcSJason Evans 		/*
334238510fcSJason Evans 		 * After a panic, or during autoconfiguration, just give
335238510fcSJason Evans 		 * interrupts a chance, then just return; don't run any other
336b40ce416SJulian Elischer 		 * thread or panic below, in case this is the idle process and
337238510fcSJason Evans 		 * already asleep.
338238510fcSJason Evans 		 */
339238510fcSJason Evans 		return 0;
340238510fcSJason Evans 	}
3414bc37205SJeffrey Hsu 
3424bc37205SJeffrey Hsu 	mtx_lock_spin(&sched_lock);
3434bc37205SJeffrey Hsu 
344238510fcSJason Evans 	CV_WAIT_VALIDATE(cvp, mp);
345238510fcSJason Evans 
346c86b6ff5SJohn Baldwin 	DROP_GIANT();
347c86b6ff5SJohn Baldwin 	mtx_unlock(mp);
348238510fcSJason Evans 
349b40ce416SJulian Elischer 	cv_waitq_add(cvp, td);
350b40ce416SJulian Elischer 	callout_reset(&td->td_slpcallout, timo, cv_timedwait_end, td);
351b40ce416SJulian Elischer 	cv_switch(td);
352238510fcSJason Evans 
353b40ce416SJulian Elischer 	if (td->td_flags & TDF_TIMEOUT) {
354b40ce416SJulian Elischer 		td->td_flags &= ~TDF_TIMEOUT;
355238510fcSJason Evans 		rval = EWOULDBLOCK;
356b40ce416SJulian Elischer 	} else if (td->td_flags & TDF_TIMOFAIL)
357b40ce416SJulian Elischer 		td->td_flags &= ~TDF_TIMOFAIL;
358b40ce416SJulian Elischer 	else if (callout_stop(&td->td_slpcallout) == 0) {
35991a4536fSJohn Baldwin 		/*
36091a4536fSJohn Baldwin 		 * Work around race with cv_timedwait_end similar to that
36191a4536fSJohn Baldwin 		 * between msleep and endtsleep.
362d5cb7e14SJulian Elischer 		 * Go back to sleep.
36391a4536fSJohn Baldwin 		 */
36471fad9fdSJulian Elischer 		TD_SET_SLEEPING(td);
365b40ce416SJulian Elischer 		td->td_proc->p_stats->p_ru.ru_nivcsw++;
36691a4536fSJohn Baldwin 		mi_switch();
36771fad9fdSJulian Elischer 		td->td_flags &= ~TDF_TIMOFAIL;
36891a4536fSJohn Baldwin 	}
369238510fcSJason Evans 
370e602ba25SJulian Elischer 	if (td->td_proc->p_flag & P_WEXIT)
371e602ba25SJulian Elischer 		rval = EWOULDBLOCK;
3729ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
373238510fcSJason Evans #ifdef KTRACE
3749ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
3759ba7fe1bSJohn Baldwin 		ktrcsw(0, 0);
376238510fcSJason Evans #endif
377238510fcSJason Evans 	PICKUP_GIANT();
3789ed346baSBosko Milekic 	mtx_lock(mp);
37919284646SJohn Baldwin 	WITNESS_RESTORE(&mp->mtx_object, mp);
380238510fcSJason Evans 
381238510fcSJason Evans 	return (rval);
382238510fcSJason Evans }
383238510fcSJason Evans 
384238510fcSJason Evans /*
385238510fcSJason Evans  * Wait on a condition variable for at most timo/hz seconds, allowing
386b40ce416SJulian Elischer  * interruption by signals.  Returns 0 if the thread was resumed by cv_signal
387238510fcSJason Evans  * or cv_broadcast, EWOULDBLOCK if the timeout expires, and EINTR or ERESTART if
388238510fcSJason Evans  * a signal was caught.
389238510fcSJason Evans  */
390238510fcSJason Evans int
391238510fcSJason Evans cv_timedwait_sig(struct cv *cvp, struct mtx *mp, int timo)
392238510fcSJason Evans {
393b40ce416SJulian Elischer 	struct thread *td;
3949ef3a985SJohn Baldwin 	struct proc *p;
395238510fcSJason Evans 	int rval;
396238510fcSJason Evans 	int sig;
397238510fcSJason Evans 	WITNESS_SAVE_DECL(mp);
398238510fcSJason Evans 
399b40ce416SJulian Elischer 	td = curthread;
4009ef3a985SJohn Baldwin 	p = td->td_proc;
401238510fcSJason Evans 	rval = 0;
402238510fcSJason Evans #ifdef KTRACE
4039ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
4049ba7fe1bSJohn Baldwin 		ktrcsw(1, 0);
405238510fcSJason Evans #endif
406b40ce416SJulian Elischer 	CV_ASSERT(cvp, mp, td);
40726306795SJohn Baldwin 	WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, &mp->mtx_object,
40826306795SJohn Baldwin 	    "Waiting on \"%s\"", cvp->cv_description);
40919284646SJohn Baldwin 	WITNESS_SAVE(&mp->mtx_object, mp);
410238510fcSJason Evans 
411238510fcSJason Evans 	if (cold || panicstr) {
412238510fcSJason Evans 		/*
413238510fcSJason Evans 		 * After a panic, or during autoconfiguration, just give
414238510fcSJason Evans 		 * interrupts a chance, then just return; don't run any other
415b40ce416SJulian Elischer 		 * thread or panic below, in case this is the idle process and
416238510fcSJason Evans 		 * already asleep.
417238510fcSJason Evans 		 */
418238510fcSJason Evans 		return 0;
419238510fcSJason Evans 	}
4204bc37205SJeffrey Hsu 
4214bc37205SJeffrey Hsu 	mtx_lock_spin(&sched_lock);
4224bc37205SJeffrey Hsu 
423238510fcSJason Evans 	CV_WAIT_VALIDATE(cvp, mp);
424238510fcSJason Evans 
425c86b6ff5SJohn Baldwin 	DROP_GIANT();
426c86b6ff5SJohn Baldwin 	mtx_unlock(mp);
427238510fcSJason Evans 
428b40ce416SJulian Elischer 	cv_waitq_add(cvp, td);
429b40ce416SJulian Elischer 	callout_reset(&td->td_slpcallout, timo, cv_timedwait_end, td);
430b40ce416SJulian Elischer 	sig = cv_switch_catch(td);
431238510fcSJason Evans 
432b40ce416SJulian Elischer 	if (td->td_flags & TDF_TIMEOUT) {
433b40ce416SJulian Elischer 		td->td_flags &= ~TDF_TIMEOUT;
434238510fcSJason Evans 		rval = EWOULDBLOCK;
435b40ce416SJulian Elischer 	} else if (td->td_flags & TDF_TIMOFAIL)
436b40ce416SJulian Elischer 		td->td_flags &= ~TDF_TIMOFAIL;
437b40ce416SJulian Elischer 	else if (callout_stop(&td->td_slpcallout) == 0) {
43891a4536fSJohn Baldwin 		/*
43991a4536fSJohn Baldwin 		 * Work around race with cv_timedwait_end similar to that
44091a4536fSJohn Baldwin 		 * between msleep and endtsleep.
441d5cb7e14SJulian Elischer 		 * Go back to sleep.
44291a4536fSJohn Baldwin 		 */
44371fad9fdSJulian Elischer 		TD_SET_SLEEPING(td);
444b40ce416SJulian Elischer 		td->td_proc->p_stats->p_ru.ru_nivcsw++;
44591a4536fSJohn Baldwin 		mi_switch();
44671fad9fdSJulian Elischer 		td->td_flags &= ~TDF_TIMOFAIL;
44791a4536fSJohn Baldwin 	}
4489ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
449238510fcSJason Evans 
4509ef3a985SJohn Baldwin 	PROC_LOCK(p);
451238510fcSJason Evans 	if (sig == 0)
452e602ba25SJulian Elischer 		sig = cursig(td);
453238510fcSJason Evans 	if (sig != 0) {
4549ef3a985SJohn Baldwin 		if (SIGISMEMBER(p->p_sigacts->ps_sigintr, sig))
455238510fcSJason Evans 			rval = EINTR;
456238510fcSJason Evans 		else
457238510fcSJason Evans 			rval = ERESTART;
458238510fcSJason Evans 	}
4599ef3a985SJohn Baldwin 	PROC_UNLOCK(p);
460238510fcSJason Evans 
461e602ba25SJulian Elischer 	if (p->p_flag & P_WEXIT)
462e602ba25SJulian Elischer 		rval = EINTR;
463e602ba25SJulian Elischer 
464238510fcSJason Evans #ifdef KTRACE
4659ba7fe1bSJohn Baldwin 	if (KTRPOINT(td, KTR_CSW))
4669ba7fe1bSJohn Baldwin 		ktrcsw(0, 0);
467238510fcSJason Evans #endif
4689ba7fe1bSJohn Baldwin 	PICKUP_GIANT();
4699ed346baSBosko Milekic 	mtx_lock(mp);
47019284646SJohn Baldwin 	WITNESS_RESTORE(&mp->mtx_object, mp);
471238510fcSJason Evans 
472238510fcSJason Evans 	return (rval);
473238510fcSJason Evans }
474238510fcSJason Evans 
475238510fcSJason Evans /*
476238510fcSJason Evans  * Common code for signal and broadcast.  Assumes waitq is not empty.  Must be
477238510fcSJason Evans  * called with sched_lock held.
478238510fcSJason Evans  */
479238510fcSJason Evans static __inline void
480238510fcSJason Evans cv_wakeup(struct cv *cvp)
481238510fcSJason Evans {
482b40ce416SJulian Elischer 	struct thread *td;
483238510fcSJason Evans 
484981808d1SJohn Baldwin 	mtx_assert(&sched_lock, MA_OWNED);
485b40ce416SJulian Elischer 	td = TAILQ_FIRST(&cvp->cv_waitq);
486a48740b6SDavid E. O'Brien 	KASSERT(td->td_wchan == cvp, ("%s: bogus wchan", __func__));
487a48740b6SDavid E. O'Brien 	KASSERT(td->td_flags & TDF_CVWAITQ, ("%s: not on waitq", __func__));
48871fad9fdSJulian Elischer 	cv_waitq_remove(td);
48971fad9fdSJulian Elischer 	TD_CLR_SLEEPING(td);
49071fad9fdSJulian Elischer 	setrunnable(td);
491238510fcSJason Evans }
492238510fcSJason Evans 
493238510fcSJason Evans /*
494b40ce416SJulian Elischer  * Signal a condition variable, wakes up one waiting thread.  Will also wakeup
495238510fcSJason Evans  * the swapper if the process is not in memory, so that it can bring the
496b40ce416SJulian Elischer  * sleeping process in.  Note that this may also result in additional threads
497238510fcSJason Evans  * being made runnable.  Should be called with the same mutex as was passed to
498238510fcSJason Evans  * cv_wait held.
499238510fcSJason Evans  */
500238510fcSJason Evans void
501238510fcSJason Evans cv_signal(struct cv *cvp)
502238510fcSJason Evans {
503238510fcSJason Evans 
504a48740b6SDavid E. O'Brien 	KASSERT(cvp != NULL, ("%s: cvp NULL", __func__));
5059ed346baSBosko Milekic 	mtx_lock_spin(&sched_lock);
506238510fcSJason Evans 	if (!TAILQ_EMPTY(&cvp->cv_waitq)) {
507238510fcSJason Evans 		CV_SIGNAL_VALIDATE(cvp);
508238510fcSJason Evans 		cv_wakeup(cvp);
509238510fcSJason Evans 	}
5109ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
511238510fcSJason Evans }
512238510fcSJason Evans 
513238510fcSJason Evans /*
514b40ce416SJulian Elischer  * Broadcast a signal to a condition variable.  Wakes up all waiting threads.
515238510fcSJason Evans  * Should be called with the same mutex as was passed to cv_wait held.
516238510fcSJason Evans  */
517238510fcSJason Evans void
518238510fcSJason Evans cv_broadcast(struct cv *cvp)
519238510fcSJason Evans {
520238510fcSJason Evans 
521a48740b6SDavid E. O'Brien 	KASSERT(cvp != NULL, ("%s: cvp NULL", __func__));
5229ed346baSBosko Milekic 	mtx_lock_spin(&sched_lock);
523238510fcSJason Evans 	CV_SIGNAL_VALIDATE(cvp);
524238510fcSJason Evans 	while (!TAILQ_EMPTY(&cvp->cv_waitq))
525238510fcSJason Evans 		cv_wakeup(cvp);
5269ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
527238510fcSJason Evans }
528238510fcSJason Evans 
529238510fcSJason Evans /*
530b40ce416SJulian Elischer  * Remove a thread from the wait queue of its condition variable.  This may be
531238510fcSJason Evans  * called externally.
532238510fcSJason Evans  */
533238510fcSJason Evans void
534b40ce416SJulian Elischer cv_waitq_remove(struct thread *td)
535238510fcSJason Evans {
536238510fcSJason Evans 	struct cv *cvp;
537238510fcSJason Evans 
53871fad9fdSJulian Elischer 	mtx_assert(&sched_lock, MA_OWNED);
539b40ce416SJulian Elischer 	if ((cvp = td->td_wchan) != NULL && td->td_flags & TDF_CVWAITQ) {
540b40ce416SJulian Elischer 		TAILQ_REMOVE(&cvp->cv_waitq, td, td_slpq);
541b40ce416SJulian Elischer 		td->td_flags &= ~TDF_CVWAITQ;
542b89bc9e6SHartmut Brandt 		td->td_wmesg = NULL;
54371fad9fdSJulian Elischer 		TD_CLR_ON_SLEEPQ(td);
544238510fcSJason Evans 	}
545238510fcSJason Evans }
546238510fcSJason Evans 
547238510fcSJason Evans /*
548b40ce416SJulian Elischer  * Timeout function for cv_timedwait.  Put the thread on the runqueue and set
549238510fcSJason Evans  * its timeout flag.
550238510fcSJason Evans  */
551238510fcSJason Evans static void
552238510fcSJason Evans cv_timedwait_end(void *arg)
553238510fcSJason Evans {
554b40ce416SJulian Elischer 	struct thread *td;
555238510fcSJason Evans 
556b40ce416SJulian Elischer 	td = arg;
55771fad9fdSJulian Elischer 	CTR3(KTR_PROC, "cv_timedwait_end: thread %p (pid %d, %s)",
55871fad9fdSJulian Elischer 	    td, td->td_proc->p_pid, td->td_proc->p_comm);
5599ed346baSBosko Milekic 	mtx_lock_spin(&sched_lock);
56071fad9fdSJulian Elischer 	if (TD_ON_SLEEPQ(td)) {
561b40ce416SJulian Elischer 		cv_waitq_remove(td);
562b40ce416SJulian Elischer 		td->td_flags |= TDF_TIMEOUT;
56371fad9fdSJulian Elischer 	} else {
564b40ce416SJulian Elischer 		td->td_flags |= TDF_TIMOFAIL;
56571fad9fdSJulian Elischer 	}
56671fad9fdSJulian Elischer 	TD_CLR_SLEEPING(td);
56771fad9fdSJulian Elischer 	setrunnable(td);
5689ed346baSBosko Milekic 	mtx_unlock_spin(&sched_lock);
569238510fcSJason Evans }
570e602ba25SJulian Elischer 
571e602ba25SJulian Elischer /*
572e602ba25SJulian Elischer  * For now only abort interruptable waits.
573e602ba25SJulian Elischer  * The others will have to either complete on their own or have a timeout.
574e602ba25SJulian Elischer  */
575e602ba25SJulian Elischer void
576e602ba25SJulian Elischer cv_abort(struct thread *td)
577e602ba25SJulian Elischer {
578e602ba25SJulian Elischer 
579e602ba25SJulian Elischer 	CTR3(KTR_PROC, "cv_abort: thread %p (pid %d, %s)", td,
58071fad9fdSJulian Elischer 	    td->td_proc->p_pid, td->td_proc->p_comm);
581e602ba25SJulian Elischer 	mtx_lock_spin(&sched_lock);
582e602ba25SJulian Elischer 	if ((td->td_flags & (TDF_SINTR|TDF_TIMEOUT)) == TDF_SINTR) {
58371fad9fdSJulian Elischer 		if (TD_ON_SLEEPQ(td)) {
584e602ba25SJulian Elischer 			cv_waitq_remove(td);
585e602ba25SJulian Elischer 		}
58671fad9fdSJulian Elischer 		TD_CLR_SLEEPING(td);
58771fad9fdSJulian Elischer 		setrunnable(td);
588e602ba25SJulian Elischer 	}
589e602ba25SJulian Elischer 	mtx_unlock_spin(&sched_lock);
590e602ba25SJulian Elischer }
591e602ba25SJulian Elischer 
592