xref: /freebsd/sys/kern/kern_switch.c (revision d74ac6819b2cc8e5c18a099a97ffc16616b4e94d)
1dba6c5a6SPeter Wemm /*
2d5a08a60SJake Burkholder  * Copyright (c) 2001 Jake Burkholder <jake@FreeBSD.org>
3d5a08a60SJake Burkholder  * All rights reserved.
4dba6c5a6SPeter Wemm  *
5dba6c5a6SPeter Wemm  * Redistribution and use in source and binary forms, with or without
6dba6c5a6SPeter Wemm  * modification, are permitted provided that the following conditions
7dba6c5a6SPeter Wemm  * are met:
8dba6c5a6SPeter Wemm  * 1. Redistributions of source code must retain the above copyright
9dba6c5a6SPeter Wemm  *    notice, this list of conditions and the following disclaimer.
10dba6c5a6SPeter Wemm  * 2. Redistributions in binary form must reproduce the above copyright
11dba6c5a6SPeter Wemm  *    notice, this list of conditions and the following disclaimer in the
12dba6c5a6SPeter Wemm  *    documentation and/or other materials provided with the distribution.
13dba6c5a6SPeter Wemm  *
14dba6c5a6SPeter Wemm  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15dba6c5a6SPeter Wemm  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16dba6c5a6SPeter Wemm  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17dba6c5a6SPeter Wemm  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18dba6c5a6SPeter Wemm  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19dba6c5a6SPeter Wemm  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20dba6c5a6SPeter Wemm  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21dba6c5a6SPeter Wemm  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22dba6c5a6SPeter Wemm  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23dba6c5a6SPeter Wemm  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24dba6c5a6SPeter Wemm  * SUCH DAMAGE.
25dba6c5a6SPeter Wemm  *
26dba6c5a6SPeter Wemm  * $FreeBSD$
27dba6c5a6SPeter Wemm  */
28dba6c5a6SPeter Wemm 
29dba6c5a6SPeter Wemm #include <sys/param.h>
30dba6c5a6SPeter Wemm #include <sys/systm.h>
31dba6c5a6SPeter Wemm #include <sys/kernel.h>
320384fff8SJason Evans #include <sys/ktr.h>
33f34fa851SJohn Baldwin #include <sys/lock.h>
3435e0e5b3SJohn Baldwin #include <sys/mutex.h>
35dba6c5a6SPeter Wemm #include <sys/proc.h>
36dba6c5a6SPeter Wemm #include <sys/queue.h>
37dba6c5a6SPeter Wemm 
38dba6c5a6SPeter Wemm /*
39d5a08a60SJake Burkholder  * Global run queue.
40dba6c5a6SPeter Wemm  */
41d5a08a60SJake Burkholder static struct runq runq;
42d5a08a60SJake Burkholder SYSINIT(runq, SI_SUB_RUN_QUEUE, SI_ORDER_FIRST, runq_init, &runq)
43dba6c5a6SPeter Wemm 
44dba6c5a6SPeter Wemm /*
45d5a08a60SJake Burkholder  * Wrappers which implement old interface; act on global run queue.
46dba6c5a6SPeter Wemm  */
47dba6c5a6SPeter Wemm 
48b40ce416SJulian Elischer struct thread *
49b40ce416SJulian Elischer choosethread(void)
50dba6c5a6SPeter Wemm {
51b40ce416SJulian Elischer 	return (runq_choose(&runq)->ke_thread);
52d5a08a60SJake Burkholder }
53d5a08a60SJake Burkholder 
54d5a08a60SJake Burkholder int
55d5a08a60SJake Burkholder procrunnable(void)
56d5a08a60SJake Burkholder {
57d5a08a60SJake Burkholder 	return runq_check(&runq);
58d5a08a60SJake Burkholder }
59d5a08a60SJake Burkholder 
60d5a08a60SJake Burkholder void
61b40ce416SJulian Elischer remrunqueue(struct thread *td)
62d5a08a60SJake Burkholder {
63b40ce416SJulian Elischer 	runq_remove(&runq, td->td_kse);
64d5a08a60SJake Burkholder }
65d5a08a60SJake Burkholder 
66d5a08a60SJake Burkholder void
67b40ce416SJulian Elischer setrunqueue(struct thread *td)
68d5a08a60SJake Burkholder {
69b40ce416SJulian Elischer 	runq_add(&runq, td->td_kse);
70d5a08a60SJake Burkholder }
71d5a08a60SJake Burkholder 
727e1f6dfeSJohn Baldwin /* Critical sections that prevent preemption. */
737e1f6dfeSJohn Baldwin void
747e1f6dfeSJohn Baldwin critical_enter(void)
757e1f6dfeSJohn Baldwin {
767e1f6dfeSJohn Baldwin 	struct thread *td;
777e1f6dfeSJohn Baldwin 
787e1f6dfeSJohn Baldwin 	td = curthread;
797e1f6dfeSJohn Baldwin 	if (td->td_critnest == 0)
80d74ac681SMatthew Dillon 		cpu_critical_enter();
817e1f6dfeSJohn Baldwin 	td->td_critnest++;
827e1f6dfeSJohn Baldwin }
837e1f6dfeSJohn Baldwin 
847e1f6dfeSJohn Baldwin void
857e1f6dfeSJohn Baldwin critical_exit(void)
867e1f6dfeSJohn Baldwin {
877e1f6dfeSJohn Baldwin 	struct thread *td;
887e1f6dfeSJohn Baldwin 
897e1f6dfeSJohn Baldwin 	td = curthread;
907e1f6dfeSJohn Baldwin 	if (td->td_critnest == 1) {
917e1f6dfeSJohn Baldwin 		td->td_critnest = 0;
92d74ac681SMatthew Dillon 		cpu_critical_exit();
93d74ac681SMatthew Dillon 	} else {
947e1f6dfeSJohn Baldwin 		td->td_critnest--;
957e1f6dfeSJohn Baldwin 	}
96d74ac681SMatthew Dillon }
977e1f6dfeSJohn Baldwin 
98d5a08a60SJake Burkholder /*
99d5a08a60SJake Burkholder  * Clear the status bit of the queue corresponding to priority level pri,
100d5a08a60SJake Burkholder  * indicating that it is empty.
101d5a08a60SJake Burkholder  */
102d5a08a60SJake Burkholder static __inline void
103d5a08a60SJake Burkholder runq_clrbit(struct runq *rq, int pri)
104d5a08a60SJake Burkholder {
105d5a08a60SJake Burkholder 	struct rqbits *rqb;
106d5a08a60SJake Burkholder 
107d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
108d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_clrbit: bits=%#x %#x bit=%#x word=%d",
109d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)],
110d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)] & ~RQB_BIT(pri),
111d5a08a60SJake Burkholder 	    RQB_BIT(pri), RQB_WORD(pri));
112d5a08a60SJake Burkholder 	rqb->rqb_bits[RQB_WORD(pri)] &= ~RQB_BIT(pri);
113d5a08a60SJake Burkholder }
114d5a08a60SJake Burkholder 
115d5a08a60SJake Burkholder /*
116d5a08a60SJake Burkholder  * Find the index of the first non-empty run queue.  This is done by
117d5a08a60SJake Burkholder  * scanning the status bits, a set bit indicates a non-empty queue.
118d5a08a60SJake Burkholder  */
119d5a08a60SJake Burkholder static __inline int
120d5a08a60SJake Burkholder runq_findbit(struct runq *rq)
121d5a08a60SJake Burkholder {
122d5a08a60SJake Burkholder 	struct rqbits *rqb;
123d5a08a60SJake Burkholder 	int pri;
124d5a08a60SJake Burkholder 	int i;
125d5a08a60SJake Burkholder 
126d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
127d5a08a60SJake Burkholder 	for (i = 0; i < RQB_LEN; i++)
128d5a08a60SJake Burkholder 		if (rqb->rqb_bits[i]) {
129d5a08a60SJake Burkholder 			pri = (RQB_FFS(rqb->rqb_bits[i]) - 1) +
130d5a08a60SJake Burkholder 			    (i << RQB_L2BPW);
131d5a08a60SJake Burkholder 			CTR3(KTR_RUNQ, "runq_findbit: bits=%#x i=%d pri=%d",
132d5a08a60SJake Burkholder 			    rqb->rqb_bits[i], i, pri);
133d5a08a60SJake Burkholder 			return (pri);
134d5a08a60SJake Burkholder 		}
135d5a08a60SJake Burkholder 
136d5a08a60SJake Burkholder 	return (-1);
137d5a08a60SJake Burkholder }
138d5a08a60SJake Burkholder 
139d5a08a60SJake Burkholder /*
140d5a08a60SJake Burkholder  * Set the status bit of the queue corresponding to priority level pri,
141d5a08a60SJake Burkholder  * indicating that it is non-empty.
142d5a08a60SJake Burkholder  */
143d5a08a60SJake Burkholder static __inline void
144d5a08a60SJake Burkholder runq_setbit(struct runq *rq, int pri)
145d5a08a60SJake Burkholder {
146d5a08a60SJake Burkholder 	struct rqbits *rqb;
147d5a08a60SJake Burkholder 
148d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
149d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_setbit: bits=%#x %#x bit=%#x word=%d",
150d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)],
151d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)] | RQB_BIT(pri),
152d5a08a60SJake Burkholder 	    RQB_BIT(pri), RQB_WORD(pri));
153d5a08a60SJake Burkholder 	rqb->rqb_bits[RQB_WORD(pri)] |= RQB_BIT(pri);
154d5a08a60SJake Burkholder }
155d5a08a60SJake Burkholder 
156e97c3e3dSDag-Erling Smørgrav #if defined(INVARIANT_SUPPORT) && defined(DIAGNOSTIC)
1579cbd0393SDag-Erling Smørgrav /*
1589cbd0393SDag-Erling Smørgrav  * Return true if the specified process is already in the run queue.
1599cbd0393SDag-Erling Smørgrav  */
1609cbd0393SDag-Erling Smørgrav static __inline int
161e97c3e3dSDag-Erling Smørgrav runq_findproc(struct runq *rq, struct kse *ke)
1629cbd0393SDag-Erling Smørgrav {
163b40ce416SJulian Elischer 	struct kse *ke2;
1649cbd0393SDag-Erling Smørgrav 	int i;
1659cbd0393SDag-Erling Smørgrav 
1669cbd0393SDag-Erling Smørgrav 	mtx_assert(&sched_lock, MA_OWNED);
1679cbd0393SDag-Erling Smørgrav 	for (i = 0; i < RQB_LEN; i++)
168b40ce416SJulian Elischer 		TAILQ_FOREACH(ke2, &rq->rq_queues[i], ke_procq)
169b40ce416SJulian Elischer 		    if (ke2 == ke)
1709cbd0393SDag-Erling Smørgrav 			    return 1;
1719cbd0393SDag-Erling Smørgrav 	return 0;
1729cbd0393SDag-Erling Smørgrav }
1739cbd0393SDag-Erling Smørgrav #endif
1749cbd0393SDag-Erling Smørgrav 
175d5a08a60SJake Burkholder /*
176d5a08a60SJake Burkholder  * Add the process to the queue specified by its priority, and set the
177d5a08a60SJake Burkholder  * corresponding status bit.
178d5a08a60SJake Burkholder  */
179d5a08a60SJake Burkholder void
180b40ce416SJulian Elischer runq_add(struct runq *rq, struct kse *ke)
181d5a08a60SJake Burkholder {
182d5a08a60SJake Burkholder 	struct rqhead *rqh;
183d5a08a60SJake Burkholder 	int pri;
184dba6c5a6SPeter Wemm 
185b40ce416SJulian Elischer #ifdef INVARIANTS
186b40ce416SJulian Elischer 	struct proc *p = ke->ke_proc;
187b40ce416SJulian Elischer #endif
188b40ce416SJulian Elischer 	if (ke->ke_flags & KEF_ONRUNQ)
189b40ce416SJulian Elischer 		return;
1900384fff8SJason Evans 	mtx_assert(&sched_lock, MA_OWNED);
191d5a08a60SJake Burkholder 	KASSERT(p->p_stat == SRUN, ("runq_add: proc %p (%s) not SRUN",
192d5a08a60SJake Burkholder 	    p, p->p_comm));
193e97c3e3dSDag-Erling Smørgrav #if defined(INVARIANTS) && defined(DIAGNOSTIC)
194e97c3e3dSDag-Erling Smørgrav 	KASSERT(runq_findproc(rq, ke) == 0,
195b40ce416SJulian Elischer 	    ("runq_add: proc %p (%s) already in run queue", ke, p->p_comm));
196e97c3e3dSDag-Erling Smørgrav #endif
1972c100766SJulian Elischer 	pri = ke->ke_thread->td_priority / RQ_PPQ;
198b40ce416SJulian Elischer 	ke->ke_rqindex = pri;
199d5a08a60SJake Burkholder 	runq_setbit(rq, pri);
200d5a08a60SJake Burkholder 	rqh = &rq->rq_queues[pri];
201d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_add: p=%p pri=%d %d rqh=%p",
2022c100766SJulian Elischer 	    ke->ke_proc, ke->ke_thread->td_priority, pri, rqh);
203b40ce416SJulian Elischer 	TAILQ_INSERT_TAIL(rqh, ke, ke_procq);
204b40ce416SJulian Elischer 	ke->ke_flags |= KEF_ONRUNQ;
205dba6c5a6SPeter Wemm }
206d5a08a60SJake Burkholder 
207d5a08a60SJake Burkholder /*
208d5a08a60SJake Burkholder  * Return true if there are runnable processes of any priority on the run
209d5a08a60SJake Burkholder  * queue, false otherwise.  Has no side effects, does not modify the run
210d5a08a60SJake Burkholder  * queue structure.
211d5a08a60SJake Burkholder  */
212d5a08a60SJake Burkholder int
213d5a08a60SJake Burkholder runq_check(struct runq *rq)
214d5a08a60SJake Burkholder {
215d5a08a60SJake Burkholder 	struct rqbits *rqb;
216d5a08a60SJake Burkholder 	int i;
217d5a08a60SJake Burkholder 
218d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
219d5a08a60SJake Burkholder 	for (i = 0; i < RQB_LEN; i++)
220d5a08a60SJake Burkholder 		if (rqb->rqb_bits[i]) {
221d5a08a60SJake Burkholder 			CTR2(KTR_RUNQ, "runq_check: bits=%#x i=%d",
222d5a08a60SJake Burkholder 			    rqb->rqb_bits[i], i);
223d5a08a60SJake Burkholder 			return (1);
224dba6c5a6SPeter Wemm 		}
225d5a08a60SJake Burkholder 	CTR0(KTR_RUNQ, "runq_check: empty");
226d5a08a60SJake Burkholder 
227d5a08a60SJake Burkholder 	return (0);
228dba6c5a6SPeter Wemm }
229d5a08a60SJake Burkholder 
230d5a08a60SJake Burkholder /*
231d5a08a60SJake Burkholder  * Find and remove the highest priority process from the run queue.
232d5a08a60SJake Burkholder  * If there are no runnable processes, the per-cpu idle process is
233d5a08a60SJake Burkholder  * returned.  Will not return NULL under any circumstances.
234d5a08a60SJake Burkholder  */
235b40ce416SJulian Elischer struct kse *
236d5a08a60SJake Burkholder runq_choose(struct runq *rq)
237d5a08a60SJake Burkholder {
238d5a08a60SJake Burkholder 	struct rqhead *rqh;
239b40ce416SJulian Elischer 	struct kse *ke;
240d5a08a60SJake Burkholder 	int pri;
241d5a08a60SJake Burkholder 
242d5a08a60SJake Burkholder 	mtx_assert(&sched_lock, MA_OWNED);
243d5a08a60SJake Burkholder 	if ((pri = runq_findbit(rq)) != -1) {
244d5a08a60SJake Burkholder 		rqh = &rq->rq_queues[pri];
245b40ce416SJulian Elischer 		ke = TAILQ_FIRST(rqh);
246b40ce416SJulian Elischer 		KASSERT(ke != NULL, ("runq_choose: no proc on busy queue"));
247b40ce416SJulian Elischer 		KASSERT(ke->ke_proc->p_stat == SRUN,
248b40ce416SJulian Elischer 		    ("runq_choose: process %d(%s) in state %d", ke->ke_proc->p_pid,
249b40ce416SJulian Elischer 		    ke->ke_proc->p_comm, ke->ke_proc->p_stat));
250b40ce416SJulian Elischer 		CTR3(KTR_RUNQ, "runq_choose: pri=%d kse=%p rqh=%p", pri, ke, rqh);
251b40ce416SJulian Elischer 		TAILQ_REMOVE(rqh, ke, ke_procq);
252d5a08a60SJake Burkholder 		if (TAILQ_EMPTY(rqh)) {
253d5a08a60SJake Burkholder 			CTR0(KTR_RUNQ, "runq_choose: empty");
254d5a08a60SJake Burkholder 			runq_clrbit(rq, pri);
255d5a08a60SJake Burkholder 		}
256b40ce416SJulian Elischer 		ke->ke_flags &= ~KEF_ONRUNQ;
257b40ce416SJulian Elischer 		return (ke);
258d5a08a60SJake Burkholder 	}
259d5a08a60SJake Burkholder 	CTR1(KTR_RUNQ, "runq_choose: idleproc pri=%d", pri);
260d5a08a60SJake Burkholder 
261b40ce416SJulian Elischer 	return (PCPU_GET(idlethread)->td_kse);
262d5a08a60SJake Burkholder }
263d5a08a60SJake Burkholder 
264d5a08a60SJake Burkholder /*
265d5a08a60SJake Burkholder  * Initialize a run structure.
266d5a08a60SJake Burkholder  */
267d5a08a60SJake Burkholder void
268d5a08a60SJake Burkholder runq_init(struct runq *rq)
269d5a08a60SJake Burkholder {
270d5a08a60SJake Burkholder 	int i;
271d5a08a60SJake Burkholder 
272f32ded2fSJake Burkholder 	bzero(rq, sizeof *rq);
273d5a08a60SJake Burkholder 	for (i = 0; i < RQ_NQS; i++)
274d5a08a60SJake Burkholder 		TAILQ_INIT(&rq->rq_queues[i]);
275d5a08a60SJake Burkholder }
276d5a08a60SJake Burkholder 
277d5a08a60SJake Burkholder /*
278d5a08a60SJake Burkholder  * Remove the process from the queue specified by its priority, and clear the
279d5a08a60SJake Burkholder  * corresponding status bit if the queue becomes empty.
280d5a08a60SJake Burkholder  */
281d5a08a60SJake Burkholder void
282b40ce416SJulian Elischer runq_remove(struct runq *rq, struct kse *ke)
283d5a08a60SJake Burkholder {
284d5a08a60SJake Burkholder 	struct rqhead *rqh;
285d5a08a60SJake Burkholder 	int pri;
286d5a08a60SJake Burkholder 
287b40ce416SJulian Elischer 	if (!(ke->ke_flags & KEF_ONRUNQ))
288b40ce416SJulian Elischer 		return;
289d5a08a60SJake Burkholder 	mtx_assert(&sched_lock, MA_OWNED);
290b40ce416SJulian Elischer 	pri = ke->ke_rqindex;
291d5a08a60SJake Burkholder 	rqh = &rq->rq_queues[pri];
292d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_remove: p=%p pri=%d %d rqh=%p",
2932c100766SJulian Elischer 	    ke, ke->ke_thread->td_priority, pri, rqh);
294b40ce416SJulian Elischer 	KASSERT(ke != NULL, ("runq_remove: no proc on busy queue"));
295b40ce416SJulian Elischer 	TAILQ_REMOVE(rqh, ke, ke_procq);
296d5a08a60SJake Burkholder 	if (TAILQ_EMPTY(rqh)) {
297d5a08a60SJake Burkholder 		CTR0(KTR_RUNQ, "runq_remove: empty");
298d5a08a60SJake Burkholder 		runq_clrbit(rq, pri);
299d5a08a60SJake Burkholder 	}
300b40ce416SJulian Elischer 	ke->ke_flags &= ~KEF_ONRUNQ;
301dba6c5a6SPeter Wemm }
302