xref: /freebsd/sys/kern/kern_switch.c (revision 7e1f6dfe9d7ac65419d57b36dee19cd1a3e996f5)
1dba6c5a6SPeter Wemm /*
2d5a08a60SJake Burkholder  * Copyright (c) 2001 Jake Burkholder <jake@FreeBSD.org>
3d5a08a60SJake Burkholder  * All rights reserved.
4dba6c5a6SPeter Wemm  *
5dba6c5a6SPeter Wemm  * Redistribution and use in source and binary forms, with or without
6dba6c5a6SPeter Wemm  * modification, are permitted provided that the following conditions
7dba6c5a6SPeter Wemm  * are met:
8dba6c5a6SPeter Wemm  * 1. Redistributions of source code must retain the above copyright
9dba6c5a6SPeter Wemm  *    notice, this list of conditions and the following disclaimer.
10dba6c5a6SPeter Wemm  * 2. Redistributions in binary form must reproduce the above copyright
11dba6c5a6SPeter Wemm  *    notice, this list of conditions and the following disclaimer in the
12dba6c5a6SPeter Wemm  *    documentation and/or other materials provided with the distribution.
13dba6c5a6SPeter Wemm  *
14dba6c5a6SPeter Wemm  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15dba6c5a6SPeter Wemm  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16dba6c5a6SPeter Wemm  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17dba6c5a6SPeter Wemm  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18dba6c5a6SPeter Wemm  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19dba6c5a6SPeter Wemm  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20dba6c5a6SPeter Wemm  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21dba6c5a6SPeter Wemm  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22dba6c5a6SPeter Wemm  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23dba6c5a6SPeter Wemm  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24dba6c5a6SPeter Wemm  * SUCH DAMAGE.
25dba6c5a6SPeter Wemm  *
26dba6c5a6SPeter Wemm  * $FreeBSD$
27dba6c5a6SPeter Wemm  */
28dba6c5a6SPeter Wemm 
29dba6c5a6SPeter Wemm #include <sys/param.h>
30dba6c5a6SPeter Wemm #include <sys/systm.h>
31dba6c5a6SPeter Wemm #include <sys/kernel.h>
320384fff8SJason Evans #include <sys/ktr.h>
33f34fa851SJohn Baldwin #include <sys/lock.h>
3435e0e5b3SJohn Baldwin #include <sys/mutex.h>
35dba6c5a6SPeter Wemm #include <sys/proc.h>
36dba6c5a6SPeter Wemm #include <sys/queue.h>
37dba6c5a6SPeter Wemm 
38dba6c5a6SPeter Wemm /*
39d5a08a60SJake Burkholder  * Global run queue.
40dba6c5a6SPeter Wemm  */
41d5a08a60SJake Burkholder static struct runq runq;
42d5a08a60SJake Burkholder SYSINIT(runq, SI_SUB_RUN_QUEUE, SI_ORDER_FIRST, runq_init, &runq)
43dba6c5a6SPeter Wemm 
44dba6c5a6SPeter Wemm /*
45d5a08a60SJake Burkholder  * Wrappers which implement old interface; act on global run queue.
46dba6c5a6SPeter Wemm  */
47dba6c5a6SPeter Wemm 
48b40ce416SJulian Elischer struct thread *
49b40ce416SJulian Elischer choosethread(void)
50dba6c5a6SPeter Wemm {
51b40ce416SJulian Elischer 	return (runq_choose(&runq)->ke_thread);
52d5a08a60SJake Burkholder }
53d5a08a60SJake Burkholder 
54d5a08a60SJake Burkholder int
55d5a08a60SJake Burkholder procrunnable(void)
56d5a08a60SJake Burkholder {
57d5a08a60SJake Burkholder 	return runq_check(&runq);
58d5a08a60SJake Burkholder }
59d5a08a60SJake Burkholder 
60d5a08a60SJake Burkholder void
61b40ce416SJulian Elischer remrunqueue(struct thread *td)
62d5a08a60SJake Burkholder {
63b40ce416SJulian Elischer 	runq_remove(&runq, td->td_kse);
64d5a08a60SJake Burkholder }
65d5a08a60SJake Burkholder 
66d5a08a60SJake Burkholder void
67b40ce416SJulian Elischer setrunqueue(struct thread *td)
68d5a08a60SJake Burkholder {
69b40ce416SJulian Elischer 	runq_add(&runq, td->td_kse);
70d5a08a60SJake Burkholder }
71d5a08a60SJake Burkholder 
727e1f6dfeSJohn Baldwin /* Critical sections that prevent preemption. */
737e1f6dfeSJohn Baldwin void
747e1f6dfeSJohn Baldwin critical_enter(void)
757e1f6dfeSJohn Baldwin {
767e1f6dfeSJohn Baldwin 	struct thread *td;
777e1f6dfeSJohn Baldwin 
787e1f6dfeSJohn Baldwin 	td = curthread;
797e1f6dfeSJohn Baldwin 	if (td->td_critnest == 0)
807e1f6dfeSJohn Baldwin 		td->td_savecrit = cpu_critical_enter();
817e1f6dfeSJohn Baldwin 	td->td_critnest++;
827e1f6dfeSJohn Baldwin }
837e1f6dfeSJohn Baldwin 
847e1f6dfeSJohn Baldwin void
857e1f6dfeSJohn Baldwin critical_exit(void)
867e1f6dfeSJohn Baldwin {
877e1f6dfeSJohn Baldwin 	struct thread *td;
887e1f6dfeSJohn Baldwin 
897e1f6dfeSJohn Baldwin 	td = curthread;
907e1f6dfeSJohn Baldwin 	if (td->td_critnest == 1) {
917e1f6dfeSJohn Baldwin 		td->td_critnest = 0;
927e1f6dfeSJohn Baldwin 		cpu_critical_exit(td->td_savecrit);
937e1f6dfeSJohn Baldwin 	} else
947e1f6dfeSJohn Baldwin 		td->td_critnest--;
957e1f6dfeSJohn Baldwin }
967e1f6dfeSJohn Baldwin 
97d5a08a60SJake Burkholder /*
98d5a08a60SJake Burkholder  * Clear the status bit of the queue corresponding to priority level pri,
99d5a08a60SJake Burkholder  * indicating that it is empty.
100d5a08a60SJake Burkholder  */
101d5a08a60SJake Burkholder static __inline void
102d5a08a60SJake Burkholder runq_clrbit(struct runq *rq, int pri)
103d5a08a60SJake Burkholder {
104d5a08a60SJake Burkholder 	struct rqbits *rqb;
105d5a08a60SJake Burkholder 
106d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
107d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_clrbit: bits=%#x %#x bit=%#x word=%d",
108d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)],
109d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)] & ~RQB_BIT(pri),
110d5a08a60SJake Burkholder 	    RQB_BIT(pri), RQB_WORD(pri));
111d5a08a60SJake Burkholder 	rqb->rqb_bits[RQB_WORD(pri)] &= ~RQB_BIT(pri);
112d5a08a60SJake Burkholder }
113d5a08a60SJake Burkholder 
114d5a08a60SJake Burkholder /*
115d5a08a60SJake Burkholder  * Find the index of the first non-empty run queue.  This is done by
116d5a08a60SJake Burkholder  * scanning the status bits, a set bit indicates a non-empty queue.
117d5a08a60SJake Burkholder  */
118d5a08a60SJake Burkholder static __inline int
119d5a08a60SJake Burkholder runq_findbit(struct runq *rq)
120d5a08a60SJake Burkholder {
121d5a08a60SJake Burkholder 	struct rqbits *rqb;
122d5a08a60SJake Burkholder 	int pri;
123d5a08a60SJake Burkholder 	int i;
124d5a08a60SJake Burkholder 
125d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
126d5a08a60SJake Burkholder 	for (i = 0; i < RQB_LEN; i++)
127d5a08a60SJake Burkholder 		if (rqb->rqb_bits[i]) {
128d5a08a60SJake Burkholder 			pri = (RQB_FFS(rqb->rqb_bits[i]) - 1) +
129d5a08a60SJake Burkholder 			    (i << RQB_L2BPW);
130d5a08a60SJake Burkholder 			CTR3(KTR_RUNQ, "runq_findbit: bits=%#x i=%d pri=%d",
131d5a08a60SJake Burkholder 			    rqb->rqb_bits[i], i, pri);
132d5a08a60SJake Burkholder 			return (pri);
133d5a08a60SJake Burkholder 		}
134d5a08a60SJake Burkholder 
135d5a08a60SJake Burkholder 	return (-1);
136d5a08a60SJake Burkholder }
137d5a08a60SJake Burkholder 
138d5a08a60SJake Burkholder /*
139d5a08a60SJake Burkholder  * Set the status bit of the queue corresponding to priority level pri,
140d5a08a60SJake Burkholder  * indicating that it is non-empty.
141d5a08a60SJake Burkholder  */
142d5a08a60SJake Burkholder static __inline void
143d5a08a60SJake Burkholder runq_setbit(struct runq *rq, int pri)
144d5a08a60SJake Burkholder {
145d5a08a60SJake Burkholder 	struct rqbits *rqb;
146d5a08a60SJake Burkholder 
147d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
148d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_setbit: bits=%#x %#x bit=%#x word=%d",
149d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)],
150d5a08a60SJake Burkholder 	    rqb->rqb_bits[RQB_WORD(pri)] | RQB_BIT(pri),
151d5a08a60SJake Burkholder 	    RQB_BIT(pri), RQB_WORD(pri));
152d5a08a60SJake Burkholder 	rqb->rqb_bits[RQB_WORD(pri)] |= RQB_BIT(pri);
153d5a08a60SJake Burkholder }
154d5a08a60SJake Burkholder 
1559cbd0393SDag-Erling Smørgrav #ifdef INVARIANT_SUPPORT
1569cbd0393SDag-Erling Smørgrav /*
1579cbd0393SDag-Erling Smørgrav  * Return true if the specified process is already in the run queue.
1589cbd0393SDag-Erling Smørgrav  */
1599cbd0393SDag-Erling Smørgrav static __inline int
160b40ce416SJulian Elischer runq_find(struct runq *rq, struct kse *ke)
1619cbd0393SDag-Erling Smørgrav {
162b40ce416SJulian Elischer 	struct kse *ke2;
1639cbd0393SDag-Erling Smørgrav 	int i;
1649cbd0393SDag-Erling Smørgrav 
1659cbd0393SDag-Erling Smørgrav 	mtx_assert(&sched_lock, MA_OWNED);
1669cbd0393SDag-Erling Smørgrav 	for (i = 0; i < RQB_LEN; i++)
167b40ce416SJulian Elischer 		TAILQ_FOREACH(ke2, &rq->rq_queues[i], ke_procq)
168b40ce416SJulian Elischer 		    if (ke2 == ke)
1699cbd0393SDag-Erling Smørgrav 			    return 1;
1709cbd0393SDag-Erling Smørgrav 	return 0;
1719cbd0393SDag-Erling Smørgrav }
1729cbd0393SDag-Erling Smørgrav #endif
1739cbd0393SDag-Erling Smørgrav 
174d5a08a60SJake Burkholder /*
175d5a08a60SJake Burkholder  * Add the process to the queue specified by its priority, and set the
176d5a08a60SJake Burkholder  * corresponding status bit.
177d5a08a60SJake Burkholder  */
178d5a08a60SJake Burkholder void
179b40ce416SJulian Elischer runq_add(struct runq *rq, struct kse *ke)
180d5a08a60SJake Burkholder {
181d5a08a60SJake Burkholder 	struct rqhead *rqh;
182d5a08a60SJake Burkholder 	int pri;
183dba6c5a6SPeter Wemm 
184b40ce416SJulian Elischer 	struct ksegrp *kg = ke->ke_ksegrp;
185b40ce416SJulian Elischer #ifdef INVARIANTS
186b40ce416SJulian Elischer 	struct proc *p = ke->ke_proc;
187b40ce416SJulian Elischer #endif
188b40ce416SJulian Elischer 	if (ke->ke_flags & KEF_ONRUNQ)
189b40ce416SJulian Elischer 		return;
1900384fff8SJason Evans 	mtx_assert(&sched_lock, MA_OWNED);
191d5a08a60SJake Burkholder 	KASSERT(p->p_stat == SRUN, ("runq_add: proc %p (%s) not SRUN",
192d5a08a60SJake Burkholder 	    p, p->p_comm));
193b40ce416SJulian Elischer 	KASSERT(runq_find(rq, ke) == 0,
194b40ce416SJulian Elischer 	    ("runq_add: proc %p (%s) already in run queue", ke, p->p_comm));
195b40ce416SJulian Elischer 	pri = kg->kg_pri.pri_level / RQ_PPQ;
196b40ce416SJulian Elischer 	ke->ke_rqindex = pri;
197d5a08a60SJake Burkholder 	runq_setbit(rq, pri);
198d5a08a60SJake Burkholder 	rqh = &rq->rq_queues[pri];
199d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_add: p=%p pri=%d %d rqh=%p",
2006a494eebSJonathan Lemon 	    ke->ke_proc, kg->kg_pri.pri_level, pri, rqh);
201b40ce416SJulian Elischer 	TAILQ_INSERT_TAIL(rqh, ke, ke_procq);
202b40ce416SJulian Elischer 	ke->ke_flags |= KEF_ONRUNQ;
203dba6c5a6SPeter Wemm }
204d5a08a60SJake Burkholder 
205d5a08a60SJake Burkholder /*
206d5a08a60SJake Burkholder  * Return true if there are runnable processes of any priority on the run
207d5a08a60SJake Burkholder  * queue, false otherwise.  Has no side effects, does not modify the run
208d5a08a60SJake Burkholder  * queue structure.
209d5a08a60SJake Burkholder  */
210d5a08a60SJake Burkholder int
211d5a08a60SJake Burkholder runq_check(struct runq *rq)
212d5a08a60SJake Burkholder {
213d5a08a60SJake Burkholder 	struct rqbits *rqb;
214d5a08a60SJake Burkholder 	int i;
215d5a08a60SJake Burkholder 
216d5a08a60SJake Burkholder 	rqb = &rq->rq_status;
217d5a08a60SJake Burkholder 	for (i = 0; i < RQB_LEN; i++)
218d5a08a60SJake Burkholder 		if (rqb->rqb_bits[i]) {
219d5a08a60SJake Burkholder 			CTR2(KTR_RUNQ, "runq_check: bits=%#x i=%d",
220d5a08a60SJake Burkholder 			    rqb->rqb_bits[i], i);
221d5a08a60SJake Burkholder 			return (1);
222dba6c5a6SPeter Wemm 		}
223d5a08a60SJake Burkholder 	CTR0(KTR_RUNQ, "runq_check: empty");
224d5a08a60SJake Burkholder 
225d5a08a60SJake Burkholder 	return (0);
226dba6c5a6SPeter Wemm }
227d5a08a60SJake Burkholder 
228d5a08a60SJake Burkholder /*
229d5a08a60SJake Burkholder  * Find and remove the highest priority process from the run queue.
230d5a08a60SJake Burkholder  * If there are no runnable processes, the per-cpu idle process is
231d5a08a60SJake Burkholder  * returned.  Will not return NULL under any circumstances.
232d5a08a60SJake Burkholder  */
233b40ce416SJulian Elischer struct kse *
234d5a08a60SJake Burkholder runq_choose(struct runq *rq)
235d5a08a60SJake Burkholder {
236d5a08a60SJake Burkholder 	struct rqhead *rqh;
237b40ce416SJulian Elischer 	struct kse *ke;
238d5a08a60SJake Burkholder 	int pri;
239d5a08a60SJake Burkholder 
240d5a08a60SJake Burkholder 	mtx_assert(&sched_lock, MA_OWNED);
241d5a08a60SJake Burkholder 	if ((pri = runq_findbit(rq)) != -1) {
242d5a08a60SJake Burkholder 		rqh = &rq->rq_queues[pri];
243b40ce416SJulian Elischer 		ke = TAILQ_FIRST(rqh);
244b40ce416SJulian Elischer 		KASSERT(ke != NULL, ("runq_choose: no proc on busy queue"));
245b40ce416SJulian Elischer 		KASSERT(ke->ke_proc->p_stat == SRUN,
246b40ce416SJulian Elischer 		    ("runq_choose: process %d(%s) in state %d", ke->ke_proc->p_pid,
247b40ce416SJulian Elischer 		    ke->ke_proc->p_comm, ke->ke_proc->p_stat));
248b40ce416SJulian Elischer 		CTR3(KTR_RUNQ, "runq_choose: pri=%d kse=%p rqh=%p", pri, ke, rqh);
249b40ce416SJulian Elischer 		TAILQ_REMOVE(rqh, ke, ke_procq);
250d5a08a60SJake Burkholder 		if (TAILQ_EMPTY(rqh)) {
251d5a08a60SJake Burkholder 			CTR0(KTR_RUNQ, "runq_choose: empty");
252d5a08a60SJake Burkholder 			runq_clrbit(rq, pri);
253d5a08a60SJake Burkholder 		}
254b40ce416SJulian Elischer 		ke->ke_flags &= ~KEF_ONRUNQ;
255b40ce416SJulian Elischer 		return (ke);
256d5a08a60SJake Burkholder 	}
257d5a08a60SJake Burkholder 	CTR1(KTR_RUNQ, "runq_choose: idleproc pri=%d", pri);
258d5a08a60SJake Burkholder 
259b40ce416SJulian Elischer 	return (PCPU_GET(idlethread)->td_kse);
260d5a08a60SJake Burkholder }
261d5a08a60SJake Burkholder 
262d5a08a60SJake Burkholder /*
263d5a08a60SJake Burkholder  * Initialize a run structure.
264d5a08a60SJake Burkholder  */
265d5a08a60SJake Burkholder void
266d5a08a60SJake Burkholder runq_init(struct runq *rq)
267d5a08a60SJake Burkholder {
268d5a08a60SJake Burkholder 	int i;
269d5a08a60SJake Burkholder 
270f32ded2fSJake Burkholder 	bzero(rq, sizeof *rq);
271d5a08a60SJake Burkholder 	for (i = 0; i < RQ_NQS; i++)
272d5a08a60SJake Burkholder 		TAILQ_INIT(&rq->rq_queues[i]);
273d5a08a60SJake Burkholder }
274d5a08a60SJake Burkholder 
275d5a08a60SJake Burkholder /*
276d5a08a60SJake Burkholder  * Remove the process from the queue specified by its priority, and clear the
277d5a08a60SJake Burkholder  * corresponding status bit if the queue becomes empty.
278d5a08a60SJake Burkholder  */
279d5a08a60SJake Burkholder void
280b40ce416SJulian Elischer runq_remove(struct runq *rq, struct kse *ke)
281d5a08a60SJake Burkholder {
282b40ce416SJulian Elischer #ifdef KTR
283b40ce416SJulian Elischer 	struct ksegrp *kg = ke->ke_ksegrp;
284b40ce416SJulian Elischer #endif
285d5a08a60SJake Burkholder 	struct rqhead *rqh;
286d5a08a60SJake Burkholder 	int pri;
287d5a08a60SJake Burkholder 
288b40ce416SJulian Elischer 	if (!(ke->ke_flags & KEF_ONRUNQ))
289b40ce416SJulian Elischer 		return;
290d5a08a60SJake Burkholder 	mtx_assert(&sched_lock, MA_OWNED);
291b40ce416SJulian Elischer 	pri = ke->ke_rqindex;
292d5a08a60SJake Burkholder 	rqh = &rq->rq_queues[pri];
293d5a08a60SJake Burkholder 	CTR4(KTR_RUNQ, "runq_remove: p=%p pri=%d %d rqh=%p",
294b40ce416SJulian Elischer 	    ke, kg->kg_pri.pri_level, pri, rqh);
295b40ce416SJulian Elischer 	KASSERT(ke != NULL, ("runq_remove: no proc on busy queue"));
296b40ce416SJulian Elischer 	TAILQ_REMOVE(rqh, ke, ke_procq);
297d5a08a60SJake Burkholder 	if (TAILQ_EMPTY(rqh)) {
298d5a08a60SJake Burkholder 		CTR0(KTR_RUNQ, "runq_remove: empty");
299d5a08a60SJake Burkholder 		runq_clrbit(rq, pri);
300d5a08a60SJake Burkholder 	}
301b40ce416SJulian Elischer 	ke->ke_flags &= ~KEF_ONRUNQ;
302dba6c5a6SPeter Wemm }
303