1dba6c5a6SPeter Wemm /* 2d5a08a60SJake Burkholder * Copyright (c) 2001 Jake Burkholder <jake@FreeBSD.org> 3d5a08a60SJake Burkholder * All rights reserved. 4dba6c5a6SPeter Wemm * 5dba6c5a6SPeter Wemm * Redistribution and use in source and binary forms, with or without 6dba6c5a6SPeter Wemm * modification, are permitted provided that the following conditions 7dba6c5a6SPeter Wemm * are met: 8dba6c5a6SPeter Wemm * 1. Redistributions of source code must retain the above copyright 9dba6c5a6SPeter Wemm * notice, this list of conditions and the following disclaimer. 10dba6c5a6SPeter Wemm * 2. Redistributions in binary form must reproduce the above copyright 11dba6c5a6SPeter Wemm * notice, this list of conditions and the following disclaimer in the 12dba6c5a6SPeter Wemm * documentation and/or other materials provided with the distribution. 13dba6c5a6SPeter Wemm * 14dba6c5a6SPeter Wemm * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15dba6c5a6SPeter Wemm * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16dba6c5a6SPeter Wemm * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17dba6c5a6SPeter Wemm * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18dba6c5a6SPeter Wemm * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19dba6c5a6SPeter Wemm * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20dba6c5a6SPeter Wemm * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21dba6c5a6SPeter Wemm * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22dba6c5a6SPeter Wemm * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23dba6c5a6SPeter Wemm * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24dba6c5a6SPeter Wemm * SUCH DAMAGE. 25dba6c5a6SPeter Wemm * 26dba6c5a6SPeter Wemm * $FreeBSD$ 27dba6c5a6SPeter Wemm */ 28dba6c5a6SPeter Wemm 29dba6c5a6SPeter Wemm #include <sys/param.h> 30dba6c5a6SPeter Wemm #include <sys/systm.h> 31dba6c5a6SPeter Wemm #include <sys/kernel.h> 320384fff8SJason Evans #include <sys/ktr.h> 33f34fa851SJohn Baldwin #include <sys/lock.h> 3435e0e5b3SJohn Baldwin #include <sys/mutex.h> 35dba6c5a6SPeter Wemm #include <sys/proc.h> 36dba6c5a6SPeter Wemm #include <sys/queue.h> 37dba6c5a6SPeter Wemm 38dba6c5a6SPeter Wemm /* 39d5a08a60SJake Burkholder * Global run queue. 40dba6c5a6SPeter Wemm */ 41d5a08a60SJake Burkholder static struct runq runq; 42d5a08a60SJake Burkholder SYSINIT(runq, SI_SUB_RUN_QUEUE, SI_ORDER_FIRST, runq_init, &runq) 43dba6c5a6SPeter Wemm 44dba6c5a6SPeter Wemm /* 45d5a08a60SJake Burkholder * Wrappers which implement old interface; act on global run queue. 46dba6c5a6SPeter Wemm */ 47dba6c5a6SPeter Wemm 48b40ce416SJulian Elischer struct thread * 49b40ce416SJulian Elischer choosethread(void) 50dba6c5a6SPeter Wemm { 51b40ce416SJulian Elischer return (runq_choose(&runq)->ke_thread); 52d5a08a60SJake Burkholder } 53d5a08a60SJake Burkholder 54d5a08a60SJake Burkholder int 55d5a08a60SJake Burkholder procrunnable(void) 56d5a08a60SJake Burkholder { 57d5a08a60SJake Burkholder return runq_check(&runq); 58d5a08a60SJake Burkholder } 59d5a08a60SJake Burkholder 60d5a08a60SJake Burkholder void 61b40ce416SJulian Elischer remrunqueue(struct thread *td) 62d5a08a60SJake Burkholder { 63b40ce416SJulian Elischer runq_remove(&runq, td->td_kse); 64d5a08a60SJake Burkholder } 65d5a08a60SJake Burkholder 66d5a08a60SJake Burkholder void 67b40ce416SJulian Elischer setrunqueue(struct thread *td) 68d5a08a60SJake Burkholder { 69b40ce416SJulian Elischer runq_add(&runq, td->td_kse); 70d5a08a60SJake Burkholder } 71d5a08a60SJake Burkholder 727e1f6dfeSJohn Baldwin /* Critical sections that prevent preemption. */ 737e1f6dfeSJohn Baldwin void 747e1f6dfeSJohn Baldwin critical_enter(void) 757e1f6dfeSJohn Baldwin { 767e1f6dfeSJohn Baldwin struct thread *td; 777e1f6dfeSJohn Baldwin 787e1f6dfeSJohn Baldwin td = curthread; 797e1f6dfeSJohn Baldwin if (td->td_critnest == 0) 807e1f6dfeSJohn Baldwin td->td_savecrit = cpu_critical_enter(); 817e1f6dfeSJohn Baldwin td->td_critnest++; 827e1f6dfeSJohn Baldwin } 837e1f6dfeSJohn Baldwin 847e1f6dfeSJohn Baldwin void 857e1f6dfeSJohn Baldwin critical_exit(void) 867e1f6dfeSJohn Baldwin { 877e1f6dfeSJohn Baldwin struct thread *td; 887e1f6dfeSJohn Baldwin 897e1f6dfeSJohn Baldwin td = curthread; 907e1f6dfeSJohn Baldwin if (td->td_critnest == 1) { 917e1f6dfeSJohn Baldwin td->td_critnest = 0; 927e1f6dfeSJohn Baldwin cpu_critical_exit(td->td_savecrit); 937e1f6dfeSJohn Baldwin } else 947e1f6dfeSJohn Baldwin td->td_critnest--; 957e1f6dfeSJohn Baldwin } 967e1f6dfeSJohn Baldwin 97d5a08a60SJake Burkholder /* 98d5a08a60SJake Burkholder * Clear the status bit of the queue corresponding to priority level pri, 99d5a08a60SJake Burkholder * indicating that it is empty. 100d5a08a60SJake Burkholder */ 101d5a08a60SJake Burkholder static __inline void 102d5a08a60SJake Burkholder runq_clrbit(struct runq *rq, int pri) 103d5a08a60SJake Burkholder { 104d5a08a60SJake Burkholder struct rqbits *rqb; 105d5a08a60SJake Burkholder 106d5a08a60SJake Burkholder rqb = &rq->rq_status; 107d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_clrbit: bits=%#x %#x bit=%#x word=%d", 108d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)], 109d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] & ~RQB_BIT(pri), 110d5a08a60SJake Burkholder RQB_BIT(pri), RQB_WORD(pri)); 111d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] &= ~RQB_BIT(pri); 112d5a08a60SJake Burkholder } 113d5a08a60SJake Burkholder 114d5a08a60SJake Burkholder /* 115d5a08a60SJake Burkholder * Find the index of the first non-empty run queue. This is done by 116d5a08a60SJake Burkholder * scanning the status bits, a set bit indicates a non-empty queue. 117d5a08a60SJake Burkholder */ 118d5a08a60SJake Burkholder static __inline int 119d5a08a60SJake Burkholder runq_findbit(struct runq *rq) 120d5a08a60SJake Burkholder { 121d5a08a60SJake Burkholder struct rqbits *rqb; 122d5a08a60SJake Burkholder int pri; 123d5a08a60SJake Burkholder int i; 124d5a08a60SJake Burkholder 125d5a08a60SJake Burkholder rqb = &rq->rq_status; 126d5a08a60SJake Burkholder for (i = 0; i < RQB_LEN; i++) 127d5a08a60SJake Burkholder if (rqb->rqb_bits[i]) { 128d5a08a60SJake Burkholder pri = (RQB_FFS(rqb->rqb_bits[i]) - 1) + 129d5a08a60SJake Burkholder (i << RQB_L2BPW); 130d5a08a60SJake Burkholder CTR3(KTR_RUNQ, "runq_findbit: bits=%#x i=%d pri=%d", 131d5a08a60SJake Burkholder rqb->rqb_bits[i], i, pri); 132d5a08a60SJake Burkholder return (pri); 133d5a08a60SJake Burkholder } 134d5a08a60SJake Burkholder 135d5a08a60SJake Burkholder return (-1); 136d5a08a60SJake Burkholder } 137d5a08a60SJake Burkholder 138d5a08a60SJake Burkholder /* 139d5a08a60SJake Burkholder * Set the status bit of the queue corresponding to priority level pri, 140d5a08a60SJake Burkholder * indicating that it is non-empty. 141d5a08a60SJake Burkholder */ 142d5a08a60SJake Burkholder static __inline void 143d5a08a60SJake Burkholder runq_setbit(struct runq *rq, int pri) 144d5a08a60SJake Burkholder { 145d5a08a60SJake Burkholder struct rqbits *rqb; 146d5a08a60SJake Burkholder 147d5a08a60SJake Burkholder rqb = &rq->rq_status; 148d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_setbit: bits=%#x %#x bit=%#x word=%d", 149d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)], 150d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] | RQB_BIT(pri), 151d5a08a60SJake Burkholder RQB_BIT(pri), RQB_WORD(pri)); 152d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] |= RQB_BIT(pri); 153d5a08a60SJake Burkholder } 154d5a08a60SJake Burkholder 1559cbd0393SDag-Erling Smørgrav #ifdef INVARIANT_SUPPORT 1569cbd0393SDag-Erling Smørgrav /* 1579cbd0393SDag-Erling Smørgrav * Return true if the specified process is already in the run queue. 1589cbd0393SDag-Erling Smørgrav */ 1599cbd0393SDag-Erling Smørgrav static __inline int 160b40ce416SJulian Elischer runq_find(struct runq *rq, struct kse *ke) 1619cbd0393SDag-Erling Smørgrav { 162b40ce416SJulian Elischer struct kse *ke2; 1639cbd0393SDag-Erling Smørgrav int i; 1649cbd0393SDag-Erling Smørgrav 1659cbd0393SDag-Erling Smørgrav mtx_assert(&sched_lock, MA_OWNED); 1669cbd0393SDag-Erling Smørgrav for (i = 0; i < RQB_LEN; i++) 167b40ce416SJulian Elischer TAILQ_FOREACH(ke2, &rq->rq_queues[i], ke_procq) 168b40ce416SJulian Elischer if (ke2 == ke) 1699cbd0393SDag-Erling Smørgrav return 1; 1709cbd0393SDag-Erling Smørgrav return 0; 1719cbd0393SDag-Erling Smørgrav } 1729cbd0393SDag-Erling Smørgrav #endif 1739cbd0393SDag-Erling Smørgrav 174d5a08a60SJake Burkholder /* 175d5a08a60SJake Burkholder * Add the process to the queue specified by its priority, and set the 176d5a08a60SJake Burkholder * corresponding status bit. 177d5a08a60SJake Burkholder */ 178d5a08a60SJake Burkholder void 179b40ce416SJulian Elischer runq_add(struct runq *rq, struct kse *ke) 180d5a08a60SJake Burkholder { 181d5a08a60SJake Burkholder struct rqhead *rqh; 182d5a08a60SJake Burkholder int pri; 183dba6c5a6SPeter Wemm 184b40ce416SJulian Elischer struct ksegrp *kg = ke->ke_ksegrp; 185b40ce416SJulian Elischer #ifdef INVARIANTS 186b40ce416SJulian Elischer struct proc *p = ke->ke_proc; 187b40ce416SJulian Elischer #endif 188b40ce416SJulian Elischer if (ke->ke_flags & KEF_ONRUNQ) 189b40ce416SJulian Elischer return; 1900384fff8SJason Evans mtx_assert(&sched_lock, MA_OWNED); 191d5a08a60SJake Burkholder KASSERT(p->p_stat == SRUN, ("runq_add: proc %p (%s) not SRUN", 192d5a08a60SJake Burkholder p, p->p_comm)); 193b40ce416SJulian Elischer KASSERT(runq_find(rq, ke) == 0, 194b40ce416SJulian Elischer ("runq_add: proc %p (%s) already in run queue", ke, p->p_comm)); 195b40ce416SJulian Elischer pri = kg->kg_pri.pri_level / RQ_PPQ; 196b40ce416SJulian Elischer ke->ke_rqindex = pri; 197d5a08a60SJake Burkholder runq_setbit(rq, pri); 198d5a08a60SJake Burkholder rqh = &rq->rq_queues[pri]; 199d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_add: p=%p pri=%d %d rqh=%p", 2006a494eebSJonathan Lemon ke->ke_proc, kg->kg_pri.pri_level, pri, rqh); 201b40ce416SJulian Elischer TAILQ_INSERT_TAIL(rqh, ke, ke_procq); 202b40ce416SJulian Elischer ke->ke_flags |= KEF_ONRUNQ; 203dba6c5a6SPeter Wemm } 204d5a08a60SJake Burkholder 205d5a08a60SJake Burkholder /* 206d5a08a60SJake Burkholder * Return true if there are runnable processes of any priority on the run 207d5a08a60SJake Burkholder * queue, false otherwise. Has no side effects, does not modify the run 208d5a08a60SJake Burkholder * queue structure. 209d5a08a60SJake Burkholder */ 210d5a08a60SJake Burkholder int 211d5a08a60SJake Burkholder runq_check(struct runq *rq) 212d5a08a60SJake Burkholder { 213d5a08a60SJake Burkholder struct rqbits *rqb; 214d5a08a60SJake Burkholder int i; 215d5a08a60SJake Burkholder 216d5a08a60SJake Burkholder rqb = &rq->rq_status; 217d5a08a60SJake Burkholder for (i = 0; i < RQB_LEN; i++) 218d5a08a60SJake Burkholder if (rqb->rqb_bits[i]) { 219d5a08a60SJake Burkholder CTR2(KTR_RUNQ, "runq_check: bits=%#x i=%d", 220d5a08a60SJake Burkholder rqb->rqb_bits[i], i); 221d5a08a60SJake Burkholder return (1); 222dba6c5a6SPeter Wemm } 223d5a08a60SJake Burkholder CTR0(KTR_RUNQ, "runq_check: empty"); 224d5a08a60SJake Burkholder 225d5a08a60SJake Burkholder return (0); 226dba6c5a6SPeter Wemm } 227d5a08a60SJake Burkholder 228d5a08a60SJake Burkholder /* 229d5a08a60SJake Burkholder * Find and remove the highest priority process from the run queue. 230d5a08a60SJake Burkholder * If there are no runnable processes, the per-cpu idle process is 231d5a08a60SJake Burkholder * returned. Will not return NULL under any circumstances. 232d5a08a60SJake Burkholder */ 233b40ce416SJulian Elischer struct kse * 234d5a08a60SJake Burkholder runq_choose(struct runq *rq) 235d5a08a60SJake Burkholder { 236d5a08a60SJake Burkholder struct rqhead *rqh; 237b40ce416SJulian Elischer struct kse *ke; 238d5a08a60SJake Burkholder int pri; 239d5a08a60SJake Burkholder 240d5a08a60SJake Burkholder mtx_assert(&sched_lock, MA_OWNED); 241d5a08a60SJake Burkholder if ((pri = runq_findbit(rq)) != -1) { 242d5a08a60SJake Burkholder rqh = &rq->rq_queues[pri]; 243b40ce416SJulian Elischer ke = TAILQ_FIRST(rqh); 244b40ce416SJulian Elischer KASSERT(ke != NULL, ("runq_choose: no proc on busy queue")); 245b40ce416SJulian Elischer KASSERT(ke->ke_proc->p_stat == SRUN, 246b40ce416SJulian Elischer ("runq_choose: process %d(%s) in state %d", ke->ke_proc->p_pid, 247b40ce416SJulian Elischer ke->ke_proc->p_comm, ke->ke_proc->p_stat)); 248b40ce416SJulian Elischer CTR3(KTR_RUNQ, "runq_choose: pri=%d kse=%p rqh=%p", pri, ke, rqh); 249b40ce416SJulian Elischer TAILQ_REMOVE(rqh, ke, ke_procq); 250d5a08a60SJake Burkholder if (TAILQ_EMPTY(rqh)) { 251d5a08a60SJake Burkholder CTR0(KTR_RUNQ, "runq_choose: empty"); 252d5a08a60SJake Burkholder runq_clrbit(rq, pri); 253d5a08a60SJake Burkholder } 254b40ce416SJulian Elischer ke->ke_flags &= ~KEF_ONRUNQ; 255b40ce416SJulian Elischer return (ke); 256d5a08a60SJake Burkholder } 257d5a08a60SJake Burkholder CTR1(KTR_RUNQ, "runq_choose: idleproc pri=%d", pri); 258d5a08a60SJake Burkholder 259b40ce416SJulian Elischer return (PCPU_GET(idlethread)->td_kse); 260d5a08a60SJake Burkholder } 261d5a08a60SJake Burkholder 262d5a08a60SJake Burkholder /* 263d5a08a60SJake Burkholder * Initialize a run structure. 264d5a08a60SJake Burkholder */ 265d5a08a60SJake Burkholder void 266d5a08a60SJake Burkholder runq_init(struct runq *rq) 267d5a08a60SJake Burkholder { 268d5a08a60SJake Burkholder int i; 269d5a08a60SJake Burkholder 270f32ded2fSJake Burkholder bzero(rq, sizeof *rq); 271d5a08a60SJake Burkholder for (i = 0; i < RQ_NQS; i++) 272d5a08a60SJake Burkholder TAILQ_INIT(&rq->rq_queues[i]); 273d5a08a60SJake Burkholder } 274d5a08a60SJake Burkholder 275d5a08a60SJake Burkholder /* 276d5a08a60SJake Burkholder * Remove the process from the queue specified by its priority, and clear the 277d5a08a60SJake Burkholder * corresponding status bit if the queue becomes empty. 278d5a08a60SJake Burkholder */ 279d5a08a60SJake Burkholder void 280b40ce416SJulian Elischer runq_remove(struct runq *rq, struct kse *ke) 281d5a08a60SJake Burkholder { 282b40ce416SJulian Elischer #ifdef KTR 283b40ce416SJulian Elischer struct ksegrp *kg = ke->ke_ksegrp; 284b40ce416SJulian Elischer #endif 285d5a08a60SJake Burkholder struct rqhead *rqh; 286d5a08a60SJake Burkholder int pri; 287d5a08a60SJake Burkholder 288b40ce416SJulian Elischer if (!(ke->ke_flags & KEF_ONRUNQ)) 289b40ce416SJulian Elischer return; 290d5a08a60SJake Burkholder mtx_assert(&sched_lock, MA_OWNED); 291b40ce416SJulian Elischer pri = ke->ke_rqindex; 292d5a08a60SJake Burkholder rqh = &rq->rq_queues[pri]; 293d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_remove: p=%p pri=%d %d rqh=%p", 294b40ce416SJulian Elischer ke, kg->kg_pri.pri_level, pri, rqh); 295b40ce416SJulian Elischer KASSERT(ke != NULL, ("runq_remove: no proc on busy queue")); 296b40ce416SJulian Elischer TAILQ_REMOVE(rqh, ke, ke_procq); 297d5a08a60SJake Burkholder if (TAILQ_EMPTY(rqh)) { 298d5a08a60SJake Burkholder CTR0(KTR_RUNQ, "runq_remove: empty"); 299d5a08a60SJake Burkholder runq_clrbit(rq, pri); 300d5a08a60SJake Burkholder } 301b40ce416SJulian Elischer ke->ke_flags &= ~KEF_ONRUNQ; 302dba6c5a6SPeter Wemm } 303