1dba6c5a6SPeter Wemm /* 2d5a08a60SJake Burkholder * Copyright (c) 2001 Jake Burkholder <jake@FreeBSD.org> 3d5a08a60SJake Burkholder * All rights reserved. 4dba6c5a6SPeter Wemm * 5dba6c5a6SPeter Wemm * Redistribution and use in source and binary forms, with or without 6dba6c5a6SPeter Wemm * modification, are permitted provided that the following conditions 7dba6c5a6SPeter Wemm * are met: 8dba6c5a6SPeter Wemm * 1. Redistributions of source code must retain the above copyright 9dba6c5a6SPeter Wemm * notice, this list of conditions and the following disclaimer. 10dba6c5a6SPeter Wemm * 2. Redistributions in binary form must reproduce the above copyright 11dba6c5a6SPeter Wemm * notice, this list of conditions and the following disclaimer in the 12dba6c5a6SPeter Wemm * documentation and/or other materials provided with the distribution. 13dba6c5a6SPeter Wemm * 14dba6c5a6SPeter Wemm * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15dba6c5a6SPeter Wemm * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16dba6c5a6SPeter Wemm * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17dba6c5a6SPeter Wemm * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18dba6c5a6SPeter Wemm * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19dba6c5a6SPeter Wemm * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20dba6c5a6SPeter Wemm * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21dba6c5a6SPeter Wemm * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22dba6c5a6SPeter Wemm * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23dba6c5a6SPeter Wemm * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24dba6c5a6SPeter Wemm * SUCH DAMAGE. 25dba6c5a6SPeter Wemm * 26dba6c5a6SPeter Wemm * $FreeBSD$ 27dba6c5a6SPeter Wemm */ 28dba6c5a6SPeter Wemm 29dba6c5a6SPeter Wemm #include <sys/param.h> 30dba6c5a6SPeter Wemm #include <sys/systm.h> 31dba6c5a6SPeter Wemm #include <sys/kernel.h> 320384fff8SJason Evans #include <sys/ktr.h> 33f34fa851SJohn Baldwin #include <sys/lock.h> 3435e0e5b3SJohn Baldwin #include <sys/mutex.h> 35dba6c5a6SPeter Wemm #include <sys/proc.h> 36dba6c5a6SPeter Wemm #include <sys/queue.h> 37dba6c5a6SPeter Wemm 38dba6c5a6SPeter Wemm /* 39d5a08a60SJake Burkholder * Global run queue. 40dba6c5a6SPeter Wemm */ 41d5a08a60SJake Burkholder static struct runq runq; 42d5a08a60SJake Burkholder SYSINIT(runq, SI_SUB_RUN_QUEUE, SI_ORDER_FIRST, runq_init, &runq) 43dba6c5a6SPeter Wemm 44dba6c5a6SPeter Wemm /* 45d5a08a60SJake Burkholder * Wrappers which implement old interface; act on global run queue. 46dba6c5a6SPeter Wemm */ 47dba6c5a6SPeter Wemm 48b40ce416SJulian Elischer struct thread * 49b40ce416SJulian Elischer choosethread(void) 50dba6c5a6SPeter Wemm { 51b40ce416SJulian Elischer return (runq_choose(&runq)->ke_thread); 52d5a08a60SJake Burkholder } 53d5a08a60SJake Burkholder 54d5a08a60SJake Burkholder int 55d5a08a60SJake Burkholder procrunnable(void) 56d5a08a60SJake Burkholder { 57d5a08a60SJake Burkholder return runq_check(&runq); 58d5a08a60SJake Burkholder } 59d5a08a60SJake Burkholder 60d5a08a60SJake Burkholder void 61b40ce416SJulian Elischer remrunqueue(struct thread *td) 62d5a08a60SJake Burkholder { 63b40ce416SJulian Elischer runq_remove(&runq, td->td_kse); 64d5a08a60SJake Burkholder } 65d5a08a60SJake Burkholder 66d5a08a60SJake Burkholder void 67b40ce416SJulian Elischer setrunqueue(struct thread *td) 68d5a08a60SJake Burkholder { 69b40ce416SJulian Elischer runq_add(&runq, td->td_kse); 70d5a08a60SJake Burkholder } 71d5a08a60SJake Burkholder 727e1f6dfeSJohn Baldwin /* Critical sections that prevent preemption. */ 737e1f6dfeSJohn Baldwin void 747e1f6dfeSJohn Baldwin critical_enter(void) 757e1f6dfeSJohn Baldwin { 767e1f6dfeSJohn Baldwin struct thread *td; 777e1f6dfeSJohn Baldwin 787e1f6dfeSJohn Baldwin td = curthread; 797e1f6dfeSJohn Baldwin if (td->td_critnest == 0) 80d74ac681SMatthew Dillon cpu_critical_enter(); 817e1f6dfeSJohn Baldwin td->td_critnest++; 827e1f6dfeSJohn Baldwin } 837e1f6dfeSJohn Baldwin 847e1f6dfeSJohn Baldwin void 857e1f6dfeSJohn Baldwin critical_exit(void) 867e1f6dfeSJohn Baldwin { 877e1f6dfeSJohn Baldwin struct thread *td; 887e1f6dfeSJohn Baldwin 897e1f6dfeSJohn Baldwin td = curthread; 907e1f6dfeSJohn Baldwin if (td->td_critnest == 1) { 917e1f6dfeSJohn Baldwin td->td_critnest = 0; 92d74ac681SMatthew Dillon cpu_critical_exit(); 93d74ac681SMatthew Dillon } else { 947e1f6dfeSJohn Baldwin td->td_critnest--; 957e1f6dfeSJohn Baldwin } 96d74ac681SMatthew Dillon } 977e1f6dfeSJohn Baldwin 98d5a08a60SJake Burkholder /* 99d5a08a60SJake Burkholder * Clear the status bit of the queue corresponding to priority level pri, 100d5a08a60SJake Burkholder * indicating that it is empty. 101d5a08a60SJake Burkholder */ 102d5a08a60SJake Burkholder static __inline void 103d5a08a60SJake Burkholder runq_clrbit(struct runq *rq, int pri) 104d5a08a60SJake Burkholder { 105d5a08a60SJake Burkholder struct rqbits *rqb; 106d5a08a60SJake Burkholder 107d5a08a60SJake Burkholder rqb = &rq->rq_status; 108d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_clrbit: bits=%#x %#x bit=%#x word=%d", 109d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)], 110d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] & ~RQB_BIT(pri), 111d5a08a60SJake Burkholder RQB_BIT(pri), RQB_WORD(pri)); 112d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] &= ~RQB_BIT(pri); 113d5a08a60SJake Burkholder } 114d5a08a60SJake Burkholder 115d5a08a60SJake Burkholder /* 116d5a08a60SJake Burkholder * Find the index of the first non-empty run queue. This is done by 117d5a08a60SJake Burkholder * scanning the status bits, a set bit indicates a non-empty queue. 118d5a08a60SJake Burkholder */ 119d5a08a60SJake Burkholder static __inline int 120d5a08a60SJake Burkholder runq_findbit(struct runq *rq) 121d5a08a60SJake Burkholder { 122d5a08a60SJake Burkholder struct rqbits *rqb; 123d5a08a60SJake Burkholder int pri; 124d5a08a60SJake Burkholder int i; 125d5a08a60SJake Burkholder 126d5a08a60SJake Burkholder rqb = &rq->rq_status; 127d5a08a60SJake Burkholder for (i = 0; i < RQB_LEN; i++) 128d5a08a60SJake Burkholder if (rqb->rqb_bits[i]) { 129d5a08a60SJake Burkholder pri = (RQB_FFS(rqb->rqb_bits[i]) - 1) + 130d5a08a60SJake Burkholder (i << RQB_L2BPW); 131d5a08a60SJake Burkholder CTR3(KTR_RUNQ, "runq_findbit: bits=%#x i=%d pri=%d", 132d5a08a60SJake Burkholder rqb->rqb_bits[i], i, pri); 133d5a08a60SJake Burkholder return (pri); 134d5a08a60SJake Burkholder } 135d5a08a60SJake Burkholder 136d5a08a60SJake Burkholder return (-1); 137d5a08a60SJake Burkholder } 138d5a08a60SJake Burkholder 139d5a08a60SJake Burkholder /* 140d5a08a60SJake Burkholder * Set the status bit of the queue corresponding to priority level pri, 141d5a08a60SJake Burkholder * indicating that it is non-empty. 142d5a08a60SJake Burkholder */ 143d5a08a60SJake Burkholder static __inline void 144d5a08a60SJake Burkholder runq_setbit(struct runq *rq, int pri) 145d5a08a60SJake Burkholder { 146d5a08a60SJake Burkholder struct rqbits *rqb; 147d5a08a60SJake Burkholder 148d5a08a60SJake Burkholder rqb = &rq->rq_status; 149d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_setbit: bits=%#x %#x bit=%#x word=%d", 150d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)], 151d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] | RQB_BIT(pri), 152d5a08a60SJake Burkholder RQB_BIT(pri), RQB_WORD(pri)); 153d5a08a60SJake Burkholder rqb->rqb_bits[RQB_WORD(pri)] |= RQB_BIT(pri); 154d5a08a60SJake Burkholder } 155d5a08a60SJake Burkholder 156e97c3e3dSDag-Erling Smørgrav #if defined(INVARIANT_SUPPORT) && defined(DIAGNOSTIC) 1579cbd0393SDag-Erling Smørgrav /* 1589cbd0393SDag-Erling Smørgrav * Return true if the specified process is already in the run queue. 1599cbd0393SDag-Erling Smørgrav */ 1609cbd0393SDag-Erling Smørgrav static __inline int 161e97c3e3dSDag-Erling Smørgrav runq_findproc(struct runq *rq, struct kse *ke) 1629cbd0393SDag-Erling Smørgrav { 163b40ce416SJulian Elischer struct kse *ke2; 1649cbd0393SDag-Erling Smørgrav int i; 1659cbd0393SDag-Erling Smørgrav 1669cbd0393SDag-Erling Smørgrav mtx_assert(&sched_lock, MA_OWNED); 1679cbd0393SDag-Erling Smørgrav for (i = 0; i < RQB_LEN; i++) 168b40ce416SJulian Elischer TAILQ_FOREACH(ke2, &rq->rq_queues[i], ke_procq) 169b40ce416SJulian Elischer if (ke2 == ke) 1709cbd0393SDag-Erling Smørgrav return 1; 1719cbd0393SDag-Erling Smørgrav return 0; 1729cbd0393SDag-Erling Smørgrav } 1739cbd0393SDag-Erling Smørgrav #endif 1749cbd0393SDag-Erling Smørgrav 175d5a08a60SJake Burkholder /* 176d5a08a60SJake Burkholder * Add the process to the queue specified by its priority, and set the 177d5a08a60SJake Burkholder * corresponding status bit. 178d5a08a60SJake Burkholder */ 179d5a08a60SJake Burkholder void 180b40ce416SJulian Elischer runq_add(struct runq *rq, struct kse *ke) 181d5a08a60SJake Burkholder { 182d5a08a60SJake Burkholder struct rqhead *rqh; 183d5a08a60SJake Burkholder int pri; 184dba6c5a6SPeter Wemm 185b40ce416SJulian Elischer #ifdef INVARIANTS 186b40ce416SJulian Elischer struct proc *p = ke->ke_proc; 187b40ce416SJulian Elischer #endif 188b40ce416SJulian Elischer if (ke->ke_flags & KEF_ONRUNQ) 189b40ce416SJulian Elischer return; 1900384fff8SJason Evans mtx_assert(&sched_lock, MA_OWNED); 191d5a08a60SJake Burkholder KASSERT(p->p_stat == SRUN, ("runq_add: proc %p (%s) not SRUN", 192d5a08a60SJake Burkholder p, p->p_comm)); 193e97c3e3dSDag-Erling Smørgrav #if defined(INVARIANTS) && defined(DIAGNOSTIC) 194e97c3e3dSDag-Erling Smørgrav KASSERT(runq_findproc(rq, ke) == 0, 195b40ce416SJulian Elischer ("runq_add: proc %p (%s) already in run queue", ke, p->p_comm)); 196e97c3e3dSDag-Erling Smørgrav #endif 1972c100766SJulian Elischer pri = ke->ke_thread->td_priority / RQ_PPQ; 198b40ce416SJulian Elischer ke->ke_rqindex = pri; 199d5a08a60SJake Burkholder runq_setbit(rq, pri); 200d5a08a60SJake Burkholder rqh = &rq->rq_queues[pri]; 201d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_add: p=%p pri=%d %d rqh=%p", 2022c100766SJulian Elischer ke->ke_proc, ke->ke_thread->td_priority, pri, rqh); 203b40ce416SJulian Elischer TAILQ_INSERT_TAIL(rqh, ke, ke_procq); 204b40ce416SJulian Elischer ke->ke_flags |= KEF_ONRUNQ; 205dba6c5a6SPeter Wemm } 206d5a08a60SJake Burkholder 207d5a08a60SJake Burkholder /* 208d5a08a60SJake Burkholder * Return true if there are runnable processes of any priority on the run 209d5a08a60SJake Burkholder * queue, false otherwise. Has no side effects, does not modify the run 210d5a08a60SJake Burkholder * queue structure. 211d5a08a60SJake Burkholder */ 212d5a08a60SJake Burkholder int 213d5a08a60SJake Burkholder runq_check(struct runq *rq) 214d5a08a60SJake Burkholder { 215d5a08a60SJake Burkholder struct rqbits *rqb; 216d5a08a60SJake Burkholder int i; 217d5a08a60SJake Burkholder 218d5a08a60SJake Burkholder rqb = &rq->rq_status; 219d5a08a60SJake Burkholder for (i = 0; i < RQB_LEN; i++) 220d5a08a60SJake Burkholder if (rqb->rqb_bits[i]) { 221d5a08a60SJake Burkholder CTR2(KTR_RUNQ, "runq_check: bits=%#x i=%d", 222d5a08a60SJake Burkholder rqb->rqb_bits[i], i); 223d5a08a60SJake Burkholder return (1); 224dba6c5a6SPeter Wemm } 225d5a08a60SJake Burkholder CTR0(KTR_RUNQ, "runq_check: empty"); 226d5a08a60SJake Burkholder 227d5a08a60SJake Burkholder return (0); 228dba6c5a6SPeter Wemm } 229d5a08a60SJake Burkholder 230d5a08a60SJake Burkholder /* 231d5a08a60SJake Burkholder * Find and remove the highest priority process from the run queue. 232d5a08a60SJake Burkholder * If there are no runnable processes, the per-cpu idle process is 233d5a08a60SJake Burkholder * returned. Will not return NULL under any circumstances. 234d5a08a60SJake Burkholder */ 235b40ce416SJulian Elischer struct kse * 236d5a08a60SJake Burkholder runq_choose(struct runq *rq) 237d5a08a60SJake Burkholder { 238d5a08a60SJake Burkholder struct rqhead *rqh; 239b40ce416SJulian Elischer struct kse *ke; 240d5a08a60SJake Burkholder int pri; 241d5a08a60SJake Burkholder 242d5a08a60SJake Burkholder mtx_assert(&sched_lock, MA_OWNED); 243d5a08a60SJake Burkholder if ((pri = runq_findbit(rq)) != -1) { 244d5a08a60SJake Burkholder rqh = &rq->rq_queues[pri]; 245b40ce416SJulian Elischer ke = TAILQ_FIRST(rqh); 246b40ce416SJulian Elischer KASSERT(ke != NULL, ("runq_choose: no proc on busy queue")); 247b40ce416SJulian Elischer KASSERT(ke->ke_proc->p_stat == SRUN, 248b40ce416SJulian Elischer ("runq_choose: process %d(%s) in state %d", ke->ke_proc->p_pid, 249b40ce416SJulian Elischer ke->ke_proc->p_comm, ke->ke_proc->p_stat)); 250b40ce416SJulian Elischer CTR3(KTR_RUNQ, "runq_choose: pri=%d kse=%p rqh=%p", pri, ke, rqh); 251b40ce416SJulian Elischer TAILQ_REMOVE(rqh, ke, ke_procq); 252d5a08a60SJake Burkholder if (TAILQ_EMPTY(rqh)) { 253d5a08a60SJake Burkholder CTR0(KTR_RUNQ, "runq_choose: empty"); 254d5a08a60SJake Burkholder runq_clrbit(rq, pri); 255d5a08a60SJake Burkholder } 256b40ce416SJulian Elischer ke->ke_flags &= ~KEF_ONRUNQ; 257b40ce416SJulian Elischer return (ke); 258d5a08a60SJake Burkholder } 259d5a08a60SJake Burkholder CTR1(KTR_RUNQ, "runq_choose: idleproc pri=%d", pri); 260d5a08a60SJake Burkholder 261b40ce416SJulian Elischer return (PCPU_GET(idlethread)->td_kse); 262d5a08a60SJake Burkholder } 263d5a08a60SJake Burkholder 264d5a08a60SJake Burkholder /* 265d5a08a60SJake Burkholder * Initialize a run structure. 266d5a08a60SJake Burkholder */ 267d5a08a60SJake Burkholder void 268d5a08a60SJake Burkholder runq_init(struct runq *rq) 269d5a08a60SJake Burkholder { 270d5a08a60SJake Burkholder int i; 271d5a08a60SJake Burkholder 272f32ded2fSJake Burkholder bzero(rq, sizeof *rq); 273d5a08a60SJake Burkholder for (i = 0; i < RQ_NQS; i++) 274d5a08a60SJake Burkholder TAILQ_INIT(&rq->rq_queues[i]); 275d5a08a60SJake Burkholder } 276d5a08a60SJake Burkholder 277d5a08a60SJake Burkholder /* 278d5a08a60SJake Burkholder * Remove the process from the queue specified by its priority, and clear the 279d5a08a60SJake Burkholder * corresponding status bit if the queue becomes empty. 280d5a08a60SJake Burkholder */ 281d5a08a60SJake Burkholder void 282b40ce416SJulian Elischer runq_remove(struct runq *rq, struct kse *ke) 283d5a08a60SJake Burkholder { 284d5a08a60SJake Burkholder struct rqhead *rqh; 285d5a08a60SJake Burkholder int pri; 286d5a08a60SJake Burkholder 287b40ce416SJulian Elischer if (!(ke->ke_flags & KEF_ONRUNQ)) 288b40ce416SJulian Elischer return; 289d5a08a60SJake Burkholder mtx_assert(&sched_lock, MA_OWNED); 290b40ce416SJulian Elischer pri = ke->ke_rqindex; 291d5a08a60SJake Burkholder rqh = &rq->rq_queues[pri]; 292d5a08a60SJake Burkholder CTR4(KTR_RUNQ, "runq_remove: p=%p pri=%d %d rqh=%p", 2932c100766SJulian Elischer ke, ke->ke_thread->td_priority, pri, rqh); 294b40ce416SJulian Elischer KASSERT(ke != NULL, ("runq_remove: no proc on busy queue")); 295b40ce416SJulian Elischer TAILQ_REMOVE(rqh, ke, ke_procq); 296d5a08a60SJake Burkholder if (TAILQ_EMPTY(rqh)) { 297d5a08a60SJake Burkholder CTR0(KTR_RUNQ, "runq_remove: empty"); 298d5a08a60SJake Burkholder runq_clrbit(rq, pri); 299d5a08a60SJake Burkholder } 300b40ce416SJulian Elischer ke->ke_flags &= ~KEF_ONRUNQ; 301dba6c5a6SPeter Wemm } 302