144990b8cSJulian Elischer /* 244990b8cSJulian Elischer * Copyright (C) 2001 Julian Elischer <julian@freebsd.org>. 344990b8cSJulian Elischer * All rights reserved. 444990b8cSJulian Elischer * 544990b8cSJulian Elischer * Redistribution and use in source and binary forms, with or without 644990b8cSJulian Elischer * modification, are permitted provided that the following conditions 744990b8cSJulian Elischer * are met: 844990b8cSJulian Elischer * 1. Redistributions of source code must retain the above copyright 944990b8cSJulian Elischer * notice(s), this list of conditions and the following disclaimer as 1044990b8cSJulian Elischer * the first lines of this file unmodified other than the possible 1144990b8cSJulian Elischer * addition of one or more copyright notices. 1244990b8cSJulian Elischer * 2. Redistributions in binary form must reproduce the above copyright 1344990b8cSJulian Elischer * notice(s), this list of conditions and the following disclaimer in the 1444990b8cSJulian Elischer * documentation and/or other materials provided with the distribution. 1544990b8cSJulian Elischer * 1644990b8cSJulian Elischer * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) ``AS IS'' AND ANY 1744990b8cSJulian Elischer * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED 1844990b8cSJulian Elischer * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 1944990b8cSJulian Elischer * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY 2044990b8cSJulian Elischer * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES 2144990b8cSJulian Elischer * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 2244990b8cSJulian Elischer * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 2344990b8cSJulian Elischer * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2444990b8cSJulian Elischer * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2544990b8cSJulian Elischer * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH 2644990b8cSJulian Elischer * DAMAGE. 2744990b8cSJulian Elischer */ 2844990b8cSJulian Elischer 29677b542eSDavid E. O'Brien #include <sys/cdefs.h> 30677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 31677b542eSDavid E. O'Brien 3244990b8cSJulian Elischer #include <sys/param.h> 3344990b8cSJulian Elischer #include <sys/systm.h> 3444990b8cSJulian Elischer #include <sys/kernel.h> 3544990b8cSJulian Elischer #include <sys/lock.h> 3644990b8cSJulian Elischer #include <sys/mutex.h> 3744990b8cSJulian Elischer #include <sys/proc.h> 3894e0a4cdSJulian Elischer #include <sys/smp.h> 3944990b8cSJulian Elischer #include <sys/sysctl.h> 40de028f5aSJeff Roberson #include <sys/sched.h> 4144f3b092SJohn Baldwin #include <sys/sleepqueue.h> 42961a7b24SJohn Baldwin #include <sys/turnstile.h> 4344990b8cSJulian Elischer #include <sys/ktr.h> 4444990b8cSJulian Elischer 4544990b8cSJulian Elischer #include <vm/vm.h> 4649a2507bSAlan Cox #include <vm/vm_extern.h> 4744990b8cSJulian Elischer #include <vm/uma.h> 4802fb42b0SPeter Wemm 4944990b8cSJulian Elischer /* 504f0db5e0SJulian Elischer * KSEGRP related storage. 5144990b8cSJulian Elischer */ 524f0db5e0SJulian Elischer static uma_zone_t ksegrp_zone; 5344990b8cSJulian Elischer static uma_zone_t thread_zone; 5444990b8cSJulian Elischer 554f0db5e0SJulian Elischer /* DEBUG ONLY */ 5644990b8cSJulian Elischer SYSCTL_NODE(_kern, OID_AUTO, threads, CTLFLAG_RW, 0, "thread allocation"); 57696058c3SJulian Elischer static int thread_debug = 0; 58696058c3SJulian Elischer SYSCTL_INT(_kern_threads, OID_AUTO, debug, CTLFLAG_RW, 59696058c3SJulian Elischer &thread_debug, 0, "thread debug"); 60fdc5ecd2SDavid Xu 61345ad866SJulian Elischer int max_threads_per_proc = 1500; 62fdc5ecd2SDavid Xu SYSCTL_INT(_kern_threads, OID_AUTO, max_threads_per_proc, CTLFLAG_RW, 634f0db5e0SJulian Elischer &max_threads_per_proc, 0, "Limit on threads per proc"); 644f0db5e0SJulian Elischer 65ed062c8dSJulian Elischer int max_groups_per_proc = 1500; 66fdc5ecd2SDavid Xu SYSCTL_INT(_kern_threads, OID_AUTO, max_groups_per_proc, CTLFLAG_RW, 67fdc5ecd2SDavid Xu &max_groups_per_proc, 0, "Limit on thread groups per proc"); 68fdc5ecd2SDavid Xu 69345ad866SJulian Elischer int max_threads_hits; 700252d203SDavid Xu SYSCTL_INT(_kern_threads, OID_AUTO, max_threads_hits, CTLFLAG_RD, 710252d203SDavid Xu &max_threads_hits, 0, ""); 720252d203SDavid Xu 7394e0a4cdSJulian Elischer int virtual_cpu; 7494e0a4cdSJulian Elischer 7594e0a4cdSJulian Elischer #define RANGEOF(type, start, end) (offsetof(type, end) - offsetof(type, start)) 7644990b8cSJulian Elischer 775215b187SJeff Roberson TAILQ_HEAD(, thread) zombie_threads = TAILQ_HEAD_INITIALIZER(zombie_threads); 785c8329edSJulian Elischer TAILQ_HEAD(, ksegrp) zombie_ksegrps = TAILQ_HEAD_INITIALIZER(zombie_ksegrps); 795215b187SJeff Roberson struct mtx kse_zombie_lock; 805215b187SJeff Roberson MTX_SYSINIT(kse_zombie_lock, &kse_zombie_lock, "kse zombie lock", MTX_SPIN); 8144990b8cSJulian Elischer 8294e0a4cdSJulian Elischer static int 8394e0a4cdSJulian Elischer sysctl_kse_virtual_cpu(SYSCTL_HANDLER_ARGS) 8494e0a4cdSJulian Elischer { 8594e0a4cdSJulian Elischer int error, new_val; 8694e0a4cdSJulian Elischer int def_val; 8794e0a4cdSJulian Elischer 8894e0a4cdSJulian Elischer def_val = mp_ncpus; 8994e0a4cdSJulian Elischer if (virtual_cpu == 0) 9094e0a4cdSJulian Elischer new_val = def_val; 9194e0a4cdSJulian Elischer else 9294e0a4cdSJulian Elischer new_val = virtual_cpu; 9394e0a4cdSJulian Elischer error = sysctl_handle_int(oidp, &new_val, 0, req); 9494e0a4cdSJulian Elischer if (error != 0 || req->newptr == NULL) 9594e0a4cdSJulian Elischer return (error); 9694e0a4cdSJulian Elischer if (new_val < 0) 9794e0a4cdSJulian Elischer return (EINVAL); 9894e0a4cdSJulian Elischer virtual_cpu = new_val; 9994e0a4cdSJulian Elischer return (0); 10094e0a4cdSJulian Elischer } 10194e0a4cdSJulian Elischer 10294e0a4cdSJulian Elischer /* DEBUG ONLY */ 10394e0a4cdSJulian Elischer SYSCTL_PROC(_kern_threads, OID_AUTO, virtual_cpu, CTLTYPE_INT|CTLFLAG_RW, 10494e0a4cdSJulian Elischer 0, sizeof(virtual_cpu), sysctl_kse_virtual_cpu, "I", 10594e0a4cdSJulian Elischer "debug virtual cpus"); 1065c8329edSJulian Elischer 10744990b8cSJulian Elischer /* 108fdcac928SMarcel Moolenaar * Thread ID allocator. The allocator keeps track of assigned IDs by 109fdcac928SMarcel Moolenaar * using a bitmap. The bitmap is created in parts. The parts are linked 110fdcac928SMarcel Moolenaar * together. 111fdcac928SMarcel Moolenaar */ 112fdcac928SMarcel Moolenaar typedef u_long tid_bitmap_word; 113fdcac928SMarcel Moolenaar 114fdcac928SMarcel Moolenaar #define TID_IDS_PER_PART 1024 115fdcac928SMarcel Moolenaar #define TID_IDS_PER_IDX (sizeof(tid_bitmap_word) << 3) 116fdcac928SMarcel Moolenaar #define TID_BITMAP_SIZE (TID_IDS_PER_PART / TID_IDS_PER_IDX) 117fdcac928SMarcel Moolenaar #define TID_MIN (PID_MAX + 1) 118fdcac928SMarcel Moolenaar 119fdcac928SMarcel Moolenaar struct tid_bitmap_part { 120fdcac928SMarcel Moolenaar STAILQ_ENTRY(tid_bitmap_part) bmp_next; 121fdcac928SMarcel Moolenaar tid_bitmap_word bmp_bitmap[TID_BITMAP_SIZE]; 1220068114dSMarcel Moolenaar lwpid_t bmp_base; 123fdcac928SMarcel Moolenaar int bmp_free; 124fdcac928SMarcel Moolenaar }; 125fdcac928SMarcel Moolenaar 126fdcac928SMarcel Moolenaar static STAILQ_HEAD(, tid_bitmap_part) tid_bitmap = 127fdcac928SMarcel Moolenaar STAILQ_HEAD_INITIALIZER(tid_bitmap); 128fdcac928SMarcel Moolenaar static uma_zone_t tid_zone; 129fdcac928SMarcel Moolenaar 130fdcac928SMarcel Moolenaar struct mtx tid_lock; 131fdcac928SMarcel Moolenaar MTX_SYSINIT(tid_lock, &tid_lock, "TID lock", MTX_DEF); 132fdcac928SMarcel Moolenaar 133fdcac928SMarcel Moolenaar /* 134696058c3SJulian Elischer * Prepare a thread for use. 13544990b8cSJulian Elischer */ 136b23f72e9SBrian Feldman static int 137b23f72e9SBrian Feldman thread_ctor(void *mem, int size, void *arg, int flags) 13844990b8cSJulian Elischer { 13944990b8cSJulian Elischer struct thread *td; 14044990b8cSJulian Elischer 14144990b8cSJulian Elischer td = (struct thread *)mem; 14271fad9fdSJulian Elischer td->td_state = TDS_INACTIVE; 143060563ecSJulian Elischer td->td_oncpu = NOCPU; 1446c27c603SJuli Mallett 1456c27c603SJuli Mallett /* 1466c27c603SJuli Mallett * Note that td_critnest begins life as 1 because the thread is not 1476c27c603SJuli Mallett * running and is thereby implicitly waiting to be on the receiving 1486c27c603SJuli Mallett * end of a context switch. A context switch must occur inside a 1496c27c603SJuli Mallett * critical section, and in fact, includes hand-off of the sched_lock. 1506c27c603SJuli Mallett * After a context switch to a newly created thread, it will release 1516c27c603SJuli Mallett * sched_lock for the first time, and its td_critnest will hit 0 for 1526c27c603SJuli Mallett * the first time. This happens on the far end of a context switch, 1536c27c603SJuli Mallett * and when it context switches away from itself, it will in fact go 1546c27c603SJuli Mallett * back into a critical section, and hand off the sched lock to the 1556c27c603SJuli Mallett * next thread. 1566c27c603SJuli Mallett */ 157139b7550SJohn Baldwin td->td_critnest = 1; 158b23f72e9SBrian Feldman return (0); 15944990b8cSJulian Elischer } 16044990b8cSJulian Elischer 16144990b8cSJulian Elischer /* 16244990b8cSJulian Elischer * Reclaim a thread after use. 16344990b8cSJulian Elischer */ 16444990b8cSJulian Elischer static void 16544990b8cSJulian Elischer thread_dtor(void *mem, int size, void *arg) 16644990b8cSJulian Elischer { 16744990b8cSJulian Elischer struct thread *td; 16844990b8cSJulian Elischer 16944990b8cSJulian Elischer td = (struct thread *)mem; 17044990b8cSJulian Elischer 17144990b8cSJulian Elischer #ifdef INVARIANTS 17244990b8cSJulian Elischer /* Verify that this thread is in a safe state to free. */ 17344990b8cSJulian Elischer switch (td->td_state) { 17471fad9fdSJulian Elischer case TDS_INHIBITED: 17571fad9fdSJulian Elischer case TDS_RUNNING: 17671fad9fdSJulian Elischer case TDS_CAN_RUN: 17744990b8cSJulian Elischer case TDS_RUNQ: 17844990b8cSJulian Elischer /* 17944990b8cSJulian Elischer * We must never unlink a thread that is in one of 18044990b8cSJulian Elischer * these states, because it is currently active. 18144990b8cSJulian Elischer */ 18244990b8cSJulian Elischer panic("bad state for thread unlinking"); 18344990b8cSJulian Elischer /* NOTREACHED */ 18471fad9fdSJulian Elischer case TDS_INACTIVE: 18544990b8cSJulian Elischer break; 18644990b8cSJulian Elischer default: 18744990b8cSJulian Elischer panic("bad thread state"); 18844990b8cSJulian Elischer /* NOTREACHED */ 18944990b8cSJulian Elischer } 19044990b8cSJulian Elischer #endif 191ed062c8dSJulian Elischer sched_newthread(td); 19244990b8cSJulian Elischer } 19344990b8cSJulian Elischer 19444990b8cSJulian Elischer /* 19544990b8cSJulian Elischer * Initialize type-stable parts of a thread (when newly created). 19644990b8cSJulian Elischer */ 197b23f72e9SBrian Feldman static int 198b23f72e9SBrian Feldman thread_init(void *mem, int size, int flags) 19944990b8cSJulian Elischer { 20044990b8cSJulian Elischer struct thread *td; 201247aba24SMarcel Moolenaar struct tid_bitmap_part *bmp, *new; 202247aba24SMarcel Moolenaar int bit, idx; 20344990b8cSJulian Elischer 20444990b8cSJulian Elischer td = (struct thread *)mem; 205247aba24SMarcel Moolenaar 206247aba24SMarcel Moolenaar mtx_lock(&tid_lock); 207247aba24SMarcel Moolenaar STAILQ_FOREACH(bmp, &tid_bitmap, bmp_next) { 208247aba24SMarcel Moolenaar if (bmp->bmp_free) 209247aba24SMarcel Moolenaar break; 210247aba24SMarcel Moolenaar } 211247aba24SMarcel Moolenaar /* Create a new bitmap if we run out of free bits. */ 212247aba24SMarcel Moolenaar if (bmp == NULL) { 213247aba24SMarcel Moolenaar mtx_unlock(&tid_lock); 214247aba24SMarcel Moolenaar new = uma_zalloc(tid_zone, M_WAITOK); 215247aba24SMarcel Moolenaar mtx_lock(&tid_lock); 216247aba24SMarcel Moolenaar bmp = STAILQ_LAST(&tid_bitmap, tid_bitmap_part, bmp_next); 217247aba24SMarcel Moolenaar if (bmp == NULL || bmp->bmp_free < TID_IDS_PER_PART/2) { 218247aba24SMarcel Moolenaar /* 1=free, 0=assigned. This way we can use ffsl(). */ 219247aba24SMarcel Moolenaar memset(new->bmp_bitmap, ~0U, sizeof(new->bmp_bitmap)); 220247aba24SMarcel Moolenaar new->bmp_base = (bmp == NULL) ? TID_MIN : 221247aba24SMarcel Moolenaar bmp->bmp_base + TID_IDS_PER_PART; 222247aba24SMarcel Moolenaar new->bmp_free = TID_IDS_PER_PART; 223247aba24SMarcel Moolenaar STAILQ_INSERT_TAIL(&tid_bitmap, new, bmp_next); 224247aba24SMarcel Moolenaar bmp = new; 225247aba24SMarcel Moolenaar new = NULL; 226247aba24SMarcel Moolenaar } 227247aba24SMarcel Moolenaar } else 228247aba24SMarcel Moolenaar new = NULL; 229247aba24SMarcel Moolenaar /* We have a bitmap with available IDs. */ 230247aba24SMarcel Moolenaar idx = 0; 231247aba24SMarcel Moolenaar while (idx < TID_BITMAP_SIZE && bmp->bmp_bitmap[idx] == 0UL) 232247aba24SMarcel Moolenaar idx++; 233247aba24SMarcel Moolenaar bit = ffsl(bmp->bmp_bitmap[idx]) - 1; 234247aba24SMarcel Moolenaar td->td_tid = bmp->bmp_base + idx * TID_IDS_PER_IDX + bit; 235247aba24SMarcel Moolenaar bmp->bmp_bitmap[idx] &= ~(1UL << bit); 236247aba24SMarcel Moolenaar bmp->bmp_free--; 237247aba24SMarcel Moolenaar mtx_unlock(&tid_lock); 238247aba24SMarcel Moolenaar if (new != NULL) 239247aba24SMarcel Moolenaar uma_zfree(tid_zone, new); 240247aba24SMarcel Moolenaar 24149a2507bSAlan Cox vm_thread_new(td, 0); 24244990b8cSJulian Elischer cpu_thread_setup(td); 24344f3b092SJohn Baldwin td->td_sleepqueue = sleepq_alloc(); 244961a7b24SJohn Baldwin td->td_turnstile = turnstile_alloc(); 245de028f5aSJeff Roberson td->td_sched = (struct td_sched *)&td[1]; 246ed062c8dSJulian Elischer sched_newthread(td); 247b23f72e9SBrian Feldman return (0); 24844990b8cSJulian Elischer } 24944990b8cSJulian Elischer 25044990b8cSJulian Elischer /* 25144990b8cSJulian Elischer * Tear down type-stable parts of a thread (just before being discarded). 25244990b8cSJulian Elischer */ 25344990b8cSJulian Elischer static void 25444990b8cSJulian Elischer thread_fini(void *mem, int size) 25544990b8cSJulian Elischer { 25644990b8cSJulian Elischer struct thread *td; 257247aba24SMarcel Moolenaar struct tid_bitmap_part *bmp; 258247aba24SMarcel Moolenaar lwpid_t tid; 259247aba24SMarcel Moolenaar int bit, idx; 26044990b8cSJulian Elischer 26144990b8cSJulian Elischer td = (struct thread *)mem; 262961a7b24SJohn Baldwin turnstile_free(td->td_turnstile); 26344f3b092SJohn Baldwin sleepq_free(td->td_sleepqueue); 26449a2507bSAlan Cox vm_thread_dispose(td); 265247aba24SMarcel Moolenaar 266247aba24SMarcel Moolenaar STAILQ_FOREACH(bmp, &tid_bitmap, bmp_next) { 267247aba24SMarcel Moolenaar if (td->td_tid >= bmp->bmp_base && 268247aba24SMarcel Moolenaar td->td_tid < bmp->bmp_base + TID_IDS_PER_PART) 269247aba24SMarcel Moolenaar break; 270247aba24SMarcel Moolenaar } 271247aba24SMarcel Moolenaar KASSERT(bmp != NULL, ("No TID bitmap?")); 272247aba24SMarcel Moolenaar mtx_lock(&tid_lock); 273247aba24SMarcel Moolenaar tid = td->td_tid - bmp->bmp_base; 274247aba24SMarcel Moolenaar idx = tid / TID_IDS_PER_IDX; 275247aba24SMarcel Moolenaar bit = 1UL << (tid % TID_IDS_PER_IDX); 276247aba24SMarcel Moolenaar bmp->bmp_bitmap[idx] |= bit; 277247aba24SMarcel Moolenaar bmp->bmp_free++; 278247aba24SMarcel Moolenaar mtx_unlock(&tid_lock); 27944990b8cSJulian Elischer } 2805215b187SJeff Roberson 281de028f5aSJeff Roberson /* 282de028f5aSJeff Roberson * Initialize type-stable parts of a ksegrp (when newly created). 283de028f5aSJeff Roberson */ 284b23f72e9SBrian Feldman static int 285a9b5dc7dSJulian Elischer ksegrp_ctor(void *mem, int size, void *arg, int flags) 286de028f5aSJeff Roberson { 287de028f5aSJeff Roberson struct ksegrp *kg; 288de028f5aSJeff Roberson 289de028f5aSJeff Roberson kg = (struct ksegrp *)mem; 290a9b5dc7dSJulian Elischer bzero(mem, size); 291de028f5aSJeff Roberson kg->kg_sched = (struct kg_sched *)&kg[1]; 292b23f72e9SBrian Feldman return (0); 293de028f5aSJeff Roberson } 29444990b8cSJulian Elischer 2955c8329edSJulian Elischer void 2965c8329edSJulian Elischer ksegrp_link(struct ksegrp *kg, struct proc *p) 2975c8329edSJulian Elischer { 2985c8329edSJulian Elischer 2995c8329edSJulian Elischer TAILQ_INIT(&kg->kg_threads); 3005c8329edSJulian Elischer TAILQ_INIT(&kg->kg_runq); /* links with td_runq */ 3015c8329edSJulian Elischer TAILQ_INIT(&kg->kg_slpq); /* links with td_runq */ 3025215b187SJeff Roberson TAILQ_INIT(&kg->kg_upcalls); /* all upcall structure in ksegrp */ 3035c8329edSJulian Elischer kg->kg_proc = p; 3045215b187SJeff Roberson /* 3055215b187SJeff Roberson * the following counters are in the -zero- section 3065215b187SJeff Roberson * and may not need clearing 3075215b187SJeff Roberson */ 3085c8329edSJulian Elischer kg->kg_numthreads = 0; 3095c8329edSJulian Elischer kg->kg_runnable = 0; 3105215b187SJeff Roberson kg->kg_numupcalls = 0; 3115c8329edSJulian Elischer /* link it in now that it's consistent */ 3125c8329edSJulian Elischer p->p_numksegrps++; 3135c8329edSJulian Elischer TAILQ_INSERT_HEAD(&p->p_ksegrps, kg, kg_ksegrp); 3145c8329edSJulian Elischer } 3155c8329edSJulian Elischer 316ed062c8dSJulian Elischer /* 317ed062c8dSJulian Elischer * Called from: 318ed062c8dSJulian Elischer * thread-exit() 319ed062c8dSJulian Elischer */ 3205c8329edSJulian Elischer void 3215c8329edSJulian Elischer ksegrp_unlink(struct ksegrp *kg) 3225c8329edSJulian Elischer { 3235c8329edSJulian Elischer struct proc *p; 3245c8329edSJulian Elischer 3255c8329edSJulian Elischer mtx_assert(&sched_lock, MA_OWNED); 3265215b187SJeff Roberson KASSERT((kg->kg_numthreads == 0), ("ksegrp_unlink: residual threads")); 3275215b187SJeff Roberson KASSERT((kg->kg_numupcalls == 0), ("ksegrp_unlink: residual upcalls")); 3285215b187SJeff Roberson 3295c8329edSJulian Elischer p = kg->kg_proc; 3305c8329edSJulian Elischer TAILQ_REMOVE(&p->p_ksegrps, kg, kg_ksegrp); 3315c8329edSJulian Elischer p->p_numksegrps--; 3325c8329edSJulian Elischer /* 3335c8329edSJulian Elischer * Aggregate stats from the KSE 3345c8329edSJulian Elischer */ 3355c8329edSJulian Elischer } 3365c8329edSJulian Elischer 3375c8329edSJulian Elischer /* 3385215b187SJeff Roberson * For a newly created process, 3395215b187SJeff Roberson * link up all the structures and its initial threads etc. 340ed062c8dSJulian Elischer * called from: 341ed062c8dSJulian Elischer * {arch}/{arch}/machdep.c ia64_init(), init386() etc. 342ed062c8dSJulian Elischer * proc_dtor() (should go away) 343ed062c8dSJulian Elischer * proc_init() 3445c8329edSJulian Elischer */ 3455c8329edSJulian Elischer void 346ed062c8dSJulian Elischer proc_linkup(struct proc *p, struct ksegrp *kg, struct thread *td) 3475c8329edSJulian Elischer { 3485c8329edSJulian Elischer 3495c8329edSJulian Elischer TAILQ_INIT(&p->p_ksegrps); /* all ksegrps in proc */ 3505c8329edSJulian Elischer TAILQ_INIT(&p->p_threads); /* all threads in proc */ 3515c8329edSJulian Elischer TAILQ_INIT(&p->p_suspended); /* Threads suspended */ 3525c8329edSJulian Elischer p->p_numksegrps = 0; 3535c8329edSJulian Elischer p->p_numthreads = 0; 3545c8329edSJulian Elischer 3555c8329edSJulian Elischer ksegrp_link(kg, p); 3565c8329edSJulian Elischer thread_link(td, kg); 3575c8329edSJulian Elischer } 3585c8329edSJulian Elischer 3595c8329edSJulian Elischer /* 36044990b8cSJulian Elischer * Initialize global thread allocation resources. 36144990b8cSJulian Elischer */ 36244990b8cSJulian Elischer void 36344990b8cSJulian Elischer threadinit(void) 36444990b8cSJulian Elischer { 36544990b8cSJulian Elischer 366de028f5aSJeff Roberson thread_zone = uma_zcreate("THREAD", sched_sizeof_thread(), 36744990b8cSJulian Elischer thread_ctor, thread_dtor, thread_init, thread_fini, 36844990b8cSJulian Elischer UMA_ALIGN_CACHE, 0); 369fdcac928SMarcel Moolenaar tid_zone = uma_zcreate("TID", sizeof(struct tid_bitmap_part), 370fdcac928SMarcel Moolenaar NULL, NULL, NULL, NULL, UMA_ALIGN_CACHE, 0); 371de028f5aSJeff Roberson ksegrp_zone = uma_zcreate("KSEGRP", sched_sizeof_ksegrp(), 372a9b5dc7dSJulian Elischer ksegrp_ctor, NULL, NULL, NULL, 3734f0db5e0SJulian Elischer UMA_ALIGN_CACHE, 0); 374ed062c8dSJulian Elischer kseinit(); /* set up kse specific stuff e.g. upcall zone*/ 37544990b8cSJulian Elischer } 37644990b8cSJulian Elischer 37744990b8cSJulian Elischer /* 3781faf202eSJulian Elischer * Stash an embarasingly extra thread into the zombie thread queue. 37944990b8cSJulian Elischer */ 38044990b8cSJulian Elischer void 38144990b8cSJulian Elischer thread_stash(struct thread *td) 38244990b8cSJulian Elischer { 3835215b187SJeff Roberson mtx_lock_spin(&kse_zombie_lock); 38444990b8cSJulian Elischer TAILQ_INSERT_HEAD(&zombie_threads, td, td_runq); 3855215b187SJeff Roberson mtx_unlock_spin(&kse_zombie_lock); 38644990b8cSJulian Elischer } 38744990b8cSJulian Elischer 38844990b8cSJulian Elischer /* 3895c8329edSJulian Elischer * Stash an embarasingly extra ksegrp into the zombie ksegrp queue. 3905c8329edSJulian Elischer */ 3915c8329edSJulian Elischer void 3925c8329edSJulian Elischer ksegrp_stash(struct ksegrp *kg) 3935c8329edSJulian Elischer { 3945215b187SJeff Roberson mtx_lock_spin(&kse_zombie_lock); 3955c8329edSJulian Elischer TAILQ_INSERT_HEAD(&zombie_ksegrps, kg, kg_ksegrp); 3965215b187SJeff Roberson mtx_unlock_spin(&kse_zombie_lock); 3975c8329edSJulian Elischer } 3985c8329edSJulian Elischer 3995c8329edSJulian Elischer /* 4005215b187SJeff Roberson * Reap zombie kse resource. 40144990b8cSJulian Elischer */ 40244990b8cSJulian Elischer void 40344990b8cSJulian Elischer thread_reap(void) 40444990b8cSJulian Elischer { 4055c8329edSJulian Elischer struct thread *td_first, *td_next; 4065c8329edSJulian Elischer struct ksegrp *kg_first, * kg_next; 40744990b8cSJulian Elischer 40844990b8cSJulian Elischer /* 4095215b187SJeff Roberson * Don't even bother to lock if none at this instant, 4105215b187SJeff Roberson * we really don't care about the next instant.. 41144990b8cSJulian Elischer */ 4125c8329edSJulian Elischer if ((!TAILQ_EMPTY(&zombie_threads)) 413345ad866SJulian Elischer || (!TAILQ_EMPTY(&zombie_ksegrps))) { 4145215b187SJeff Roberson mtx_lock_spin(&kse_zombie_lock); 4155c8329edSJulian Elischer td_first = TAILQ_FIRST(&zombie_threads); 4165c8329edSJulian Elischer kg_first = TAILQ_FIRST(&zombie_ksegrps); 4175c8329edSJulian Elischer if (td_first) 4185c8329edSJulian Elischer TAILQ_INIT(&zombie_threads); 4195c8329edSJulian Elischer if (kg_first) 4205c8329edSJulian Elischer TAILQ_INIT(&zombie_ksegrps); 4215215b187SJeff Roberson mtx_unlock_spin(&kse_zombie_lock); 4225c8329edSJulian Elischer while (td_first) { 4235c8329edSJulian Elischer td_next = TAILQ_NEXT(td_first, td_runq); 4245215b187SJeff Roberson if (td_first->td_ucred) 4255215b187SJeff Roberson crfree(td_first->td_ucred); 4265c8329edSJulian Elischer thread_free(td_first); 4275c8329edSJulian Elischer td_first = td_next; 42844990b8cSJulian Elischer } 4295c8329edSJulian Elischer while (kg_first) { 4305c8329edSJulian Elischer kg_next = TAILQ_NEXT(kg_first, kg_ksegrp); 4315c8329edSJulian Elischer ksegrp_free(kg_first); 4325c8329edSJulian Elischer kg_first = kg_next; 4335c8329edSJulian Elischer } 434ed062c8dSJulian Elischer /* 435ed062c8dSJulian Elischer * there will always be a thread on the list if one of these 436ed062c8dSJulian Elischer * is there. 437ed062c8dSJulian Elischer */ 438345ad866SJulian Elischer kse_GC(); 43944990b8cSJulian Elischer } 440ed062c8dSJulian Elischer } 44144990b8cSJulian Elischer 44244990b8cSJulian Elischer /* 4434f0db5e0SJulian Elischer * Allocate a ksegrp. 4444f0db5e0SJulian Elischer */ 4454f0db5e0SJulian Elischer struct ksegrp * 4464f0db5e0SJulian Elischer ksegrp_alloc(void) 4474f0db5e0SJulian Elischer { 448a163d034SWarner Losh return (uma_zalloc(ksegrp_zone, M_WAITOK)); 4494f0db5e0SJulian Elischer } 4504f0db5e0SJulian Elischer 4514f0db5e0SJulian Elischer /* 45244990b8cSJulian Elischer * Allocate a thread. 45344990b8cSJulian Elischer */ 45444990b8cSJulian Elischer struct thread * 45544990b8cSJulian Elischer thread_alloc(void) 45644990b8cSJulian Elischer { 45744990b8cSJulian Elischer thread_reap(); /* check if any zombies to get */ 458a163d034SWarner Losh return (uma_zalloc(thread_zone, M_WAITOK)); 45944990b8cSJulian Elischer } 46044990b8cSJulian Elischer 46144990b8cSJulian Elischer /* 4624f0db5e0SJulian Elischer * Deallocate a ksegrp. 4634f0db5e0SJulian Elischer */ 4644f0db5e0SJulian Elischer void 4654f0db5e0SJulian Elischer ksegrp_free(struct ksegrp *td) 4664f0db5e0SJulian Elischer { 4674f0db5e0SJulian Elischer uma_zfree(ksegrp_zone, td); 4684f0db5e0SJulian Elischer } 4694f0db5e0SJulian Elischer 4704f0db5e0SJulian Elischer /* 47144990b8cSJulian Elischer * Deallocate a thread. 47244990b8cSJulian Elischer */ 47344990b8cSJulian Elischer void 47444990b8cSJulian Elischer thread_free(struct thread *td) 47544990b8cSJulian Elischer { 476696058c3SJulian Elischer 477696058c3SJulian Elischer cpu_thread_clean(td); 47844990b8cSJulian Elischer uma_zfree(thread_zone, td); 47944990b8cSJulian Elischer } 48044990b8cSJulian Elischer 48144990b8cSJulian Elischer /* 48244990b8cSJulian Elischer * Discard the current thread and exit from its context. 48394e0a4cdSJulian Elischer * Always called with scheduler locked. 48444990b8cSJulian Elischer * 48544990b8cSJulian Elischer * Because we can't free a thread while we're operating under its context, 486696058c3SJulian Elischer * push the current thread into our CPU's deadthread holder. This means 487696058c3SJulian Elischer * we needn't worry about someone else grabbing our context before we 48894e0a4cdSJulian Elischer * do a cpu_throw(). This may not be needed now as we are under schedlock. 48994e0a4cdSJulian Elischer * Maybe we can just do a thread_stash() as thr_exit1 does. 49094e0a4cdSJulian Elischer */ 49194e0a4cdSJulian Elischer /* XXX 49294e0a4cdSJulian Elischer * libthr expects its thread exit to return for the last 49394e0a4cdSJulian Elischer * thread, meaning that the program is back to non-threaded 49494e0a4cdSJulian Elischer * mode I guess. Because we do this (cpu_throw) unconditionally 49594e0a4cdSJulian Elischer * here, they have their own version of it. (thr_exit1()) 49694e0a4cdSJulian Elischer * that doesn't do it all if this was the last thread. 49794e0a4cdSJulian Elischer * It is also called from thread_suspend_check(). 49894e0a4cdSJulian Elischer * Of course in the end, they end up coming here through exit1 49994e0a4cdSJulian Elischer * anyhow.. After fixing 'thr' to play by the rules we should be able 50094e0a4cdSJulian Elischer * to merge these two functions together. 501ed062c8dSJulian Elischer * 502ed062c8dSJulian Elischer * called from: 503ed062c8dSJulian Elischer * exit1() 504ed062c8dSJulian Elischer * kse_exit() 505ed062c8dSJulian Elischer * thr_exit() 506ed062c8dSJulian Elischer * thread_user_enter() 507ed062c8dSJulian Elischer * thread_userret() 508ed062c8dSJulian Elischer * thread_suspend_check() 50944990b8cSJulian Elischer */ 51044990b8cSJulian Elischer void 51144990b8cSJulian Elischer thread_exit(void) 51244990b8cSJulian Elischer { 51344990b8cSJulian Elischer struct thread *td; 51444990b8cSJulian Elischer struct proc *p; 51544990b8cSJulian Elischer struct ksegrp *kg; 51644990b8cSJulian Elischer 51744990b8cSJulian Elischer td = curthread; 51844990b8cSJulian Elischer kg = td->td_ksegrp; 51944990b8cSJulian Elischer p = td->td_proc; 52044990b8cSJulian Elischer 52144990b8cSJulian Elischer mtx_assert(&sched_lock, MA_OWNED); 522ed062c8dSJulian Elischer mtx_assert(&Giant, MA_NOTOWNED); 52344990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 524ed062c8dSJulian Elischer KASSERT(p != NULL, ("thread exiting without a process")); 525ed062c8dSJulian Elischer KASSERT(kg != NULL, ("thread exiting without a kse group")); 526cc701b73SRobert Watson CTR3(KTR_PROC, "thread_exit: thread %p (pid %ld, %s)", td, 527cc701b73SRobert Watson (long)p->p_pid, p->p_comm); 52844990b8cSJulian Elischer 52948bfcdddSJulian Elischer if (td->td_standin != NULL) { 530ed062c8dSJulian Elischer /* 531ed062c8dSJulian Elischer * Note that we don't need to free the cred here as it 532ed062c8dSJulian Elischer * is done in thread_reap(). 533ed062c8dSJulian Elischer */ 53448bfcdddSJulian Elischer thread_stash(td->td_standin); 53548bfcdddSJulian Elischer td->td_standin = NULL; 53648bfcdddSJulian Elischer } 53748bfcdddSJulian Elischer 538ed062c8dSJulian Elischer /* 539ed062c8dSJulian Elischer * drop FPU & debug register state storage, or any other 540ed062c8dSJulian Elischer * architecture specific resources that 541ed062c8dSJulian Elischer * would not be on a new untouched process. 542ed062c8dSJulian Elischer */ 54344990b8cSJulian Elischer cpu_thread_exit(td); /* XXXSMP */ 54444990b8cSJulian Elischer 5451faf202eSJulian Elischer /* 546ed062c8dSJulian Elischer * The thread is exiting. scheduler can release its stuff 547ed062c8dSJulian Elischer * and collect stats etc. 548ed062c8dSJulian Elischer */ 549ed062c8dSJulian Elischer sched_thread_exit(td); 550ed062c8dSJulian Elischer 551ed062c8dSJulian Elischer /* 5521faf202eSJulian Elischer * The last thread is left attached to the process 5531faf202eSJulian Elischer * So that the whole bundle gets recycled. Skip 554ed062c8dSJulian Elischer * all this stuff if we never had threads. 555ed062c8dSJulian Elischer * EXIT clears all sign of other threads when 556ed062c8dSJulian Elischer * it goes to single threading, so the last thread always 557ed062c8dSJulian Elischer * takes the short path. 5581faf202eSJulian Elischer */ 559ed062c8dSJulian Elischer if (p->p_flag & P_HADTHREADS) { 5601faf202eSJulian Elischer if (p->p_numthreads > 1) { 561d3a0bd78SJulian Elischer thread_unlink(td); 562ed062c8dSJulian Elischer 563ed062c8dSJulian Elischer /* XXX first arg not used in 4BSD or ULE */ 564ed062c8dSJulian Elischer sched_exit_thread(FIRST_THREAD_IN_PROC(p), td); 565ed062c8dSJulian Elischer 566ed062c8dSJulian Elischer /* 567ed062c8dSJulian Elischer * as we are exiting there is room for another 568ed062c8dSJulian Elischer * to be created. 569ed062c8dSJulian Elischer */ 5700252d203SDavid Xu if (p->p_maxthrwaits) 5710252d203SDavid Xu wakeup(&p->p_numthreads); 572ed062c8dSJulian Elischer 57344990b8cSJulian Elischer /* 57444990b8cSJulian Elischer * The test below is NOT true if we are the 5751faf202eSJulian Elischer * sole exiting thread. P_STOPPED_SNGL is unset 57644990b8cSJulian Elischer * in exit1() after it is the only survivor. 57744990b8cSJulian Elischer */ 5781279572aSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 57944990b8cSJulian Elischer if (p->p_numthreads == p->p_suspcount) { 58071fad9fdSJulian Elischer thread_unsuspend_one(p->p_singlethread); 58144990b8cSJulian Elischer } 58244990b8cSJulian Elischer } 58348bfcdddSJulian Elischer 5845215b187SJeff Roberson /* 5855215b187SJeff Roberson * Because each upcall structure has an owner thread, 5865215b187SJeff Roberson * owner thread exits only when process is in exiting 5875215b187SJeff Roberson * state, so upcall to userland is no longer needed, 5885215b187SJeff Roberson * deleting upcall structure is safe here. 5895215b187SJeff Roberson * So when all threads in a group is exited, all upcalls 5905215b187SJeff Roberson * in the group should be automatically freed. 591ed062c8dSJulian Elischer * XXXKSE This is a KSE thing and should be exported 592ed062c8dSJulian Elischer * there somehow. 5935215b187SJeff Roberson */ 5945215b187SJeff Roberson upcall_remove(td); 5956f8132a8SJulian Elischer 59648bfcdddSJulian Elischer /* 597ed062c8dSJulian Elischer * If the thread we unlinked above was the last one, 598ed062c8dSJulian Elischer * then this ksegrp should go away too. 59948bfcdddSJulian Elischer */ 600ed062c8dSJulian Elischer if (kg->kg_numthreads == 0) { 601ed062c8dSJulian Elischer /* 602ed062c8dSJulian Elischer * let the scheduler know about this in case 603ed062c8dSJulian Elischer * it needs to recover stats or resources. 604ed062c8dSJulian Elischer * Theoretically we could let 605ed062c8dSJulian Elischer * sched_exit_ksegrp() do the equivalent of 606ed062c8dSJulian Elischer * setting the concurrency to 0 607ed062c8dSJulian Elischer * but don't do it yet to avoid changing 608ed062c8dSJulian Elischer * the existing scheduler code until we 609ed062c8dSJulian Elischer * are ready. 610ed062c8dSJulian Elischer * We supply a random other ksegrp 611ed062c8dSJulian Elischer * as the recipient of any built up 612ed062c8dSJulian Elischer * cpu usage etc. (If the scheduler wants it). 613ed062c8dSJulian Elischer * XXXKSE 614ed062c8dSJulian Elischer * This is probably not fair so think of 615ed062c8dSJulian Elischer * a better answer. 616ed062c8dSJulian Elischer */ 61755d44f79SJulian Elischer sched_exit_ksegrp(FIRST_KSEGRP_IN_PROC(p), td); 618ed062c8dSJulian Elischer sched_set_concurrency(kg, 0); /* XXX TEMP */ 619ab2baa72SDavid Xu ksegrp_unlink(kg); 620ed062c8dSJulian Elischer ksegrp_stash(kg); 621ab2baa72SDavid Xu } 6226f8132a8SJulian Elischer PROC_UNLOCK(p); 6235c8329edSJulian Elischer td->td_ksegrp = NULL; 624696058c3SJulian Elischer PCPU_SET(deadthread, td); 6251faf202eSJulian Elischer } else { 626ed062c8dSJulian Elischer /* 627ed062c8dSJulian Elischer * The last thread is exiting.. but not through exit() 628ed062c8dSJulian Elischer * what should we do? 629ed062c8dSJulian Elischer * Theoretically this can't happen 630ed062c8dSJulian Elischer * exit1() - clears threading flags before coming here 631ed062c8dSJulian Elischer * kse_exit() - treats last thread specially 632ed062c8dSJulian Elischer * thr_exit() - treats last thread specially 633ed062c8dSJulian Elischer * thread_user_enter() - only if more exist 634ed062c8dSJulian Elischer * thread_userret() - only if more exist 635ed062c8dSJulian Elischer * thread_suspend_check() - only if more exist 636ed062c8dSJulian Elischer */ 637ed062c8dSJulian Elischer panic ("thread_exit: Last thread exiting on its own"); 638ed062c8dSJulian Elischer } 639ed062c8dSJulian Elischer } else { 640ed062c8dSJulian Elischer /* 641ed062c8dSJulian Elischer * non threaded process comes here. 642ed062c8dSJulian Elischer * This includes an EX threaded process that is coming 643ed062c8dSJulian Elischer * here via exit1(). (exit1 dethreads the proc first). 644ed062c8dSJulian Elischer */ 6451faf202eSJulian Elischer PROC_UNLOCK(p); 6461faf202eSJulian Elischer } 647dcc9954eSJulian Elischer td->td_state = TDS_INACTIVE; 648732d9528SJulian Elischer CTR1(KTR_PROC, "thread_exit: cpu_throw() thread %p", td); 649cc66ebe2SPeter Wemm cpu_throw(td, choosethread()); 650cc66ebe2SPeter Wemm panic("I'm a teapot!"); 65144990b8cSJulian Elischer /* NOTREACHED */ 65244990b8cSJulian Elischer } 65344990b8cSJulian Elischer 65444990b8cSJulian Elischer /* 655696058c3SJulian Elischer * Do any thread specific cleanups that may be needed in wait() 65637814395SPeter Wemm * called with Giant, proc and schedlock not held. 657696058c3SJulian Elischer */ 658696058c3SJulian Elischer void 659696058c3SJulian Elischer thread_wait(struct proc *p) 660696058c3SJulian Elischer { 661696058c3SJulian Elischer struct thread *td; 662696058c3SJulian Elischer 66337814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 66485495c72SJens Schweikhardt KASSERT((p->p_numthreads == 1), ("Multiple threads in wait1()")); 66585495c72SJens Schweikhardt KASSERT((p->p_numksegrps == 1), ("Multiple ksegrps in wait1()")); 666696058c3SJulian Elischer FOREACH_THREAD_IN_PROC(p, td) { 667696058c3SJulian Elischer if (td->td_standin != NULL) { 668ed062c8dSJulian Elischer crfree(td->td_ucred); 669ed062c8dSJulian Elischer td->td_ucred = NULL; 670696058c3SJulian Elischer thread_free(td->td_standin); 671696058c3SJulian Elischer td->td_standin = NULL; 672696058c3SJulian Elischer } 673696058c3SJulian Elischer cpu_thread_clean(td); 674ed062c8dSJulian Elischer crfree(td->td_ucred); 675696058c3SJulian Elischer } 676696058c3SJulian Elischer thread_reap(); /* check for zombie threads etc. */ 677696058c3SJulian Elischer } 678696058c3SJulian Elischer 679696058c3SJulian Elischer /* 68044990b8cSJulian Elischer * Link a thread to a process. 6811faf202eSJulian Elischer * set up anything that needs to be initialized for it to 6821faf202eSJulian Elischer * be used by the process. 68344990b8cSJulian Elischer * 68444990b8cSJulian Elischer * Note that we do not link to the proc's ucred here. 68544990b8cSJulian Elischer * The thread is linked as if running but no KSE assigned. 686ed062c8dSJulian Elischer * Called from: 687ed062c8dSJulian Elischer * proc_linkup() 688ed062c8dSJulian Elischer * thread_schedule_upcall() 689ed062c8dSJulian Elischer * thr_create() 69044990b8cSJulian Elischer */ 69144990b8cSJulian Elischer void 69244990b8cSJulian Elischer thread_link(struct thread *td, struct ksegrp *kg) 69344990b8cSJulian Elischer { 69444990b8cSJulian Elischer struct proc *p; 69544990b8cSJulian Elischer 69644990b8cSJulian Elischer p = kg->kg_proc; 69771fad9fdSJulian Elischer td->td_state = TDS_INACTIVE; 69844990b8cSJulian Elischer td->td_proc = p; 69944990b8cSJulian Elischer td->td_ksegrp = kg; 7005215b187SJeff Roberson td->td_flags = 0; 7014fc21c09SDaniel Eischen td->td_kflags = 0; 70244990b8cSJulian Elischer 7031faf202eSJulian Elischer LIST_INIT(&td->td_contested); 704c06eb4e2SSam Leffler callout_init(&td->td_slpcallout, CALLOUT_MPSAFE); 70544990b8cSJulian Elischer TAILQ_INSERT_HEAD(&p->p_threads, td, td_plist); 70644990b8cSJulian Elischer TAILQ_INSERT_HEAD(&kg->kg_threads, td, td_kglist); 70744990b8cSJulian Elischer p->p_numthreads++; 70844990b8cSJulian Elischer kg->kg_numthreads++; 70944990b8cSJulian Elischer } 71044990b8cSJulian Elischer 711ed062c8dSJulian Elischer /* 712e5bedcefSJulian Elischer * Convert a process with one thread to an unthreaded process. 713e5bedcefSJulian Elischer * Called from: 714e5bedcefSJulian Elischer * thread_single(exit) (called from execve and exit) 715e5bedcefSJulian Elischer * kse_exit() XXX may need cleaning up wrt KSE stuff 716e5bedcefSJulian Elischer */ 717e5bedcefSJulian Elischer void 718e5bedcefSJulian Elischer thread_unthread(struct thread *td) 719e5bedcefSJulian Elischer { 720e5bedcefSJulian Elischer struct proc *p = td->td_proc; 721e5bedcefSJulian Elischer 722e5bedcefSJulian Elischer KASSERT((p->p_numthreads == 1), ("Unthreading with >1 threads")); 723e5bedcefSJulian Elischer upcall_remove(td); 724e5bedcefSJulian Elischer p->p_flag &= ~(P_SA|P_HADTHREADS); 725e5bedcefSJulian Elischer td->td_mailbox = NULL; 726e5bedcefSJulian Elischer td->td_pflags &= ~(TDP_SA | TDP_CAN_UNBIND); 727e5bedcefSJulian Elischer if (td->td_standin != NULL) { 728e5bedcefSJulian Elischer thread_stash(td->td_standin); 729e5bedcefSJulian Elischer td->td_standin = NULL; 730e5bedcefSJulian Elischer } 731e5bedcefSJulian Elischer sched_set_concurrency(td->td_ksegrp, 1); 732e5bedcefSJulian Elischer } 733e5bedcefSJulian Elischer 734e5bedcefSJulian Elischer /* 735ed062c8dSJulian Elischer * Called from: 736ed062c8dSJulian Elischer * thread_exit() 737ed062c8dSJulian Elischer */ 738d3a0bd78SJulian Elischer void 739d3a0bd78SJulian Elischer thread_unlink(struct thread *td) 740d3a0bd78SJulian Elischer { 741d3a0bd78SJulian Elischer struct proc *p = td->td_proc; 742d3a0bd78SJulian Elischer struct ksegrp *kg = td->td_ksegrp; 743d3a0bd78SJulian Elischer 744112afcb2SJohn Baldwin mtx_assert(&sched_lock, MA_OWNED); 745d3a0bd78SJulian Elischer TAILQ_REMOVE(&p->p_threads, td, td_plist); 746d3a0bd78SJulian Elischer p->p_numthreads--; 747d3a0bd78SJulian Elischer TAILQ_REMOVE(&kg->kg_threads, td, td_kglist); 748d3a0bd78SJulian Elischer kg->kg_numthreads--; 749d3a0bd78SJulian Elischer /* could clear a few other things here */ 750ed062c8dSJulian Elischer /* Must NOT clear links to proc and ksegrp! */ 7515c8329edSJulian Elischer } 7525c8329edSJulian Elischer 7535215b187SJeff Roberson /* 75444990b8cSJulian Elischer * Enforce single-threading. 75544990b8cSJulian Elischer * 75644990b8cSJulian Elischer * Returns 1 if the caller must abort (another thread is waiting to 75744990b8cSJulian Elischer * exit the process or similar). Process is locked! 75844990b8cSJulian Elischer * Returns 0 when you are successfully the only thread running. 75944990b8cSJulian Elischer * A process has successfully single threaded in the suspend mode when 76044990b8cSJulian Elischer * There are no threads in user mode. Threads in the kernel must be 76144990b8cSJulian Elischer * allowed to continue until they get to the user boundary. They may even 76244990b8cSJulian Elischer * copy out their return values and data before suspending. They may however be 76344990b8cSJulian Elischer * accellerated in reaching the user boundary as we will wake up 76444990b8cSJulian Elischer * any sleeping threads that are interruptable. (PCATCH). 76544990b8cSJulian Elischer */ 76644990b8cSJulian Elischer int 767906ac69dSDavid Xu thread_single(int mode) 76844990b8cSJulian Elischer { 76944990b8cSJulian Elischer struct thread *td; 77044990b8cSJulian Elischer struct thread *td2; 77144990b8cSJulian Elischer struct proc *p; 772ec008e96SDavid Xu int remaining; 77344990b8cSJulian Elischer 77444990b8cSJulian Elischer td = curthread; 77544990b8cSJulian Elischer p = td->td_proc; 77637814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 77744990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 77844990b8cSJulian Elischer KASSERT((td != NULL), ("curthread is NULL")); 77944990b8cSJulian Elischer 780ed062c8dSJulian Elischer if ((p->p_flag & P_HADTHREADS) == 0) 78144990b8cSJulian Elischer return (0); 78244990b8cSJulian Elischer 783e3b9bf71SJulian Elischer /* Is someone already single threading? */ 784906ac69dSDavid Xu if (p->p_singlethread != NULL && p->p_singlethread != td) 78544990b8cSJulian Elischer return (1); 78644990b8cSJulian Elischer 787906ac69dSDavid Xu if (mode == SINGLE_EXIT) { 788906ac69dSDavid Xu p->p_flag |= P_SINGLE_EXIT; 789906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_BOUNDARY; 790906ac69dSDavid Xu } else { 791906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_EXIT; 792906ac69dSDavid Xu if (mode == SINGLE_BOUNDARY) 793906ac69dSDavid Xu p->p_flag |= P_SINGLE_BOUNDARY; 794906ac69dSDavid Xu else 795906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_BOUNDARY; 796906ac69dSDavid Xu } 7971279572aSDavid Xu p->p_flag |= P_STOPPED_SINGLE; 79871fad9fdSJulian Elischer mtx_lock_spin(&sched_lock); 799112afcb2SJohn Baldwin p->p_singlethread = td; 800906ac69dSDavid Xu if (mode == SINGLE_EXIT) 801ec008e96SDavid Xu remaining = p->p_numthreads; 802906ac69dSDavid Xu else if (mode == SINGLE_BOUNDARY) 803906ac69dSDavid Xu remaining = p->p_numthreads - p->p_boundary_count; 804906ac69dSDavid Xu else 805ec008e96SDavid Xu remaining = p->p_numthreads - p->p_suspcount; 806ec008e96SDavid Xu while (remaining != 1) { 80744990b8cSJulian Elischer FOREACH_THREAD_IN_PROC(p, td2) { 80844990b8cSJulian Elischer if (td2 == td) 80944990b8cSJulian Elischer continue; 810588257e8SDavid Xu td2->td_flags |= TDF_ASTPENDING; 81171fad9fdSJulian Elischer if (TD_IS_INHIBITED(td2)) { 812906ac69dSDavid Xu switch (mode) { 813906ac69dSDavid Xu case SINGLE_EXIT: 814cbf4e354SDavid Xu if (td->td_flags & TDF_DBSUSPEND) 815cbf4e354SDavid Xu td->td_flags &= ~TDF_DBSUSPEND; 816906ac69dSDavid Xu if (TD_IS_SUSPENDED(td2)) 81771fad9fdSJulian Elischer thread_unsuspend_one(td2); 81833862f40SDavid Xu if (TD_ON_SLEEPQ(td2) && 819906ac69dSDavid Xu (td2->td_flags & TDF_SINTR)) 82044f3b092SJohn Baldwin sleepq_abort(td2); 821906ac69dSDavid Xu break; 822906ac69dSDavid Xu case SINGLE_BOUNDARY: 823906ac69dSDavid Xu if (TD_IS_SUSPENDED(td2) && 824906ac69dSDavid Xu !(td2->td_flags & TDF_BOUNDARY)) 825906ac69dSDavid Xu thread_unsuspend_one(td2); 826906ac69dSDavid Xu if (TD_ON_SLEEPQ(td2) && 827906ac69dSDavid Xu (td2->td_flags & TDF_SINTR)) 828906ac69dSDavid Xu sleepq_abort(td2); 829906ac69dSDavid Xu break; 830906ac69dSDavid Xu default: 8319d102777SJulian Elischer if (TD_IS_SUSPENDED(td2)) 8329d102777SJulian Elischer continue; 8335215b187SJeff Roberson /* 8345215b187SJeff Roberson * maybe other inhibitted states too? 8355215b187SJeff Roberson * XXXKSE Is it totally safe to 8365215b187SJeff Roberson * suspend a non-interruptable thread? 8375215b187SJeff Roberson */ 83893a7aa79SJulian Elischer if (td2->td_inhibitors & 8395215b187SJeff Roberson (TDI_SLEEPING | TDI_SWAPPED)) 8409d102777SJulian Elischer thread_suspend_one(td2); 841906ac69dSDavid Xu break; 84244990b8cSJulian Elischer } 84344990b8cSJulian Elischer } 8449d102777SJulian Elischer } 845906ac69dSDavid Xu if (mode == SINGLE_EXIT) 846ec008e96SDavid Xu remaining = p->p_numthreads; 847906ac69dSDavid Xu else if (mode == SINGLE_BOUNDARY) 848906ac69dSDavid Xu remaining = p->p_numthreads - p->p_boundary_count; 849ec008e96SDavid Xu else 850ec008e96SDavid Xu remaining = p->p_numthreads - p->p_suspcount; 851ec008e96SDavid Xu 8529d102777SJulian Elischer /* 8539d102777SJulian Elischer * Maybe we suspended some threads.. was it enough? 8549d102777SJulian Elischer */ 855ec008e96SDavid Xu if (remaining == 1) 8569d102777SJulian Elischer break; 8579d102777SJulian Elischer 85844990b8cSJulian Elischer /* 85944990b8cSJulian Elischer * Wake us up when everyone else has suspended. 860e3b9bf71SJulian Elischer * In the mean time we suspend as well. 86144990b8cSJulian Elischer */ 86271fad9fdSJulian Elischer thread_suspend_one(td); 86344990b8cSJulian Elischer PROC_UNLOCK(p); 864bf0acc27SJohn Baldwin mi_switch(SW_VOL, NULL); 86544990b8cSJulian Elischer mtx_unlock_spin(&sched_lock); 86644990b8cSJulian Elischer PROC_LOCK(p); 867112afcb2SJohn Baldwin mtx_lock_spin(&sched_lock); 868906ac69dSDavid Xu if (mode == SINGLE_EXIT) 869ec008e96SDavid Xu remaining = p->p_numthreads; 870906ac69dSDavid Xu else if (mode == SINGLE_BOUNDARY) 871906ac69dSDavid Xu remaining = p->p_numthreads - p->p_boundary_count; 872ec008e96SDavid Xu else 873ec008e96SDavid Xu remaining = p->p_numthreads - p->p_suspcount; 87444990b8cSJulian Elischer } 875906ac69dSDavid Xu if (mode == SINGLE_EXIT) { 87691599697SJulian Elischer /* 87791599697SJulian Elischer * We have gotten rid of all the other threads and we 87891599697SJulian Elischer * are about to either exit or exec. In either case, 87991599697SJulian Elischer * we try our utmost to revert to being a non-threaded 88091599697SJulian Elischer * process. 88191599697SJulian Elischer */ 882ed062c8dSJulian Elischer p->p_singlethread = NULL; 883e5bedcefSJulian Elischer p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT); 884e5bedcefSJulian Elischer thread_unthread(td); 88591599697SJulian Elischer } 886112afcb2SJohn Baldwin mtx_unlock_spin(&sched_lock); 88744990b8cSJulian Elischer return (0); 88844990b8cSJulian Elischer } 88944990b8cSJulian Elischer 89044990b8cSJulian Elischer /* 89144990b8cSJulian Elischer * Called in from locations that can safely check to see 89244990b8cSJulian Elischer * whether we have to suspend or at least throttle for a 89344990b8cSJulian Elischer * single-thread event (e.g. fork). 89444990b8cSJulian Elischer * 89544990b8cSJulian Elischer * Such locations include userret(). 89644990b8cSJulian Elischer * If the "return_instead" argument is non zero, the thread must be able to 89744990b8cSJulian Elischer * accept 0 (caller may continue), or 1 (caller must abort) as a result. 89844990b8cSJulian Elischer * 89944990b8cSJulian Elischer * The 'return_instead' argument tells the function if it may do a 90044990b8cSJulian Elischer * thread_exit() or suspend, or whether the caller must abort and back 90144990b8cSJulian Elischer * out instead. 90244990b8cSJulian Elischer * 90344990b8cSJulian Elischer * If the thread that set the single_threading request has set the 90444990b8cSJulian Elischer * P_SINGLE_EXIT bit in the process flags then this call will never return 90544990b8cSJulian Elischer * if 'return_instead' is false, but will exit. 90644990b8cSJulian Elischer * 90744990b8cSJulian Elischer * P_SINGLE_EXIT | return_instead == 0| return_instead != 0 90844990b8cSJulian Elischer *---------------+--------------------+--------------------- 90944990b8cSJulian Elischer * 0 | returns 0 | returns 0 or 1 91044990b8cSJulian Elischer * | when ST ends | immediatly 91144990b8cSJulian Elischer *---------------+--------------------+--------------------- 91244990b8cSJulian Elischer * 1 | thread exits | returns 1 91344990b8cSJulian Elischer * | | immediatly 91444990b8cSJulian Elischer * 0 = thread_exit() or suspension ok, 91544990b8cSJulian Elischer * other = return error instead of stopping the thread. 91644990b8cSJulian Elischer * 91744990b8cSJulian Elischer * While a full suspension is under effect, even a single threading 91844990b8cSJulian Elischer * thread would be suspended if it made this call (but it shouldn't). 91944990b8cSJulian Elischer * This call should only be made from places where 92044990b8cSJulian Elischer * thread_exit() would be safe as that may be the outcome unless 92144990b8cSJulian Elischer * return_instead is set. 92244990b8cSJulian Elischer */ 92344990b8cSJulian Elischer int 92444990b8cSJulian Elischer thread_suspend_check(int return_instead) 92544990b8cSJulian Elischer { 926ecafb24bSJuli Mallett struct thread *td; 927ecafb24bSJuli Mallett struct proc *p; 92844990b8cSJulian Elischer 92944990b8cSJulian Elischer td = curthread; 93044990b8cSJulian Elischer p = td->td_proc; 93137814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 93244990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 933cbf4e354SDavid Xu while (P_SHOULDSTOP(p) || 934cbf4e354SDavid Xu ((p->p_flag & P_TRACED) && (td->td_flags & TDF_DBSUSPEND))) { 9351279572aSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 93644990b8cSJulian Elischer KASSERT(p->p_singlethread != NULL, 93744990b8cSJulian Elischer ("singlethread not set")); 93844990b8cSJulian Elischer /* 939e3b9bf71SJulian Elischer * The only suspension in action is a 940e3b9bf71SJulian Elischer * single-threading. Single threader need not stop. 941b6d5995eSJulian Elischer * XXX Should be safe to access unlocked 942b6d5995eSJulian Elischer * as it can only be set to be true by us. 94344990b8cSJulian Elischer */ 944e3b9bf71SJulian Elischer if (p->p_singlethread == td) 94544990b8cSJulian Elischer return (0); /* Exempt from stopping. */ 94644990b8cSJulian Elischer } 94745a4bfa1SDavid Xu if ((p->p_flag & P_SINGLE_EXIT) && return_instead) 94844990b8cSJulian Elischer return (1); 94944990b8cSJulian Elischer 950906ac69dSDavid Xu /* Should we goto user boundary if we didn't come from there? */ 951906ac69dSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE && 952906ac69dSDavid Xu (p->p_flag & P_SINGLE_BOUNDARY) && return_instead) 953906ac69dSDavid Xu return (1); 954906ac69dSDavid Xu 955e574e444SDavid Xu mtx_lock_spin(&sched_lock); 956e574e444SDavid Xu thread_stopped(p); 95744990b8cSJulian Elischer /* 95844990b8cSJulian Elischer * If the process is waiting for us to exit, 95944990b8cSJulian Elischer * this thread should just suicide. 9601279572aSDavid Xu * Assumes that P_SINGLE_EXIT implies P_STOPPED_SINGLE. 96144990b8cSJulian Elischer */ 962906ac69dSDavid Xu if ((p->p_flag & P_SINGLE_EXIT) && (p->p_singlethread != td)) 96344990b8cSJulian Elischer thread_exit(); 96444990b8cSJulian Elischer 96544990b8cSJulian Elischer /* 96644990b8cSJulian Elischer * When a thread suspends, it just 96744990b8cSJulian Elischer * moves to the processes's suspend queue 96844990b8cSJulian Elischer * and stays there. 96944990b8cSJulian Elischer */ 97071fad9fdSJulian Elischer thread_suspend_one(td); 971906ac69dSDavid Xu if (return_instead == 0) { 972906ac69dSDavid Xu p->p_boundary_count++; 973906ac69dSDavid Xu td->td_flags |= TDF_BOUNDARY; 974cf19bf91SJulian Elischer } 975906ac69dSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 976906ac69dSDavid Xu if (p->p_numthreads == p->p_suspcount) 977906ac69dSDavid Xu thread_unsuspend_one(p->p_singlethread); 978cf19bf91SJulian Elischer } 979a6f37ac9SJohn Baldwin PROC_UNLOCK(p); 980bf0acc27SJohn Baldwin mi_switch(SW_INVOL, NULL); 981906ac69dSDavid Xu if (return_instead == 0) { 982906ac69dSDavid Xu p->p_boundary_count--; 983906ac69dSDavid Xu td->td_flags &= ~TDF_BOUNDARY; 984906ac69dSDavid Xu } 98544990b8cSJulian Elischer mtx_unlock_spin(&sched_lock); 98644990b8cSJulian Elischer PROC_LOCK(p); 98744990b8cSJulian Elischer } 98844990b8cSJulian Elischer return (0); 98944990b8cSJulian Elischer } 99044990b8cSJulian Elischer 99135c32a76SDavid Xu void 99235c32a76SDavid Xu thread_suspend_one(struct thread *td) 99335c32a76SDavid Xu { 99435c32a76SDavid Xu struct proc *p = td->td_proc; 99535c32a76SDavid Xu 99635c32a76SDavid Xu mtx_assert(&sched_lock, MA_OWNED); 997112afcb2SJohn Baldwin PROC_LOCK_ASSERT(p, MA_OWNED); 998e574e444SDavid Xu KASSERT(!TD_IS_SUSPENDED(td), ("already suspended")); 99935c32a76SDavid Xu p->p_suspcount++; 100071fad9fdSJulian Elischer TD_SET_SUSPENDED(td); 100135c32a76SDavid Xu TAILQ_INSERT_TAIL(&p->p_suspended, td, td_runq); 100271fad9fdSJulian Elischer /* 100371fad9fdSJulian Elischer * Hack: If we are suspending but are on the sleep queue 100471fad9fdSJulian Elischer * then we are in msleep or the cv equivalent. We 100571fad9fdSJulian Elischer * want to look like we have two Inhibitors. 10069d102777SJulian Elischer * May already be set.. doesn't matter. 100771fad9fdSJulian Elischer */ 100871fad9fdSJulian Elischer if (TD_ON_SLEEPQ(td)) 100971fad9fdSJulian Elischer TD_SET_SLEEPING(td); 101035c32a76SDavid Xu } 101135c32a76SDavid Xu 101235c32a76SDavid Xu void 101335c32a76SDavid Xu thread_unsuspend_one(struct thread *td) 101435c32a76SDavid Xu { 101535c32a76SDavid Xu struct proc *p = td->td_proc; 101635c32a76SDavid Xu 101735c32a76SDavid Xu mtx_assert(&sched_lock, MA_OWNED); 1018112afcb2SJohn Baldwin PROC_LOCK_ASSERT(p, MA_OWNED); 101935c32a76SDavid Xu TAILQ_REMOVE(&p->p_suspended, td, td_runq); 102071fad9fdSJulian Elischer TD_CLR_SUSPENDED(td); 102135c32a76SDavid Xu p->p_suspcount--; 102271fad9fdSJulian Elischer setrunnable(td); 102335c32a76SDavid Xu } 102435c32a76SDavid Xu 102544990b8cSJulian Elischer /* 102644990b8cSJulian Elischer * Allow all threads blocked by single threading to continue running. 102744990b8cSJulian Elischer */ 102844990b8cSJulian Elischer void 102944990b8cSJulian Elischer thread_unsuspend(struct proc *p) 103044990b8cSJulian Elischer { 103144990b8cSJulian Elischer struct thread *td; 103244990b8cSJulian Elischer 1033b6d5995eSJulian Elischer mtx_assert(&sched_lock, MA_OWNED); 103444990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 103544990b8cSJulian Elischer if (!P_SHOULDSTOP(p)) { 103644990b8cSJulian Elischer while ((td = TAILQ_FIRST(&p->p_suspended))) { 103735c32a76SDavid Xu thread_unsuspend_one(td); 103844990b8cSJulian Elischer } 10391279572aSDavid Xu } else if ((P_SHOULDSTOP(p) == P_STOPPED_SINGLE) && 104044990b8cSJulian Elischer (p->p_numthreads == p->p_suspcount)) { 104144990b8cSJulian Elischer /* 104244990b8cSJulian Elischer * Stopping everything also did the job for the single 104344990b8cSJulian Elischer * threading request. Now we've downgraded to single-threaded, 104444990b8cSJulian Elischer * let it continue. 104544990b8cSJulian Elischer */ 104635c32a76SDavid Xu thread_unsuspend_one(p->p_singlethread); 104744990b8cSJulian Elischer } 104844990b8cSJulian Elischer } 104944990b8cSJulian Elischer 1050ed062c8dSJulian Elischer /* 1051ed062c8dSJulian Elischer * End the single threading mode.. 1052ed062c8dSJulian Elischer */ 105344990b8cSJulian Elischer void 105444990b8cSJulian Elischer thread_single_end(void) 105544990b8cSJulian Elischer { 105644990b8cSJulian Elischer struct thread *td; 105744990b8cSJulian Elischer struct proc *p; 105844990b8cSJulian Elischer 105944990b8cSJulian Elischer td = curthread; 106044990b8cSJulian Elischer p = td->td_proc; 106144990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 1062906ac69dSDavid Xu p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT | P_SINGLE_BOUNDARY); 1063112afcb2SJohn Baldwin mtx_lock_spin(&sched_lock); 106444990b8cSJulian Elischer p->p_singlethread = NULL; 106549539972SJulian Elischer /* 106649539972SJulian Elischer * If there are other threads they mey now run, 106749539972SJulian Elischer * unless of course there is a blanket 'stop order' 106849539972SJulian Elischer * on the process. The single threader must be allowed 106949539972SJulian Elischer * to continue however as this is a bad place to stop. 107049539972SJulian Elischer */ 107149539972SJulian Elischer if ((p->p_numthreads != 1) && (!P_SHOULDSTOP(p))) { 107249539972SJulian Elischer while (( td = TAILQ_FIRST(&p->p_suspended))) { 107371fad9fdSJulian Elischer thread_unsuspend_one(td); 107444990b8cSJulian Elischer } 107549539972SJulian Elischer } 1076112afcb2SJohn Baldwin mtx_unlock_spin(&sched_lock); 107749539972SJulian Elischer } 10784fc21c09SDaniel Eischen 1079007ddf7eSJohn Baldwin /* 1080007ddf7eSJohn Baldwin * Called before going into an interruptible sleep to see if we have been 1081007ddf7eSJohn Baldwin * interrupted or requested to exit. 1082007ddf7eSJohn Baldwin */ 1083007ddf7eSJohn Baldwin int 1084007ddf7eSJohn Baldwin thread_sleep_check(struct thread *td) 1085007ddf7eSJohn Baldwin { 1086007ddf7eSJohn Baldwin struct proc *p; 1087007ddf7eSJohn Baldwin 1088007ddf7eSJohn Baldwin p = td->td_proc; 1089007ddf7eSJohn Baldwin mtx_assert(&sched_lock, MA_OWNED); 10902179a22cSJulian Elischer if (p->p_flag & P_HADTHREADS) { 1091906ac69dSDavid Xu if (p->p_singlethread != td) { 1092906ac69dSDavid Xu if (p->p_flag & P_SINGLE_EXIT) 1093007ddf7eSJohn Baldwin return (EINTR); 1094906ac69dSDavid Xu if (p->p_flag & P_SINGLE_BOUNDARY) 1095906ac69dSDavid Xu return (ERESTART); 1096906ac69dSDavid Xu } 1097007ddf7eSJohn Baldwin if (td->td_flags & TDF_INTERRUPT) 1098007ddf7eSJohn Baldwin return (td->td_intrval); 1099007ddf7eSJohn Baldwin } 1100007ddf7eSJohn Baldwin return (0); 1101007ddf7eSJohn Baldwin } 1102