19454b2d8SWarner Losh /*- 24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause 38a36da99SPedro F. Giffuni * 444990b8cSJulian Elischer * Copyright (C) 2001 Julian Elischer <julian@freebsd.org>. 544990b8cSJulian Elischer * All rights reserved. 644990b8cSJulian Elischer * 744990b8cSJulian Elischer * Redistribution and use in source and binary forms, with or without 844990b8cSJulian Elischer * modification, are permitted provided that the following conditions 944990b8cSJulian Elischer * are met: 1044990b8cSJulian Elischer * 1. Redistributions of source code must retain the above copyright 1144990b8cSJulian Elischer * notice(s), this list of conditions and the following disclaimer as 1244990b8cSJulian Elischer * the first lines of this file unmodified other than the possible 1344990b8cSJulian Elischer * addition of one or more copyright notices. 1444990b8cSJulian Elischer * 2. Redistributions in binary form must reproduce the above copyright 1544990b8cSJulian Elischer * notice(s), this list of conditions and the following disclaimer in the 1644990b8cSJulian Elischer * documentation and/or other materials provided with the distribution. 1744990b8cSJulian Elischer * 1844990b8cSJulian Elischer * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) ``AS IS'' AND ANY 1944990b8cSJulian Elischer * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED 2044990b8cSJulian Elischer * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 2144990b8cSJulian Elischer * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY 2244990b8cSJulian Elischer * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES 2344990b8cSJulian Elischer * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 2444990b8cSJulian Elischer * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 2544990b8cSJulian Elischer * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2644990b8cSJulian Elischer * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2744990b8cSJulian Elischer * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH 2844990b8cSJulian Elischer * DAMAGE. 2944990b8cSJulian Elischer */ 3044990b8cSJulian Elischer 313d06b4b3SAttilio Rao #include "opt_witness.h" 3216d95d4fSJoseph Koshy #include "opt_hwpmc_hooks.h" 333d06b4b3SAttilio Rao 3444990b8cSJulian Elischer #include <sys/param.h> 3544990b8cSJulian Elischer #include <sys/systm.h> 3644990b8cSJulian Elischer #include <sys/kernel.h> 3744990b8cSJulian Elischer #include <sys/lock.h> 385dda15adSMark Johnston #include <sys/msan.h> 3944990b8cSJulian Elischer #include <sys/mutex.h> 4044990b8cSJulian Elischer #include <sys/proc.h> 4135bb59edSMateusz Guzik #include <sys/bitstring.h> 426febf180SGleb Smirnoff #include <sys/epoch.h> 438f0e9130SKonstantin Belousov #include <sys/rangelock.h> 44e170bfdaSDavid Xu #include <sys/resourcevar.h> 45b3e9e682SRyan Stone #include <sys/sdt.h> 4694e0a4cdSJulian Elischer #include <sys/smp.h> 47de028f5aSJeff Roberson #include <sys/sched.h> 4844f3b092SJohn Baldwin #include <sys/sleepqueue.h> 49ace8398dSJeff Roberson #include <sys/selinfo.h> 50d1e7a4a5SJohn Baldwin #include <sys/syscallsubr.h> 51598f2b81SMateusz Guzik #include <sys/dtrace_bsd.h> 5291d1786fSDmitry Chagin #include <sys/sysent.h> 53961a7b24SJohn Baldwin #include <sys/turnstile.h> 54d116b9f1SMateusz Guzik #include <sys/taskqueue.h> 5544990b8cSJulian Elischer #include <sys/ktr.h> 56cf7d9a8cSDavid Xu #include <sys/rwlock.h> 57af29f399SDmitry Chagin #include <sys/umtxvar.h> 589ed01c32SGleb Smirnoff #include <sys/vmmeter.h> 59d7f687fcSJeff Roberson #include <sys/cpuset.h> 6016d95d4fSJoseph Koshy #ifdef HWPMC_HOOKS 6116d95d4fSJoseph Koshy #include <sys/pmckern.h> 6216d95d4fSJoseph Koshy #endif 631bd3cf5dSMateusz Guzik #include <sys/priv.h> 6444990b8cSJulian Elischer 65911b84b0SRobert Watson #include <security/audit/audit.h> 66911b84b0SRobert Watson 67d116b9f1SMateusz Guzik #include <vm/pmap.h> 6844990b8cSJulian Elischer #include <vm/vm.h> 6949a2507bSAlan Cox #include <vm/vm_extern.h> 7044990b8cSJulian Elischer #include <vm/uma.h> 71d116b9f1SMateusz Guzik #include <vm/vm_phys.h> 72b209f889SRandall Stewart #include <sys/eventhandler.h> 7302fb42b0SPeter Wemm 74acd9f517SKonstantin Belousov /* 75acd9f517SKonstantin Belousov * Asserts below verify the stability of struct thread and struct proc 76acd9f517SKonstantin Belousov * layout, as exposed by KBI to modules. On head, the KBI is allowed 77acd9f517SKonstantin Belousov * to drift, change to the structures must be accompanied by the 78acd9f517SKonstantin Belousov * assert update. 79acd9f517SKonstantin Belousov * 80acd9f517SKonstantin Belousov * On the stable branches after KBI freeze, conditions must not be 81acd9f517SKonstantin Belousov * violated. Typically new fields are moved to the end of the 82acd9f517SKonstantin Belousov * structures. 83acd9f517SKonstantin Belousov */ 84acd9f517SKonstantin Belousov #ifdef __amd64__ 85a422084aSMark Johnston _Static_assert(offsetof(struct thread, td_flags) == 0x108, 86acd9f517SKonstantin Belousov "struct thread KBI td_flags"); 87c6d31b83SKonstantin Belousov _Static_assert(offsetof(struct thread, td_pflags) == 0x114, 88acd9f517SKonstantin Belousov "struct thread KBI td_pflags"); 897530de77SMateusz Guzik _Static_assert(offsetof(struct thread, td_frame) == 0x4b8, 90acd9f517SKonstantin Belousov "struct thread KBI td_frame"); 91c6d31b83SKonstantin Belousov _Static_assert(offsetof(struct thread, td_emuldata) == 0x6c0, 92acd9f517SKonstantin Belousov "struct thread KBI td_emuldata"); 9385078b85SConrad Meyer _Static_assert(offsetof(struct proc, p_flag) == 0xb8, 94acd9f517SKonstantin Belousov "struct proc KBI p_flag"); 9585078b85SConrad Meyer _Static_assert(offsetof(struct proc, p_pid) == 0xc4, 96acd9f517SKonstantin Belousov "struct proc KBI p_pid"); 97351d5f7fSKonstantin Belousov _Static_assert(offsetof(struct proc, p_filemon) == 0x3c8, 98acd9f517SKonstantin Belousov "struct proc KBI p_filemon"); 99aaa92413SKonstantin Belousov _Static_assert(offsetof(struct proc, p_comm) == 0x3e0, 100acd9f517SKonstantin Belousov "struct proc KBI p_comm"); 10193ca6ff2SKonstantin Belousov _Static_assert(offsetof(struct proc, p_emuldata) == 0x4d0, 102acd9f517SKonstantin Belousov "struct proc KBI p_emuldata"); 103acd9f517SKonstantin Belousov #endif 104acd9f517SKonstantin Belousov #ifdef __i386__ 105a422084aSMark Johnston _Static_assert(offsetof(struct thread, td_flags) == 0x9c, 106acd9f517SKonstantin Belousov "struct thread KBI td_flags"); 107c6d31b83SKonstantin Belousov _Static_assert(offsetof(struct thread, td_pflags) == 0xa8, 108acd9f517SKonstantin Belousov "struct thread KBI td_pflags"); 1097530de77SMateusz Guzik _Static_assert(offsetof(struct thread, td_frame) == 0x318, 110acd9f517SKonstantin Belousov "struct thread KBI td_frame"); 1117530de77SMateusz Guzik _Static_assert(offsetof(struct thread, td_emuldata) == 0x35c, 112acd9f517SKonstantin Belousov "struct thread KBI td_emuldata"); 11385078b85SConrad Meyer _Static_assert(offsetof(struct proc, p_flag) == 0x6c, 114acd9f517SKonstantin Belousov "struct proc KBI p_flag"); 11585078b85SConrad Meyer _Static_assert(offsetof(struct proc, p_pid) == 0x78, 116acd9f517SKonstantin Belousov "struct proc KBI p_pid"); 1174d675b80SKonstantin Belousov _Static_assert(offsetof(struct proc, p_filemon) == 0x270, 118acd9f517SKonstantin Belousov "struct proc KBI p_filemon"); 119aaa92413SKonstantin Belousov _Static_assert(offsetof(struct proc, p_comm) == 0x284, 120acd9f517SKonstantin Belousov "struct proc KBI p_comm"); 121aaa92413SKonstantin Belousov _Static_assert(offsetof(struct proc, p_emuldata) == 0x318, 122acd9f517SKonstantin Belousov "struct proc KBI p_emuldata"); 123acd9f517SKonstantin Belousov #endif 124acd9f517SKonstantin Belousov 125b3e9e682SRyan Stone SDT_PROVIDER_DECLARE(proc); 126d9fae5abSAndriy Gapon SDT_PROBE_DEFINE(proc, , , lwp__exit); 127b3e9e682SRyan Stone 1288460a577SJohn Birrell /* 1298460a577SJohn Birrell * thread related storage. 1308460a577SJohn Birrell */ 13144990b8cSJulian Elischer static uma_zone_t thread_zone; 13244990b8cSJulian Elischer 133d116b9f1SMateusz Guzik struct thread_domain_data { 134d116b9f1SMateusz Guzik struct thread *tdd_zombies; 135d116b9f1SMateusz Guzik int tdd_reapticks; 136d116b9f1SMateusz Guzik } __aligned(CACHE_LINE_SIZE); 137d116b9f1SMateusz Guzik 138d116b9f1SMateusz Guzik static struct thread_domain_data thread_domain_data[MAXMEMDOM]; 139d116b9f1SMateusz Guzik 140d116b9f1SMateusz Guzik static struct task thread_reap_task; 141d116b9f1SMateusz Guzik static struct callout thread_reap_callout; 14244990b8cSJulian Elischer 143ff8fbcffSJeff Roberson static void thread_zombie(struct thread *); 144b83e94beSMateusz Guzik static void thread_reap(void); 145d116b9f1SMateusz Guzik static void thread_reap_all(void); 146d116b9f1SMateusz Guzik static void thread_reap_task_cb(void *, int); 147d116b9f1SMateusz Guzik static void thread_reap_callout_cb(void *); 14884cdea97SKonstantin Belousov static int thread_unsuspend_one(struct thread *td, struct proc *p, 14984cdea97SKonstantin Belousov bool boundary); 150755341dfSMateusz Guzik static void thread_free_batched(struct thread *td); 151ff8fbcffSJeff Roberson 152d1ca25beSMateusz Guzik static __exclusive_cache_line struct mtx tid_lock; 153934e7e5eSMateusz Guzik static bitstr_t *tid_bitmap; 15435bb59edSMateusz Guzik 155cf7d9a8cSDavid Xu static MALLOC_DEFINE(M_TIDHASH, "tidhash", "thread hash"); 156cf7d9a8cSDavid Xu 1571bd3cf5dSMateusz Guzik static int maxthread; 1581bd3cf5dSMateusz Guzik SYSCTL_INT(_kern, OID_AUTO, maxthread, CTLFLAG_RDTUN, 1591bd3cf5dSMateusz Guzik &maxthread, 0, "Maximum number of threads"); 1601bd3cf5dSMateusz Guzik 16162dbc992SMateusz Guzik static __exclusive_cache_line int nthreads; 1621bd3cf5dSMateusz Guzik 163aae3547bSMateusz Guzik static LIST_HEAD(tidhashhead, thread) *tidhashtbl; 164aae3547bSMateusz Guzik static u_long tidhash; 16526007fe3SMateusz Guzik static u_long tidhashlock; 16626007fe3SMateusz Guzik static struct rwlock *tidhashtbl_lock; 167aae3547bSMateusz Guzik #define TIDHASH(tid) (&tidhashtbl[(tid) & tidhash]) 16826007fe3SMateusz Guzik #define TIDHASHLOCK(tid) (&tidhashtbl_lock[(tid) & tidhashlock]) 169cf7d9a8cSDavid Xu 1702ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_ctor); 1712ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_dtor); 1722ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_init); 1732ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_fini); 1742ca45184SMatt Joras 17562dbc992SMateusz Guzik static bool 176d116b9f1SMateusz Guzik thread_count_inc_try(void) 177ec6ea5e8SDavid Xu { 17862dbc992SMateusz Guzik int nthreads_new; 179ec6ea5e8SDavid Xu 18062dbc992SMateusz Guzik nthreads_new = atomic_fetchadd_int(&nthreads, 1) + 1; 18162dbc992SMateusz Guzik if (nthreads_new >= maxthread - 100) { 1821bd3cf5dSMateusz Guzik if (priv_check_cred(curthread->td_ucred, PRIV_MAXPROC) != 0 || 18362dbc992SMateusz Guzik nthreads_new >= maxthread) { 18462dbc992SMateusz Guzik atomic_subtract_int(&nthreads, 1); 185d116b9f1SMateusz Guzik return (false); 186d116b9f1SMateusz Guzik } 187d116b9f1SMateusz Guzik } 188d116b9f1SMateusz Guzik return (true); 189d116b9f1SMateusz Guzik } 190d116b9f1SMateusz Guzik 191d116b9f1SMateusz Guzik static bool 192d116b9f1SMateusz Guzik thread_count_inc(void) 193d116b9f1SMateusz Guzik { 194d116b9f1SMateusz Guzik static struct timeval lastfail; 195d116b9f1SMateusz Guzik static int curfail; 196d116b9f1SMateusz Guzik 197d116b9f1SMateusz Guzik thread_reap(); 198d116b9f1SMateusz Guzik if (thread_count_inc_try()) { 199d116b9f1SMateusz Guzik return (true); 200d116b9f1SMateusz Guzik } 201d116b9f1SMateusz Guzik 202d116b9f1SMateusz Guzik thread_reap_all(); 203d116b9f1SMateusz Guzik if (thread_count_inc_try()) { 204d116b9f1SMateusz Guzik return (true); 205d116b9f1SMateusz Guzik } 206d116b9f1SMateusz Guzik 2071bd3cf5dSMateusz Guzik if (ppsratecheck(&lastfail, &curfail, 1)) { 2081bd3cf5dSMateusz Guzik printf("maxthread limit exceeded by uid %u " 2091bd3cf5dSMateusz Guzik "(pid %d); consider increasing kern.maxthread\n", 2101bd3cf5dSMateusz Guzik curthread->td_ucred->cr_ruid, curproc->p_pid); 2111bd3cf5dSMateusz Guzik } 21262dbc992SMateusz Guzik return (false); 2131bd3cf5dSMateusz Guzik } 2141bd3cf5dSMateusz Guzik 21562dbc992SMateusz Guzik static void 21662dbc992SMateusz Guzik thread_count_sub(int n) 21762dbc992SMateusz Guzik { 21862dbc992SMateusz Guzik 21962dbc992SMateusz Guzik atomic_subtract_int(&nthreads, n); 22062dbc992SMateusz Guzik } 22162dbc992SMateusz Guzik 22262dbc992SMateusz Guzik static void 22362dbc992SMateusz Guzik thread_count_dec(void) 22462dbc992SMateusz Guzik { 22562dbc992SMateusz Guzik 22662dbc992SMateusz Guzik thread_count_sub(1); 22762dbc992SMateusz Guzik } 22862dbc992SMateusz Guzik 22962dbc992SMateusz Guzik static lwpid_t 23062dbc992SMateusz Guzik tid_alloc(void) 23162dbc992SMateusz Guzik { 23262dbc992SMateusz Guzik static lwpid_t trytid; 23362dbc992SMateusz Guzik lwpid_t tid; 23462dbc992SMateusz Guzik 23562dbc992SMateusz Guzik mtx_lock(&tid_lock); 23635bb59edSMateusz Guzik /* 23735bb59edSMateusz Guzik * It is an invariant that the bitmap is big enough to hold maxthread 23835bb59edSMateusz Guzik * IDs. If we got to this point there has to be at least one free. 23935bb59edSMateusz Guzik */ 24035bb59edSMateusz Guzik if (trytid >= maxthread) 24135bb59edSMateusz Guzik trytid = 0; 24235bb59edSMateusz Guzik bit_ffc_at(tid_bitmap, trytid, maxthread, &tid); 24335bb59edSMateusz Guzik if (tid == -1) { 24435bb59edSMateusz Guzik KASSERT(trytid != 0, ("unexpectedly ran out of IDs")); 24535bb59edSMateusz Guzik trytid = 0; 24635bb59edSMateusz Guzik bit_ffc_at(tid_bitmap, trytid, maxthread, &tid); 24735bb59edSMateusz Guzik KASSERT(tid != -1, ("unexpectedly ran out of IDs")); 248ec6ea5e8SDavid Xu } 24935bb59edSMateusz Guzik bit_set(tid_bitmap, tid); 250934e7e5eSMateusz Guzik trytid = tid + 1; 251ec6ea5e8SDavid Xu mtx_unlock(&tid_lock); 25235bb59edSMateusz Guzik return (tid + NO_PID); 253ec6ea5e8SDavid Xu } 254ec6ea5e8SDavid Xu 255ec6ea5e8SDavid Xu static void 256755341dfSMateusz Guzik tid_free_locked(lwpid_t rtid) 257ec6ea5e8SDavid Xu { 25835bb59edSMateusz Guzik lwpid_t tid; 259ec6ea5e8SDavid Xu 260755341dfSMateusz Guzik mtx_assert(&tid_lock, MA_OWNED); 26135bb59edSMateusz Guzik KASSERT(rtid >= NO_PID, 26235bb59edSMateusz Guzik ("%s: invalid tid %d\n", __func__, rtid)); 26335bb59edSMateusz Guzik tid = rtid - NO_PID; 26435bb59edSMateusz Guzik KASSERT(bit_test(tid_bitmap, tid) != 0, 26535bb59edSMateusz Guzik ("thread ID %d not allocated\n", rtid)); 26635bb59edSMateusz Guzik bit_clear(tid_bitmap, tid); 267755341dfSMateusz Guzik } 268755341dfSMateusz Guzik 269755341dfSMateusz Guzik static void 270755341dfSMateusz Guzik tid_free(lwpid_t rtid) 271755341dfSMateusz Guzik { 272755341dfSMateusz Guzik 273755341dfSMateusz Guzik mtx_lock(&tid_lock); 274755341dfSMateusz Guzik tid_free_locked(rtid); 275755341dfSMateusz Guzik mtx_unlock(&tid_lock); 276755341dfSMateusz Guzik } 277755341dfSMateusz Guzik 278755341dfSMateusz Guzik static void 279755341dfSMateusz Guzik tid_free_batch(lwpid_t *batch, int n) 280755341dfSMateusz Guzik { 281755341dfSMateusz Guzik int i; 282755341dfSMateusz Guzik 283755341dfSMateusz Guzik mtx_lock(&tid_lock); 284755341dfSMateusz Guzik for (i = 0; i < n; i++) { 285755341dfSMateusz Guzik tid_free_locked(batch[i]); 286755341dfSMateusz Guzik } 287ec6ea5e8SDavid Xu mtx_unlock(&tid_lock); 288ec6ea5e8SDavid Xu } 289ec6ea5e8SDavid Xu 290fdcac928SMarcel Moolenaar /* 2915ef7b7a0SMateusz Guzik * Batching for thread reapping. 2925ef7b7a0SMateusz Guzik */ 2935ef7b7a0SMateusz Guzik struct tidbatch { 2945ef7b7a0SMateusz Guzik lwpid_t tab[16]; 2955ef7b7a0SMateusz Guzik int n; 2965ef7b7a0SMateusz Guzik }; 2975ef7b7a0SMateusz Guzik 2985ef7b7a0SMateusz Guzik static void 2995ef7b7a0SMateusz Guzik tidbatch_prep(struct tidbatch *tb) 3005ef7b7a0SMateusz Guzik { 3015ef7b7a0SMateusz Guzik 3025ef7b7a0SMateusz Guzik tb->n = 0; 3035ef7b7a0SMateusz Guzik } 3045ef7b7a0SMateusz Guzik 3055ef7b7a0SMateusz Guzik static void 3065ef7b7a0SMateusz Guzik tidbatch_add(struct tidbatch *tb, struct thread *td) 3075ef7b7a0SMateusz Guzik { 3085ef7b7a0SMateusz Guzik 3095ef7b7a0SMateusz Guzik KASSERT(tb->n < nitems(tb->tab), 3105ef7b7a0SMateusz Guzik ("%s: count too high %d", __func__, tb->n)); 3115ef7b7a0SMateusz Guzik tb->tab[tb->n] = td->td_tid; 3125ef7b7a0SMateusz Guzik tb->n++; 3135ef7b7a0SMateusz Guzik } 3145ef7b7a0SMateusz Guzik 3155ef7b7a0SMateusz Guzik static void 3165ef7b7a0SMateusz Guzik tidbatch_process(struct tidbatch *tb) 3175ef7b7a0SMateusz Guzik { 3185ef7b7a0SMateusz Guzik 3195ef7b7a0SMateusz Guzik KASSERT(tb->n <= nitems(tb->tab), 3205ef7b7a0SMateusz Guzik ("%s: count too high %d", __func__, tb->n)); 3215ef7b7a0SMateusz Guzik if (tb->n == nitems(tb->tab)) { 3225ef7b7a0SMateusz Guzik tid_free_batch(tb->tab, tb->n); 3235ef7b7a0SMateusz Guzik tb->n = 0; 3245ef7b7a0SMateusz Guzik } 3255ef7b7a0SMateusz Guzik } 3265ef7b7a0SMateusz Guzik 3275ef7b7a0SMateusz Guzik static void 3285ef7b7a0SMateusz Guzik tidbatch_final(struct tidbatch *tb) 3295ef7b7a0SMateusz Guzik { 3305ef7b7a0SMateusz Guzik 3315ef7b7a0SMateusz Guzik KASSERT(tb->n <= nitems(tb->tab), 3325ef7b7a0SMateusz Guzik ("%s: count too high %d", __func__, tb->n)); 3335ef7b7a0SMateusz Guzik if (tb->n != 0) { 3345ef7b7a0SMateusz Guzik tid_free_batch(tb->tab, tb->n); 3355ef7b7a0SMateusz Guzik } 3365ef7b7a0SMateusz Guzik } 3375ef7b7a0SMateusz Guzik 3385ef7b7a0SMateusz Guzik /* 339e0c86f5cSMateusz Guzik * Batching thread count free, for consistency 340e0c86f5cSMateusz Guzik */ 341e0c86f5cSMateusz Guzik struct tdcountbatch { 342e0c86f5cSMateusz Guzik int n; 343e0c86f5cSMateusz Guzik }; 344e0c86f5cSMateusz Guzik 345e0c86f5cSMateusz Guzik static void 346e0c86f5cSMateusz Guzik tdcountbatch_prep(struct tdcountbatch *tb) 347e0c86f5cSMateusz Guzik { 348e0c86f5cSMateusz Guzik 349e0c86f5cSMateusz Guzik tb->n = 0; 350e0c86f5cSMateusz Guzik } 351e0c86f5cSMateusz Guzik 352e0c86f5cSMateusz Guzik static void 353e0c86f5cSMateusz Guzik tdcountbatch_add(struct tdcountbatch *tb, struct thread *td __unused) 354e0c86f5cSMateusz Guzik { 355e0c86f5cSMateusz Guzik 356e0c86f5cSMateusz Guzik tb->n++; 357e0c86f5cSMateusz Guzik } 358e0c86f5cSMateusz Guzik 359e0c86f5cSMateusz Guzik static void 360e0c86f5cSMateusz Guzik tdcountbatch_process(struct tdcountbatch *tb) 361e0c86f5cSMateusz Guzik { 362e0c86f5cSMateusz Guzik 363e0c86f5cSMateusz Guzik if (tb->n == 32) { 364e0c86f5cSMateusz Guzik thread_count_sub(tb->n); 365e0c86f5cSMateusz Guzik tb->n = 0; 366e0c86f5cSMateusz Guzik } 367e0c86f5cSMateusz Guzik } 368e0c86f5cSMateusz Guzik 369e0c86f5cSMateusz Guzik static void 370e0c86f5cSMateusz Guzik tdcountbatch_final(struct tdcountbatch *tb) 371e0c86f5cSMateusz Guzik { 372e0c86f5cSMateusz Guzik 373e0c86f5cSMateusz Guzik if (tb->n != 0) { 374e0c86f5cSMateusz Guzik thread_count_sub(tb->n); 375e0c86f5cSMateusz Guzik } 376e0c86f5cSMateusz Guzik } 377e0c86f5cSMateusz Guzik 378e0c86f5cSMateusz Guzik /* 379696058c3SJulian Elischer * Prepare a thread for use. 38044990b8cSJulian Elischer */ 381b23f72e9SBrian Feldman static int 382b23f72e9SBrian Feldman thread_ctor(void *mem, int size, void *arg, int flags) 38344990b8cSJulian Elischer { 38444990b8cSJulian Elischer struct thread *td; 38544990b8cSJulian Elischer 38644990b8cSJulian Elischer td = (struct thread *)mem; 387fa2528acSAlex Richardson TD_SET_STATE(td, TDS_INACTIVE); 38894dd54b9SKonstantin Belousov td->td_lastcpu = td->td_oncpu = NOCPU; 3896c27c603SJuli Mallett 3906c27c603SJuli Mallett /* 3916c27c603SJuli Mallett * Note that td_critnest begins life as 1 because the thread is not 3926c27c603SJuli Mallett * running and is thereby implicitly waiting to be on the receiving 393a54e85fdSJeff Roberson * end of a context switch. 3946c27c603SJuli Mallett */ 395139b7550SJohn Baldwin td->td_critnest = 1; 396acbe332aSDavid Xu td->td_lend_user_pri = PRI_MAX; 397911b84b0SRobert Watson #ifdef AUDIT 398911b84b0SRobert Watson audit_thread_alloc(td); 399911b84b0SRobert Watson #endif 400598f2b81SMateusz Guzik #ifdef KDTRACE_HOOKS 401598f2b81SMateusz Guzik kdtrace_thread_ctor(td); 402598f2b81SMateusz Guzik #endif 403d10183d9SDavid Xu umtx_thread_alloc(td); 40419d3e47dSMateusz Guzik MPASS(td->td_sel == NULL); 405b23f72e9SBrian Feldman return (0); 40644990b8cSJulian Elischer } 40744990b8cSJulian Elischer 40844990b8cSJulian Elischer /* 40944990b8cSJulian Elischer * Reclaim a thread after use. 41044990b8cSJulian Elischer */ 41144990b8cSJulian Elischer static void 41244990b8cSJulian Elischer thread_dtor(void *mem, int size, void *arg) 41344990b8cSJulian Elischer { 41444990b8cSJulian Elischer struct thread *td; 41544990b8cSJulian Elischer 41644990b8cSJulian Elischer td = (struct thread *)mem; 41744990b8cSJulian Elischer 41844990b8cSJulian Elischer #ifdef INVARIANTS 41944990b8cSJulian Elischer /* Verify that this thread is in a safe state to free. */ 420fa2528acSAlex Richardson switch (TD_GET_STATE(td)) { 42171fad9fdSJulian Elischer case TDS_INHIBITED: 42271fad9fdSJulian Elischer case TDS_RUNNING: 42371fad9fdSJulian Elischer case TDS_CAN_RUN: 42444990b8cSJulian Elischer case TDS_RUNQ: 42544990b8cSJulian Elischer /* 42644990b8cSJulian Elischer * We must never unlink a thread that is in one of 42744990b8cSJulian Elischer * these states, because it is currently active. 42844990b8cSJulian Elischer */ 42944990b8cSJulian Elischer panic("bad state for thread unlinking"); 43044990b8cSJulian Elischer /* NOTREACHED */ 43171fad9fdSJulian Elischer case TDS_INACTIVE: 43244990b8cSJulian Elischer break; 43344990b8cSJulian Elischer default: 43444990b8cSJulian Elischer panic("bad thread state"); 43544990b8cSJulian Elischer /* NOTREACHED */ 43644990b8cSJulian Elischer } 43744990b8cSJulian Elischer #endif 4386e8525ceSRobert Watson #ifdef AUDIT 4396e8525ceSRobert Watson audit_thread_free(td); 4406e8525ceSRobert Watson #endif 441598f2b81SMateusz Guzik #ifdef KDTRACE_HOOKS 442598f2b81SMateusz Guzik kdtrace_thread_dtor(td); 443598f2b81SMateusz Guzik #endif 4441ba4a712SPawel Jakub Dawidek /* Free all OSD associated to this thread. */ 4451ba4a712SPawel Jakub Dawidek osd_thread_exit(td); 446c6d31b83SKonstantin Belousov ast_kclear(td); 44719d3e47dSMateusz Guzik seltdfini(td); 44844990b8cSJulian Elischer } 44944990b8cSJulian Elischer 45044990b8cSJulian Elischer /* 45144990b8cSJulian Elischer * Initialize type-stable parts of a thread (when newly created). 45244990b8cSJulian Elischer */ 453b23f72e9SBrian Feldman static int 454b23f72e9SBrian Feldman thread_init(void *mem, int size, int flags) 45544990b8cSJulian Elischer { 45644990b8cSJulian Elischer struct thread *td; 45744990b8cSJulian Elischer 45844990b8cSJulian Elischer td = (struct thread *)mem; 459247aba24SMarcel Moolenaar 460b83e94beSMateusz Guzik td->td_allocdomain = vm_phys_domain(vtophys(td)); 46144f3b092SJohn Baldwin td->td_sleepqueue = sleepq_alloc(); 462961a7b24SJohn Baldwin td->td_turnstile = turnstile_alloc(); 4638f0e9130SKonstantin Belousov td->td_rlqe = NULL; 4642ca45184SMatt Joras EVENTHANDLER_DIRECT_INVOKE(thread_init, td); 465d10183d9SDavid Xu umtx_thread_init(td); 46689b57fcfSKonstantin Belousov td->td_kstack = 0; 467ad8b1d85SKonstantin Belousov td->td_sel = NULL; 468b23f72e9SBrian Feldman return (0); 46944990b8cSJulian Elischer } 47044990b8cSJulian Elischer 47144990b8cSJulian Elischer /* 47244990b8cSJulian Elischer * Tear down type-stable parts of a thread (just before being discarded). 47344990b8cSJulian Elischer */ 47444990b8cSJulian Elischer static void 47544990b8cSJulian Elischer thread_fini(void *mem, int size) 47644990b8cSJulian Elischer { 47744990b8cSJulian Elischer struct thread *td; 47844990b8cSJulian Elischer 47944990b8cSJulian Elischer td = (struct thread *)mem; 4802ca45184SMatt Joras EVENTHANDLER_DIRECT_INVOKE(thread_fini, td); 4818f0e9130SKonstantin Belousov rlqentry_free(td->td_rlqe); 482961a7b24SJohn Baldwin turnstile_free(td->td_turnstile); 48344f3b092SJohn Baldwin sleepq_free(td->td_sleepqueue); 484d10183d9SDavid Xu umtx_thread_fini(td); 48519d3e47dSMateusz Guzik MPASS(td->td_sel == NULL); 48644990b8cSJulian Elischer } 4875215b187SJeff Roberson 4885c8329edSJulian Elischer /* 4895215b187SJeff Roberson * For a newly created process, 4905215b187SJeff Roberson * link up all the structures and its initial threads etc. 491ed062c8dSJulian Elischer * called from: 492e7d939bdSMarcel Moolenaar * {arch}/{arch}/machdep.c {arch}_init(), init386() etc. 493ed062c8dSJulian Elischer * proc_dtor() (should go away) 494ed062c8dSJulian Elischer * proc_init() 4955c8329edSJulian Elischer */ 4965c8329edSJulian Elischer void 49789b57fcfSKonstantin Belousov proc_linkup0(struct proc *p, struct thread *td) 49889b57fcfSKonstantin Belousov { 49989b57fcfSKonstantin Belousov TAILQ_INIT(&p->p_threads); /* all threads in proc */ 50089b57fcfSKonstantin Belousov proc_linkup(p, td); 50189b57fcfSKonstantin Belousov } 50289b57fcfSKonstantin Belousov 50389b57fcfSKonstantin Belousov void 5048460a577SJohn Birrell proc_linkup(struct proc *p, struct thread *td) 5055c8329edSJulian Elischer { 506a54e85fdSJeff Roberson 5079104847fSDavid Xu sigqueue_init(&p->p_sigqueue, p); 508cc29f221SKonstantin Belousov p->p_ksi = ksiginfo_alloc(M_WAITOK); 509ebceaf6dSDavid Xu if (p->p_ksi != NULL) { 5105c474517SDavid Xu /* XXX p_ksi may be null if ksiginfo zone is not ready */ 511ebceaf6dSDavid Xu p->p_ksi->ksi_flags = KSI_EXT | KSI_INS; 512ebceaf6dSDavid Xu } 513b2f92ef9SDavid Xu LIST_INIT(&p->p_mqnotifier); 5145c8329edSJulian Elischer p->p_numthreads = 0; 5158460a577SJohn Birrell thread_link(td, p); 5165c8329edSJulian Elischer } 5175c8329edSJulian Elischer 518c6d31b83SKonstantin Belousov static void 519c6d31b83SKonstantin Belousov ast_suspend(struct thread *td, int tda __unused) 520c6d31b83SKonstantin Belousov { 521c6d31b83SKonstantin Belousov struct proc *p; 522c6d31b83SKonstantin Belousov 523c6d31b83SKonstantin Belousov p = td->td_proc; 524c6d31b83SKonstantin Belousov /* 525c6d31b83SKonstantin Belousov * We need to check to see if we have to exit or wait due to a 526c6d31b83SKonstantin Belousov * single threading requirement or some other STOP condition. 527c6d31b83SKonstantin Belousov */ 528c6d31b83SKonstantin Belousov PROC_LOCK(p); 529c6d31b83SKonstantin Belousov thread_suspend_check(0); 530c6d31b83SKonstantin Belousov PROC_UNLOCK(p); 531c6d31b83SKonstantin Belousov } 532c6d31b83SKonstantin Belousov 5331bd3cf5dSMateusz Guzik extern int max_threads_per_proc; 5341bd3cf5dSMateusz Guzik 5355c8329edSJulian Elischer /* 53644990b8cSJulian Elischer * Initialize global thread allocation resources. 53744990b8cSJulian Elischer */ 53844990b8cSJulian Elischer void 53944990b8cSJulian Elischer threadinit(void) 54044990b8cSJulian Elischer { 54126007fe3SMateusz Guzik u_long i; 542cf31cadeSMateusz Guzik lwpid_t tid0; 54344990b8cSJulian Elischer 5441bd3cf5dSMateusz Guzik /* 5451bd3cf5dSMateusz Guzik * Place an upper limit on threads which can be allocated. 5461bd3cf5dSMateusz Guzik * 5471bd3cf5dSMateusz Guzik * Note that other factors may make the de facto limit much lower. 5481bd3cf5dSMateusz Guzik * 5491bd3cf5dSMateusz Guzik * Platform limits are somewhat arbitrary but deemed "more than good 5501bd3cf5dSMateusz Guzik * enough" for the foreseable future. 5511bd3cf5dSMateusz Guzik */ 5521bd3cf5dSMateusz Guzik if (maxthread == 0) { 5531bd3cf5dSMateusz Guzik #ifdef _LP64 5541bd3cf5dSMateusz Guzik maxthread = MIN(maxproc * max_threads_per_proc, 1000000); 5551bd3cf5dSMateusz Guzik #else 5561bd3cf5dSMateusz Guzik maxthread = MIN(maxproc * max_threads_per_proc, 100000); 5571bd3cf5dSMateusz Guzik #endif 5581bd3cf5dSMateusz Guzik } 5591bd3cf5dSMateusz Guzik 5601ea7a6f8SPoul-Henning Kamp mtx_init(&tid_lock, "TID lock", NULL, MTX_DEF); 56135bb59edSMateusz Guzik tid_bitmap = bit_alloc(maxthread, M_TIDHASH, M_WAITOK); 56262dbc992SMateusz Guzik /* 56362dbc992SMateusz Guzik * Handle thread0. 56462dbc992SMateusz Guzik */ 56562dbc992SMateusz Guzik thread_count_inc(); 566cf31cadeSMateusz Guzik tid0 = tid_alloc(); 567cf31cadeSMateusz Guzik if (tid0 != THREAD0_TID) 568cf31cadeSMateusz Guzik panic("tid0 %d != %d\n", tid0, THREAD0_TID); 5691ea7a6f8SPoul-Henning Kamp 5707d1469e5SOlivier Certner /* 5717d1469e5SOlivier Certner * Thread structures are specially aligned so that (at least) the 5727d1469e5SOlivier Certner * 5 lower bits of a pointer to 'struct thead' must be 0. These bits 5737d1469e5SOlivier Certner * are used by synchronization primitives to store flags in pointers to 5747d1469e5SOlivier Certner * such structures. 5757d1469e5SOlivier Certner */ 576de028f5aSJeff Roberson thread_zone = uma_zcreate("THREAD", sched_sizeof_thread(), 57744990b8cSJulian Elischer thread_ctor, thread_dtor, thread_init, thread_fini, 5787d1469e5SOlivier Certner UMA_ALIGN_CACHE_AND_MASK(32 - 1), UMA_ZONE_NOFREE); 579cf7d9a8cSDavid Xu tidhashtbl = hashinit(maxproc / 2, M_TIDHASH, &tidhash); 58026007fe3SMateusz Guzik tidhashlock = (tidhash + 1) / 64; 58126007fe3SMateusz Guzik if (tidhashlock > 0) 58226007fe3SMateusz Guzik tidhashlock--; 58326007fe3SMateusz Guzik tidhashtbl_lock = malloc(sizeof(*tidhashtbl_lock) * (tidhashlock + 1), 58426007fe3SMateusz Guzik M_TIDHASH, M_WAITOK | M_ZERO); 58526007fe3SMateusz Guzik for (i = 0; i < tidhashlock + 1; i++) 58626007fe3SMateusz Guzik rw_init(&tidhashtbl_lock[i], "tidhash"); 587d116b9f1SMateusz Guzik 588d116b9f1SMateusz Guzik TASK_INIT(&thread_reap_task, 0, thread_reap_task_cb, NULL); 589d116b9f1SMateusz Guzik callout_init(&thread_reap_callout, 1); 590845d7797SKonstantin Belousov callout_reset(&thread_reap_callout, 5 * hz, 591845d7797SKonstantin Belousov thread_reap_callout_cb, NULL); 592c6d31b83SKonstantin Belousov ast_register(TDA_SUSPEND, ASTR_ASTF_REQUIRED, 0, ast_suspend); 59344990b8cSJulian Elischer } 59444990b8cSJulian Elischer 59544990b8cSJulian Elischer /* 596ff8fbcffSJeff Roberson * Place an unused thread on the zombie list. 59744990b8cSJulian Elischer */ 59844990b8cSJulian Elischer void 599ff8fbcffSJeff Roberson thread_zombie(struct thread *td) 60044990b8cSJulian Elischer { 601d116b9f1SMateusz Guzik struct thread_domain_data *tdd; 602c5315f51SMateusz Guzik struct thread *ztd; 603c5315f51SMateusz Guzik 604a9568cd2SMateusz Guzik tdd = &thread_domain_data[td->td_allocdomain]; 605d116b9f1SMateusz Guzik ztd = atomic_load_ptr(&tdd->tdd_zombies); 606c5315f51SMateusz Guzik for (;;) { 607c5315f51SMateusz Guzik td->td_zombie = ztd; 608d116b9f1SMateusz Guzik if (atomic_fcmpset_rel_ptr((uintptr_t *)&tdd->tdd_zombies, 609c5315f51SMateusz Guzik (uintptr_t *)&ztd, (uintptr_t)td)) 610c5315f51SMateusz Guzik break; 611c5315f51SMateusz Guzik continue; 612c5315f51SMateusz Guzik } 61344990b8cSJulian Elischer } 61444990b8cSJulian Elischer 6155c8329edSJulian Elischer /* 616ff8fbcffSJeff Roberson * Release a thread that has exited after cpu_throw(). 617ff8fbcffSJeff Roberson */ 618ff8fbcffSJeff Roberson void 619ff8fbcffSJeff Roberson thread_stash(struct thread *td) 620ff8fbcffSJeff Roberson { 621ff8fbcffSJeff Roberson atomic_subtract_rel_int(&td->td_proc->p_exitthreads, 1); 622ff8fbcffSJeff Roberson thread_zombie(td); 623ff8fbcffSJeff Roberson } 624ff8fbcffSJeff Roberson 625ff8fbcffSJeff Roberson /* 626d116b9f1SMateusz Guzik * Reap zombies from passed domain. 62744990b8cSJulian Elischer */ 628d116b9f1SMateusz Guzik static void 629d116b9f1SMateusz Guzik thread_reap_domain(struct thread_domain_data *tdd) 63044990b8cSJulian Elischer { 631c5315f51SMateusz Guzik struct thread *itd, *ntd; 6325ef7b7a0SMateusz Guzik struct tidbatch tidbatch; 633f34a2f56SMateusz Guzik struct credbatch credbatch; 634bbe62559SMateusz Guzik struct limbatch limbatch; 635e0c86f5cSMateusz Guzik struct tdcountbatch tdcountbatch; 63644990b8cSJulian Elischer 63744990b8cSJulian Elischer /* 638c5315f51SMateusz Guzik * Reading upfront is pessimal if followed by concurrent atomic_swap, 639c5315f51SMateusz Guzik * but most of the time the list is empty. 64044990b8cSJulian Elischer */ 641d116b9f1SMateusz Guzik if (tdd->tdd_zombies == NULL) 642c5315f51SMateusz Guzik return; 643c5315f51SMateusz Guzik 644d116b9f1SMateusz Guzik itd = (struct thread *)atomic_swap_ptr((uintptr_t *)&tdd->tdd_zombies, 645c5315f51SMateusz Guzik (uintptr_t)NULL); 6465ef7b7a0SMateusz Guzik if (itd == NULL) 6475ef7b7a0SMateusz Guzik return; 6485ef7b7a0SMateusz Guzik 649d116b9f1SMateusz Guzik /* 650d116b9f1SMateusz Guzik * Multiple CPUs can get here, the race is fine as ticks is only 651d116b9f1SMateusz Guzik * advisory. 652d116b9f1SMateusz Guzik */ 653d116b9f1SMateusz Guzik tdd->tdd_reapticks = ticks; 654d116b9f1SMateusz Guzik 6555ef7b7a0SMateusz Guzik tidbatch_prep(&tidbatch); 656f34a2f56SMateusz Guzik credbatch_prep(&credbatch); 657bbe62559SMateusz Guzik limbatch_prep(&limbatch); 658e0c86f5cSMateusz Guzik tdcountbatch_prep(&tdcountbatch); 659d116b9f1SMateusz Guzik 660c5315f51SMateusz Guzik while (itd != NULL) { 661c5315f51SMateusz Guzik ntd = itd->td_zombie; 6625ef7b7a0SMateusz Guzik EVENTHANDLER_DIRECT_INVOKE(thread_dtor, itd); 663bbe62559SMateusz Guzik 6645ef7b7a0SMateusz Guzik tidbatch_add(&tidbatch, itd); 665f34a2f56SMateusz Guzik credbatch_add(&credbatch, itd); 666bbe62559SMateusz Guzik limbatch_add(&limbatch, itd); 667e0c86f5cSMateusz Guzik tdcountbatch_add(&tdcountbatch, itd); 668bbe62559SMateusz Guzik 669755341dfSMateusz Guzik thread_free_batched(itd); 670bbe62559SMateusz Guzik 6715ef7b7a0SMateusz Guzik tidbatch_process(&tidbatch); 672f34a2f56SMateusz Guzik credbatch_process(&credbatch); 673bbe62559SMateusz Guzik limbatch_process(&limbatch); 674e0c86f5cSMateusz Guzik tdcountbatch_process(&tdcountbatch); 675bbe62559SMateusz Guzik 676c5315f51SMateusz Guzik itd = ntd; 67744990b8cSJulian Elischer } 678755341dfSMateusz Guzik 6795ef7b7a0SMateusz Guzik tidbatch_final(&tidbatch); 680f34a2f56SMateusz Guzik credbatch_final(&credbatch); 681bbe62559SMateusz Guzik limbatch_final(&limbatch); 682e0c86f5cSMateusz Guzik tdcountbatch_final(&tdcountbatch); 683ed062c8dSJulian Elischer } 68444990b8cSJulian Elischer 6854f0db5e0SJulian Elischer /* 686d116b9f1SMateusz Guzik * Reap zombies from all domains. 687d116b9f1SMateusz Guzik */ 688d116b9f1SMateusz Guzik static void 689d116b9f1SMateusz Guzik thread_reap_all(void) 690d116b9f1SMateusz Guzik { 691d116b9f1SMateusz Guzik struct thread_domain_data *tdd; 692d116b9f1SMateusz Guzik int i, domain; 693d116b9f1SMateusz Guzik 694d116b9f1SMateusz Guzik domain = PCPU_GET(domain); 695d116b9f1SMateusz Guzik for (i = 0; i < vm_ndomains; i++) { 696d116b9f1SMateusz Guzik tdd = &thread_domain_data[(i + domain) % vm_ndomains]; 697d116b9f1SMateusz Guzik thread_reap_domain(tdd); 698d116b9f1SMateusz Guzik } 699d116b9f1SMateusz Guzik } 700d116b9f1SMateusz Guzik 701d116b9f1SMateusz Guzik /* 702d116b9f1SMateusz Guzik * Reap zombies from local domain. 703d116b9f1SMateusz Guzik */ 704b83e94beSMateusz Guzik static void 705d116b9f1SMateusz Guzik thread_reap(void) 706d116b9f1SMateusz Guzik { 707d116b9f1SMateusz Guzik struct thread_domain_data *tdd; 708d116b9f1SMateusz Guzik int domain; 709d116b9f1SMateusz Guzik 710d116b9f1SMateusz Guzik domain = PCPU_GET(domain); 711d116b9f1SMateusz Guzik tdd = &thread_domain_data[domain]; 712d116b9f1SMateusz Guzik 713d116b9f1SMateusz Guzik thread_reap_domain(tdd); 714d116b9f1SMateusz Guzik } 715d116b9f1SMateusz Guzik 716d116b9f1SMateusz Guzik static void 717d116b9f1SMateusz Guzik thread_reap_task_cb(void *arg __unused, int pending __unused) 718d116b9f1SMateusz Guzik { 719d116b9f1SMateusz Guzik 720d116b9f1SMateusz Guzik thread_reap_all(); 721d116b9f1SMateusz Guzik } 722d116b9f1SMateusz Guzik 723d116b9f1SMateusz Guzik static void 724d116b9f1SMateusz Guzik thread_reap_callout_cb(void *arg __unused) 725d116b9f1SMateusz Guzik { 726d116b9f1SMateusz Guzik struct thread_domain_data *tdd; 727d116b9f1SMateusz Guzik int i, cticks, lticks; 728d116b9f1SMateusz Guzik bool wantreap; 729d116b9f1SMateusz Guzik 730d116b9f1SMateusz Guzik wantreap = false; 731d116b9f1SMateusz Guzik cticks = atomic_load_int(&ticks); 732d116b9f1SMateusz Guzik for (i = 0; i < vm_ndomains; i++) { 733d116b9f1SMateusz Guzik tdd = &thread_domain_data[i]; 734d116b9f1SMateusz Guzik lticks = tdd->tdd_reapticks; 735d116b9f1SMateusz Guzik if (tdd->tdd_zombies != NULL && 736d116b9f1SMateusz Guzik (u_int)(cticks - lticks) > 5 * hz) { 737d116b9f1SMateusz Guzik wantreap = true; 738d116b9f1SMateusz Guzik break; 739d116b9f1SMateusz Guzik } 740d116b9f1SMateusz Guzik } 741d116b9f1SMateusz Guzik 742d116b9f1SMateusz Guzik if (wantreap) 743d116b9f1SMateusz Guzik taskqueue_enqueue(taskqueue_thread, &thread_reap_task); 744845d7797SKonstantin Belousov callout_reset(&thread_reap_callout, 5 * hz, 745845d7797SKonstantin Belousov thread_reap_callout_cb, NULL); 746d116b9f1SMateusz Guzik } 747d116b9f1SMateusz Guzik 748d116b9f1SMateusz Guzik /* 749f62c7e54SKonstantin Belousov * Calling this function guarantees that any thread that exited before 750f62c7e54SKonstantin Belousov * the call is reaped when the function returns. By 'exited' we mean 751f62c7e54SKonstantin Belousov * a thread removed from the process linkage with thread_unlink(). 752f62c7e54SKonstantin Belousov * Practically this means that caller must lock/unlock corresponding 753f62c7e54SKonstantin Belousov * process lock before the call, to synchronize with thread_exit(). 754f62c7e54SKonstantin Belousov */ 755f62c7e54SKonstantin Belousov void 756f62c7e54SKonstantin Belousov thread_reap_barrier(void) 757f62c7e54SKonstantin Belousov { 758f62c7e54SKonstantin Belousov struct task *t; 759f62c7e54SKonstantin Belousov 760f62c7e54SKonstantin Belousov /* 761f62c7e54SKonstantin Belousov * First do context switches to each CPU to ensure that all 762f62c7e54SKonstantin Belousov * PCPU pc_deadthreads are moved to zombie list. 763f62c7e54SKonstantin Belousov */ 764f62c7e54SKonstantin Belousov quiesce_all_cpus("", PDROP); 765f62c7e54SKonstantin Belousov 766f62c7e54SKonstantin Belousov /* 767f62c7e54SKonstantin Belousov * Second, fire the task in the same thread as normal 768f62c7e54SKonstantin Belousov * thread_reap() is done, to serialize reaping. 769f62c7e54SKonstantin Belousov */ 770f62c7e54SKonstantin Belousov t = malloc(sizeof(*t), M_TEMP, M_WAITOK); 771f62c7e54SKonstantin Belousov TASK_INIT(t, 0, thread_reap_task_cb, t); 772f62c7e54SKonstantin Belousov taskqueue_enqueue(taskqueue_thread, t); 773f62c7e54SKonstantin Belousov taskqueue_drain(taskqueue_thread, t); 774f62c7e54SKonstantin Belousov free(t, M_TEMP); 775f62c7e54SKonstantin Belousov } 776f62c7e54SKonstantin Belousov 777f62c7e54SKonstantin Belousov /* 77844990b8cSJulian Elischer * Allocate a thread. 77944990b8cSJulian Elischer */ 78044990b8cSJulian Elischer struct thread * 7818a945d10SKonstantin Belousov thread_alloc(int pages) 78244990b8cSJulian Elischer { 78389b57fcfSKonstantin Belousov struct thread *td; 7841bd3cf5dSMateusz Guzik lwpid_t tid; 7858460a577SJohn Birrell 78662dbc992SMateusz Guzik if (!thread_count_inc()) { 7871bd3cf5dSMateusz Guzik return (NULL); 7881bd3cf5dSMateusz Guzik } 7891bd3cf5dSMateusz Guzik 79062dbc992SMateusz Guzik tid = tid_alloc(); 7911bd3cf5dSMateusz Guzik td = uma_zalloc(thread_zone, M_WAITOK); 79289b57fcfSKonstantin Belousov KASSERT(td->td_kstack == 0, ("thread_alloc got thread with kstack")); 7938a945d10SKonstantin Belousov if (!vm_thread_new(td, pages)) { 79489b57fcfSKonstantin Belousov uma_zfree(thread_zone, td); 7951bd3cf5dSMateusz Guzik tid_free(tid); 79662dbc992SMateusz Guzik thread_count_dec(); 79789b57fcfSKonstantin Belousov return (NULL); 79889b57fcfSKonstantin Belousov } 7991bd3cf5dSMateusz Guzik td->td_tid = tid; 800f575573cSKonstantin Belousov bzero(&td->td_sa.args, sizeof(td->td_sa.args)); 801*800da341SMark Johnston kasan_thread_alloc(td); 8025dda15adSMark Johnston kmsan_thread_alloc(td); 8030c3967e7SMarcel Moolenaar cpu_thread_alloc(td); 8041bd3cf5dSMateusz Guzik EVENTHANDLER_DIRECT_INVOKE(thread_ctor, td); 80589b57fcfSKonstantin Belousov return (td); 80644990b8cSJulian Elischer } 80744990b8cSJulian Elischer 8088a945d10SKonstantin Belousov int 809*800da341SMark Johnston thread_recycle(struct thread *td, int pages) 8108a945d10SKonstantin Belousov { 811*800da341SMark Johnston if (td->td_kstack == 0 || td->td_kstack_pages != pages) { 812*800da341SMark Johnston if (td->td_kstack != 0) 813*800da341SMark Johnston vm_thread_dispose(td); 8148a945d10SKonstantin Belousov if (!vm_thread_new(td, pages)) 815*800da341SMark Johnston return (ENOMEM); 8168a945d10SKonstantin Belousov cpu_thread_alloc(td); 817*800da341SMark Johnston } 818*800da341SMark Johnston kasan_thread_alloc(td); 819*800da341SMark Johnston kmsan_thread_alloc(td); 820*800da341SMark Johnston return (0); 8218a945d10SKonstantin Belousov } 8224f0db5e0SJulian Elischer 8234f0db5e0SJulian Elischer /* 82444990b8cSJulian Elischer * Deallocate a thread. 82544990b8cSJulian Elischer */ 826755341dfSMateusz Guzik static void 827755341dfSMateusz Guzik thread_free_batched(struct thread *td) 82844990b8cSJulian Elischer { 8292e6b8de4SJeff Roberson 8302e6b8de4SJeff Roberson lock_profile_thread_exit(td); 83145aea8deSJeff Roberson if (td->td_cpuset) 832d7f687fcSJeff Roberson cpuset_rel(td->td_cpuset); 833d7f687fcSJeff Roberson td->td_cpuset = NULL; 8340c3967e7SMarcel Moolenaar cpu_thread_free(td); 83589b57fcfSKonstantin Belousov if (td->td_kstack != 0) 83689b57fcfSKonstantin Belousov vm_thread_dispose(td); 8372d19b736SKonstantin Belousov callout_drain(&td->td_slpcallout); 838755341dfSMateusz Guzik /* 839755341dfSMateusz Guzik * Freeing handled by the caller. 840755341dfSMateusz Guzik */ 8411bd3cf5dSMateusz Guzik td->td_tid = -1; 8425dda15adSMark Johnston kmsan_thread_free(td); 84344990b8cSJulian Elischer uma_zfree(thread_zone, td); 84444990b8cSJulian Elischer } 84544990b8cSJulian Elischer 8464ea6a9a2SMateusz Guzik void 847755341dfSMateusz Guzik thread_free(struct thread *td) 848755341dfSMateusz Guzik { 849755341dfSMateusz Guzik lwpid_t tid; 850755341dfSMateusz Guzik 8515ef7b7a0SMateusz Guzik EVENTHANDLER_DIRECT_INVOKE(thread_dtor, td); 852755341dfSMateusz Guzik tid = td->td_tid; 853755341dfSMateusz Guzik thread_free_batched(td); 854755341dfSMateusz Guzik tid_free(tid); 85562dbc992SMateusz Guzik thread_count_dec(); 856755341dfSMateusz Guzik } 857755341dfSMateusz Guzik 858755341dfSMateusz Guzik void 8594ea6a9a2SMateusz Guzik thread_cow_get_proc(struct thread *newtd, struct proc *p) 8604ea6a9a2SMateusz Guzik { 8614ea6a9a2SMateusz Guzik 8624ea6a9a2SMateusz Guzik PROC_LOCK_ASSERT(p, MA_OWNED); 8631724c563SMateusz Guzik newtd->td_realucred = crcowget(p->p_ucred); 8641724c563SMateusz Guzik newtd->td_ucred = newtd->td_realucred; 865f6f6d240SMateusz Guzik newtd->td_limit = lim_hold(p->p_limit); 8664ea6a9a2SMateusz Guzik newtd->td_cowgen = p->p_cowgen; 8674ea6a9a2SMateusz Guzik } 8684ea6a9a2SMateusz Guzik 8694ea6a9a2SMateusz Guzik void 8704ea6a9a2SMateusz Guzik thread_cow_get(struct thread *newtd, struct thread *td) 8714ea6a9a2SMateusz Guzik { 8724ea6a9a2SMateusz Guzik 8731724c563SMateusz Guzik MPASS(td->td_realucred == td->td_ucred); 8741724c563SMateusz Guzik newtd->td_realucred = crcowget(td->td_realucred); 8751724c563SMateusz Guzik newtd->td_ucred = newtd->td_realucred; 876f6f6d240SMateusz Guzik newtd->td_limit = lim_hold(td->td_limit); 8774ea6a9a2SMateusz Guzik newtd->td_cowgen = td->td_cowgen; 8784ea6a9a2SMateusz Guzik } 8794ea6a9a2SMateusz Guzik 8804ea6a9a2SMateusz Guzik void 8814ea6a9a2SMateusz Guzik thread_cow_free(struct thread *td) 8824ea6a9a2SMateusz Guzik { 8834ea6a9a2SMateusz Guzik 8841724c563SMateusz Guzik if (td->td_realucred != NULL) 8851724c563SMateusz Guzik crcowfree(td); 886cd672ca6SMateusz Guzik if (td->td_limit != NULL) 887f6f6d240SMateusz Guzik lim_free(td->td_limit); 8884ea6a9a2SMateusz Guzik } 8894ea6a9a2SMateusz Guzik 8904ea6a9a2SMateusz Guzik void 8914ea6a9a2SMateusz Guzik thread_cow_update(struct thread *td) 8924ea6a9a2SMateusz Guzik { 8934ea6a9a2SMateusz Guzik struct proc *p; 894cd672ca6SMateusz Guzik struct ucred *oldcred; 895cd672ca6SMateusz Guzik struct plimit *oldlimit; 8964ea6a9a2SMateusz Guzik 8974ea6a9a2SMateusz Guzik p = td->td_proc; 8984ea6a9a2SMateusz Guzik PROC_LOCK(p); 8991724c563SMateusz Guzik oldcred = crcowsync(); 9008a0cb04dSMateusz Guzik oldlimit = lim_cowsync(); 9014ea6a9a2SMateusz Guzik td->td_cowgen = p->p_cowgen; 9024ea6a9a2SMateusz Guzik PROC_UNLOCK(p); 903cd672ca6SMateusz Guzik if (oldcred != NULL) 904cd672ca6SMateusz Guzik crfree(oldcred); 905cd672ca6SMateusz Guzik if (oldlimit != NULL) 906cd672ca6SMateusz Guzik lim_free(oldlimit); 9074ea6a9a2SMateusz Guzik } 9084ea6a9a2SMateusz Guzik 90932114b63SMateusz Guzik void 91032114b63SMateusz Guzik thread_cow_synced(struct thread *td) 91132114b63SMateusz Guzik { 91232114b63SMateusz Guzik struct proc *p; 91332114b63SMateusz Guzik 91432114b63SMateusz Guzik p = td->td_proc; 91532114b63SMateusz Guzik PROC_LOCK_ASSERT(p, MA_OWNED); 91632114b63SMateusz Guzik MPASS(td->td_cowgen != p->p_cowgen); 91732114b63SMateusz Guzik MPASS(td->td_ucred == p->p_ucred); 91832114b63SMateusz Guzik MPASS(td->td_limit == p->p_limit); 91932114b63SMateusz Guzik td->td_cowgen = p->p_cowgen; 92032114b63SMateusz Guzik } 92132114b63SMateusz Guzik 92244990b8cSJulian Elischer /* 92344990b8cSJulian Elischer * Discard the current thread and exit from its context. 92494e0a4cdSJulian Elischer * Always called with scheduler locked. 92544990b8cSJulian Elischer * 92644990b8cSJulian Elischer * Because we can't free a thread while we're operating under its context, 927696058c3SJulian Elischer * push the current thread into our CPU's deadthread holder. This means 928696058c3SJulian Elischer * we needn't worry about someone else grabbing our context before we 9296617724cSJeff Roberson * do a cpu_throw(). 93044990b8cSJulian Elischer */ 93144990b8cSJulian Elischer void 93244990b8cSJulian Elischer thread_exit(void) 93344990b8cSJulian Elischer { 9347e3a96eaSJohn Baldwin uint64_t runtime, new_switchtime; 93544990b8cSJulian Elischer struct thread *td; 9361c4bcd05SJeff Roberson struct thread *td2; 93744990b8cSJulian Elischer struct proc *p; 9387847a9daSJohn Baldwin int wakeup_swapper; 93944990b8cSJulian Elischer 94044990b8cSJulian Elischer td = curthread; 94144990b8cSJulian Elischer p = td->td_proc; 94244990b8cSJulian Elischer 943a54e85fdSJeff Roberson PROC_SLOCK_ASSERT(p, MA_OWNED); 944ed062c8dSJulian Elischer mtx_assert(&Giant, MA_NOTOWNED); 945a54e85fdSJeff Roberson 94644990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 947ed062c8dSJulian Elischer KASSERT(p != NULL, ("thread exiting without a process")); 948cc701b73SRobert Watson CTR3(KTR_PROC, "thread_exit: thread %p (pid %ld, %s)", td, 949e01eafefSJulian Elischer (long)p->p_pid, td->td_name); 9506c9271a9SAndriy Gapon SDT_PROBE0(proc, , , lwp__exit); 9519104847fSDavid Xu KASSERT(TAILQ_EMPTY(&td->td_sigqueue.sq_list), ("signal pending")); 952936c24faSMateusz Guzik MPASS(td->td_realucred == td->td_ucred); 95344990b8cSJulian Elischer 954ed062c8dSJulian Elischer /* 955ed062c8dSJulian Elischer * drop FPU & debug register state storage, or any other 956ed062c8dSJulian Elischer * architecture specific resources that 957ed062c8dSJulian Elischer * would not be on a new untouched process. 958ed062c8dSJulian Elischer */ 959bd07998eSKonstantin Belousov cpu_thread_exit(td); 96044990b8cSJulian Elischer 961ed062c8dSJulian Elischer /* 9621faf202eSJulian Elischer * The last thread is left attached to the process 9631faf202eSJulian Elischer * So that the whole bundle gets recycled. Skip 964ed062c8dSJulian Elischer * all this stuff if we never had threads. 965ed062c8dSJulian Elischer * EXIT clears all sign of other threads when 966ed062c8dSJulian Elischer * it goes to single threading, so the last thread always 967ed062c8dSJulian Elischer * takes the short path. 9681faf202eSJulian Elischer */ 969ed062c8dSJulian Elischer if (p->p_flag & P_HADTHREADS) { 9701faf202eSJulian Elischer if (p->p_numthreads > 1) { 971fd229b5bSKonstantin Belousov atomic_add_int(&td->td_proc->p_exitthreads, 1); 972d3a0bd78SJulian Elischer thread_unlink(td); 9731c4bcd05SJeff Roberson td2 = FIRST_THREAD_IN_PROC(p); 9741c4bcd05SJeff Roberson sched_exit_thread(td2, td); 975ed062c8dSJulian Elischer 976ed062c8dSJulian Elischer /* 97744990b8cSJulian Elischer * The test below is NOT true if we are the 9789182554aSKonstantin Belousov * sole exiting thread. P_STOPPED_SINGLE is unset 97944990b8cSJulian Elischer * in exit1() after it is the only survivor. 98044990b8cSJulian Elischer */ 9811279572aSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 98244990b8cSJulian Elischer if (p->p_numthreads == p->p_suspcount) { 983a54e85fdSJeff Roberson thread_lock(p->p_singlethread); 9847847a9daSJohn Baldwin wakeup_swapper = thread_unsuspend_one( 98584cdea97SKonstantin Belousov p->p_singlethread, p, false); 9867847a9daSJohn Baldwin if (wakeup_swapper) 9877847a9daSJohn Baldwin kick_proc0(); 98844990b8cSJulian Elischer } 98944990b8cSJulian Elischer } 99048bfcdddSJulian Elischer 991696058c3SJulian Elischer PCPU_SET(deadthread, td); 9921faf202eSJulian Elischer } else { 993ed062c8dSJulian Elischer /* 994ed062c8dSJulian Elischer * The last thread is exiting.. but not through exit() 995ed062c8dSJulian Elischer */ 996ed062c8dSJulian Elischer panic ("thread_exit: Last thread exiting on its own"); 997ed062c8dSJulian Elischer } 9981faf202eSJulian Elischer } 99916d95d4fSJoseph Koshy #ifdef HWPMC_HOOKS 100016d95d4fSJoseph Koshy /* 100116d95d4fSJoseph Koshy * If this thread is part of a process that is being tracked by hwpmc(4), 100216d95d4fSJoseph Koshy * inform the module of the thread's impending exit. 100316d95d4fSJoseph Koshy */ 10046161b98cSMatt Macy if (PMC_PROC_IS_USING_PMCS(td->td_proc)) { 100516d95d4fSJoseph Koshy PMC_SWITCH_CONTEXT(td, PMC_FN_CSW_OUT); 10066161b98cSMatt Macy PMC_CALL_HOOK_UNLOCKED(td, PMC_FN_THR_EXIT, NULL); 1007ebfaf69cSMatt Macy } else if (PMC_SYSTEM_SAMPLING_ACTIVE()) 1008ebfaf69cSMatt Macy PMC_CALL_HOOK_UNLOCKED(td, PMC_FN_THR_EXIT_LOG, NULL); 100916d95d4fSJoseph Koshy #endif 1010a54e85fdSJeff Roberson PROC_UNLOCK(p); 10115c7bebf9SKonstantin Belousov PROC_STATLOCK(p); 10125c7bebf9SKonstantin Belousov thread_lock(td); 10135c7bebf9SKonstantin Belousov PROC_SUNLOCK(p); 10147e3a96eaSJohn Baldwin 10157e3a96eaSJohn Baldwin /* Do the same timestamp bookkeeping that mi_switch() would do. */ 10167e3a96eaSJohn Baldwin new_switchtime = cpu_ticks(); 10177e3a96eaSJohn Baldwin runtime = new_switchtime - PCPU_GET(switchtime); 10187e3a96eaSJohn Baldwin td->td_runtime += runtime; 10197e3a96eaSJohn Baldwin td->td_incruntime += runtime; 10207e3a96eaSJohn Baldwin PCPU_SET(switchtime, new_switchtime); 10217e3a96eaSJohn Baldwin PCPU_SET(switchticks, ticks); 102283c9dea1SGleb Smirnoff VM_CNT_INC(v_swtch); 10237e3a96eaSJohn Baldwin 10247e3a96eaSJohn Baldwin /* Save our resource usage in our process. */ 10257e3a96eaSJohn Baldwin td->td_ru.ru_nvcsw++; 102661a74c5cSJeff Roberson ruxagg_locked(p, td); 10277e3a96eaSJohn Baldwin rucollect(&p->p_ru, &td->td_ru); 10285c7bebf9SKonstantin Belousov PROC_STATUNLOCK(p); 10297e3a96eaSJohn Baldwin 1030fa2528acSAlex Richardson TD_SET_STATE(td, TDS_INACTIVE); 10313d06b4b3SAttilio Rao #ifdef WITNESS 10323d06b4b3SAttilio Rao witness_thread_exit(td); 10333d06b4b3SAttilio Rao #endif 1034732d9528SJulian Elischer CTR1(KTR_PROC, "thread_exit: cpu_throw() thread %p", td); 1035a54e85fdSJeff Roberson sched_throw(td); 1036cc66ebe2SPeter Wemm panic("I'm a teapot!"); 103744990b8cSJulian Elischer /* NOTREACHED */ 103844990b8cSJulian Elischer } 103944990b8cSJulian Elischer 104044990b8cSJulian Elischer /* 1041696058c3SJulian Elischer * Do any thread specific cleanups that may be needed in wait() 104237814395SPeter Wemm * called with Giant, proc and schedlock not held. 1043696058c3SJulian Elischer */ 1044696058c3SJulian Elischer void 1045696058c3SJulian Elischer thread_wait(struct proc *p) 1046696058c3SJulian Elischer { 1047696058c3SJulian Elischer struct thread *td; 1048696058c3SJulian Elischer 104937814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 1050624bf9e1SKonstantin Belousov KASSERT(p->p_numthreads == 1, ("multiple threads in thread_wait()")); 1051624bf9e1SKonstantin Belousov KASSERT(p->p_exitthreads == 0, ("p_exitthreads leaking")); 1052ff8fbcffSJeff Roberson td = FIRST_THREAD_IN_PROC(p); 1053ff8fbcffSJeff Roberson /* Lock the last thread so we spin until it exits cpu_throw(). */ 1054ff8fbcffSJeff Roberson thread_lock(td); 1055ff8fbcffSJeff Roberson thread_unlock(td); 10562e6b8de4SJeff Roberson lock_profile_thread_exit(td); 1057d7f687fcSJeff Roberson cpuset_rel(td->td_cpuset); 1058d7f687fcSJeff Roberson td->td_cpuset = NULL; 1059696058c3SJulian Elischer cpu_thread_clean(td); 10604ea6a9a2SMateusz Guzik thread_cow_free(td); 10612d19b736SKonstantin Belousov callout_drain(&td->td_slpcallout); 1062696058c3SJulian Elischer thread_reap(); /* check for zombie threads etc. */ 1063696058c3SJulian Elischer } 1064696058c3SJulian Elischer 1065696058c3SJulian Elischer /* 106644990b8cSJulian Elischer * Link a thread to a process. 10671faf202eSJulian Elischer * set up anything that needs to be initialized for it to 10681faf202eSJulian Elischer * be used by the process. 106944990b8cSJulian Elischer */ 107044990b8cSJulian Elischer void 10718460a577SJohn Birrell thread_link(struct thread *td, struct proc *p) 107244990b8cSJulian Elischer { 107344990b8cSJulian Elischer 1074a54e85fdSJeff Roberson /* 1075a54e85fdSJeff Roberson * XXX This can't be enabled because it's called for proc0 before 1076374ae2a3SJeff Roberson * its lock has been created. 1077374ae2a3SJeff Roberson * PROC_LOCK_ASSERT(p, MA_OWNED); 1078a54e85fdSJeff Roberson */ 1079fa2528acSAlex Richardson TD_SET_STATE(td, TDS_INACTIVE); 108044990b8cSJulian Elischer td->td_proc = p; 1081b61ce5b0SJeff Roberson td->td_flags = TDF_INMEM; 108244990b8cSJulian Elischer 10831faf202eSJulian Elischer LIST_INIT(&td->td_contested); 1084eea4f254SJeff Roberson LIST_INIT(&td->td_lprof[0]); 1085eea4f254SJeff Roberson LIST_INIT(&td->td_lprof[1]); 1086f6eccf96SGleb Smirnoff #ifdef EPOCH_TRACE 1087dd902d01SGleb Smirnoff SLIST_INIT(&td->td_epochs); 1088f6eccf96SGleb Smirnoff #endif 10899104847fSDavid Xu sigqueue_init(&td->td_sigqueue, p); 1090fd90e2edSJung-uk Kim callout_init(&td->td_slpcallout, 1); 109166d8df9dSDaniel Eischen TAILQ_INSERT_TAIL(&p->p_threads, td, td_plist); 109244990b8cSJulian Elischer p->p_numthreads++; 109344990b8cSJulian Elischer } 109444990b8cSJulian Elischer 1095ed062c8dSJulian Elischer /* 1096ed062c8dSJulian Elischer * Called from: 1097ed062c8dSJulian Elischer * thread_exit() 1098ed062c8dSJulian Elischer */ 1099d3a0bd78SJulian Elischer void 1100d3a0bd78SJulian Elischer thread_unlink(struct thread *td) 1101d3a0bd78SJulian Elischer { 1102d3a0bd78SJulian Elischer struct proc *p = td->td_proc; 1103d3a0bd78SJulian Elischer 1104374ae2a3SJeff Roberson PROC_LOCK_ASSERT(p, MA_OWNED); 1105f6eccf96SGleb Smirnoff #ifdef EPOCH_TRACE 1106dd902d01SGleb Smirnoff MPASS(SLIST_EMPTY(&td->td_epochs)); 1107f6eccf96SGleb Smirnoff #endif 1108dd902d01SGleb Smirnoff 1109d3a0bd78SJulian Elischer TAILQ_REMOVE(&p->p_threads, td, td_plist); 1110d3a0bd78SJulian Elischer p->p_numthreads--; 1111d3a0bd78SJulian Elischer /* could clear a few other things here */ 11128460a577SJohn Birrell /* Must NOT clear links to proc! */ 11135c8329edSJulian Elischer } 11145c8329edSJulian Elischer 111579799053SKonstantin Belousov static int 111679799053SKonstantin Belousov calc_remaining(struct proc *p, int mode) 111779799053SKonstantin Belousov { 111879799053SKonstantin Belousov int remaining; 111979799053SKonstantin Belousov 11207b519077SKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 11217b519077SKonstantin Belousov PROC_SLOCK_ASSERT(p, MA_OWNED); 112279799053SKonstantin Belousov if (mode == SINGLE_EXIT) 112379799053SKonstantin Belousov remaining = p->p_numthreads; 112479799053SKonstantin Belousov else if (mode == SINGLE_BOUNDARY) 112579799053SKonstantin Belousov remaining = p->p_numthreads - p->p_boundary_count; 11266ddcc233SKonstantin Belousov else if (mode == SINGLE_NO_EXIT || mode == SINGLE_ALLPROC) 112779799053SKonstantin Belousov remaining = p->p_numthreads - p->p_suspcount; 112879799053SKonstantin Belousov else 112979799053SKonstantin Belousov panic("calc_remaining: wrong mode %d", mode); 113079799053SKonstantin Belousov return (remaining); 113179799053SKonstantin Belousov } 113279799053SKonstantin Belousov 113307a9368aSKonstantin Belousov static int 113407a9368aSKonstantin Belousov remain_for_mode(int mode) 113507a9368aSKonstantin Belousov { 113607a9368aSKonstantin Belousov 11376ddcc233SKonstantin Belousov return (mode == SINGLE_ALLPROC ? 0 : 1); 113807a9368aSKonstantin Belousov } 113907a9368aSKonstantin Belousov 114007a9368aSKonstantin Belousov static int 114107a9368aSKonstantin Belousov weed_inhib(int mode, struct thread *td2, struct proc *p) 114207a9368aSKonstantin Belousov { 114307a9368aSKonstantin Belousov int wakeup_swapper; 114407a9368aSKonstantin Belousov 114507a9368aSKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 114607a9368aSKonstantin Belousov PROC_SLOCK_ASSERT(p, MA_OWNED); 114707a9368aSKonstantin Belousov THREAD_LOCK_ASSERT(td2, MA_OWNED); 114807a9368aSKonstantin Belousov 114907a9368aSKonstantin Belousov wakeup_swapper = 0; 115061a74c5cSJeff Roberson 115161a74c5cSJeff Roberson /* 115261a74c5cSJeff Roberson * Since the thread lock is dropped by the scheduler we have 115361a74c5cSJeff Roberson * to retry to check for races. 115461a74c5cSJeff Roberson */ 115561a74c5cSJeff Roberson restart: 115607a9368aSKonstantin Belousov switch (mode) { 115707a9368aSKonstantin Belousov case SINGLE_EXIT: 115861a74c5cSJeff Roberson if (TD_IS_SUSPENDED(td2)) { 115984cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td2, p, true); 116061a74c5cSJeff Roberson thread_lock(td2); 116161a74c5cSJeff Roberson goto restart; 116261a74c5cSJeff Roberson } 116361a74c5cSJeff Roberson if (TD_CAN_ABORT(td2)) { 116407a9368aSKonstantin Belousov wakeup_swapper |= sleepq_abort(td2, EINTR); 116561a74c5cSJeff Roberson return (wakeup_swapper); 116661a74c5cSJeff Roberson } 116707a9368aSKonstantin Belousov break; 116807a9368aSKonstantin Belousov case SINGLE_BOUNDARY: 116907a9368aSKonstantin Belousov case SINGLE_NO_EXIT: 117061a74c5cSJeff Roberson if (TD_IS_SUSPENDED(td2) && 117161a74c5cSJeff Roberson (td2->td_flags & TDF_BOUNDARY) == 0) { 117284cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td2, p, false); 117361a74c5cSJeff Roberson thread_lock(td2); 117461a74c5cSJeff Roberson goto restart; 117561a74c5cSJeff Roberson } 117661a74c5cSJeff Roberson if (TD_CAN_ABORT(td2)) { 117707a9368aSKonstantin Belousov wakeup_swapper |= sleepq_abort(td2, ERESTART); 117861a74c5cSJeff Roberson return (wakeup_swapper); 117961a74c5cSJeff Roberson } 1180917dd390SKonstantin Belousov break; 11816ddcc233SKonstantin Belousov case SINGLE_ALLPROC: 11826ddcc233SKonstantin Belousov /* 11836ddcc233SKonstantin Belousov * ALLPROC suspend tries to avoid spurious EINTR for 11846ddcc233SKonstantin Belousov * threads sleeping interruptable, by suspending the 11856ddcc233SKonstantin Belousov * thread directly, similarly to sig_suspend_threads(). 1186dd883e9aSKonstantin Belousov * Since such sleep is not neccessary performed at the user 1187dd883e9aSKonstantin Belousov * boundary, TDF_ALLPROCSUSP is used to avoid immediate 1188dd883e9aSKonstantin Belousov * un-suspend. 11896ddcc233SKonstantin Belousov */ 11905c274b36SBrooks Davis if (TD_IS_SUSPENDED(td2) && 11915c274b36SBrooks Davis (td2->td_flags & TDF_ALLPROCSUSP) == 0) { 119284cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td2, p, false); 119361a74c5cSJeff Roberson thread_lock(td2); 119461a74c5cSJeff Roberson goto restart; 119561a74c5cSJeff Roberson } 119661a74c5cSJeff Roberson if (TD_CAN_ABORT(td2)) { 11976ddcc233SKonstantin Belousov td2->td_flags |= TDF_ALLPROCSUSP; 11986ddcc233SKonstantin Belousov wakeup_swapper |= sleepq_abort(td2, ERESTART); 119961a74c5cSJeff Roberson return (wakeup_swapper); 12006ddcc233SKonstantin Belousov } 120107a9368aSKonstantin Belousov break; 120261a74c5cSJeff Roberson default: 120361a74c5cSJeff Roberson break; 120407a9368aSKonstantin Belousov } 120561a74c5cSJeff Roberson thread_unlock(td2); 120607a9368aSKonstantin Belousov return (wakeup_swapper); 120707a9368aSKonstantin Belousov } 120807a9368aSKonstantin Belousov 12095215b187SJeff Roberson /* 121044990b8cSJulian Elischer * Enforce single-threading. 121144990b8cSJulian Elischer * 121244990b8cSJulian Elischer * Returns 1 if the caller must abort (another thread is waiting to 121344990b8cSJulian Elischer * exit the process or similar). Process is locked! 121444990b8cSJulian Elischer * Returns 0 when you are successfully the only thread running. 121544990b8cSJulian Elischer * A process has successfully single threaded in the suspend mode when 121644990b8cSJulian Elischer * There are no threads in user mode. Threads in the kernel must be 121744990b8cSJulian Elischer * allowed to continue until they get to the user boundary. They may even 121844990b8cSJulian Elischer * copy out their return values and data before suspending. They may however be 1219e2668f55SMaxim Konovalov * accelerated in reaching the user boundary as we will wake up 122044990b8cSJulian Elischer * any sleeping threads that are interruptable. (PCATCH). 122144990b8cSJulian Elischer */ 122244990b8cSJulian Elischer int 12236ddcc233SKonstantin Belousov thread_single(struct proc *p, int mode) 122444990b8cSJulian Elischer { 122544990b8cSJulian Elischer struct thread *td; 122644990b8cSJulian Elischer struct thread *td2; 1227da7bbd2cSJohn Baldwin int remaining, wakeup_swapper; 122844990b8cSJulian Elischer 122944990b8cSJulian Elischer td = curthread; 12306ddcc233SKonstantin Belousov KASSERT(mode == SINGLE_EXIT || mode == SINGLE_BOUNDARY || 12316ddcc233SKonstantin Belousov mode == SINGLE_ALLPROC || mode == SINGLE_NO_EXIT, 12326ddcc233SKonstantin Belousov ("invalid mode %d", mode)); 12336ddcc233SKonstantin Belousov /* 12346ddcc233SKonstantin Belousov * If allowing non-ALLPROC singlethreading for non-curproc 12356ddcc233SKonstantin Belousov * callers, calc_remaining() and remain_for_mode() should be 12366ddcc233SKonstantin Belousov * adjusted to also account for td->td_proc != p. For now 12376ddcc233SKonstantin Belousov * this is not implemented because it is not used. 12386ddcc233SKonstantin Belousov */ 12396ddcc233SKonstantin Belousov KASSERT((mode == SINGLE_ALLPROC && td->td_proc != p) || 12406ddcc233SKonstantin Belousov (mode != SINGLE_ALLPROC && td->td_proc == p), 12416ddcc233SKonstantin Belousov ("mode %d proc %p curproc %p", mode, p, td->td_proc)); 124237814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 124344990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 124444990b8cSJulian Elischer 1245d7a9e6e7SKonstantin Belousov /* 1246d7a9e6e7SKonstantin Belousov * Is someone already single threading? 1247d7a9e6e7SKonstantin Belousov * Or may be singlethreading is not needed at all. 1248d7a9e6e7SKonstantin Belousov */ 1249d7a9e6e7SKonstantin Belousov if (mode == SINGLE_ALLPROC) { 1250d7a9e6e7SKonstantin Belousov while ((p->p_flag & P_STOPPED_SINGLE) != 0) { 1251d7a9e6e7SKonstantin Belousov if ((p->p_flag2 & P2_WEXIT) != 0) 1252d7a9e6e7SKonstantin Belousov return (1); 1253d7a9e6e7SKonstantin Belousov msleep(&p->p_flag, &p->p_mtx, PCATCH, "thrsgl", 0); 1254d7a9e6e7SKonstantin Belousov } 12559241ebc7SKonstantin Belousov if ((p->p_flag & (P_STOPPED_SIG | P_TRACED)) != 0 || 12569241ebc7SKonstantin Belousov (p->p_flag2 & P2_WEXIT) != 0) 12579241ebc7SKonstantin Belousov return (1); 1258d7a9e6e7SKonstantin Belousov } else if ((p->p_flag & P_HADTHREADS) == 0) 125944990b8cSJulian Elischer return (0); 1260906ac69dSDavid Xu if (p->p_singlethread != NULL && p->p_singlethread != td) 126144990b8cSJulian Elischer return (1); 126244990b8cSJulian Elischer 1263906ac69dSDavid Xu if (mode == SINGLE_EXIT) { 1264906ac69dSDavid Xu p->p_flag |= P_SINGLE_EXIT; 1265906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_BOUNDARY; 1266906ac69dSDavid Xu } else { 1267906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_EXIT; 1268906ac69dSDavid Xu if (mode == SINGLE_BOUNDARY) 1269906ac69dSDavid Xu p->p_flag |= P_SINGLE_BOUNDARY; 1270906ac69dSDavid Xu else 1271906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_BOUNDARY; 1272906ac69dSDavid Xu } 1273f829268bSKonstantin Belousov if (mode == SINGLE_ALLPROC) 12746ddcc233SKonstantin Belousov p->p_flag |= P_TOTAL_STOP; 12751279572aSDavid Xu p->p_flag |= P_STOPPED_SINGLE; 12767b4a950aSDavid Xu PROC_SLOCK(p); 1277112afcb2SJohn Baldwin p->p_singlethread = td; 127879799053SKonstantin Belousov remaining = calc_remaining(p, mode); 127907a9368aSKonstantin Belousov while (remaining != remain_for_mode(mode)) { 1280bf1a3220SDavid Xu if (P_SHOULDSTOP(p) != P_STOPPED_SINGLE) 1281bf1a3220SDavid Xu goto stopme; 1282da7bbd2cSJohn Baldwin wakeup_swapper = 0; 128344990b8cSJulian Elischer FOREACH_THREAD_IN_PROC(p, td2) { 128444990b8cSJulian Elischer if (td2 == td) 128544990b8cSJulian Elischer continue; 1286a54e85fdSJeff Roberson thread_lock(td2); 1287c6d31b83SKonstantin Belousov ast_sched_locked(td2, TDA_SUSPEND); 12886ddcc233SKonstantin Belousov if (TD_IS_INHIBITED(td2)) { 128907a9368aSKonstantin Belousov wakeup_swapper |= weed_inhib(mode, td2, p); 1290d8267df7SDavid Xu #ifdef SMP 1291b9009b17SKonstantin Belousov } else if (TD_IS_RUNNING(td2)) { 1292d8267df7SDavid Xu forward_signal(td2); 129361a74c5cSJeff Roberson thread_unlock(td2); 1294d8267df7SDavid Xu #endif 129561a74c5cSJeff Roberson } else 1296a54e85fdSJeff Roberson thread_unlock(td2); 12979d102777SJulian Elischer } 1298da7bbd2cSJohn Baldwin if (wakeup_swapper) 1299da7bbd2cSJohn Baldwin kick_proc0(); 130079799053SKonstantin Belousov remaining = calc_remaining(p, mode); 1301ec008e96SDavid Xu 13029d102777SJulian Elischer /* 13039d102777SJulian Elischer * Maybe we suspended some threads.. was it enough? 13049d102777SJulian Elischer */ 130507a9368aSKonstantin Belousov if (remaining == remain_for_mode(mode)) 13069d102777SJulian Elischer break; 13079d102777SJulian Elischer 1308bf1a3220SDavid Xu stopme: 130944990b8cSJulian Elischer /* 131044990b8cSJulian Elischer * Wake us up when everyone else has suspended. 1311e3b9bf71SJulian Elischer * In the mean time we suspend as well. 131244990b8cSJulian Elischer */ 13136ddcc233SKonstantin Belousov thread_suspend_switch(td, p); 131479799053SKonstantin Belousov remaining = calc_remaining(p, mode); 131544990b8cSJulian Elischer } 1316906ac69dSDavid Xu if (mode == SINGLE_EXIT) { 131791599697SJulian Elischer /* 13188626a0ddSKonstantin Belousov * Convert the process to an unthreaded process. The 13198626a0ddSKonstantin Belousov * SINGLE_EXIT is called by exit1() or execve(), in 13208626a0ddSKonstantin Belousov * both cases other threads must be retired. 132191599697SJulian Elischer */ 13228626a0ddSKonstantin Belousov KASSERT(p->p_numthreads == 1, ("Unthreading with >1 threads")); 1323ed062c8dSJulian Elischer p->p_singlethread = NULL; 13248626a0ddSKonstantin Belousov p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT | P_HADTHREADS); 1325fd229b5bSKonstantin Belousov 1326fd229b5bSKonstantin Belousov /* 1327fd229b5bSKonstantin Belousov * Wait for any remaining threads to exit cpu_throw(). 1328fd229b5bSKonstantin Belousov */ 1329fd229b5bSKonstantin Belousov while (p->p_exitthreads != 0) { 1330fd229b5bSKonstantin Belousov PROC_SUNLOCK(p); 1331fd229b5bSKonstantin Belousov PROC_UNLOCK(p); 1332fd229b5bSKonstantin Belousov sched_relinquish(td); 1333fd229b5bSKonstantin Belousov PROC_LOCK(p); 1334fd229b5bSKonstantin Belousov PROC_SLOCK(p); 1335fd229b5bSKonstantin Belousov } 1336ac437c07SKonstantin Belousov } else if (mode == SINGLE_BOUNDARY) { 1337ac437c07SKonstantin Belousov /* 1338ac437c07SKonstantin Belousov * Wait until all suspended threads are removed from 1339ac437c07SKonstantin Belousov * the processors. The thread_suspend_check() 1340ac437c07SKonstantin Belousov * increments p_boundary_count while it is still 1341ac437c07SKonstantin Belousov * running, which makes it possible for the execve() 1342ac437c07SKonstantin Belousov * to destroy vmspace while our other threads are 1343ac437c07SKonstantin Belousov * still using the address space. 1344ac437c07SKonstantin Belousov * 1345ac437c07SKonstantin Belousov * We lock the thread, which is only allowed to 1346ac437c07SKonstantin Belousov * succeed after context switch code finished using 1347ac437c07SKonstantin Belousov * the address space. 1348ac437c07SKonstantin Belousov */ 1349ac437c07SKonstantin Belousov FOREACH_THREAD_IN_PROC(p, td2) { 1350ac437c07SKonstantin Belousov if (td2 == td) 1351ac437c07SKonstantin Belousov continue; 1352ac437c07SKonstantin Belousov thread_lock(td2); 1353ac437c07SKonstantin Belousov KASSERT((td2->td_flags & TDF_BOUNDARY) != 0, 1354ac437c07SKonstantin Belousov ("td %p not on boundary", td2)); 1355ac437c07SKonstantin Belousov KASSERT(TD_IS_SUSPENDED(td2), 1356ac437c07SKonstantin Belousov ("td %p is not suspended", td2)); 1357ac437c07SKonstantin Belousov thread_unlock(td2); 1358ac437c07SKonstantin Belousov } 135991599697SJulian Elischer } 13607b4a950aSDavid Xu PROC_SUNLOCK(p); 136144990b8cSJulian Elischer return (0); 136244990b8cSJulian Elischer } 136344990b8cSJulian Elischer 13648638fe7bSKonstantin Belousov bool 13658638fe7bSKonstantin Belousov thread_suspend_check_needed(void) 13668638fe7bSKonstantin Belousov { 13678638fe7bSKonstantin Belousov struct proc *p; 13688638fe7bSKonstantin Belousov struct thread *td; 13698638fe7bSKonstantin Belousov 13708638fe7bSKonstantin Belousov td = curthread; 13718638fe7bSKonstantin Belousov p = td->td_proc; 13728638fe7bSKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 13738638fe7bSKonstantin Belousov return (P_SHOULDSTOP(p) || ((p->p_flag & P_TRACED) != 0 && 13748638fe7bSKonstantin Belousov (td->td_dbgflags & TDB_SUSPEND) != 0)); 13758638fe7bSKonstantin Belousov } 13768638fe7bSKonstantin Belousov 137744990b8cSJulian Elischer /* 137844990b8cSJulian Elischer * Called in from locations that can safely check to see 137944990b8cSJulian Elischer * whether we have to suspend or at least throttle for a 138044990b8cSJulian Elischer * single-thread event (e.g. fork). 138144990b8cSJulian Elischer * 138244990b8cSJulian Elischer * Such locations include userret(). 138344990b8cSJulian Elischer * If the "return_instead" argument is non zero, the thread must be able to 138444990b8cSJulian Elischer * accept 0 (caller may continue), or 1 (caller must abort) as a result. 138544990b8cSJulian Elischer * 138644990b8cSJulian Elischer * The 'return_instead' argument tells the function if it may do a 138744990b8cSJulian Elischer * thread_exit() or suspend, or whether the caller must abort and back 138844990b8cSJulian Elischer * out instead. 138944990b8cSJulian Elischer * 139044990b8cSJulian Elischer * If the thread that set the single_threading request has set the 139144990b8cSJulian Elischer * P_SINGLE_EXIT bit in the process flags then this call will never return 139244990b8cSJulian Elischer * if 'return_instead' is false, but will exit. 139344990b8cSJulian Elischer * 139444990b8cSJulian Elischer * P_SINGLE_EXIT | return_instead == 0| return_instead != 0 139544990b8cSJulian Elischer *---------------+--------------------+--------------------- 139644990b8cSJulian Elischer * 0 | returns 0 | returns 0 or 1 1397353374b5SJohn Baldwin * | when ST ends | immediately 139844990b8cSJulian Elischer *---------------+--------------------+--------------------- 139944990b8cSJulian Elischer * 1 | thread exits | returns 1 1400353374b5SJohn Baldwin * | | immediately 140144990b8cSJulian Elischer * 0 = thread_exit() or suspension ok, 140244990b8cSJulian Elischer * other = return error instead of stopping the thread. 140344990b8cSJulian Elischer * 140444990b8cSJulian Elischer * While a full suspension is under effect, even a single threading 140544990b8cSJulian Elischer * thread would be suspended if it made this call (but it shouldn't). 140644990b8cSJulian Elischer * This call should only be made from places where 140744990b8cSJulian Elischer * thread_exit() would be safe as that may be the outcome unless 140844990b8cSJulian Elischer * return_instead is set. 140944990b8cSJulian Elischer */ 141044990b8cSJulian Elischer int 141144990b8cSJulian Elischer thread_suspend_check(int return_instead) 141244990b8cSJulian Elischer { 1413ecafb24bSJuli Mallett struct thread *td; 1414ecafb24bSJuli Mallett struct proc *p; 141546e47c4fSKonstantin Belousov int wakeup_swapper; 141644990b8cSJulian Elischer 141744990b8cSJulian Elischer td = curthread; 141844990b8cSJulian Elischer p = td->td_proc; 141937814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 142044990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 14218638fe7bSKonstantin Belousov while (thread_suspend_check_needed()) { 14221279572aSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 142344990b8cSJulian Elischer KASSERT(p->p_singlethread != NULL, 142444990b8cSJulian Elischer ("singlethread not set")); 142544990b8cSJulian Elischer /* 1426e3b9bf71SJulian Elischer * The only suspension in action is a 1427e3b9bf71SJulian Elischer * single-threading. Single threader need not stop. 1428bd07998eSKonstantin Belousov * It is safe to access p->p_singlethread unlocked 1429bd07998eSKonstantin Belousov * because it can only be set to our address by us. 143044990b8cSJulian Elischer */ 1431e3b9bf71SJulian Elischer if (p->p_singlethread == td) 143244990b8cSJulian Elischer return (0); /* Exempt from stopping. */ 143344990b8cSJulian Elischer } 143445a4bfa1SDavid Xu if ((p->p_flag & P_SINGLE_EXIT) && return_instead) 143594f0972bSDavid Xu return (EINTR); 143644990b8cSJulian Elischer 1437906ac69dSDavid Xu /* Should we goto user boundary if we didn't come from there? */ 1438906ac69dSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE && 1439906ac69dSDavid Xu (p->p_flag & P_SINGLE_BOUNDARY) && return_instead) 144094f0972bSDavid Xu return (ERESTART); 1441906ac69dSDavid Xu 144244990b8cSJulian Elischer /* 14433077f938SKonstantin Belousov * Ignore suspend requests if they are deferred. 1444d071a6faSJohn Baldwin */ 14453077f938SKonstantin Belousov if ((td->td_flags & TDF_SBDRY) != 0) { 1446d071a6faSJohn Baldwin KASSERT(return_instead, 1447d071a6faSJohn Baldwin ("TDF_SBDRY set for unsafe thread_suspend_check")); 144846e47c4fSKonstantin Belousov KASSERT((td->td_flags & (TDF_SEINTR | TDF_SERESTART)) != 144946e47c4fSKonstantin Belousov (TDF_SEINTR | TDF_SERESTART), 145046e47c4fSKonstantin Belousov ("both TDF_SEINTR and TDF_SERESTART")); 145146e47c4fSKonstantin Belousov return (TD_SBDRY_INTR(td) ? TD_SBDRY_ERRNO(td) : 0); 1452d071a6faSJohn Baldwin } 1453d071a6faSJohn Baldwin 1454d071a6faSJohn Baldwin /* 145544990b8cSJulian Elischer * If the process is waiting for us to exit, 145644990b8cSJulian Elischer * this thread should just suicide. 14571279572aSDavid Xu * Assumes that P_SINGLE_EXIT implies P_STOPPED_SINGLE. 145844990b8cSJulian Elischer */ 1459cf7d9a8cSDavid Xu if ((p->p_flag & P_SINGLE_EXIT) && (p->p_singlethread != td)) { 1460cf7d9a8cSDavid Xu PROC_UNLOCK(p); 146191d1786fSDmitry Chagin 146291d1786fSDmitry Chagin /* 146391d1786fSDmitry Chagin * Allow Linux emulation layer to do some work 146491d1786fSDmitry Chagin * before thread suicide. 146591d1786fSDmitry Chagin */ 146691d1786fSDmitry Chagin if (__predict_false(p->p_sysent->sv_thread_detach != NULL)) 146791d1786fSDmitry Chagin (p->p_sysent->sv_thread_detach)(td); 14682a339d9eSKonstantin Belousov umtx_thread_exit(td); 1469d1e7a4a5SJohn Baldwin kern_thr_exit(td); 1470d1e7a4a5SJohn Baldwin panic("stopped thread did not exit"); 1471cf7d9a8cSDavid Xu } 147221ecd1e9SDavid Xu 147321ecd1e9SDavid Xu PROC_SLOCK(p); 147421ecd1e9SDavid Xu thread_stopped(p); 1475a54e85fdSJeff Roberson if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 1476a54e85fdSJeff Roberson if (p->p_numthreads == p->p_suspcount + 1) { 1477a54e85fdSJeff Roberson thread_lock(p->p_singlethread); 147884cdea97SKonstantin Belousov wakeup_swapper = thread_unsuspend_one( 147984cdea97SKonstantin Belousov p->p_singlethread, p, false); 14807847a9daSJohn Baldwin if (wakeup_swapper) 14817847a9daSJohn Baldwin kick_proc0(); 1482a54e85fdSJeff Roberson } 1483a54e85fdSJeff Roberson } 14843f9be10eSDavid Xu PROC_UNLOCK(p); 14857b4a950aSDavid Xu thread_lock(td); 148644990b8cSJulian Elischer /* 148744990b8cSJulian Elischer * When a thread suspends, it just 1488ad1e7d28SJulian Elischer * gets taken off all queues. 148944990b8cSJulian Elischer */ 149071fad9fdSJulian Elischer thread_suspend_one(td); 1491906ac69dSDavid Xu if (return_instead == 0) { 1492906ac69dSDavid Xu p->p_boundary_count++; 1493906ac69dSDavid Xu td->td_flags |= TDF_BOUNDARY; 1494cf19bf91SJulian Elischer } 14957b4a950aSDavid Xu PROC_SUNLOCK(p); 1496686bcb5cSJeff Roberson mi_switch(SW_INVOL | SWT_SUSPEND); 149744990b8cSJulian Elischer PROC_LOCK(p); 149844990b8cSJulian Elischer } 149944990b8cSJulian Elischer return (0); 150044990b8cSJulian Elischer } 150144990b8cSJulian Elischer 1502478ca4b0SKonstantin Belousov /* 1503478ca4b0SKonstantin Belousov * Check for possible stops and suspensions while executing a 1504478ca4b0SKonstantin Belousov * casueword or similar transiently failing operation. 1505478ca4b0SKonstantin Belousov * 1506478ca4b0SKonstantin Belousov * The sleep argument controls whether the function can handle a stop 1507478ca4b0SKonstantin Belousov * request itself or it should return ERESTART and the request is 1508478ca4b0SKonstantin Belousov * proceed at the kernel/user boundary in ast. 1509478ca4b0SKonstantin Belousov * 1510478ca4b0SKonstantin Belousov * Typically, when retrying due to casueword(9) failure (rv == 1), we 1511478ca4b0SKonstantin Belousov * should handle the stop requests there, with exception of cases when 1512478ca4b0SKonstantin Belousov * the thread owns a kernel resource, for instance busied the umtx 1513300b525dSKonstantin Belousov * key, or when functions return immediately if thread_check_susp() 1514478ca4b0SKonstantin Belousov * returned non-zero. On the other hand, retrying the whole lock 1515478ca4b0SKonstantin Belousov * operation, we better not stop there but delegate the handling to 1516478ca4b0SKonstantin Belousov * ast. 1517478ca4b0SKonstantin Belousov * 1518478ca4b0SKonstantin Belousov * If the request is for thread termination P_SINGLE_EXIT, we cannot 1519478ca4b0SKonstantin Belousov * handle it at all, and simply return EINTR. 1520478ca4b0SKonstantin Belousov */ 1521478ca4b0SKonstantin Belousov int 1522478ca4b0SKonstantin Belousov thread_check_susp(struct thread *td, bool sleep) 1523478ca4b0SKonstantin Belousov { 1524478ca4b0SKonstantin Belousov struct proc *p; 1525478ca4b0SKonstantin Belousov int error; 1526478ca4b0SKonstantin Belousov 1527478ca4b0SKonstantin Belousov /* 1528c6d31b83SKonstantin Belousov * The check for TDA_SUSPEND is racy, but it is enough to 1529478ca4b0SKonstantin Belousov * eventually break the lockstep loop. 1530478ca4b0SKonstantin Belousov */ 1531c6d31b83SKonstantin Belousov if (!td_ast_pending(td, TDA_SUSPEND)) 1532478ca4b0SKonstantin Belousov return (0); 1533478ca4b0SKonstantin Belousov error = 0; 1534478ca4b0SKonstantin Belousov p = td->td_proc; 1535478ca4b0SKonstantin Belousov PROC_LOCK(p); 1536478ca4b0SKonstantin Belousov if (p->p_flag & P_SINGLE_EXIT) 1537478ca4b0SKonstantin Belousov error = EINTR; 1538478ca4b0SKonstantin Belousov else if (P_SHOULDSTOP(p) || 1539478ca4b0SKonstantin Belousov ((p->p_flag & P_TRACED) && (td->td_dbgflags & TDB_SUSPEND))) 1540478ca4b0SKonstantin Belousov error = sleep ? thread_suspend_check(0) : ERESTART; 1541478ca4b0SKonstantin Belousov PROC_UNLOCK(p); 1542478ca4b0SKonstantin Belousov return (error); 1543478ca4b0SKonstantin Belousov } 1544478ca4b0SKonstantin Belousov 154535c32a76SDavid Xu void 15466ddcc233SKonstantin Belousov thread_suspend_switch(struct thread *td, struct proc *p) 1547a54e85fdSJeff Roberson { 1548a54e85fdSJeff Roberson 1549a54e85fdSJeff Roberson KASSERT(!TD_IS_SUSPENDED(td), ("already suspended")); 1550a54e85fdSJeff Roberson PROC_LOCK_ASSERT(p, MA_OWNED); 15517b4a950aSDavid Xu PROC_SLOCK_ASSERT(p, MA_OWNED); 1552a54e85fdSJeff Roberson /* 1553a54e85fdSJeff Roberson * We implement thread_suspend_one in stages here to avoid 1554a54e85fdSJeff Roberson * dropping the proc lock while the thread lock is owned. 1555a54e85fdSJeff Roberson */ 15566ddcc233SKonstantin Belousov if (p == td->td_proc) { 1557a54e85fdSJeff Roberson thread_stopped(p); 1558a54e85fdSJeff Roberson p->p_suspcount++; 15596ddcc233SKonstantin Belousov } 15603f9be10eSDavid Xu PROC_UNLOCK(p); 15617b4a950aSDavid Xu thread_lock(td); 1562c6d31b83SKonstantin Belousov ast_unsched_locked(td, TDA_SUSPEND); 1563a54e85fdSJeff Roberson TD_SET_SUSPENDED(td); 1564c5aa6b58SJeff Roberson sched_sleep(td, 0); 15657b4a950aSDavid Xu PROC_SUNLOCK(p); 1566a54e85fdSJeff Roberson DROP_GIANT(); 1567686bcb5cSJeff Roberson mi_switch(SW_VOL | SWT_SUSPEND); 1568a54e85fdSJeff Roberson PICKUP_GIANT(); 1569a54e85fdSJeff Roberson PROC_LOCK(p); 15707b4a950aSDavid Xu PROC_SLOCK(p); 1571a54e85fdSJeff Roberson } 1572a54e85fdSJeff Roberson 1573a54e85fdSJeff Roberson void 157435c32a76SDavid Xu thread_suspend_one(struct thread *td) 157535c32a76SDavid Xu { 15766ddcc233SKonstantin Belousov struct proc *p; 157735c32a76SDavid Xu 15786ddcc233SKonstantin Belousov p = td->td_proc; 15797b4a950aSDavid Xu PROC_SLOCK_ASSERT(p, MA_OWNED); 1580a54e85fdSJeff Roberson THREAD_LOCK_ASSERT(td, MA_OWNED); 1581e574e444SDavid Xu KASSERT(!TD_IS_SUSPENDED(td), ("already suspended")); 158235c32a76SDavid Xu p->p_suspcount++; 1583c6d31b83SKonstantin Belousov ast_unsched_locked(td, TDA_SUSPEND); 158471fad9fdSJulian Elischer TD_SET_SUSPENDED(td); 1585c5aa6b58SJeff Roberson sched_sleep(td, 0); 158635c32a76SDavid Xu } 158735c32a76SDavid Xu 158884cdea97SKonstantin Belousov static int 158984cdea97SKonstantin Belousov thread_unsuspend_one(struct thread *td, struct proc *p, bool boundary) 159035c32a76SDavid Xu { 159135c32a76SDavid Xu 1592a54e85fdSJeff Roberson THREAD_LOCK_ASSERT(td, MA_OWNED); 1593ad1e7d28SJulian Elischer KASSERT(TD_IS_SUSPENDED(td), ("Thread not suspended")); 159471fad9fdSJulian Elischer TD_CLR_SUSPENDED(td); 15956ddcc233SKonstantin Belousov td->td_flags &= ~TDF_ALLPROCSUSP; 15966ddcc233SKonstantin Belousov if (td->td_proc == p) { 15976ddcc233SKonstantin Belousov PROC_SLOCK_ASSERT(p, MA_OWNED); 159835c32a76SDavid Xu p->p_suspcount--; 159984cdea97SKonstantin Belousov if (boundary && (td->td_flags & TDF_BOUNDARY) != 0) { 160084cdea97SKonstantin Belousov td->td_flags &= ~TDF_BOUNDARY; 160184cdea97SKonstantin Belousov p->p_boundary_count--; 160284cdea97SKonstantin Belousov } 16036ddcc233SKonstantin Belousov } 160461a74c5cSJeff Roberson return (setrunnable(td, 0)); 160535c32a76SDavid Xu } 160635c32a76SDavid Xu 1607af928fdeSKonstantin Belousov void 1608af928fdeSKonstantin Belousov thread_run_flash(struct thread *td) 1609af928fdeSKonstantin Belousov { 1610af928fdeSKonstantin Belousov struct proc *p; 1611af928fdeSKonstantin Belousov 1612af928fdeSKonstantin Belousov p = td->td_proc; 1613af928fdeSKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 1614af928fdeSKonstantin Belousov 1615af928fdeSKonstantin Belousov if (TD_ON_SLEEPQ(td)) 1616af928fdeSKonstantin Belousov sleepq_remove_nested(td); 1617af928fdeSKonstantin Belousov else 1618af928fdeSKonstantin Belousov thread_lock(td); 1619af928fdeSKonstantin Belousov 1620af928fdeSKonstantin Belousov THREAD_LOCK_ASSERT(td, MA_OWNED); 1621af928fdeSKonstantin Belousov KASSERT(TD_IS_SUSPENDED(td), ("Thread not suspended")); 1622af928fdeSKonstantin Belousov 1623af928fdeSKonstantin Belousov TD_CLR_SUSPENDED(td); 1624af928fdeSKonstantin Belousov PROC_SLOCK(p); 1625af928fdeSKonstantin Belousov MPASS(p->p_suspcount > 0); 1626af928fdeSKonstantin Belousov p->p_suspcount--; 1627af928fdeSKonstantin Belousov PROC_SUNLOCK(p); 1628af928fdeSKonstantin Belousov if (setrunnable(td, 0)) 1629af928fdeSKonstantin Belousov kick_proc0(); 1630af928fdeSKonstantin Belousov } 1631af928fdeSKonstantin Belousov 163244990b8cSJulian Elischer /* 163344990b8cSJulian Elischer * Allow all threads blocked by single threading to continue running. 163444990b8cSJulian Elischer */ 163544990b8cSJulian Elischer void 163644990b8cSJulian Elischer thread_unsuspend(struct proc *p) 163744990b8cSJulian Elischer { 163844990b8cSJulian Elischer struct thread *td; 16397847a9daSJohn Baldwin int wakeup_swapper; 164044990b8cSJulian Elischer 164144990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 16427b4a950aSDavid Xu PROC_SLOCK_ASSERT(p, MA_OWNED); 16437847a9daSJohn Baldwin wakeup_swapper = 0; 164444990b8cSJulian Elischer if (!P_SHOULDSTOP(p)) { 1645ad1e7d28SJulian Elischer FOREACH_THREAD_IN_PROC(p, td) { 1646a54e85fdSJeff Roberson thread_lock(td); 1647f829268bSKonstantin Belousov if (TD_IS_SUSPENDED(td)) 164884cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td, p, 164984cdea97SKonstantin Belousov true); 1650f829268bSKonstantin Belousov else 1651a54e85fdSJeff Roberson thread_unlock(td); 1652ad1e7d28SJulian Elischer } 165384cdea97SKonstantin Belousov } else if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE && 165484cdea97SKonstantin Belousov p->p_numthreads == p->p_suspcount) { 165544990b8cSJulian Elischer /* 165644990b8cSJulian Elischer * Stopping everything also did the job for the single 165744990b8cSJulian Elischer * threading request. Now we've downgraded to single-threaded, 165844990b8cSJulian Elischer * let it continue. 165944990b8cSJulian Elischer */ 16606ddcc233SKonstantin Belousov if (p->p_singlethread->td_proc == p) { 1661a54e85fdSJeff Roberson thread_lock(p->p_singlethread); 16626ddcc233SKonstantin Belousov wakeup_swapper = thread_unsuspend_one( 166384cdea97SKonstantin Belousov p->p_singlethread, p, false); 166444990b8cSJulian Elischer } 16656ddcc233SKonstantin Belousov } 16667847a9daSJohn Baldwin if (wakeup_swapper) 16677847a9daSJohn Baldwin kick_proc0(); 166844990b8cSJulian Elischer } 166944990b8cSJulian Elischer 1670ed062c8dSJulian Elischer /* 1671ed062c8dSJulian Elischer * End the single threading mode.. 1672ed062c8dSJulian Elischer */ 167344990b8cSJulian Elischer void 16746ddcc233SKonstantin Belousov thread_single_end(struct proc *p, int mode) 167544990b8cSJulian Elischer { 167644990b8cSJulian Elischer struct thread *td; 16777847a9daSJohn Baldwin int wakeup_swapper; 167844990b8cSJulian Elischer 16796ddcc233SKonstantin Belousov KASSERT(mode == SINGLE_EXIT || mode == SINGLE_BOUNDARY || 16806ddcc233SKonstantin Belousov mode == SINGLE_ALLPROC || mode == SINGLE_NO_EXIT, 16816ddcc233SKonstantin Belousov ("invalid mode %d", mode)); 168244990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 16836ddcc233SKonstantin Belousov KASSERT((mode == SINGLE_ALLPROC && (p->p_flag & P_TOTAL_STOP) != 0) || 16846ddcc233SKonstantin Belousov (mode != SINGLE_ALLPROC && (p->p_flag & P_TOTAL_STOP) == 0), 16856ddcc233SKonstantin Belousov ("mode %d does not match P_TOTAL_STOP", mode)); 168684cdea97SKonstantin Belousov KASSERT(mode == SINGLE_ALLPROC || p->p_singlethread == curthread, 168784cdea97SKonstantin Belousov ("thread_single_end from other thread %p %p", 168884cdea97SKonstantin Belousov curthread, p->p_singlethread)); 168984cdea97SKonstantin Belousov KASSERT(mode != SINGLE_BOUNDARY || 169084cdea97SKonstantin Belousov (p->p_flag & P_SINGLE_BOUNDARY) != 0, 169184cdea97SKonstantin Belousov ("mis-matched SINGLE_BOUNDARY flags %x", p->p_flag)); 16926ddcc233SKonstantin Belousov p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT | P_SINGLE_BOUNDARY | 16936ddcc233SKonstantin Belousov P_TOTAL_STOP); 16947b4a950aSDavid Xu PROC_SLOCK(p); 169544990b8cSJulian Elischer p->p_singlethread = NULL; 16967847a9daSJohn Baldwin wakeup_swapper = 0; 169749539972SJulian Elischer /* 16987847a9daSJohn Baldwin * If there are other threads they may now run, 169949539972SJulian Elischer * unless of course there is a blanket 'stop order' 170049539972SJulian Elischer * on the process. The single threader must be allowed 170149539972SJulian Elischer * to continue however as this is a bad place to stop. 170249539972SJulian Elischer */ 17036ddcc233SKonstantin Belousov if (p->p_numthreads != remain_for_mode(mode) && !P_SHOULDSTOP(p)) { 1704ad1e7d28SJulian Elischer FOREACH_THREAD_IN_PROC(p, td) { 1705a54e85fdSJeff Roberson thread_lock(td); 1706ad1e7d28SJulian Elischer if (TD_IS_SUSPENDED(td)) { 170784cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td, p, 17082d5ef216SMark Johnston true); 170961a74c5cSJeff Roberson } else 1710a54e85fdSJeff Roberson thread_unlock(td); 171149539972SJulian Elischer } 1712ad1e7d28SJulian Elischer } 171384cdea97SKonstantin Belousov KASSERT(mode != SINGLE_BOUNDARY || p->p_boundary_count == 0, 171484cdea97SKonstantin Belousov ("inconsistent boundary count %d", p->p_boundary_count)); 17157b4a950aSDavid Xu PROC_SUNLOCK(p); 17167847a9daSJohn Baldwin if (wakeup_swapper) 17177847a9daSJohn Baldwin kick_proc0(); 1718d7a9e6e7SKonstantin Belousov wakeup(&p->p_flag); 171949539972SJulian Elischer } 17204fc21c09SDaniel Eischen 1721aae3547bSMateusz Guzik /* 1722aae3547bSMateusz Guzik * Locate a thread by number and return with proc lock held. 1723aae3547bSMateusz Guzik * 1724aae3547bSMateusz Guzik * thread exit establishes proc -> tidhash lock ordering, but lookup 1725aae3547bSMateusz Guzik * takes tidhash first and needs to return locked proc. 1726aae3547bSMateusz Guzik * 1727aae3547bSMateusz Guzik * The problem is worked around by relying on type-safety of both 1728aae3547bSMateusz Guzik * structures and doing the work in 2 steps: 1729aae3547bSMateusz Guzik * - tidhash-locked lookup which saves both thread and proc pointers 1730aae3547bSMateusz Guzik * - proc-locked verification that the found thread still matches 1731aae3547bSMateusz Guzik */ 1732aae3547bSMateusz Guzik static bool 1733aae3547bSMateusz Guzik tdfind_hash(lwpid_t tid, pid_t pid, struct proc **pp, struct thread **tdp) 1734cf7d9a8cSDavid Xu { 1735cf7d9a8cSDavid Xu #define RUN_THRESH 16 1736aae3547bSMateusz Guzik struct proc *p; 1737cf7d9a8cSDavid Xu struct thread *td; 1738aae3547bSMateusz Guzik int run; 1739aae3547bSMateusz Guzik bool locked; 1740cf7d9a8cSDavid Xu 1741aae3547bSMateusz Guzik run = 0; 174226007fe3SMateusz Guzik rw_rlock(TIDHASHLOCK(tid)); 1743aae3547bSMateusz Guzik locked = true; 1744cf7d9a8cSDavid Xu LIST_FOREACH(td, TIDHASH(tid), td_hash) { 1745aae3547bSMateusz Guzik if (td->td_tid != tid) { 1746aae3547bSMateusz Guzik run++; 1747aae3547bSMateusz Guzik continue; 1748cf7d9a8cSDavid Xu } 1749aae3547bSMateusz Guzik p = td->td_proc; 1750aae3547bSMateusz Guzik if (pid != -1 && p->p_pid != pid) { 1751cf7d9a8cSDavid Xu td = NULL; 1752cf7d9a8cSDavid Xu break; 1753cf7d9a8cSDavid Xu } 1754cf7d9a8cSDavid Xu if (run > RUN_THRESH) { 175526007fe3SMateusz Guzik if (rw_try_upgrade(TIDHASHLOCK(tid))) { 1756cf7d9a8cSDavid Xu LIST_REMOVE(td, td_hash); 1757cf7d9a8cSDavid Xu LIST_INSERT_HEAD(TIDHASH(td->td_tid), 1758cf7d9a8cSDavid Xu td, td_hash); 175926007fe3SMateusz Guzik rw_wunlock(TIDHASHLOCK(tid)); 1760aae3547bSMateusz Guzik locked = false; 1761aae3547bSMateusz Guzik break; 1762cf7d9a8cSDavid Xu } 1763cf7d9a8cSDavid Xu } 1764cf7d9a8cSDavid Xu break; 1765cf7d9a8cSDavid Xu } 1766aae3547bSMateusz Guzik if (locked) 176726007fe3SMateusz Guzik rw_runlock(TIDHASHLOCK(tid)); 1768aae3547bSMateusz Guzik if (td == NULL) 1769aae3547bSMateusz Guzik return (false); 1770aae3547bSMateusz Guzik *pp = p; 1771aae3547bSMateusz Guzik *tdp = td; 1772aae3547bSMateusz Guzik return (true); 1773aae3547bSMateusz Guzik } 1774aae3547bSMateusz Guzik 1775aae3547bSMateusz Guzik struct thread * 1776aae3547bSMateusz Guzik tdfind(lwpid_t tid, pid_t pid) 1777aae3547bSMateusz Guzik { 1778aae3547bSMateusz Guzik struct proc *p; 1779aae3547bSMateusz Guzik struct thread *td; 1780aae3547bSMateusz Guzik 1781aae3547bSMateusz Guzik td = curthread; 1782aae3547bSMateusz Guzik if (td->td_tid == tid) { 1783aae3547bSMateusz Guzik if (pid != -1 && td->td_proc->p_pid != pid) 1784aae3547bSMateusz Guzik return (NULL); 1785aae3547bSMateusz Guzik PROC_LOCK(td->td_proc); 1786cf7d9a8cSDavid Xu return (td); 1787cf7d9a8cSDavid Xu } 1788cf7d9a8cSDavid Xu 1789aae3547bSMateusz Guzik for (;;) { 1790aae3547bSMateusz Guzik if (!tdfind_hash(tid, pid, &p, &td)) 1791aae3547bSMateusz Guzik return (NULL); 1792aae3547bSMateusz Guzik PROC_LOCK(p); 1793aae3547bSMateusz Guzik if (td->td_tid != tid) { 1794aae3547bSMateusz Guzik PROC_UNLOCK(p); 1795aae3547bSMateusz Guzik continue; 1796aae3547bSMateusz Guzik } 1797aae3547bSMateusz Guzik if (td->td_proc != p) { 1798aae3547bSMateusz Guzik PROC_UNLOCK(p); 1799aae3547bSMateusz Guzik continue; 1800aae3547bSMateusz Guzik } 1801aae3547bSMateusz Guzik if (p->p_state == PRS_NEW) { 1802aae3547bSMateusz Guzik PROC_UNLOCK(p); 1803aae3547bSMateusz Guzik return (NULL); 1804aae3547bSMateusz Guzik } 1805aae3547bSMateusz Guzik return (td); 1806aae3547bSMateusz Guzik } 1807aae3547bSMateusz Guzik } 1808aae3547bSMateusz Guzik 1809cf7d9a8cSDavid Xu void 1810cf7d9a8cSDavid Xu tidhash_add(struct thread *td) 1811cf7d9a8cSDavid Xu { 181226007fe3SMateusz Guzik rw_wlock(TIDHASHLOCK(td->td_tid)); 1813cf7d9a8cSDavid Xu LIST_INSERT_HEAD(TIDHASH(td->td_tid), td, td_hash); 181426007fe3SMateusz Guzik rw_wunlock(TIDHASHLOCK(td->td_tid)); 1815cf7d9a8cSDavid Xu } 1816cf7d9a8cSDavid Xu 1817cf7d9a8cSDavid Xu void 1818cf7d9a8cSDavid Xu tidhash_remove(struct thread *td) 1819cf7d9a8cSDavid Xu { 182026007fe3SMateusz Guzik 182126007fe3SMateusz Guzik rw_wlock(TIDHASHLOCK(td->td_tid)); 1822cf7d9a8cSDavid Xu LIST_REMOVE(td, td_hash); 182326007fe3SMateusz Guzik rw_wunlock(TIDHASHLOCK(td->td_tid)); 1824cf7d9a8cSDavid Xu } 1825