19454b2d8SWarner Losh /*- 28a36da99SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 38a36da99SPedro F. Giffuni * 444990b8cSJulian Elischer * Copyright (C) 2001 Julian Elischer <julian@freebsd.org>. 544990b8cSJulian Elischer * All rights reserved. 644990b8cSJulian Elischer * 744990b8cSJulian Elischer * Redistribution and use in source and binary forms, with or without 844990b8cSJulian Elischer * modification, are permitted provided that the following conditions 944990b8cSJulian Elischer * are met: 1044990b8cSJulian Elischer * 1. Redistributions of source code must retain the above copyright 1144990b8cSJulian Elischer * notice(s), this list of conditions and the following disclaimer as 1244990b8cSJulian Elischer * the first lines of this file unmodified other than the possible 1344990b8cSJulian Elischer * addition of one or more copyright notices. 1444990b8cSJulian Elischer * 2. Redistributions in binary form must reproduce the above copyright 1544990b8cSJulian Elischer * notice(s), this list of conditions and the following disclaimer in the 1644990b8cSJulian Elischer * documentation and/or other materials provided with the distribution. 1744990b8cSJulian Elischer * 1844990b8cSJulian Elischer * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) ``AS IS'' AND ANY 1944990b8cSJulian Elischer * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED 2044990b8cSJulian Elischer * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 2144990b8cSJulian Elischer * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY 2244990b8cSJulian Elischer * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES 2344990b8cSJulian Elischer * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 2444990b8cSJulian Elischer * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 2544990b8cSJulian Elischer * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 2644990b8cSJulian Elischer * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 2744990b8cSJulian Elischer * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH 2844990b8cSJulian Elischer * DAMAGE. 2944990b8cSJulian Elischer */ 3044990b8cSJulian Elischer 313d06b4b3SAttilio Rao #include "opt_witness.h" 3216d95d4fSJoseph Koshy #include "opt_hwpmc_hooks.h" 333d06b4b3SAttilio Rao 34677b542eSDavid E. O'Brien #include <sys/cdefs.h> 35677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 36677b542eSDavid E. O'Brien 3744990b8cSJulian Elischer #include <sys/param.h> 3844990b8cSJulian Elischer #include <sys/systm.h> 3944990b8cSJulian Elischer #include <sys/kernel.h> 4044990b8cSJulian Elischer #include <sys/lock.h> 4144990b8cSJulian Elischer #include <sys/mutex.h> 4244990b8cSJulian Elischer #include <sys/proc.h> 4335bb59edSMateusz Guzik #include <sys/bitstring.h> 446febf180SGleb Smirnoff #include <sys/epoch.h> 458f0e9130SKonstantin Belousov #include <sys/rangelock.h> 46e170bfdaSDavid Xu #include <sys/resourcevar.h> 47b3e9e682SRyan Stone #include <sys/sdt.h> 4894e0a4cdSJulian Elischer #include <sys/smp.h> 49de028f5aSJeff Roberson #include <sys/sched.h> 5044f3b092SJohn Baldwin #include <sys/sleepqueue.h> 51ace8398dSJeff Roberson #include <sys/selinfo.h> 52d1e7a4a5SJohn Baldwin #include <sys/syscallsubr.h> 5391d1786fSDmitry Chagin #include <sys/sysent.h> 54961a7b24SJohn Baldwin #include <sys/turnstile.h> 5544990b8cSJulian Elischer #include <sys/ktr.h> 56cf7d9a8cSDavid Xu #include <sys/rwlock.h> 57bc8e6d81SDavid Xu #include <sys/umtx.h> 589ed01c32SGleb Smirnoff #include <sys/vmmeter.h> 59d7f687fcSJeff Roberson #include <sys/cpuset.h> 6016d95d4fSJoseph Koshy #ifdef HWPMC_HOOKS 6116d95d4fSJoseph Koshy #include <sys/pmckern.h> 6216d95d4fSJoseph Koshy #endif 631bd3cf5dSMateusz Guzik #include <sys/priv.h> 6444990b8cSJulian Elischer 65911b84b0SRobert Watson #include <security/audit/audit.h> 66911b84b0SRobert Watson 6744990b8cSJulian Elischer #include <vm/vm.h> 6849a2507bSAlan Cox #include <vm/vm_extern.h> 6944990b8cSJulian Elischer #include <vm/uma.h> 70b209f889SRandall Stewart #include <sys/eventhandler.h> 7102fb42b0SPeter Wemm 72acd9f517SKonstantin Belousov /* 73acd9f517SKonstantin Belousov * Asserts below verify the stability of struct thread and struct proc 74acd9f517SKonstantin Belousov * layout, as exposed by KBI to modules. On head, the KBI is allowed 75acd9f517SKonstantin Belousov * to drift, change to the structures must be accompanied by the 76acd9f517SKonstantin Belousov * assert update. 77acd9f517SKonstantin Belousov * 78acd9f517SKonstantin Belousov * On the stable branches after KBI freeze, conditions must not be 79acd9f517SKonstantin Belousov * violated. Typically new fields are moved to the end of the 80acd9f517SKonstantin Belousov * structures. 81acd9f517SKonstantin Belousov */ 82acd9f517SKonstantin Belousov #ifdef __amd64__ 833f289c3fSJeff Roberson _Static_assert(offsetof(struct thread, td_flags) == 0xfc, 84acd9f517SKonstantin Belousov "struct thread KBI td_flags"); 853f289c3fSJeff Roberson _Static_assert(offsetof(struct thread, td_pflags) == 0x104, 86acd9f517SKonstantin Belousov "struct thread KBI td_pflags"); 871e2521ffSEdward Tomasz Napierala _Static_assert(offsetof(struct thread, td_frame) == 0x4a0, 88acd9f517SKonstantin Belousov "struct thread KBI td_frame"); 891724c563SMateusz Guzik _Static_assert(offsetof(struct thread, td_emuldata) == 0x6b0, 90acd9f517SKonstantin Belousov "struct thread KBI td_emuldata"); 91acd9f517SKonstantin Belousov _Static_assert(offsetof(struct proc, p_flag) == 0xb0, 92acd9f517SKonstantin Belousov "struct proc KBI p_flag"); 93acd9f517SKonstantin Belousov _Static_assert(offsetof(struct proc, p_pid) == 0xbc, 94acd9f517SKonstantin Belousov "struct proc KBI p_pid"); 958de97f39SRick Macklem _Static_assert(offsetof(struct proc, p_filemon) == 0x3b8, 96acd9f517SKonstantin Belousov "struct proc KBI p_filemon"); 978de97f39SRick Macklem _Static_assert(offsetof(struct proc, p_comm) == 0x3d0, 98acd9f517SKonstantin Belousov "struct proc KBI p_comm"); 998de97f39SRick Macklem _Static_assert(offsetof(struct proc, p_emuldata) == 0x4b0, 100acd9f517SKonstantin Belousov "struct proc KBI p_emuldata"); 101acd9f517SKonstantin Belousov #endif 102acd9f517SKonstantin Belousov #ifdef __i386__ 1033f289c3fSJeff Roberson _Static_assert(offsetof(struct thread, td_flags) == 0x98, 104acd9f517SKonstantin Belousov "struct thread KBI td_flags"); 1053f289c3fSJeff Roberson _Static_assert(offsetof(struct thread, td_pflags) == 0xa0, 106acd9f517SKonstantin Belousov "struct thread KBI td_pflags"); 1071e2521ffSEdward Tomasz Napierala _Static_assert(offsetof(struct thread, td_frame) == 0x300, 108acd9f517SKonstantin Belousov "struct thread KBI td_frame"); 1091e2521ffSEdward Tomasz Napierala _Static_assert(offsetof(struct thread, td_emuldata) == 0x344, 110acd9f517SKonstantin Belousov "struct thread KBI td_emuldata"); 111acd9f517SKonstantin Belousov _Static_assert(offsetof(struct proc, p_flag) == 0x68, 112acd9f517SKonstantin Belousov "struct proc KBI p_flag"); 113acd9f517SKonstantin Belousov _Static_assert(offsetof(struct proc, p_pid) == 0x74, 114acd9f517SKonstantin Belousov "struct proc KBI p_pid"); 1158de97f39SRick Macklem _Static_assert(offsetof(struct proc, p_filemon) == 0x268, 116acd9f517SKonstantin Belousov "struct proc KBI p_filemon"); 1178de97f39SRick Macklem _Static_assert(offsetof(struct proc, p_comm) == 0x27c, 118acd9f517SKonstantin Belousov "struct proc KBI p_comm"); 1198de97f39SRick Macklem _Static_assert(offsetof(struct proc, p_emuldata) == 0x308, 120acd9f517SKonstantin Belousov "struct proc KBI p_emuldata"); 121acd9f517SKonstantin Belousov #endif 122acd9f517SKonstantin Belousov 123b3e9e682SRyan Stone SDT_PROVIDER_DECLARE(proc); 124d9fae5abSAndriy Gapon SDT_PROBE_DEFINE(proc, , , lwp__exit); 125b3e9e682SRyan Stone 1268460a577SJohn Birrell /* 1278460a577SJohn Birrell * thread related storage. 1288460a577SJohn Birrell */ 12944990b8cSJulian Elischer static uma_zone_t thread_zone; 13044990b8cSJulian Elischer 1315215b187SJeff Roberson TAILQ_HEAD(, thread) zombie_threads = TAILQ_HEAD_INITIALIZER(zombie_threads); 132c8790f5dSAttilio Rao static struct mtx zombie_lock; 133a54e85fdSJeff Roberson MTX_SYSINIT(zombie_lock, &zombie_lock, "zombie lock", MTX_SPIN); 13444990b8cSJulian Elischer 135ff8fbcffSJeff Roberson static void thread_zombie(struct thread *); 13684cdea97SKonstantin Belousov static int thread_unsuspend_one(struct thread *td, struct proc *p, 13784cdea97SKonstantin Belousov bool boundary); 138ff8fbcffSJeff Roberson 139ec6ea5e8SDavid Xu #define TID_BUFFER_SIZE 1024 140ec6ea5e8SDavid Xu 141*934e7e5eSMateusz Guzik static struct mtx tid_lock; 142*934e7e5eSMateusz Guzik static bitstr_t *tid_bitmap; 14335bb59edSMateusz Guzik 144cf7d9a8cSDavid Xu static MALLOC_DEFINE(M_TIDHASH, "tidhash", "thread hash"); 145cf7d9a8cSDavid Xu 1461bd3cf5dSMateusz Guzik static int maxthread; 1471bd3cf5dSMateusz Guzik SYSCTL_INT(_kern, OID_AUTO, maxthread, CTLFLAG_RDTUN, 1481bd3cf5dSMateusz Guzik &maxthread, 0, "Maximum number of threads"); 1491bd3cf5dSMateusz Guzik 1501bd3cf5dSMateusz Guzik static int nthreads; 1511bd3cf5dSMateusz Guzik 152cf7d9a8cSDavid Xu struct tidhashhead *tidhashtbl; 153cf7d9a8cSDavid Xu u_long tidhash; 154cf7d9a8cSDavid Xu struct rwlock tidhash_lock; 155cf7d9a8cSDavid Xu 1562ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_ctor); 1572ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_dtor); 1582ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_init); 1592ca45184SMatt Joras EVENTHANDLER_LIST_DEFINE(thread_fini); 1602ca45184SMatt Joras 161ec6ea5e8SDavid Xu static lwpid_t 162ec6ea5e8SDavid Xu tid_alloc(void) 163ec6ea5e8SDavid Xu { 1641bd3cf5dSMateusz Guzik static struct timeval lastfail; 1651bd3cf5dSMateusz Guzik static int curfail; 16635bb59edSMateusz Guzik static lwpid_t trytid; 167ec6ea5e8SDavid Xu lwpid_t tid; 168ec6ea5e8SDavid Xu 16935bb59edSMateusz Guzik mtx_lock(&tid_lock); 17035bb59edSMateusz Guzik if (nthreads + 1 >= maxthread - 100) { 1711bd3cf5dSMateusz Guzik if (priv_check_cred(curthread->td_ucred, PRIV_MAXPROC) != 0 || 17235bb59edSMateusz Guzik nthreads + 1 >= maxthread) { 17335bb59edSMateusz Guzik mtx_unlock(&tid_lock); 1741bd3cf5dSMateusz Guzik if (ppsratecheck(&lastfail, &curfail, 1)) { 1751bd3cf5dSMateusz Guzik printf("maxthread limit exceeded by uid %u " 1761bd3cf5dSMateusz Guzik "(pid %d); consider increasing kern.maxthread\n", 1771bd3cf5dSMateusz Guzik curthread->td_ucred->cr_ruid, curproc->p_pid); 1781bd3cf5dSMateusz Guzik } 1791bd3cf5dSMateusz Guzik return (-1); 1801bd3cf5dSMateusz Guzik } 1811bd3cf5dSMateusz Guzik } 1821bd3cf5dSMateusz Guzik 18335bb59edSMateusz Guzik nthreads++; 18435bb59edSMateusz Guzik /* 18535bb59edSMateusz Guzik * It is an invariant that the bitmap is big enough to hold maxthread 18635bb59edSMateusz Guzik * IDs. If we got to this point there has to be at least one free. 18735bb59edSMateusz Guzik */ 18835bb59edSMateusz Guzik if (trytid >= maxthread) 18935bb59edSMateusz Guzik trytid = 0; 19035bb59edSMateusz Guzik bit_ffc_at(tid_bitmap, trytid, maxthread, &tid); 19135bb59edSMateusz Guzik if (tid == -1) { 19235bb59edSMateusz Guzik KASSERT(trytid != 0, ("unexpectedly ran out of IDs")); 19335bb59edSMateusz Guzik trytid = 0; 19435bb59edSMateusz Guzik bit_ffc_at(tid_bitmap, trytid, maxthread, &tid); 19535bb59edSMateusz Guzik KASSERT(tid != -1, ("unexpectedly ran out of IDs")); 196ec6ea5e8SDavid Xu } 19735bb59edSMateusz Guzik bit_set(tid_bitmap, tid); 198*934e7e5eSMateusz Guzik trytid = tid + 1; 199ec6ea5e8SDavid Xu mtx_unlock(&tid_lock); 20035bb59edSMateusz Guzik return (tid + NO_PID); 201ec6ea5e8SDavid Xu } 202ec6ea5e8SDavid Xu 203ec6ea5e8SDavid Xu static void 20435bb59edSMateusz Guzik tid_free(lwpid_t rtid) 205ec6ea5e8SDavid Xu { 20635bb59edSMateusz Guzik lwpid_t tid; 207ec6ea5e8SDavid Xu 20835bb59edSMateusz Guzik KASSERT(rtid >= NO_PID, 20935bb59edSMateusz Guzik ("%s: invalid tid %d\n", __func__, rtid)); 21035bb59edSMateusz Guzik tid = rtid - NO_PID; 211ec6ea5e8SDavid Xu mtx_lock(&tid_lock); 21235bb59edSMateusz Guzik KASSERT(bit_test(tid_bitmap, tid) != 0, 21335bb59edSMateusz Guzik ("thread ID %d not allocated\n", rtid)); 21435bb59edSMateusz Guzik bit_clear(tid_bitmap, tid); 21535bb59edSMateusz Guzik nthreads--; 216ec6ea5e8SDavid Xu mtx_unlock(&tid_lock); 217ec6ea5e8SDavid Xu } 218ec6ea5e8SDavid Xu 219fdcac928SMarcel Moolenaar /* 220696058c3SJulian Elischer * Prepare a thread for use. 22144990b8cSJulian Elischer */ 222b23f72e9SBrian Feldman static int 223b23f72e9SBrian Feldman thread_ctor(void *mem, int size, void *arg, int flags) 22444990b8cSJulian Elischer { 22544990b8cSJulian Elischer struct thread *td; 22644990b8cSJulian Elischer 22744990b8cSJulian Elischer td = (struct thread *)mem; 22871fad9fdSJulian Elischer td->td_state = TDS_INACTIVE; 22994dd54b9SKonstantin Belousov td->td_lastcpu = td->td_oncpu = NOCPU; 2306c27c603SJuli Mallett 2316c27c603SJuli Mallett /* 2326c27c603SJuli Mallett * Note that td_critnest begins life as 1 because the thread is not 2336c27c603SJuli Mallett * running and is thereby implicitly waiting to be on the receiving 234a54e85fdSJeff Roberson * end of a context switch. 2356c27c603SJuli Mallett */ 236139b7550SJohn Baldwin td->td_critnest = 1; 237acbe332aSDavid Xu td->td_lend_user_pri = PRI_MAX; 238911b84b0SRobert Watson #ifdef AUDIT 239911b84b0SRobert Watson audit_thread_alloc(td); 240911b84b0SRobert Watson #endif 241d10183d9SDavid Xu umtx_thread_alloc(td); 242b23f72e9SBrian Feldman return (0); 24344990b8cSJulian Elischer } 24444990b8cSJulian Elischer 24544990b8cSJulian Elischer /* 24644990b8cSJulian Elischer * Reclaim a thread after use. 24744990b8cSJulian Elischer */ 24844990b8cSJulian Elischer static void 24944990b8cSJulian Elischer thread_dtor(void *mem, int size, void *arg) 25044990b8cSJulian Elischer { 25144990b8cSJulian Elischer struct thread *td; 25244990b8cSJulian Elischer 25344990b8cSJulian Elischer td = (struct thread *)mem; 25444990b8cSJulian Elischer 25544990b8cSJulian Elischer #ifdef INVARIANTS 25644990b8cSJulian Elischer /* Verify that this thread is in a safe state to free. */ 25744990b8cSJulian Elischer switch (td->td_state) { 25871fad9fdSJulian Elischer case TDS_INHIBITED: 25971fad9fdSJulian Elischer case TDS_RUNNING: 26071fad9fdSJulian Elischer case TDS_CAN_RUN: 26144990b8cSJulian Elischer case TDS_RUNQ: 26244990b8cSJulian Elischer /* 26344990b8cSJulian Elischer * We must never unlink a thread that is in one of 26444990b8cSJulian Elischer * these states, because it is currently active. 26544990b8cSJulian Elischer */ 26644990b8cSJulian Elischer panic("bad state for thread unlinking"); 26744990b8cSJulian Elischer /* NOTREACHED */ 26871fad9fdSJulian Elischer case TDS_INACTIVE: 26944990b8cSJulian Elischer break; 27044990b8cSJulian Elischer default: 27144990b8cSJulian Elischer panic("bad thread state"); 27244990b8cSJulian Elischer /* NOTREACHED */ 27344990b8cSJulian Elischer } 27444990b8cSJulian Elischer #endif 2756e8525ceSRobert Watson #ifdef AUDIT 2766e8525ceSRobert Watson audit_thread_free(td); 2776e8525ceSRobert Watson #endif 2781ba4a712SPawel Jakub Dawidek /* Free all OSD associated to this thread. */ 2791ba4a712SPawel Jakub Dawidek osd_thread_exit(td); 280aca4bb91SKonstantin Belousov td_softdep_cleanup(td); 281aca4bb91SKonstantin Belousov MPASS(td->td_su == NULL); 28244990b8cSJulian Elischer } 28344990b8cSJulian Elischer 28444990b8cSJulian Elischer /* 28544990b8cSJulian Elischer * Initialize type-stable parts of a thread (when newly created). 28644990b8cSJulian Elischer */ 287b23f72e9SBrian Feldman static int 288b23f72e9SBrian Feldman thread_init(void *mem, int size, int flags) 28944990b8cSJulian Elischer { 29044990b8cSJulian Elischer struct thread *td; 29144990b8cSJulian Elischer 29244990b8cSJulian Elischer td = (struct thread *)mem; 293247aba24SMarcel Moolenaar 29444f3b092SJohn Baldwin td->td_sleepqueue = sleepq_alloc(); 295961a7b24SJohn Baldwin td->td_turnstile = turnstile_alloc(); 2968f0e9130SKonstantin Belousov td->td_rlqe = NULL; 2972ca45184SMatt Joras EVENTHANDLER_DIRECT_INVOKE(thread_init, td); 298d10183d9SDavid Xu umtx_thread_init(td); 29989b57fcfSKonstantin Belousov td->td_kstack = 0; 300ad8b1d85SKonstantin Belousov td->td_sel = NULL; 301b23f72e9SBrian Feldman return (0); 30244990b8cSJulian Elischer } 30344990b8cSJulian Elischer 30444990b8cSJulian Elischer /* 30544990b8cSJulian Elischer * Tear down type-stable parts of a thread (just before being discarded). 30644990b8cSJulian Elischer */ 30744990b8cSJulian Elischer static void 30844990b8cSJulian Elischer thread_fini(void *mem, int size) 30944990b8cSJulian Elischer { 31044990b8cSJulian Elischer struct thread *td; 31144990b8cSJulian Elischer 31244990b8cSJulian Elischer td = (struct thread *)mem; 3132ca45184SMatt Joras EVENTHANDLER_DIRECT_INVOKE(thread_fini, td); 3148f0e9130SKonstantin Belousov rlqentry_free(td->td_rlqe); 315961a7b24SJohn Baldwin turnstile_free(td->td_turnstile); 31644f3b092SJohn Baldwin sleepq_free(td->td_sleepqueue); 317d10183d9SDavid Xu umtx_thread_fini(td); 318ace8398dSJeff Roberson seltdfini(td); 31944990b8cSJulian Elischer } 3205215b187SJeff Roberson 3215c8329edSJulian Elischer /* 3225215b187SJeff Roberson * For a newly created process, 3235215b187SJeff Roberson * link up all the structures and its initial threads etc. 324ed062c8dSJulian Elischer * called from: 325e7d939bdSMarcel Moolenaar * {arch}/{arch}/machdep.c {arch}_init(), init386() etc. 326ed062c8dSJulian Elischer * proc_dtor() (should go away) 327ed062c8dSJulian Elischer * proc_init() 3285c8329edSJulian Elischer */ 3295c8329edSJulian Elischer void 33089b57fcfSKonstantin Belousov proc_linkup0(struct proc *p, struct thread *td) 33189b57fcfSKonstantin Belousov { 33289b57fcfSKonstantin Belousov TAILQ_INIT(&p->p_threads); /* all threads in proc */ 33389b57fcfSKonstantin Belousov proc_linkup(p, td); 33489b57fcfSKonstantin Belousov } 33589b57fcfSKonstantin Belousov 33689b57fcfSKonstantin Belousov void 3378460a577SJohn Birrell proc_linkup(struct proc *p, struct thread *td) 3385c8329edSJulian Elischer { 339a54e85fdSJeff Roberson 3409104847fSDavid Xu sigqueue_init(&p->p_sigqueue, p); 341ebceaf6dSDavid Xu p->p_ksi = ksiginfo_alloc(1); 342ebceaf6dSDavid Xu if (p->p_ksi != NULL) { 3435c474517SDavid Xu /* XXX p_ksi may be null if ksiginfo zone is not ready */ 344ebceaf6dSDavid Xu p->p_ksi->ksi_flags = KSI_EXT | KSI_INS; 345ebceaf6dSDavid Xu } 346b2f92ef9SDavid Xu LIST_INIT(&p->p_mqnotifier); 3475c8329edSJulian Elischer p->p_numthreads = 0; 3488460a577SJohn Birrell thread_link(td, p); 3495c8329edSJulian Elischer } 3505c8329edSJulian Elischer 3511bd3cf5dSMateusz Guzik extern int max_threads_per_proc; 3521bd3cf5dSMateusz Guzik 3535c8329edSJulian Elischer /* 35444990b8cSJulian Elischer * Initialize global thread allocation resources. 35544990b8cSJulian Elischer */ 35644990b8cSJulian Elischer void 35744990b8cSJulian Elischer threadinit(void) 35844990b8cSJulian Elischer { 3595aa5420fSMark Johnston uint32_t flags; 36044990b8cSJulian Elischer 3611bd3cf5dSMateusz Guzik /* 3621bd3cf5dSMateusz Guzik * Place an upper limit on threads which can be allocated. 3631bd3cf5dSMateusz Guzik * 3641bd3cf5dSMateusz Guzik * Note that other factors may make the de facto limit much lower. 3651bd3cf5dSMateusz Guzik * 3661bd3cf5dSMateusz Guzik * Platform limits are somewhat arbitrary but deemed "more than good 3671bd3cf5dSMateusz Guzik * enough" for the foreseable future. 3681bd3cf5dSMateusz Guzik */ 3691bd3cf5dSMateusz Guzik if (maxthread == 0) { 3701bd3cf5dSMateusz Guzik #ifdef _LP64 3711bd3cf5dSMateusz Guzik maxthread = MIN(maxproc * max_threads_per_proc, 1000000); 3721bd3cf5dSMateusz Guzik #else 3731bd3cf5dSMateusz Guzik maxthread = MIN(maxproc * max_threads_per_proc, 100000); 3741bd3cf5dSMateusz Guzik #endif 3751bd3cf5dSMateusz Guzik } 3761bd3cf5dSMateusz Guzik 3771ea7a6f8SPoul-Henning Kamp mtx_init(&tid_lock, "TID lock", NULL, MTX_DEF); 37835bb59edSMateusz Guzik tid_bitmap = bit_alloc(maxthread, M_TIDHASH, M_WAITOK); 3791ea7a6f8SPoul-Henning Kamp 3805aa5420fSMark Johnston flags = UMA_ZONE_NOFREE; 3815aa5420fSMark Johnston #ifdef __aarch64__ 3825aa5420fSMark Johnston /* 3835aa5420fSMark Johnston * Force thread structures to be allocated from the direct map. 3845aa5420fSMark Johnston * Otherwise, superpage promotions and demotions may temporarily 3855aa5420fSMark Johnston * invalidate thread structure mappings. For most dynamically allocated 3865aa5420fSMark Johnston * structures this is not a problem, but translation faults cannot be 3875aa5420fSMark Johnston * handled without accessing curthread. 3885aa5420fSMark Johnston */ 3895aa5420fSMark Johnston flags |= UMA_ZONE_CONTIG; 3905aa5420fSMark Johnston #endif 391de028f5aSJeff Roberson thread_zone = uma_zcreate("THREAD", sched_sizeof_thread(), 39244990b8cSJulian Elischer thread_ctor, thread_dtor, thread_init, thread_fini, 3935aa5420fSMark Johnston 32 - 1, flags); 394cf7d9a8cSDavid Xu tidhashtbl = hashinit(maxproc / 2, M_TIDHASH, &tidhash); 395cf7d9a8cSDavid Xu rw_init(&tidhash_lock, "tidhash"); 39644990b8cSJulian Elischer } 39744990b8cSJulian Elischer 39844990b8cSJulian Elischer /* 399ff8fbcffSJeff Roberson * Place an unused thread on the zombie list. 400ad1e7d28SJulian Elischer * Use the slpq as that must be unused by now. 40144990b8cSJulian Elischer */ 40244990b8cSJulian Elischer void 403ff8fbcffSJeff Roberson thread_zombie(struct thread *td) 40444990b8cSJulian Elischer { 405a54e85fdSJeff Roberson mtx_lock_spin(&zombie_lock); 406ad1e7d28SJulian Elischer TAILQ_INSERT_HEAD(&zombie_threads, td, td_slpq); 407a54e85fdSJeff Roberson mtx_unlock_spin(&zombie_lock); 40844990b8cSJulian Elischer } 40944990b8cSJulian Elischer 4105c8329edSJulian Elischer /* 411ff8fbcffSJeff Roberson * Release a thread that has exited after cpu_throw(). 412ff8fbcffSJeff Roberson */ 413ff8fbcffSJeff Roberson void 414ff8fbcffSJeff Roberson thread_stash(struct thread *td) 415ff8fbcffSJeff Roberson { 416ff8fbcffSJeff Roberson atomic_subtract_rel_int(&td->td_proc->p_exitthreads, 1); 417ff8fbcffSJeff Roberson thread_zombie(td); 418ff8fbcffSJeff Roberson } 419ff8fbcffSJeff Roberson 420ff8fbcffSJeff Roberson /* 4216617724cSJeff Roberson * Reap zombie resources. 42244990b8cSJulian Elischer */ 42344990b8cSJulian Elischer void 42444990b8cSJulian Elischer thread_reap(void) 42544990b8cSJulian Elischer { 4265c8329edSJulian Elischer struct thread *td_first, *td_next; 42744990b8cSJulian Elischer 42844990b8cSJulian Elischer /* 4295215b187SJeff Roberson * Don't even bother to lock if none at this instant, 4302d19b736SKonstantin Belousov * we really don't care about the next instant. 43144990b8cSJulian Elischer */ 4328460a577SJohn Birrell if (!TAILQ_EMPTY(&zombie_threads)) { 433a54e85fdSJeff Roberson mtx_lock_spin(&zombie_lock); 4345c8329edSJulian Elischer td_first = TAILQ_FIRST(&zombie_threads); 4355c8329edSJulian Elischer if (td_first) 4365c8329edSJulian Elischer TAILQ_INIT(&zombie_threads); 437a54e85fdSJeff Roberson mtx_unlock_spin(&zombie_lock); 4385c8329edSJulian Elischer while (td_first) { 439ad1e7d28SJulian Elischer td_next = TAILQ_NEXT(td_first, td_slpq); 4404ea6a9a2SMateusz Guzik thread_cow_free(td_first); 4415c8329edSJulian Elischer thread_free(td_first); 4425c8329edSJulian Elischer td_first = td_next; 44344990b8cSJulian Elischer } 44444990b8cSJulian Elischer } 445ed062c8dSJulian Elischer } 44644990b8cSJulian Elischer 4474f0db5e0SJulian Elischer /* 44844990b8cSJulian Elischer * Allocate a thread. 44944990b8cSJulian Elischer */ 45044990b8cSJulian Elischer struct thread * 4518a945d10SKonstantin Belousov thread_alloc(int pages) 45244990b8cSJulian Elischer { 45389b57fcfSKonstantin Belousov struct thread *td; 4541bd3cf5dSMateusz Guzik lwpid_t tid; 4558460a577SJohn Birrell 45644990b8cSJulian Elischer thread_reap(); /* check if any zombies to get */ 45789b57fcfSKonstantin Belousov 4581bd3cf5dSMateusz Guzik tid = tid_alloc(); 4591bd3cf5dSMateusz Guzik if (tid == -1) { 4601bd3cf5dSMateusz Guzik return (NULL); 4611bd3cf5dSMateusz Guzik } 4621bd3cf5dSMateusz Guzik 4631bd3cf5dSMateusz Guzik td = uma_zalloc(thread_zone, M_WAITOK); 46489b57fcfSKonstantin Belousov KASSERT(td->td_kstack == 0, ("thread_alloc got thread with kstack")); 4658a945d10SKonstantin Belousov if (!vm_thread_new(td, pages)) { 46689b57fcfSKonstantin Belousov uma_zfree(thread_zone, td); 4671bd3cf5dSMateusz Guzik tid_free(tid); 46889b57fcfSKonstantin Belousov return (NULL); 46989b57fcfSKonstantin Belousov } 4701bd3cf5dSMateusz Guzik td->td_tid = tid; 4710c3967e7SMarcel Moolenaar cpu_thread_alloc(td); 4721bd3cf5dSMateusz Guzik EVENTHANDLER_DIRECT_INVOKE(thread_ctor, td); 47389b57fcfSKonstantin Belousov return (td); 47444990b8cSJulian Elischer } 47544990b8cSJulian Elischer 4768a945d10SKonstantin Belousov int 4778a945d10SKonstantin Belousov thread_alloc_stack(struct thread *td, int pages) 4788a945d10SKonstantin Belousov { 4798a945d10SKonstantin Belousov 4808a945d10SKonstantin Belousov KASSERT(td->td_kstack == 0, 4818a945d10SKonstantin Belousov ("thread_alloc_stack called on a thread with kstack")); 4828a945d10SKonstantin Belousov if (!vm_thread_new(td, pages)) 4838a945d10SKonstantin Belousov return (0); 4848a945d10SKonstantin Belousov cpu_thread_alloc(td); 4858a945d10SKonstantin Belousov return (1); 4868a945d10SKonstantin Belousov } 4874f0db5e0SJulian Elischer 4884f0db5e0SJulian Elischer /* 48944990b8cSJulian Elischer * Deallocate a thread. 49044990b8cSJulian Elischer */ 49144990b8cSJulian Elischer void 49244990b8cSJulian Elischer thread_free(struct thread *td) 49344990b8cSJulian Elischer { 4942e6b8de4SJeff Roberson 4951bd3cf5dSMateusz Guzik EVENTHANDLER_DIRECT_INVOKE(thread_dtor, td); 4962e6b8de4SJeff Roberson lock_profile_thread_exit(td); 49745aea8deSJeff Roberson if (td->td_cpuset) 498d7f687fcSJeff Roberson cpuset_rel(td->td_cpuset); 499d7f687fcSJeff Roberson td->td_cpuset = NULL; 5000c3967e7SMarcel Moolenaar cpu_thread_free(td); 50189b57fcfSKonstantin Belousov if (td->td_kstack != 0) 50289b57fcfSKonstantin Belousov vm_thread_dispose(td); 5032d19b736SKonstantin Belousov callout_drain(&td->td_slpcallout); 5041bd3cf5dSMateusz Guzik tid_free(td->td_tid); 5051bd3cf5dSMateusz Guzik td->td_tid = -1; 50644990b8cSJulian Elischer uma_zfree(thread_zone, td); 50744990b8cSJulian Elischer } 50844990b8cSJulian Elischer 5094ea6a9a2SMateusz Guzik void 5104ea6a9a2SMateusz Guzik thread_cow_get_proc(struct thread *newtd, struct proc *p) 5114ea6a9a2SMateusz Guzik { 5124ea6a9a2SMateusz Guzik 5134ea6a9a2SMateusz Guzik PROC_LOCK_ASSERT(p, MA_OWNED); 5141724c563SMateusz Guzik newtd->td_realucred = crcowget(p->p_ucred); 5151724c563SMateusz Guzik newtd->td_ucred = newtd->td_realucred; 516f6f6d240SMateusz Guzik newtd->td_limit = lim_hold(p->p_limit); 5174ea6a9a2SMateusz Guzik newtd->td_cowgen = p->p_cowgen; 5184ea6a9a2SMateusz Guzik } 5194ea6a9a2SMateusz Guzik 5204ea6a9a2SMateusz Guzik void 5214ea6a9a2SMateusz Guzik thread_cow_get(struct thread *newtd, struct thread *td) 5224ea6a9a2SMateusz Guzik { 5234ea6a9a2SMateusz Guzik 5241724c563SMateusz Guzik MPASS(td->td_realucred == td->td_ucred); 5251724c563SMateusz Guzik newtd->td_realucred = crcowget(td->td_realucred); 5261724c563SMateusz Guzik newtd->td_ucred = newtd->td_realucred; 527f6f6d240SMateusz Guzik newtd->td_limit = lim_hold(td->td_limit); 5284ea6a9a2SMateusz Guzik newtd->td_cowgen = td->td_cowgen; 5294ea6a9a2SMateusz Guzik } 5304ea6a9a2SMateusz Guzik 5314ea6a9a2SMateusz Guzik void 5324ea6a9a2SMateusz Guzik thread_cow_free(struct thread *td) 5334ea6a9a2SMateusz Guzik { 5344ea6a9a2SMateusz Guzik 5351724c563SMateusz Guzik if (td->td_realucred != NULL) 5361724c563SMateusz Guzik crcowfree(td); 537cd672ca6SMateusz Guzik if (td->td_limit != NULL) 538f6f6d240SMateusz Guzik lim_free(td->td_limit); 5394ea6a9a2SMateusz Guzik } 5404ea6a9a2SMateusz Guzik 5414ea6a9a2SMateusz Guzik void 5424ea6a9a2SMateusz Guzik thread_cow_update(struct thread *td) 5434ea6a9a2SMateusz Guzik { 5444ea6a9a2SMateusz Guzik struct proc *p; 545cd672ca6SMateusz Guzik struct ucred *oldcred; 546cd672ca6SMateusz Guzik struct plimit *oldlimit; 5474ea6a9a2SMateusz Guzik 5484ea6a9a2SMateusz Guzik p = td->td_proc; 549cd672ca6SMateusz Guzik oldlimit = NULL; 5504ea6a9a2SMateusz Guzik PROC_LOCK(p); 5511724c563SMateusz Guzik oldcred = crcowsync(); 552cd672ca6SMateusz Guzik if (td->td_limit != p->p_limit) { 553cd672ca6SMateusz Guzik oldlimit = td->td_limit; 554cd672ca6SMateusz Guzik td->td_limit = lim_hold(p->p_limit); 555cd672ca6SMateusz Guzik } 5564ea6a9a2SMateusz Guzik td->td_cowgen = p->p_cowgen; 5574ea6a9a2SMateusz Guzik PROC_UNLOCK(p); 558cd672ca6SMateusz Guzik if (oldcred != NULL) 559cd672ca6SMateusz Guzik crfree(oldcred); 560cd672ca6SMateusz Guzik if (oldlimit != NULL) 561cd672ca6SMateusz Guzik lim_free(oldlimit); 5624ea6a9a2SMateusz Guzik } 5634ea6a9a2SMateusz Guzik 56444990b8cSJulian Elischer /* 56544990b8cSJulian Elischer * Discard the current thread and exit from its context. 56694e0a4cdSJulian Elischer * Always called with scheduler locked. 56744990b8cSJulian Elischer * 56844990b8cSJulian Elischer * Because we can't free a thread while we're operating under its context, 569696058c3SJulian Elischer * push the current thread into our CPU's deadthread holder. This means 570696058c3SJulian Elischer * we needn't worry about someone else grabbing our context before we 5716617724cSJeff Roberson * do a cpu_throw(). 57244990b8cSJulian Elischer */ 57344990b8cSJulian Elischer void 57444990b8cSJulian Elischer thread_exit(void) 57544990b8cSJulian Elischer { 5767e3a96eaSJohn Baldwin uint64_t runtime, new_switchtime; 57744990b8cSJulian Elischer struct thread *td; 5781c4bcd05SJeff Roberson struct thread *td2; 57944990b8cSJulian Elischer struct proc *p; 5807847a9daSJohn Baldwin int wakeup_swapper; 58144990b8cSJulian Elischer 58244990b8cSJulian Elischer td = curthread; 58344990b8cSJulian Elischer p = td->td_proc; 58444990b8cSJulian Elischer 585a54e85fdSJeff Roberson PROC_SLOCK_ASSERT(p, MA_OWNED); 586ed062c8dSJulian Elischer mtx_assert(&Giant, MA_NOTOWNED); 587a54e85fdSJeff Roberson 58844990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 589ed062c8dSJulian Elischer KASSERT(p != NULL, ("thread exiting without a process")); 590cc701b73SRobert Watson CTR3(KTR_PROC, "thread_exit: thread %p (pid %ld, %s)", td, 591e01eafefSJulian Elischer (long)p->p_pid, td->td_name); 5926c9271a9SAndriy Gapon SDT_PROBE0(proc, , , lwp__exit); 5939104847fSDavid Xu KASSERT(TAILQ_EMPTY(&td->td_sigqueue.sq_list), ("signal pending")); 594936c24faSMateusz Guzik MPASS(td->td_realucred == td->td_ucred); 59544990b8cSJulian Elischer 596ed062c8dSJulian Elischer /* 597ed062c8dSJulian Elischer * drop FPU & debug register state storage, or any other 598ed062c8dSJulian Elischer * architecture specific resources that 599ed062c8dSJulian Elischer * would not be on a new untouched process. 600ed062c8dSJulian Elischer */ 601bd07998eSKonstantin Belousov cpu_thread_exit(td); 60244990b8cSJulian Elischer 603ed062c8dSJulian Elischer /* 6041faf202eSJulian Elischer * The last thread is left attached to the process 6051faf202eSJulian Elischer * So that the whole bundle gets recycled. Skip 606ed062c8dSJulian Elischer * all this stuff if we never had threads. 607ed062c8dSJulian Elischer * EXIT clears all sign of other threads when 608ed062c8dSJulian Elischer * it goes to single threading, so the last thread always 609ed062c8dSJulian Elischer * takes the short path. 6101faf202eSJulian Elischer */ 611ed062c8dSJulian Elischer if (p->p_flag & P_HADTHREADS) { 6121faf202eSJulian Elischer if (p->p_numthreads > 1) { 613fd229b5bSKonstantin Belousov atomic_add_int(&td->td_proc->p_exitthreads, 1); 614d3a0bd78SJulian Elischer thread_unlink(td); 6151c4bcd05SJeff Roberson td2 = FIRST_THREAD_IN_PROC(p); 6161c4bcd05SJeff Roberson sched_exit_thread(td2, td); 617ed062c8dSJulian Elischer 618ed062c8dSJulian Elischer /* 61944990b8cSJulian Elischer * The test below is NOT true if we are the 6209182554aSKonstantin Belousov * sole exiting thread. P_STOPPED_SINGLE is unset 62144990b8cSJulian Elischer * in exit1() after it is the only survivor. 62244990b8cSJulian Elischer */ 6231279572aSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 62444990b8cSJulian Elischer if (p->p_numthreads == p->p_suspcount) { 625a54e85fdSJeff Roberson thread_lock(p->p_singlethread); 6267847a9daSJohn Baldwin wakeup_swapper = thread_unsuspend_one( 62784cdea97SKonstantin Belousov p->p_singlethread, p, false); 6287847a9daSJohn Baldwin if (wakeup_swapper) 6297847a9daSJohn Baldwin kick_proc0(); 63044990b8cSJulian Elischer } 63144990b8cSJulian Elischer } 63248bfcdddSJulian Elischer 633696058c3SJulian Elischer PCPU_SET(deadthread, td); 6341faf202eSJulian Elischer } else { 635ed062c8dSJulian Elischer /* 636ed062c8dSJulian Elischer * The last thread is exiting.. but not through exit() 637ed062c8dSJulian Elischer */ 638ed062c8dSJulian Elischer panic ("thread_exit: Last thread exiting on its own"); 639ed062c8dSJulian Elischer } 6401faf202eSJulian Elischer } 64116d95d4fSJoseph Koshy #ifdef HWPMC_HOOKS 64216d95d4fSJoseph Koshy /* 64316d95d4fSJoseph Koshy * If this thread is part of a process that is being tracked by hwpmc(4), 64416d95d4fSJoseph Koshy * inform the module of the thread's impending exit. 64516d95d4fSJoseph Koshy */ 6466161b98cSMatt Macy if (PMC_PROC_IS_USING_PMCS(td->td_proc)) { 64716d95d4fSJoseph Koshy PMC_SWITCH_CONTEXT(td, PMC_FN_CSW_OUT); 6486161b98cSMatt Macy PMC_CALL_HOOK_UNLOCKED(td, PMC_FN_THR_EXIT, NULL); 649ebfaf69cSMatt Macy } else if (PMC_SYSTEM_SAMPLING_ACTIVE()) 650ebfaf69cSMatt Macy PMC_CALL_HOOK_UNLOCKED(td, PMC_FN_THR_EXIT_LOG, NULL); 65116d95d4fSJoseph Koshy #endif 652a54e85fdSJeff Roberson PROC_UNLOCK(p); 6535c7bebf9SKonstantin Belousov PROC_STATLOCK(p); 6545c7bebf9SKonstantin Belousov thread_lock(td); 6555c7bebf9SKonstantin Belousov PROC_SUNLOCK(p); 6567e3a96eaSJohn Baldwin 6577e3a96eaSJohn Baldwin /* Do the same timestamp bookkeeping that mi_switch() would do. */ 6587e3a96eaSJohn Baldwin new_switchtime = cpu_ticks(); 6597e3a96eaSJohn Baldwin runtime = new_switchtime - PCPU_GET(switchtime); 6607e3a96eaSJohn Baldwin td->td_runtime += runtime; 6617e3a96eaSJohn Baldwin td->td_incruntime += runtime; 6627e3a96eaSJohn Baldwin PCPU_SET(switchtime, new_switchtime); 6637e3a96eaSJohn Baldwin PCPU_SET(switchticks, ticks); 66483c9dea1SGleb Smirnoff VM_CNT_INC(v_swtch); 6657e3a96eaSJohn Baldwin 6667e3a96eaSJohn Baldwin /* Save our resource usage in our process. */ 6677e3a96eaSJohn Baldwin td->td_ru.ru_nvcsw++; 66861a74c5cSJeff Roberson ruxagg_locked(p, td); 6697e3a96eaSJohn Baldwin rucollect(&p->p_ru, &td->td_ru); 6705c7bebf9SKonstantin Belousov PROC_STATUNLOCK(p); 6717e3a96eaSJohn Baldwin 672dcc9954eSJulian Elischer td->td_state = TDS_INACTIVE; 6733d06b4b3SAttilio Rao #ifdef WITNESS 6743d06b4b3SAttilio Rao witness_thread_exit(td); 6753d06b4b3SAttilio Rao #endif 676732d9528SJulian Elischer CTR1(KTR_PROC, "thread_exit: cpu_throw() thread %p", td); 677a54e85fdSJeff Roberson sched_throw(td); 678cc66ebe2SPeter Wemm panic("I'm a teapot!"); 67944990b8cSJulian Elischer /* NOTREACHED */ 68044990b8cSJulian Elischer } 68144990b8cSJulian Elischer 68244990b8cSJulian Elischer /* 683696058c3SJulian Elischer * Do any thread specific cleanups that may be needed in wait() 68437814395SPeter Wemm * called with Giant, proc and schedlock not held. 685696058c3SJulian Elischer */ 686696058c3SJulian Elischer void 687696058c3SJulian Elischer thread_wait(struct proc *p) 688696058c3SJulian Elischer { 689696058c3SJulian Elischer struct thread *td; 690696058c3SJulian Elischer 69137814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 692624bf9e1SKonstantin Belousov KASSERT(p->p_numthreads == 1, ("multiple threads in thread_wait()")); 693624bf9e1SKonstantin Belousov KASSERT(p->p_exitthreads == 0, ("p_exitthreads leaking")); 694ff8fbcffSJeff Roberson td = FIRST_THREAD_IN_PROC(p); 695ff8fbcffSJeff Roberson /* Lock the last thread so we spin until it exits cpu_throw(). */ 696ff8fbcffSJeff Roberson thread_lock(td); 697ff8fbcffSJeff Roberson thread_unlock(td); 6982e6b8de4SJeff Roberson lock_profile_thread_exit(td); 699d7f687fcSJeff Roberson cpuset_rel(td->td_cpuset); 700d7f687fcSJeff Roberson td->td_cpuset = NULL; 701696058c3SJulian Elischer cpu_thread_clean(td); 7024ea6a9a2SMateusz Guzik thread_cow_free(td); 7032d19b736SKonstantin Belousov callout_drain(&td->td_slpcallout); 704696058c3SJulian Elischer thread_reap(); /* check for zombie threads etc. */ 705696058c3SJulian Elischer } 706696058c3SJulian Elischer 707696058c3SJulian Elischer /* 70844990b8cSJulian Elischer * Link a thread to a process. 7091faf202eSJulian Elischer * set up anything that needs to be initialized for it to 7101faf202eSJulian Elischer * be used by the process. 71144990b8cSJulian Elischer */ 71244990b8cSJulian Elischer void 7138460a577SJohn Birrell thread_link(struct thread *td, struct proc *p) 71444990b8cSJulian Elischer { 71544990b8cSJulian Elischer 716a54e85fdSJeff Roberson /* 717a54e85fdSJeff Roberson * XXX This can't be enabled because it's called for proc0 before 718374ae2a3SJeff Roberson * its lock has been created. 719374ae2a3SJeff Roberson * PROC_LOCK_ASSERT(p, MA_OWNED); 720a54e85fdSJeff Roberson */ 72171fad9fdSJulian Elischer td->td_state = TDS_INACTIVE; 72244990b8cSJulian Elischer td->td_proc = p; 723b61ce5b0SJeff Roberson td->td_flags = TDF_INMEM; 72444990b8cSJulian Elischer 7251faf202eSJulian Elischer LIST_INIT(&td->td_contested); 726eea4f254SJeff Roberson LIST_INIT(&td->td_lprof[0]); 727eea4f254SJeff Roberson LIST_INIT(&td->td_lprof[1]); 728f6eccf96SGleb Smirnoff #ifdef EPOCH_TRACE 729dd902d01SGleb Smirnoff SLIST_INIT(&td->td_epochs); 730f6eccf96SGleb Smirnoff #endif 7319104847fSDavid Xu sigqueue_init(&td->td_sigqueue, p); 732fd90e2edSJung-uk Kim callout_init(&td->td_slpcallout, 1); 73366d8df9dSDaniel Eischen TAILQ_INSERT_TAIL(&p->p_threads, td, td_plist); 73444990b8cSJulian Elischer p->p_numthreads++; 73544990b8cSJulian Elischer } 73644990b8cSJulian Elischer 737ed062c8dSJulian Elischer /* 738ed062c8dSJulian Elischer * Called from: 739ed062c8dSJulian Elischer * thread_exit() 740ed062c8dSJulian Elischer */ 741d3a0bd78SJulian Elischer void 742d3a0bd78SJulian Elischer thread_unlink(struct thread *td) 743d3a0bd78SJulian Elischer { 744d3a0bd78SJulian Elischer struct proc *p = td->td_proc; 745d3a0bd78SJulian Elischer 746374ae2a3SJeff Roberson PROC_LOCK_ASSERT(p, MA_OWNED); 747f6eccf96SGleb Smirnoff #ifdef EPOCH_TRACE 748dd902d01SGleb Smirnoff MPASS(SLIST_EMPTY(&td->td_epochs)); 749f6eccf96SGleb Smirnoff #endif 750dd902d01SGleb Smirnoff 751d3a0bd78SJulian Elischer TAILQ_REMOVE(&p->p_threads, td, td_plist); 752d3a0bd78SJulian Elischer p->p_numthreads--; 753d3a0bd78SJulian Elischer /* could clear a few other things here */ 7548460a577SJohn Birrell /* Must NOT clear links to proc! */ 7555c8329edSJulian Elischer } 7565c8329edSJulian Elischer 75779799053SKonstantin Belousov static int 75879799053SKonstantin Belousov calc_remaining(struct proc *p, int mode) 75979799053SKonstantin Belousov { 76079799053SKonstantin Belousov int remaining; 76179799053SKonstantin Belousov 7627b519077SKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 7637b519077SKonstantin Belousov PROC_SLOCK_ASSERT(p, MA_OWNED); 76479799053SKonstantin Belousov if (mode == SINGLE_EXIT) 76579799053SKonstantin Belousov remaining = p->p_numthreads; 76679799053SKonstantin Belousov else if (mode == SINGLE_BOUNDARY) 76779799053SKonstantin Belousov remaining = p->p_numthreads - p->p_boundary_count; 7686ddcc233SKonstantin Belousov else if (mode == SINGLE_NO_EXIT || mode == SINGLE_ALLPROC) 76979799053SKonstantin Belousov remaining = p->p_numthreads - p->p_suspcount; 77079799053SKonstantin Belousov else 77179799053SKonstantin Belousov panic("calc_remaining: wrong mode %d", mode); 77279799053SKonstantin Belousov return (remaining); 77379799053SKonstantin Belousov } 77479799053SKonstantin Belousov 77507a9368aSKonstantin Belousov static int 77607a9368aSKonstantin Belousov remain_for_mode(int mode) 77707a9368aSKonstantin Belousov { 77807a9368aSKonstantin Belousov 7796ddcc233SKonstantin Belousov return (mode == SINGLE_ALLPROC ? 0 : 1); 78007a9368aSKonstantin Belousov } 78107a9368aSKonstantin Belousov 78207a9368aSKonstantin Belousov static int 78307a9368aSKonstantin Belousov weed_inhib(int mode, struct thread *td2, struct proc *p) 78407a9368aSKonstantin Belousov { 78507a9368aSKonstantin Belousov int wakeup_swapper; 78607a9368aSKonstantin Belousov 78707a9368aSKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 78807a9368aSKonstantin Belousov PROC_SLOCK_ASSERT(p, MA_OWNED); 78907a9368aSKonstantin Belousov THREAD_LOCK_ASSERT(td2, MA_OWNED); 79007a9368aSKonstantin Belousov 79107a9368aSKonstantin Belousov wakeup_swapper = 0; 79261a74c5cSJeff Roberson 79361a74c5cSJeff Roberson /* 79461a74c5cSJeff Roberson * Since the thread lock is dropped by the scheduler we have 79561a74c5cSJeff Roberson * to retry to check for races. 79661a74c5cSJeff Roberson */ 79761a74c5cSJeff Roberson restart: 79807a9368aSKonstantin Belousov switch (mode) { 79907a9368aSKonstantin Belousov case SINGLE_EXIT: 80061a74c5cSJeff Roberson if (TD_IS_SUSPENDED(td2)) { 80184cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td2, p, true); 80261a74c5cSJeff Roberson thread_lock(td2); 80361a74c5cSJeff Roberson goto restart; 80461a74c5cSJeff Roberson } 80561a74c5cSJeff Roberson if (TD_CAN_ABORT(td2)) { 80607a9368aSKonstantin Belousov wakeup_swapper |= sleepq_abort(td2, EINTR); 80761a74c5cSJeff Roberson return (wakeup_swapper); 80861a74c5cSJeff Roberson } 80907a9368aSKonstantin Belousov break; 81007a9368aSKonstantin Belousov case SINGLE_BOUNDARY: 81107a9368aSKonstantin Belousov case SINGLE_NO_EXIT: 81261a74c5cSJeff Roberson if (TD_IS_SUSPENDED(td2) && 81361a74c5cSJeff Roberson (td2->td_flags & TDF_BOUNDARY) == 0) { 81484cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td2, p, false); 81561a74c5cSJeff Roberson thread_lock(td2); 81661a74c5cSJeff Roberson goto restart; 81761a74c5cSJeff Roberson } 81861a74c5cSJeff Roberson if (TD_CAN_ABORT(td2)) { 81907a9368aSKonstantin Belousov wakeup_swapper |= sleepq_abort(td2, ERESTART); 82061a74c5cSJeff Roberson return (wakeup_swapper); 82161a74c5cSJeff Roberson } 822917dd390SKonstantin Belousov break; 8236ddcc233SKonstantin Belousov case SINGLE_ALLPROC: 8246ddcc233SKonstantin Belousov /* 8256ddcc233SKonstantin Belousov * ALLPROC suspend tries to avoid spurious EINTR for 8266ddcc233SKonstantin Belousov * threads sleeping interruptable, by suspending the 8276ddcc233SKonstantin Belousov * thread directly, similarly to sig_suspend_threads(). 8286ddcc233SKonstantin Belousov * Since such sleep is not performed at the user 8296ddcc233SKonstantin Belousov * boundary, TDF_BOUNDARY flag is not set, and TDF_ALLPROCSUSP 8306ddcc233SKonstantin Belousov * is used to avoid immediate un-suspend. 8316ddcc233SKonstantin Belousov */ 8326ddcc233SKonstantin Belousov if (TD_IS_SUSPENDED(td2) && (td2->td_flags & (TDF_BOUNDARY | 83361a74c5cSJeff Roberson TDF_ALLPROCSUSP)) == 0) { 83484cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td2, p, false); 83561a74c5cSJeff Roberson thread_lock(td2); 83661a74c5cSJeff Roberson goto restart; 83761a74c5cSJeff Roberson } 83861a74c5cSJeff Roberson if (TD_CAN_ABORT(td2)) { 8396ddcc233SKonstantin Belousov if ((td2->td_flags & TDF_SBDRY) == 0) { 8406ddcc233SKonstantin Belousov thread_suspend_one(td2); 8416ddcc233SKonstantin Belousov td2->td_flags |= TDF_ALLPROCSUSP; 8426ddcc233SKonstantin Belousov } else { 8436ddcc233SKonstantin Belousov wakeup_swapper |= sleepq_abort(td2, ERESTART); 84461a74c5cSJeff Roberson return (wakeup_swapper); 8456ddcc233SKonstantin Belousov } 8466ddcc233SKonstantin Belousov } 84707a9368aSKonstantin Belousov break; 84861a74c5cSJeff Roberson default: 84961a74c5cSJeff Roberson break; 85007a9368aSKonstantin Belousov } 85161a74c5cSJeff Roberson thread_unlock(td2); 85207a9368aSKonstantin Belousov return (wakeup_swapper); 85307a9368aSKonstantin Belousov } 85407a9368aSKonstantin Belousov 8555215b187SJeff Roberson /* 85644990b8cSJulian Elischer * Enforce single-threading. 85744990b8cSJulian Elischer * 85844990b8cSJulian Elischer * Returns 1 if the caller must abort (another thread is waiting to 85944990b8cSJulian Elischer * exit the process or similar). Process is locked! 86044990b8cSJulian Elischer * Returns 0 when you are successfully the only thread running. 86144990b8cSJulian Elischer * A process has successfully single threaded in the suspend mode when 86244990b8cSJulian Elischer * There are no threads in user mode. Threads in the kernel must be 86344990b8cSJulian Elischer * allowed to continue until they get to the user boundary. They may even 86444990b8cSJulian Elischer * copy out their return values and data before suspending. They may however be 865e2668f55SMaxim Konovalov * accelerated in reaching the user boundary as we will wake up 86644990b8cSJulian Elischer * any sleeping threads that are interruptable. (PCATCH). 86744990b8cSJulian Elischer */ 86844990b8cSJulian Elischer int 8696ddcc233SKonstantin Belousov thread_single(struct proc *p, int mode) 87044990b8cSJulian Elischer { 87144990b8cSJulian Elischer struct thread *td; 87244990b8cSJulian Elischer struct thread *td2; 873da7bbd2cSJohn Baldwin int remaining, wakeup_swapper; 87444990b8cSJulian Elischer 87544990b8cSJulian Elischer td = curthread; 8766ddcc233SKonstantin Belousov KASSERT(mode == SINGLE_EXIT || mode == SINGLE_BOUNDARY || 8776ddcc233SKonstantin Belousov mode == SINGLE_ALLPROC || mode == SINGLE_NO_EXIT, 8786ddcc233SKonstantin Belousov ("invalid mode %d", mode)); 8796ddcc233SKonstantin Belousov /* 8806ddcc233SKonstantin Belousov * If allowing non-ALLPROC singlethreading for non-curproc 8816ddcc233SKonstantin Belousov * callers, calc_remaining() and remain_for_mode() should be 8826ddcc233SKonstantin Belousov * adjusted to also account for td->td_proc != p. For now 8836ddcc233SKonstantin Belousov * this is not implemented because it is not used. 8846ddcc233SKonstantin Belousov */ 8856ddcc233SKonstantin Belousov KASSERT((mode == SINGLE_ALLPROC && td->td_proc != p) || 8866ddcc233SKonstantin Belousov (mode != SINGLE_ALLPROC && td->td_proc == p), 8876ddcc233SKonstantin Belousov ("mode %d proc %p curproc %p", mode, p, td->td_proc)); 88837814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 88944990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 89044990b8cSJulian Elischer 8916ddcc233SKonstantin Belousov if ((p->p_flag & P_HADTHREADS) == 0 && mode != SINGLE_ALLPROC) 89244990b8cSJulian Elischer return (0); 89344990b8cSJulian Elischer 894e3b9bf71SJulian Elischer /* Is someone already single threading? */ 895906ac69dSDavid Xu if (p->p_singlethread != NULL && p->p_singlethread != td) 89644990b8cSJulian Elischer return (1); 89744990b8cSJulian Elischer 898906ac69dSDavid Xu if (mode == SINGLE_EXIT) { 899906ac69dSDavid Xu p->p_flag |= P_SINGLE_EXIT; 900906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_BOUNDARY; 901906ac69dSDavid Xu } else { 902906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_EXIT; 903906ac69dSDavid Xu if (mode == SINGLE_BOUNDARY) 904906ac69dSDavid Xu p->p_flag |= P_SINGLE_BOUNDARY; 905906ac69dSDavid Xu else 906906ac69dSDavid Xu p->p_flag &= ~P_SINGLE_BOUNDARY; 907906ac69dSDavid Xu } 9086ddcc233SKonstantin Belousov if (mode == SINGLE_ALLPROC) 9096ddcc233SKonstantin Belousov p->p_flag |= P_TOTAL_STOP; 9101279572aSDavid Xu p->p_flag |= P_STOPPED_SINGLE; 9117b4a950aSDavid Xu PROC_SLOCK(p); 912112afcb2SJohn Baldwin p->p_singlethread = td; 91379799053SKonstantin Belousov remaining = calc_remaining(p, mode); 91407a9368aSKonstantin Belousov while (remaining != remain_for_mode(mode)) { 915bf1a3220SDavid Xu if (P_SHOULDSTOP(p) != P_STOPPED_SINGLE) 916bf1a3220SDavid Xu goto stopme; 917da7bbd2cSJohn Baldwin wakeup_swapper = 0; 91844990b8cSJulian Elischer FOREACH_THREAD_IN_PROC(p, td2) { 91944990b8cSJulian Elischer if (td2 == td) 92044990b8cSJulian Elischer continue; 921a54e85fdSJeff Roberson thread_lock(td2); 922b7edba77SJeff Roberson td2->td_flags |= TDF_ASTPENDING | TDF_NEEDSUSPCHK; 9236ddcc233SKonstantin Belousov if (TD_IS_INHIBITED(td2)) { 92407a9368aSKonstantin Belousov wakeup_swapper |= weed_inhib(mode, td2, p); 925d8267df7SDavid Xu #ifdef SMP 9266ddcc233SKonstantin Belousov } else if (TD_IS_RUNNING(td2) && td != td2) { 927d8267df7SDavid Xu forward_signal(td2); 92861a74c5cSJeff Roberson thread_unlock(td2); 929d8267df7SDavid Xu #endif 93061a74c5cSJeff Roberson } else 931a54e85fdSJeff Roberson thread_unlock(td2); 9329d102777SJulian Elischer } 933da7bbd2cSJohn Baldwin if (wakeup_swapper) 934da7bbd2cSJohn Baldwin kick_proc0(); 93579799053SKonstantin Belousov remaining = calc_remaining(p, mode); 936ec008e96SDavid Xu 9379d102777SJulian Elischer /* 9389d102777SJulian Elischer * Maybe we suspended some threads.. was it enough? 9399d102777SJulian Elischer */ 94007a9368aSKonstantin Belousov if (remaining == remain_for_mode(mode)) 9419d102777SJulian Elischer break; 9429d102777SJulian Elischer 943bf1a3220SDavid Xu stopme: 94444990b8cSJulian Elischer /* 94544990b8cSJulian Elischer * Wake us up when everyone else has suspended. 946e3b9bf71SJulian Elischer * In the mean time we suspend as well. 94744990b8cSJulian Elischer */ 9486ddcc233SKonstantin Belousov thread_suspend_switch(td, p); 94979799053SKonstantin Belousov remaining = calc_remaining(p, mode); 95044990b8cSJulian Elischer } 951906ac69dSDavid Xu if (mode == SINGLE_EXIT) { 95291599697SJulian Elischer /* 9538626a0ddSKonstantin Belousov * Convert the process to an unthreaded process. The 9548626a0ddSKonstantin Belousov * SINGLE_EXIT is called by exit1() or execve(), in 9558626a0ddSKonstantin Belousov * both cases other threads must be retired. 95691599697SJulian Elischer */ 9578626a0ddSKonstantin Belousov KASSERT(p->p_numthreads == 1, ("Unthreading with >1 threads")); 958ed062c8dSJulian Elischer p->p_singlethread = NULL; 9598626a0ddSKonstantin Belousov p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT | P_HADTHREADS); 960fd229b5bSKonstantin Belousov 961fd229b5bSKonstantin Belousov /* 962fd229b5bSKonstantin Belousov * Wait for any remaining threads to exit cpu_throw(). 963fd229b5bSKonstantin Belousov */ 964fd229b5bSKonstantin Belousov while (p->p_exitthreads != 0) { 965fd229b5bSKonstantin Belousov PROC_SUNLOCK(p); 966fd229b5bSKonstantin Belousov PROC_UNLOCK(p); 967fd229b5bSKonstantin Belousov sched_relinquish(td); 968fd229b5bSKonstantin Belousov PROC_LOCK(p); 969fd229b5bSKonstantin Belousov PROC_SLOCK(p); 970fd229b5bSKonstantin Belousov } 971ac437c07SKonstantin Belousov } else if (mode == SINGLE_BOUNDARY) { 972ac437c07SKonstantin Belousov /* 973ac437c07SKonstantin Belousov * Wait until all suspended threads are removed from 974ac437c07SKonstantin Belousov * the processors. The thread_suspend_check() 975ac437c07SKonstantin Belousov * increments p_boundary_count while it is still 976ac437c07SKonstantin Belousov * running, which makes it possible for the execve() 977ac437c07SKonstantin Belousov * to destroy vmspace while our other threads are 978ac437c07SKonstantin Belousov * still using the address space. 979ac437c07SKonstantin Belousov * 980ac437c07SKonstantin Belousov * We lock the thread, which is only allowed to 981ac437c07SKonstantin Belousov * succeed after context switch code finished using 982ac437c07SKonstantin Belousov * the address space. 983ac437c07SKonstantin Belousov */ 984ac437c07SKonstantin Belousov FOREACH_THREAD_IN_PROC(p, td2) { 985ac437c07SKonstantin Belousov if (td2 == td) 986ac437c07SKonstantin Belousov continue; 987ac437c07SKonstantin Belousov thread_lock(td2); 988ac437c07SKonstantin Belousov KASSERT((td2->td_flags & TDF_BOUNDARY) != 0, 989ac437c07SKonstantin Belousov ("td %p not on boundary", td2)); 990ac437c07SKonstantin Belousov KASSERT(TD_IS_SUSPENDED(td2), 991ac437c07SKonstantin Belousov ("td %p is not suspended", td2)); 992ac437c07SKonstantin Belousov thread_unlock(td2); 993ac437c07SKonstantin Belousov } 99491599697SJulian Elischer } 9957b4a950aSDavid Xu PROC_SUNLOCK(p); 99644990b8cSJulian Elischer return (0); 99744990b8cSJulian Elischer } 99844990b8cSJulian Elischer 9998638fe7bSKonstantin Belousov bool 10008638fe7bSKonstantin Belousov thread_suspend_check_needed(void) 10018638fe7bSKonstantin Belousov { 10028638fe7bSKonstantin Belousov struct proc *p; 10038638fe7bSKonstantin Belousov struct thread *td; 10048638fe7bSKonstantin Belousov 10058638fe7bSKonstantin Belousov td = curthread; 10068638fe7bSKonstantin Belousov p = td->td_proc; 10078638fe7bSKonstantin Belousov PROC_LOCK_ASSERT(p, MA_OWNED); 10088638fe7bSKonstantin Belousov return (P_SHOULDSTOP(p) || ((p->p_flag & P_TRACED) != 0 && 10098638fe7bSKonstantin Belousov (td->td_dbgflags & TDB_SUSPEND) != 0)); 10108638fe7bSKonstantin Belousov } 10118638fe7bSKonstantin Belousov 101244990b8cSJulian Elischer /* 101344990b8cSJulian Elischer * Called in from locations that can safely check to see 101444990b8cSJulian Elischer * whether we have to suspend or at least throttle for a 101544990b8cSJulian Elischer * single-thread event (e.g. fork). 101644990b8cSJulian Elischer * 101744990b8cSJulian Elischer * Such locations include userret(). 101844990b8cSJulian Elischer * If the "return_instead" argument is non zero, the thread must be able to 101944990b8cSJulian Elischer * accept 0 (caller may continue), or 1 (caller must abort) as a result. 102044990b8cSJulian Elischer * 102144990b8cSJulian Elischer * The 'return_instead' argument tells the function if it may do a 102244990b8cSJulian Elischer * thread_exit() or suspend, or whether the caller must abort and back 102344990b8cSJulian Elischer * out instead. 102444990b8cSJulian Elischer * 102544990b8cSJulian Elischer * If the thread that set the single_threading request has set the 102644990b8cSJulian Elischer * P_SINGLE_EXIT bit in the process flags then this call will never return 102744990b8cSJulian Elischer * if 'return_instead' is false, but will exit. 102844990b8cSJulian Elischer * 102944990b8cSJulian Elischer * P_SINGLE_EXIT | return_instead == 0| return_instead != 0 103044990b8cSJulian Elischer *---------------+--------------------+--------------------- 103144990b8cSJulian Elischer * 0 | returns 0 | returns 0 or 1 1032353374b5SJohn Baldwin * | when ST ends | immediately 103344990b8cSJulian Elischer *---------------+--------------------+--------------------- 103444990b8cSJulian Elischer * 1 | thread exits | returns 1 1035353374b5SJohn Baldwin * | | immediately 103644990b8cSJulian Elischer * 0 = thread_exit() or suspension ok, 103744990b8cSJulian Elischer * other = return error instead of stopping the thread. 103844990b8cSJulian Elischer * 103944990b8cSJulian Elischer * While a full suspension is under effect, even a single threading 104044990b8cSJulian Elischer * thread would be suspended if it made this call (but it shouldn't). 104144990b8cSJulian Elischer * This call should only be made from places where 104244990b8cSJulian Elischer * thread_exit() would be safe as that may be the outcome unless 104344990b8cSJulian Elischer * return_instead is set. 104444990b8cSJulian Elischer */ 104544990b8cSJulian Elischer int 104644990b8cSJulian Elischer thread_suspend_check(int return_instead) 104744990b8cSJulian Elischer { 1048ecafb24bSJuli Mallett struct thread *td; 1049ecafb24bSJuli Mallett struct proc *p; 105046e47c4fSKonstantin Belousov int wakeup_swapper; 105144990b8cSJulian Elischer 105244990b8cSJulian Elischer td = curthread; 105344990b8cSJulian Elischer p = td->td_proc; 105437814395SPeter Wemm mtx_assert(&Giant, MA_NOTOWNED); 105544990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 10568638fe7bSKonstantin Belousov while (thread_suspend_check_needed()) { 10571279572aSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 105844990b8cSJulian Elischer KASSERT(p->p_singlethread != NULL, 105944990b8cSJulian Elischer ("singlethread not set")); 106044990b8cSJulian Elischer /* 1061e3b9bf71SJulian Elischer * The only suspension in action is a 1062e3b9bf71SJulian Elischer * single-threading. Single threader need not stop. 1063bd07998eSKonstantin Belousov * It is safe to access p->p_singlethread unlocked 1064bd07998eSKonstantin Belousov * because it can only be set to our address by us. 106544990b8cSJulian Elischer */ 1066e3b9bf71SJulian Elischer if (p->p_singlethread == td) 106744990b8cSJulian Elischer return (0); /* Exempt from stopping. */ 106844990b8cSJulian Elischer } 106945a4bfa1SDavid Xu if ((p->p_flag & P_SINGLE_EXIT) && return_instead) 107094f0972bSDavid Xu return (EINTR); 107144990b8cSJulian Elischer 1072906ac69dSDavid Xu /* Should we goto user boundary if we didn't come from there? */ 1073906ac69dSDavid Xu if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE && 1074906ac69dSDavid Xu (p->p_flag & P_SINGLE_BOUNDARY) && return_instead) 107594f0972bSDavid Xu return (ERESTART); 1076906ac69dSDavid Xu 107744990b8cSJulian Elischer /* 10783077f938SKonstantin Belousov * Ignore suspend requests if they are deferred. 1079d071a6faSJohn Baldwin */ 10803077f938SKonstantin Belousov if ((td->td_flags & TDF_SBDRY) != 0) { 1081d071a6faSJohn Baldwin KASSERT(return_instead, 1082d071a6faSJohn Baldwin ("TDF_SBDRY set for unsafe thread_suspend_check")); 108346e47c4fSKonstantin Belousov KASSERT((td->td_flags & (TDF_SEINTR | TDF_SERESTART)) != 108446e47c4fSKonstantin Belousov (TDF_SEINTR | TDF_SERESTART), 108546e47c4fSKonstantin Belousov ("both TDF_SEINTR and TDF_SERESTART")); 108646e47c4fSKonstantin Belousov return (TD_SBDRY_INTR(td) ? TD_SBDRY_ERRNO(td) : 0); 1087d071a6faSJohn Baldwin } 1088d071a6faSJohn Baldwin 1089d071a6faSJohn Baldwin /* 109044990b8cSJulian Elischer * If the process is waiting for us to exit, 109144990b8cSJulian Elischer * this thread should just suicide. 10921279572aSDavid Xu * Assumes that P_SINGLE_EXIT implies P_STOPPED_SINGLE. 109344990b8cSJulian Elischer */ 1094cf7d9a8cSDavid Xu if ((p->p_flag & P_SINGLE_EXIT) && (p->p_singlethread != td)) { 1095cf7d9a8cSDavid Xu PROC_UNLOCK(p); 109691d1786fSDmitry Chagin 109791d1786fSDmitry Chagin /* 109891d1786fSDmitry Chagin * Allow Linux emulation layer to do some work 109991d1786fSDmitry Chagin * before thread suicide. 110091d1786fSDmitry Chagin */ 110191d1786fSDmitry Chagin if (__predict_false(p->p_sysent->sv_thread_detach != NULL)) 110291d1786fSDmitry Chagin (p->p_sysent->sv_thread_detach)(td); 11032a339d9eSKonstantin Belousov umtx_thread_exit(td); 1104d1e7a4a5SJohn Baldwin kern_thr_exit(td); 1105d1e7a4a5SJohn Baldwin panic("stopped thread did not exit"); 1106cf7d9a8cSDavid Xu } 110721ecd1e9SDavid Xu 110821ecd1e9SDavid Xu PROC_SLOCK(p); 110921ecd1e9SDavid Xu thread_stopped(p); 1110a54e85fdSJeff Roberson if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) { 1111a54e85fdSJeff Roberson if (p->p_numthreads == p->p_suspcount + 1) { 1112a54e85fdSJeff Roberson thread_lock(p->p_singlethread); 111384cdea97SKonstantin Belousov wakeup_swapper = thread_unsuspend_one( 111484cdea97SKonstantin Belousov p->p_singlethread, p, false); 11157847a9daSJohn Baldwin if (wakeup_swapper) 11167847a9daSJohn Baldwin kick_proc0(); 1117a54e85fdSJeff Roberson } 1118a54e85fdSJeff Roberson } 11193f9be10eSDavid Xu PROC_UNLOCK(p); 11207b4a950aSDavid Xu thread_lock(td); 112144990b8cSJulian Elischer /* 112244990b8cSJulian Elischer * When a thread suspends, it just 1123ad1e7d28SJulian Elischer * gets taken off all queues. 112444990b8cSJulian Elischer */ 112571fad9fdSJulian Elischer thread_suspend_one(td); 1126906ac69dSDavid Xu if (return_instead == 0) { 1127906ac69dSDavid Xu p->p_boundary_count++; 1128906ac69dSDavid Xu td->td_flags |= TDF_BOUNDARY; 1129cf19bf91SJulian Elischer } 11307b4a950aSDavid Xu PROC_SUNLOCK(p); 1131686bcb5cSJeff Roberson mi_switch(SW_INVOL | SWT_SUSPEND); 113244990b8cSJulian Elischer PROC_LOCK(p); 113344990b8cSJulian Elischer } 113444990b8cSJulian Elischer return (0); 113544990b8cSJulian Elischer } 113644990b8cSJulian Elischer 1137478ca4b0SKonstantin Belousov /* 1138478ca4b0SKonstantin Belousov * Check for possible stops and suspensions while executing a 1139478ca4b0SKonstantin Belousov * casueword or similar transiently failing operation. 1140478ca4b0SKonstantin Belousov * 1141478ca4b0SKonstantin Belousov * The sleep argument controls whether the function can handle a stop 1142478ca4b0SKonstantin Belousov * request itself or it should return ERESTART and the request is 1143478ca4b0SKonstantin Belousov * proceed at the kernel/user boundary in ast. 1144478ca4b0SKonstantin Belousov * 1145478ca4b0SKonstantin Belousov * Typically, when retrying due to casueword(9) failure (rv == 1), we 1146478ca4b0SKonstantin Belousov * should handle the stop requests there, with exception of cases when 1147478ca4b0SKonstantin Belousov * the thread owns a kernel resource, for instance busied the umtx 1148300b525dSKonstantin Belousov * key, or when functions return immediately if thread_check_susp() 1149478ca4b0SKonstantin Belousov * returned non-zero. On the other hand, retrying the whole lock 1150478ca4b0SKonstantin Belousov * operation, we better not stop there but delegate the handling to 1151478ca4b0SKonstantin Belousov * ast. 1152478ca4b0SKonstantin Belousov * 1153478ca4b0SKonstantin Belousov * If the request is for thread termination P_SINGLE_EXIT, we cannot 1154478ca4b0SKonstantin Belousov * handle it at all, and simply return EINTR. 1155478ca4b0SKonstantin Belousov */ 1156478ca4b0SKonstantin Belousov int 1157478ca4b0SKonstantin Belousov thread_check_susp(struct thread *td, bool sleep) 1158478ca4b0SKonstantin Belousov { 1159478ca4b0SKonstantin Belousov struct proc *p; 1160478ca4b0SKonstantin Belousov int error; 1161478ca4b0SKonstantin Belousov 1162478ca4b0SKonstantin Belousov /* 1163478ca4b0SKonstantin Belousov * The check for TDF_NEEDSUSPCHK is racy, but it is enough to 1164478ca4b0SKonstantin Belousov * eventually break the lockstep loop. 1165478ca4b0SKonstantin Belousov */ 1166478ca4b0SKonstantin Belousov if ((td->td_flags & TDF_NEEDSUSPCHK) == 0) 1167478ca4b0SKonstantin Belousov return (0); 1168478ca4b0SKonstantin Belousov error = 0; 1169478ca4b0SKonstantin Belousov p = td->td_proc; 1170478ca4b0SKonstantin Belousov PROC_LOCK(p); 1171478ca4b0SKonstantin Belousov if (p->p_flag & P_SINGLE_EXIT) 1172478ca4b0SKonstantin Belousov error = EINTR; 1173478ca4b0SKonstantin Belousov else if (P_SHOULDSTOP(p) || 1174478ca4b0SKonstantin Belousov ((p->p_flag & P_TRACED) && (td->td_dbgflags & TDB_SUSPEND))) 1175478ca4b0SKonstantin Belousov error = sleep ? thread_suspend_check(0) : ERESTART; 1176478ca4b0SKonstantin Belousov PROC_UNLOCK(p); 1177478ca4b0SKonstantin Belousov return (error); 1178478ca4b0SKonstantin Belousov } 1179478ca4b0SKonstantin Belousov 118035c32a76SDavid Xu void 11816ddcc233SKonstantin Belousov thread_suspend_switch(struct thread *td, struct proc *p) 1182a54e85fdSJeff Roberson { 1183a54e85fdSJeff Roberson 1184a54e85fdSJeff Roberson KASSERT(!TD_IS_SUSPENDED(td), ("already suspended")); 1185a54e85fdSJeff Roberson PROC_LOCK_ASSERT(p, MA_OWNED); 11867b4a950aSDavid Xu PROC_SLOCK_ASSERT(p, MA_OWNED); 1187a54e85fdSJeff Roberson /* 1188a54e85fdSJeff Roberson * We implement thread_suspend_one in stages here to avoid 1189a54e85fdSJeff Roberson * dropping the proc lock while the thread lock is owned. 1190a54e85fdSJeff Roberson */ 11916ddcc233SKonstantin Belousov if (p == td->td_proc) { 1192a54e85fdSJeff Roberson thread_stopped(p); 1193a54e85fdSJeff Roberson p->p_suspcount++; 11946ddcc233SKonstantin Belousov } 11953f9be10eSDavid Xu PROC_UNLOCK(p); 11967b4a950aSDavid Xu thread_lock(td); 1197b7edba77SJeff Roberson td->td_flags &= ~TDF_NEEDSUSPCHK; 1198a54e85fdSJeff Roberson TD_SET_SUSPENDED(td); 1199c5aa6b58SJeff Roberson sched_sleep(td, 0); 12007b4a950aSDavid Xu PROC_SUNLOCK(p); 1201a54e85fdSJeff Roberson DROP_GIANT(); 1202686bcb5cSJeff Roberson mi_switch(SW_VOL | SWT_SUSPEND); 1203a54e85fdSJeff Roberson PICKUP_GIANT(); 1204a54e85fdSJeff Roberson PROC_LOCK(p); 12057b4a950aSDavid Xu PROC_SLOCK(p); 1206a54e85fdSJeff Roberson } 1207a54e85fdSJeff Roberson 1208a54e85fdSJeff Roberson void 120935c32a76SDavid Xu thread_suspend_one(struct thread *td) 121035c32a76SDavid Xu { 12116ddcc233SKonstantin Belousov struct proc *p; 121235c32a76SDavid Xu 12136ddcc233SKonstantin Belousov p = td->td_proc; 12147b4a950aSDavid Xu PROC_SLOCK_ASSERT(p, MA_OWNED); 1215a54e85fdSJeff Roberson THREAD_LOCK_ASSERT(td, MA_OWNED); 1216e574e444SDavid Xu KASSERT(!TD_IS_SUSPENDED(td), ("already suspended")); 121735c32a76SDavid Xu p->p_suspcount++; 1218b7edba77SJeff Roberson td->td_flags &= ~TDF_NEEDSUSPCHK; 121971fad9fdSJulian Elischer TD_SET_SUSPENDED(td); 1220c5aa6b58SJeff Roberson sched_sleep(td, 0); 122135c32a76SDavid Xu } 122235c32a76SDavid Xu 122384cdea97SKonstantin Belousov static int 122484cdea97SKonstantin Belousov thread_unsuspend_one(struct thread *td, struct proc *p, bool boundary) 122535c32a76SDavid Xu { 122635c32a76SDavid Xu 1227a54e85fdSJeff Roberson THREAD_LOCK_ASSERT(td, MA_OWNED); 1228ad1e7d28SJulian Elischer KASSERT(TD_IS_SUSPENDED(td), ("Thread not suspended")); 122971fad9fdSJulian Elischer TD_CLR_SUSPENDED(td); 12306ddcc233SKonstantin Belousov td->td_flags &= ~TDF_ALLPROCSUSP; 12316ddcc233SKonstantin Belousov if (td->td_proc == p) { 12326ddcc233SKonstantin Belousov PROC_SLOCK_ASSERT(p, MA_OWNED); 123335c32a76SDavid Xu p->p_suspcount--; 123484cdea97SKonstantin Belousov if (boundary && (td->td_flags & TDF_BOUNDARY) != 0) { 123584cdea97SKonstantin Belousov td->td_flags &= ~TDF_BOUNDARY; 123684cdea97SKonstantin Belousov p->p_boundary_count--; 123784cdea97SKonstantin Belousov } 12386ddcc233SKonstantin Belousov } 123961a74c5cSJeff Roberson return (setrunnable(td, 0)); 124035c32a76SDavid Xu } 124135c32a76SDavid Xu 124244990b8cSJulian Elischer /* 124344990b8cSJulian Elischer * Allow all threads blocked by single threading to continue running. 124444990b8cSJulian Elischer */ 124544990b8cSJulian Elischer void 124644990b8cSJulian Elischer thread_unsuspend(struct proc *p) 124744990b8cSJulian Elischer { 124844990b8cSJulian Elischer struct thread *td; 12497847a9daSJohn Baldwin int wakeup_swapper; 125044990b8cSJulian Elischer 125144990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 12527b4a950aSDavid Xu PROC_SLOCK_ASSERT(p, MA_OWNED); 12537847a9daSJohn Baldwin wakeup_swapper = 0; 125444990b8cSJulian Elischer if (!P_SHOULDSTOP(p)) { 1255ad1e7d28SJulian Elischer FOREACH_THREAD_IN_PROC(p, td) { 1256a54e85fdSJeff Roberson thread_lock(td); 1257ad1e7d28SJulian Elischer if (TD_IS_SUSPENDED(td)) { 125884cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td, p, 125984cdea97SKonstantin Belousov true); 126061a74c5cSJeff Roberson } else 1261a54e85fdSJeff Roberson thread_unlock(td); 1262ad1e7d28SJulian Elischer } 126384cdea97SKonstantin Belousov } else if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE && 126484cdea97SKonstantin Belousov p->p_numthreads == p->p_suspcount) { 126544990b8cSJulian Elischer /* 126644990b8cSJulian Elischer * Stopping everything also did the job for the single 126744990b8cSJulian Elischer * threading request. Now we've downgraded to single-threaded, 126844990b8cSJulian Elischer * let it continue. 126944990b8cSJulian Elischer */ 12706ddcc233SKonstantin Belousov if (p->p_singlethread->td_proc == p) { 1271a54e85fdSJeff Roberson thread_lock(p->p_singlethread); 12726ddcc233SKonstantin Belousov wakeup_swapper = thread_unsuspend_one( 127384cdea97SKonstantin Belousov p->p_singlethread, p, false); 127444990b8cSJulian Elischer } 12756ddcc233SKonstantin Belousov } 12767847a9daSJohn Baldwin if (wakeup_swapper) 12777847a9daSJohn Baldwin kick_proc0(); 127844990b8cSJulian Elischer } 127944990b8cSJulian Elischer 1280ed062c8dSJulian Elischer /* 1281ed062c8dSJulian Elischer * End the single threading mode.. 1282ed062c8dSJulian Elischer */ 128344990b8cSJulian Elischer void 12846ddcc233SKonstantin Belousov thread_single_end(struct proc *p, int mode) 128544990b8cSJulian Elischer { 128644990b8cSJulian Elischer struct thread *td; 12877847a9daSJohn Baldwin int wakeup_swapper; 128844990b8cSJulian Elischer 12896ddcc233SKonstantin Belousov KASSERT(mode == SINGLE_EXIT || mode == SINGLE_BOUNDARY || 12906ddcc233SKonstantin Belousov mode == SINGLE_ALLPROC || mode == SINGLE_NO_EXIT, 12916ddcc233SKonstantin Belousov ("invalid mode %d", mode)); 129244990b8cSJulian Elischer PROC_LOCK_ASSERT(p, MA_OWNED); 12936ddcc233SKonstantin Belousov KASSERT((mode == SINGLE_ALLPROC && (p->p_flag & P_TOTAL_STOP) != 0) || 12946ddcc233SKonstantin Belousov (mode != SINGLE_ALLPROC && (p->p_flag & P_TOTAL_STOP) == 0), 12956ddcc233SKonstantin Belousov ("mode %d does not match P_TOTAL_STOP", mode)); 129684cdea97SKonstantin Belousov KASSERT(mode == SINGLE_ALLPROC || p->p_singlethread == curthread, 129784cdea97SKonstantin Belousov ("thread_single_end from other thread %p %p", 129884cdea97SKonstantin Belousov curthread, p->p_singlethread)); 129984cdea97SKonstantin Belousov KASSERT(mode != SINGLE_BOUNDARY || 130084cdea97SKonstantin Belousov (p->p_flag & P_SINGLE_BOUNDARY) != 0, 130184cdea97SKonstantin Belousov ("mis-matched SINGLE_BOUNDARY flags %x", p->p_flag)); 13026ddcc233SKonstantin Belousov p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT | P_SINGLE_BOUNDARY | 13036ddcc233SKonstantin Belousov P_TOTAL_STOP); 13047b4a950aSDavid Xu PROC_SLOCK(p); 130544990b8cSJulian Elischer p->p_singlethread = NULL; 13067847a9daSJohn Baldwin wakeup_swapper = 0; 130749539972SJulian Elischer /* 13087847a9daSJohn Baldwin * If there are other threads they may now run, 130949539972SJulian Elischer * unless of course there is a blanket 'stop order' 131049539972SJulian Elischer * on the process. The single threader must be allowed 131149539972SJulian Elischer * to continue however as this is a bad place to stop. 131249539972SJulian Elischer */ 13136ddcc233SKonstantin Belousov if (p->p_numthreads != remain_for_mode(mode) && !P_SHOULDSTOP(p)) { 1314ad1e7d28SJulian Elischer FOREACH_THREAD_IN_PROC(p, td) { 1315a54e85fdSJeff Roberson thread_lock(td); 1316ad1e7d28SJulian Elischer if (TD_IS_SUSPENDED(td)) { 131784cdea97SKonstantin Belousov wakeup_swapper |= thread_unsuspend_one(td, p, 131884cdea97SKonstantin Belousov mode == SINGLE_BOUNDARY); 131961a74c5cSJeff Roberson } else 1320a54e85fdSJeff Roberson thread_unlock(td); 132149539972SJulian Elischer } 1322ad1e7d28SJulian Elischer } 132384cdea97SKonstantin Belousov KASSERT(mode != SINGLE_BOUNDARY || p->p_boundary_count == 0, 132484cdea97SKonstantin Belousov ("inconsistent boundary count %d", p->p_boundary_count)); 13257b4a950aSDavid Xu PROC_SUNLOCK(p); 13267847a9daSJohn Baldwin if (wakeup_swapper) 13277847a9daSJohn Baldwin kick_proc0(); 132849539972SJulian Elischer } 13294fc21c09SDaniel Eischen 133044355392SDavid Xu struct thread * 133144355392SDavid Xu thread_find(struct proc *p, lwpid_t tid) 133244355392SDavid Xu { 133344355392SDavid Xu struct thread *td; 133444355392SDavid Xu 133544355392SDavid Xu PROC_LOCK_ASSERT(p, MA_OWNED); 133644355392SDavid Xu FOREACH_THREAD_IN_PROC(p, td) { 133744355392SDavid Xu if (td->td_tid == tid) 133844355392SDavid Xu break; 133944355392SDavid Xu } 134044355392SDavid Xu return (td); 134144355392SDavid Xu } 1342cf7d9a8cSDavid Xu 1343cf7d9a8cSDavid Xu /* Locate a thread by number; return with proc lock held. */ 1344cf7d9a8cSDavid Xu struct thread * 1345cf7d9a8cSDavid Xu tdfind(lwpid_t tid, pid_t pid) 1346cf7d9a8cSDavid Xu { 1347cf7d9a8cSDavid Xu #define RUN_THRESH 16 1348cf7d9a8cSDavid Xu struct thread *td; 1349cf7d9a8cSDavid Xu int run = 0; 1350cf7d9a8cSDavid Xu 13517cd4443fSMateusz Guzik td = curthread; 13527cd4443fSMateusz Guzik if (td->td_tid == tid) { 13537cd4443fSMateusz Guzik if (pid != -1 && td->td_proc->p_pid != pid) 13547cd4443fSMateusz Guzik return (NULL); 13557cd4443fSMateusz Guzik PROC_LOCK(td->td_proc); 13567cd4443fSMateusz Guzik return (td); 13577cd4443fSMateusz Guzik } 13587cd4443fSMateusz Guzik 1359cf7d9a8cSDavid Xu rw_rlock(&tidhash_lock); 1360cf7d9a8cSDavid Xu LIST_FOREACH(td, TIDHASH(tid), td_hash) { 1361cf7d9a8cSDavid Xu if (td->td_tid == tid) { 1362cf7d9a8cSDavid Xu if (pid != -1 && td->td_proc->p_pid != pid) { 1363cf7d9a8cSDavid Xu td = NULL; 1364cf7d9a8cSDavid Xu break; 1365cf7d9a8cSDavid Xu } 13668e6fa660SJohn Baldwin PROC_LOCK(td->td_proc); 1367cf7d9a8cSDavid Xu if (td->td_proc->p_state == PRS_NEW) { 13688e6fa660SJohn Baldwin PROC_UNLOCK(td->td_proc); 1369cf7d9a8cSDavid Xu td = NULL; 1370cf7d9a8cSDavid Xu break; 1371cf7d9a8cSDavid Xu } 1372cf7d9a8cSDavid Xu if (run > RUN_THRESH) { 1373cf7d9a8cSDavid Xu if (rw_try_upgrade(&tidhash_lock)) { 1374cf7d9a8cSDavid Xu LIST_REMOVE(td, td_hash); 1375cf7d9a8cSDavid Xu LIST_INSERT_HEAD(TIDHASH(td->td_tid), 1376cf7d9a8cSDavid Xu td, td_hash); 1377cf7d9a8cSDavid Xu rw_wunlock(&tidhash_lock); 1378cf7d9a8cSDavid Xu return (td); 1379cf7d9a8cSDavid Xu } 1380cf7d9a8cSDavid Xu } 1381cf7d9a8cSDavid Xu break; 1382cf7d9a8cSDavid Xu } 1383cf7d9a8cSDavid Xu run++; 1384cf7d9a8cSDavid Xu } 1385cf7d9a8cSDavid Xu rw_runlock(&tidhash_lock); 1386cf7d9a8cSDavid Xu return (td); 1387cf7d9a8cSDavid Xu } 1388cf7d9a8cSDavid Xu 1389cf7d9a8cSDavid Xu void 1390cf7d9a8cSDavid Xu tidhash_add(struct thread *td) 1391cf7d9a8cSDavid Xu { 1392cf7d9a8cSDavid Xu rw_wlock(&tidhash_lock); 1393cf7d9a8cSDavid Xu LIST_INSERT_HEAD(TIDHASH(td->td_tid), td, td_hash); 1394cf7d9a8cSDavid Xu rw_wunlock(&tidhash_lock); 1395cf7d9a8cSDavid Xu } 1396cf7d9a8cSDavid Xu 1397cf7d9a8cSDavid Xu void 1398cf7d9a8cSDavid Xu tidhash_remove(struct thread *td) 1399cf7d9a8cSDavid Xu { 1400cf7d9a8cSDavid Xu rw_wlock(&tidhash_lock); 1401cf7d9a8cSDavid Xu LIST_REMOVE(td, td_hash); 1402cf7d9a8cSDavid Xu rw_wunlock(&tidhash_lock); 1403cf7d9a8cSDavid Xu } 1404