xref: /freebsd/sys/kern/kern_thread.c (revision e2668f55632a7406dac32541cf739c980a2bc187)
19454b2d8SWarner Losh /*-
244990b8cSJulian Elischer  * Copyright (C) 2001 Julian Elischer <julian@freebsd.org>.
344990b8cSJulian Elischer  *  All rights reserved.
444990b8cSJulian Elischer  *
544990b8cSJulian Elischer  * Redistribution and use in source and binary forms, with or without
644990b8cSJulian Elischer  * modification, are permitted provided that the following conditions
744990b8cSJulian Elischer  * are met:
844990b8cSJulian Elischer  * 1. Redistributions of source code must retain the above copyright
944990b8cSJulian Elischer  *    notice(s), this list of conditions and the following disclaimer as
1044990b8cSJulian Elischer  *    the first lines of this file unmodified other than the possible
1144990b8cSJulian Elischer  *    addition of one or more copyright notices.
1244990b8cSJulian Elischer  * 2. Redistributions in binary form must reproduce the above copyright
1344990b8cSJulian Elischer  *    notice(s), this list of conditions and the following disclaimer in the
1444990b8cSJulian Elischer  *    documentation and/or other materials provided with the distribution.
1544990b8cSJulian Elischer  *
1644990b8cSJulian Elischer  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) ``AS IS'' AND ANY
1744990b8cSJulian Elischer  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
1844990b8cSJulian Elischer  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
1944990b8cSJulian Elischer  * DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY
2044990b8cSJulian Elischer  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
2144990b8cSJulian Elischer  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
2244990b8cSJulian Elischer  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
2344990b8cSJulian Elischer  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2444990b8cSJulian Elischer  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2544990b8cSJulian Elischer  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
2644990b8cSJulian Elischer  * DAMAGE.
2744990b8cSJulian Elischer  */
2844990b8cSJulian Elischer 
29677b542eSDavid E. O'Brien #include <sys/cdefs.h>
30677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
31677b542eSDavid E. O'Brien 
3244990b8cSJulian Elischer #include <sys/param.h>
3344990b8cSJulian Elischer #include <sys/systm.h>
3444990b8cSJulian Elischer #include <sys/kernel.h>
3544990b8cSJulian Elischer #include <sys/lock.h>
3644990b8cSJulian Elischer #include <sys/mutex.h>
3744990b8cSJulian Elischer #include <sys/proc.h>
38e170bfdaSDavid Xu #include <sys/resourcevar.h>
3994e0a4cdSJulian Elischer #include <sys/smp.h>
4044990b8cSJulian Elischer #include <sys/sysctl.h>
41de028f5aSJeff Roberson #include <sys/sched.h>
4244f3b092SJohn Baldwin #include <sys/sleepqueue.h>
43961a7b24SJohn Baldwin #include <sys/turnstile.h>
4444990b8cSJulian Elischer #include <sys/ktr.h>
45bc8e6d81SDavid Xu #include <sys/umtx.h>
4644990b8cSJulian Elischer 
47911b84b0SRobert Watson #include <security/audit/audit.h>
48911b84b0SRobert Watson 
4944990b8cSJulian Elischer #include <vm/vm.h>
5049a2507bSAlan Cox #include <vm/vm_extern.h>
5144990b8cSJulian Elischer #include <vm/uma.h>
5202fb42b0SPeter Wemm 
5344990b8cSJulian Elischer /*
544f0db5e0SJulian Elischer  * KSEGRP related storage.
5544990b8cSJulian Elischer  */
564f0db5e0SJulian Elischer static uma_zone_t ksegrp_zone;
5744990b8cSJulian Elischer static uma_zone_t thread_zone;
5844990b8cSJulian Elischer 
594f0db5e0SJulian Elischer /* DEBUG ONLY */
6044990b8cSJulian Elischer SYSCTL_NODE(_kern, OID_AUTO, threads, CTLFLAG_RW, 0, "thread allocation");
61696058c3SJulian Elischer static int thread_debug = 0;
62696058c3SJulian Elischer SYSCTL_INT(_kern_threads, OID_AUTO, debug, CTLFLAG_RW,
63696058c3SJulian Elischer 	&thread_debug, 0, "thread debug");
64fdc5ecd2SDavid Xu 
65345ad866SJulian Elischer int max_threads_per_proc = 1500;
66fdc5ecd2SDavid Xu SYSCTL_INT(_kern_threads, OID_AUTO, max_threads_per_proc, CTLFLAG_RW,
674f0db5e0SJulian Elischer 	&max_threads_per_proc, 0, "Limit on threads per proc");
684f0db5e0SJulian Elischer 
69ed062c8dSJulian Elischer int max_groups_per_proc = 1500;
70fdc5ecd2SDavid Xu SYSCTL_INT(_kern_threads, OID_AUTO, max_groups_per_proc, CTLFLAG_RW,
71fdc5ecd2SDavid Xu 	&max_groups_per_proc, 0, "Limit on thread groups per proc");
72fdc5ecd2SDavid Xu 
73345ad866SJulian Elischer int max_threads_hits;
740252d203SDavid Xu SYSCTL_INT(_kern_threads, OID_AUTO, max_threads_hits, CTLFLAG_RD,
750252d203SDavid Xu 	&max_threads_hits, 0, "");
760252d203SDavid Xu 
7794e0a4cdSJulian Elischer int virtual_cpu;
7894e0a4cdSJulian Elischer 
795215b187SJeff Roberson TAILQ_HEAD(, thread) zombie_threads = TAILQ_HEAD_INITIALIZER(zombie_threads);
805c8329edSJulian Elischer TAILQ_HEAD(, ksegrp) zombie_ksegrps = TAILQ_HEAD_INITIALIZER(zombie_ksegrps);
815215b187SJeff Roberson struct mtx kse_zombie_lock;
825215b187SJeff Roberson MTX_SYSINIT(kse_zombie_lock, &kse_zombie_lock, "kse zombie lock", MTX_SPIN);
8344990b8cSJulian Elischer 
8494e0a4cdSJulian Elischer static int
8594e0a4cdSJulian Elischer sysctl_kse_virtual_cpu(SYSCTL_HANDLER_ARGS)
8694e0a4cdSJulian Elischer {
8794e0a4cdSJulian Elischer 	int error, new_val;
8894e0a4cdSJulian Elischer 	int def_val;
8994e0a4cdSJulian Elischer 
9094e0a4cdSJulian Elischer 	def_val = mp_ncpus;
9194e0a4cdSJulian Elischer 	if (virtual_cpu == 0)
9294e0a4cdSJulian Elischer 		new_val = def_val;
9394e0a4cdSJulian Elischer 	else
9494e0a4cdSJulian Elischer 		new_val = virtual_cpu;
9594e0a4cdSJulian Elischer 	error = sysctl_handle_int(oidp, &new_val, 0, req);
9694e0a4cdSJulian Elischer 	if (error != 0 || req->newptr == NULL)
9794e0a4cdSJulian Elischer 		return (error);
9894e0a4cdSJulian Elischer 	if (new_val < 0)
9994e0a4cdSJulian Elischer 		return (EINVAL);
10094e0a4cdSJulian Elischer 	virtual_cpu = new_val;
10194e0a4cdSJulian Elischer 	return (0);
10294e0a4cdSJulian Elischer }
10394e0a4cdSJulian Elischer 
10494e0a4cdSJulian Elischer /* DEBUG ONLY */
10594e0a4cdSJulian Elischer SYSCTL_PROC(_kern_threads, OID_AUTO, virtual_cpu, CTLTYPE_INT|CTLFLAG_RW,
10694e0a4cdSJulian Elischer 	0, sizeof(virtual_cpu), sysctl_kse_virtual_cpu, "I",
10794e0a4cdSJulian Elischer 	"debug virtual cpus");
1085c8329edSJulian Elischer 
109fdcac928SMarcel Moolenaar struct mtx tid_lock;
1101ea7a6f8SPoul-Henning Kamp static struct unrhdr *tid_unrhdr;
111fdcac928SMarcel Moolenaar 
112fdcac928SMarcel Moolenaar /*
113696058c3SJulian Elischer  * Prepare a thread for use.
11444990b8cSJulian Elischer  */
115b23f72e9SBrian Feldman static int
116b23f72e9SBrian Feldman thread_ctor(void *mem, int size, void *arg, int flags)
11744990b8cSJulian Elischer {
11844990b8cSJulian Elischer 	struct thread	*td;
11944990b8cSJulian Elischer 
12044990b8cSJulian Elischer 	td = (struct thread *)mem;
12171fad9fdSJulian Elischer 	td->td_state = TDS_INACTIVE;
122060563ecSJulian Elischer 	td->td_oncpu = NOCPU;
1236c27c603SJuli Mallett 
124773eff9dSPoul-Henning Kamp 	td->td_tid = alloc_unr(tid_unrhdr);
125773eff9dSPoul-Henning Kamp 
1266c27c603SJuli Mallett 	/*
1276c27c603SJuli Mallett 	 * Note that td_critnest begins life as 1 because the thread is not
1286c27c603SJuli Mallett 	 * running and is thereby implicitly waiting to be on the receiving
1296c27c603SJuli Mallett 	 * end of a context switch.  A context switch must occur inside a
1306c27c603SJuli Mallett 	 * critical section, and in fact, includes hand-off of the sched_lock.
1316c27c603SJuli Mallett 	 * After a context switch to a newly created thread, it will release
1326c27c603SJuli Mallett 	 * sched_lock for the first time, and its td_critnest will hit 0 for
1336c27c603SJuli Mallett 	 * the first time.  This happens on the far end of a context switch,
1346c27c603SJuli Mallett 	 * and when it context switches away from itself, it will in fact go
1356c27c603SJuli Mallett 	 * back into a critical section, and hand off the sched lock to the
1366c27c603SJuli Mallett 	 * next thread.
1376c27c603SJuli Mallett 	 */
138139b7550SJohn Baldwin 	td->td_critnest = 1;
139911b84b0SRobert Watson 
140911b84b0SRobert Watson #ifdef AUDIT
141911b84b0SRobert Watson 	audit_thread_alloc(td);
142911b84b0SRobert Watson #endif
143b23f72e9SBrian Feldman 	return (0);
14444990b8cSJulian Elischer }
14544990b8cSJulian Elischer 
14644990b8cSJulian Elischer /*
14744990b8cSJulian Elischer  * Reclaim a thread after use.
14844990b8cSJulian Elischer  */
14944990b8cSJulian Elischer static void
15044990b8cSJulian Elischer thread_dtor(void *mem, int size, void *arg)
15144990b8cSJulian Elischer {
15244990b8cSJulian Elischer 	struct thread *td;
15344990b8cSJulian Elischer 
15444990b8cSJulian Elischer 	td = (struct thread *)mem;
15544990b8cSJulian Elischer 
15644990b8cSJulian Elischer #ifdef INVARIANTS
15744990b8cSJulian Elischer 	/* Verify that this thread is in a safe state to free. */
15844990b8cSJulian Elischer 	switch (td->td_state) {
15971fad9fdSJulian Elischer 	case TDS_INHIBITED:
16071fad9fdSJulian Elischer 	case TDS_RUNNING:
16171fad9fdSJulian Elischer 	case TDS_CAN_RUN:
16244990b8cSJulian Elischer 	case TDS_RUNQ:
16344990b8cSJulian Elischer 		/*
16444990b8cSJulian Elischer 		 * We must never unlink a thread that is in one of
16544990b8cSJulian Elischer 		 * these states, because it is currently active.
16644990b8cSJulian Elischer 		 */
16744990b8cSJulian Elischer 		panic("bad state for thread unlinking");
16844990b8cSJulian Elischer 		/* NOTREACHED */
16971fad9fdSJulian Elischer 	case TDS_INACTIVE:
17044990b8cSJulian Elischer 		break;
17144990b8cSJulian Elischer 	default:
17244990b8cSJulian Elischer 		panic("bad thread state");
17344990b8cSJulian Elischer 		/* NOTREACHED */
17444990b8cSJulian Elischer 	}
17544990b8cSJulian Elischer #endif
1766e8525ceSRobert Watson #ifdef AUDIT
1776e8525ceSRobert Watson 	audit_thread_free(td);
1786e8525ceSRobert Watson #endif
179773eff9dSPoul-Henning Kamp 	free_unr(tid_unrhdr, td->td_tid);
180ed062c8dSJulian Elischer 	sched_newthread(td);
18144990b8cSJulian Elischer }
18244990b8cSJulian Elischer 
18344990b8cSJulian Elischer /*
18444990b8cSJulian Elischer  * Initialize type-stable parts of a thread (when newly created).
18544990b8cSJulian Elischer  */
186b23f72e9SBrian Feldman static int
187b23f72e9SBrian Feldman thread_init(void *mem, int size, int flags)
18844990b8cSJulian Elischer {
18944990b8cSJulian Elischer 	struct thread *td;
19044990b8cSJulian Elischer 
19144990b8cSJulian Elischer 	td = (struct thread *)mem;
192247aba24SMarcel Moolenaar 
19349a2507bSAlan Cox 	vm_thread_new(td, 0);
19444990b8cSJulian Elischer 	cpu_thread_setup(td);
19544f3b092SJohn Baldwin 	td->td_sleepqueue = sleepq_alloc();
196961a7b24SJohn Baldwin 	td->td_turnstile = turnstile_alloc();
197bc8e6d81SDavid Xu 	td->td_umtxq = umtxq_alloc();
198de028f5aSJeff Roberson 	td->td_sched = (struct td_sched *)&td[1];
199ed062c8dSJulian Elischer 	sched_newthread(td);
200b23f72e9SBrian Feldman 	return (0);
20144990b8cSJulian Elischer }
20244990b8cSJulian Elischer 
20344990b8cSJulian Elischer /*
20444990b8cSJulian Elischer  * Tear down type-stable parts of a thread (just before being discarded).
20544990b8cSJulian Elischer  */
20644990b8cSJulian Elischer static void
20744990b8cSJulian Elischer thread_fini(void *mem, int size)
20844990b8cSJulian Elischer {
20944990b8cSJulian Elischer 	struct thread *td;
21044990b8cSJulian Elischer 
21144990b8cSJulian Elischer 	td = (struct thread *)mem;
212961a7b24SJohn Baldwin 	turnstile_free(td->td_turnstile);
21344f3b092SJohn Baldwin 	sleepq_free(td->td_sleepqueue);
214bc8e6d81SDavid Xu 	umtxq_free(td->td_umtxq);
21549a2507bSAlan Cox 	vm_thread_dispose(td);
21644990b8cSJulian Elischer }
2175215b187SJeff Roberson 
218de028f5aSJeff Roberson /*
219de028f5aSJeff Roberson  * Initialize type-stable parts of a ksegrp (when newly created).
220de028f5aSJeff Roberson  */
221b23f72e9SBrian Feldman static int
222a9b5dc7dSJulian Elischer ksegrp_ctor(void *mem, int size, void *arg, int flags)
223de028f5aSJeff Roberson {
224de028f5aSJeff Roberson 	struct ksegrp	*kg;
225de028f5aSJeff Roberson 
226de028f5aSJeff Roberson 	kg = (struct ksegrp *)mem;
227a9b5dc7dSJulian Elischer 	bzero(mem, size);
228de028f5aSJeff Roberson 	kg->kg_sched = (struct kg_sched *)&kg[1];
229b23f72e9SBrian Feldman 	return (0);
230de028f5aSJeff Roberson }
23144990b8cSJulian Elischer 
2325c8329edSJulian Elischer void
2335c8329edSJulian Elischer ksegrp_link(struct ksegrp *kg, struct proc *p)
2345c8329edSJulian Elischer {
2355c8329edSJulian Elischer 
2365c8329edSJulian Elischer 	TAILQ_INIT(&kg->kg_threads);
2375c8329edSJulian Elischer 	TAILQ_INIT(&kg->kg_runq);	/* links with td_runq */
2385215b187SJeff Roberson 	TAILQ_INIT(&kg->kg_upcalls);	/* all upcall structure in ksegrp */
2395c8329edSJulian Elischer 	kg->kg_proc = p;
2405215b187SJeff Roberson 	/*
2415215b187SJeff Roberson 	 * the following counters are in the -zero- section
2425215b187SJeff Roberson 	 * and may not need clearing
2435215b187SJeff Roberson 	 */
2445c8329edSJulian Elischer 	kg->kg_numthreads = 0;
2455215b187SJeff Roberson 	kg->kg_numupcalls = 0;
2465c8329edSJulian Elischer 	/* link it in now that it's consistent */
2475c8329edSJulian Elischer 	p->p_numksegrps++;
2485c8329edSJulian Elischer 	TAILQ_INSERT_HEAD(&p->p_ksegrps, kg, kg_ksegrp);
2495c8329edSJulian Elischer }
2505c8329edSJulian Elischer 
251ed062c8dSJulian Elischer /*
252ed062c8dSJulian Elischer  * Called from:
253ed062c8dSJulian Elischer  *   thread-exit()
254ed062c8dSJulian Elischer  */
2555c8329edSJulian Elischer void
2565c8329edSJulian Elischer ksegrp_unlink(struct ksegrp *kg)
2575c8329edSJulian Elischer {
2585c8329edSJulian Elischer 	struct proc *p;
2595c8329edSJulian Elischer 
2605c8329edSJulian Elischer 	mtx_assert(&sched_lock, MA_OWNED);
2615215b187SJeff Roberson 	KASSERT((kg->kg_numthreads == 0), ("ksegrp_unlink: residual threads"));
2625215b187SJeff Roberson 	KASSERT((kg->kg_numupcalls == 0), ("ksegrp_unlink: residual upcalls"));
2635215b187SJeff Roberson 
2645c8329edSJulian Elischer 	p = kg->kg_proc;
2655c8329edSJulian Elischer 	TAILQ_REMOVE(&p->p_ksegrps, kg, kg_ksegrp);
2665c8329edSJulian Elischer 	p->p_numksegrps--;
2675c8329edSJulian Elischer 	/*
2685c8329edSJulian Elischer 	 * Aggregate stats from the KSE
2695c8329edSJulian Elischer 	 */
27021fc3164SDavid Xu 	if (p->p_procscopegrp == kg)
27121fc3164SDavid Xu 		p->p_procscopegrp = NULL;
2725c8329edSJulian Elischer }
2735c8329edSJulian Elischer 
2745c8329edSJulian Elischer /*
2755215b187SJeff Roberson  * For a newly created process,
2765215b187SJeff Roberson  * link up all the structures and its initial threads etc.
277ed062c8dSJulian Elischer  * called from:
278ed062c8dSJulian Elischer  * {arch}/{arch}/machdep.c   ia64_init(), init386() etc.
279ed062c8dSJulian Elischer  * proc_dtor() (should go away)
280ed062c8dSJulian Elischer  * proc_init()
2815c8329edSJulian Elischer  */
2825c8329edSJulian Elischer void
283ed062c8dSJulian Elischer proc_linkup(struct proc *p, struct ksegrp *kg, struct thread *td)
2845c8329edSJulian Elischer {
2855c8329edSJulian Elischer 
2865c8329edSJulian Elischer 	TAILQ_INIT(&p->p_ksegrps);	     /* all ksegrps in proc */
2875c8329edSJulian Elischer 	TAILQ_INIT(&p->p_threads);	     /* all threads in proc */
2885c8329edSJulian Elischer 	TAILQ_INIT(&p->p_suspended);	     /* Threads suspended */
2899104847fSDavid Xu 	sigqueue_init(&p->p_sigqueue, p);
290ebceaf6dSDavid Xu 	p->p_ksi = ksiginfo_alloc(1);
291ebceaf6dSDavid Xu 	if (p->p_ksi != NULL) {
2925c474517SDavid Xu 		/* XXX p_ksi may be null if ksiginfo zone is not ready */
293ebceaf6dSDavid Xu 		p->p_ksi->ksi_flags = KSI_EXT | KSI_INS;
294ebceaf6dSDavid Xu 	}
295b2f92ef9SDavid Xu 	LIST_INIT(&p->p_mqnotifier);
2965c8329edSJulian Elischer 	p->p_numksegrps = 0;
2975c8329edSJulian Elischer 	p->p_numthreads = 0;
2985c8329edSJulian Elischer 
2995c8329edSJulian Elischer 	ksegrp_link(kg, p);
3005c8329edSJulian Elischer 	thread_link(td, kg);
3015c8329edSJulian Elischer }
3025c8329edSJulian Elischer 
3035c8329edSJulian Elischer /*
30444990b8cSJulian Elischer  * Initialize global thread allocation resources.
30544990b8cSJulian Elischer  */
30644990b8cSJulian Elischer void
30744990b8cSJulian Elischer threadinit(void)
30844990b8cSJulian Elischer {
30944990b8cSJulian Elischer 
3101ea7a6f8SPoul-Henning Kamp 	mtx_init(&tid_lock, "TID lock", NULL, MTX_DEF);
3111ea7a6f8SPoul-Henning Kamp 	tid_unrhdr = new_unrhdr(PID_MAX + 1, INT_MAX, &tid_lock);
3121ea7a6f8SPoul-Henning Kamp 
313de028f5aSJeff Roberson 	thread_zone = uma_zcreate("THREAD", sched_sizeof_thread(),
31444990b8cSJulian Elischer 	    thread_ctor, thread_dtor, thread_init, thread_fini,
31544990b8cSJulian Elischer 	    UMA_ALIGN_CACHE, 0);
316de028f5aSJeff Roberson 	ksegrp_zone = uma_zcreate("KSEGRP", sched_sizeof_ksegrp(),
317a9b5dc7dSJulian Elischer 	    ksegrp_ctor, NULL, NULL, NULL,
3184f0db5e0SJulian Elischer 	    UMA_ALIGN_CACHE, 0);
319ed062c8dSJulian Elischer 	kseinit();	/* set up kse specific stuff  e.g. upcall zone*/
32044990b8cSJulian Elischer }
32144990b8cSJulian Elischer 
32244990b8cSJulian Elischer /*
3231faf202eSJulian Elischer  * Stash an embarasingly extra thread into the zombie thread queue.
32444990b8cSJulian Elischer  */
32544990b8cSJulian Elischer void
32644990b8cSJulian Elischer thread_stash(struct thread *td)
32744990b8cSJulian Elischer {
3285215b187SJeff Roberson 	mtx_lock_spin(&kse_zombie_lock);
32944990b8cSJulian Elischer 	TAILQ_INSERT_HEAD(&zombie_threads, td, td_runq);
3305215b187SJeff Roberson 	mtx_unlock_spin(&kse_zombie_lock);
33144990b8cSJulian Elischer }
33244990b8cSJulian Elischer 
33344990b8cSJulian Elischer /*
3345c8329edSJulian Elischer  * Stash an embarasingly extra ksegrp into the zombie ksegrp queue.
3355c8329edSJulian Elischer  */
3365c8329edSJulian Elischer void
3375c8329edSJulian Elischer ksegrp_stash(struct ksegrp *kg)
3385c8329edSJulian Elischer {
3395215b187SJeff Roberson 	mtx_lock_spin(&kse_zombie_lock);
3405c8329edSJulian Elischer 	TAILQ_INSERT_HEAD(&zombie_ksegrps, kg, kg_ksegrp);
3415215b187SJeff Roberson 	mtx_unlock_spin(&kse_zombie_lock);
3425c8329edSJulian Elischer }
3435c8329edSJulian Elischer 
3445c8329edSJulian Elischer /*
3455215b187SJeff Roberson  * Reap zombie kse resource.
34644990b8cSJulian Elischer  */
34744990b8cSJulian Elischer void
34844990b8cSJulian Elischer thread_reap(void)
34944990b8cSJulian Elischer {
3505c8329edSJulian Elischer 	struct thread *td_first, *td_next;
3515c8329edSJulian Elischer 	struct ksegrp *kg_first, * kg_next;
35244990b8cSJulian Elischer 
35344990b8cSJulian Elischer 	/*
3545215b187SJeff Roberson 	 * Don't even bother to lock if none at this instant,
3555215b187SJeff Roberson 	 * we really don't care about the next instant..
35644990b8cSJulian Elischer 	 */
3575c8329edSJulian Elischer 	if ((!TAILQ_EMPTY(&zombie_threads))
358345ad866SJulian Elischer 	    || (!TAILQ_EMPTY(&zombie_ksegrps))) {
3595215b187SJeff Roberson 		mtx_lock_spin(&kse_zombie_lock);
3605c8329edSJulian Elischer 		td_first = TAILQ_FIRST(&zombie_threads);
3615c8329edSJulian Elischer 		kg_first = TAILQ_FIRST(&zombie_ksegrps);
3625c8329edSJulian Elischer 		if (td_first)
3635c8329edSJulian Elischer 			TAILQ_INIT(&zombie_threads);
3645c8329edSJulian Elischer 		if (kg_first)
3655c8329edSJulian Elischer 			TAILQ_INIT(&zombie_ksegrps);
3665215b187SJeff Roberson 		mtx_unlock_spin(&kse_zombie_lock);
3675c8329edSJulian Elischer 		while (td_first) {
3685c8329edSJulian Elischer 			td_next = TAILQ_NEXT(td_first, td_runq);
3695215b187SJeff Roberson 			if (td_first->td_ucred)
3705215b187SJeff Roberson 				crfree(td_first->td_ucred);
3715c8329edSJulian Elischer 			thread_free(td_first);
3725c8329edSJulian Elischer 			td_first = td_next;
37344990b8cSJulian Elischer 		}
3745c8329edSJulian Elischer 		while (kg_first) {
3755c8329edSJulian Elischer 			kg_next = TAILQ_NEXT(kg_first, kg_ksegrp);
3765c8329edSJulian Elischer 			ksegrp_free(kg_first);
3775c8329edSJulian Elischer 			kg_first = kg_next;
3785c8329edSJulian Elischer 		}
379ed062c8dSJulian Elischer 		/*
380ed062c8dSJulian Elischer 		 * there will always be a thread on the list if one of these
381ed062c8dSJulian Elischer 		 * is there.
382ed062c8dSJulian Elischer 		 */
383345ad866SJulian Elischer 		kse_GC();
38444990b8cSJulian Elischer 	}
385ed062c8dSJulian Elischer }
38644990b8cSJulian Elischer 
38744990b8cSJulian Elischer /*
3884f0db5e0SJulian Elischer  * Allocate a ksegrp.
3894f0db5e0SJulian Elischer  */
3904f0db5e0SJulian Elischer struct ksegrp *
3914f0db5e0SJulian Elischer ksegrp_alloc(void)
3924f0db5e0SJulian Elischer {
393a163d034SWarner Losh 	return (uma_zalloc(ksegrp_zone, M_WAITOK));
3944f0db5e0SJulian Elischer }
3954f0db5e0SJulian Elischer 
3964f0db5e0SJulian Elischer /*
39744990b8cSJulian Elischer  * Allocate a thread.
39844990b8cSJulian Elischer  */
39944990b8cSJulian Elischer struct thread *
40044990b8cSJulian Elischer thread_alloc(void)
40144990b8cSJulian Elischer {
40244990b8cSJulian Elischer 	thread_reap(); /* check if any zombies to get */
403a163d034SWarner Losh 	return (uma_zalloc(thread_zone, M_WAITOK));
40444990b8cSJulian Elischer }
40544990b8cSJulian Elischer 
40644990b8cSJulian Elischer /*
4074f0db5e0SJulian Elischer  * Deallocate a ksegrp.
4084f0db5e0SJulian Elischer  */
4094f0db5e0SJulian Elischer void
4104f0db5e0SJulian Elischer ksegrp_free(struct ksegrp *td)
4114f0db5e0SJulian Elischer {
4124f0db5e0SJulian Elischer 	uma_zfree(ksegrp_zone, td);
4134f0db5e0SJulian Elischer }
4144f0db5e0SJulian Elischer 
4154f0db5e0SJulian Elischer /*
41644990b8cSJulian Elischer  * Deallocate a thread.
41744990b8cSJulian Elischer  */
41844990b8cSJulian Elischer void
41944990b8cSJulian Elischer thread_free(struct thread *td)
42044990b8cSJulian Elischer {
421696058c3SJulian Elischer 
422696058c3SJulian Elischer 	cpu_thread_clean(td);
42344990b8cSJulian Elischer 	uma_zfree(thread_zone, td);
42444990b8cSJulian Elischer }
42544990b8cSJulian Elischer 
42644990b8cSJulian Elischer /*
42744990b8cSJulian Elischer  * Discard the current thread and exit from its context.
42894e0a4cdSJulian Elischer  * Always called with scheduler locked.
42944990b8cSJulian Elischer  *
43044990b8cSJulian Elischer  * Because we can't free a thread while we're operating under its context,
431696058c3SJulian Elischer  * push the current thread into our CPU's deadthread holder. This means
432696058c3SJulian Elischer  * we needn't worry about someone else grabbing our context before we
43394e0a4cdSJulian Elischer  * do a cpu_throw().  This may not be needed now as we are under schedlock.
43494e0a4cdSJulian Elischer  * Maybe we can just do a thread_stash() as thr_exit1 does.
43594e0a4cdSJulian Elischer  */
43694e0a4cdSJulian Elischer /*  XXX
43794e0a4cdSJulian Elischer  * libthr expects its thread exit to return for the last
43894e0a4cdSJulian Elischer  * thread, meaning that the program is back to non-threaded
43994e0a4cdSJulian Elischer  * mode I guess. Because we do this (cpu_throw) unconditionally
44094e0a4cdSJulian Elischer  * here, they have their own version of it. (thr_exit1())
44194e0a4cdSJulian Elischer  * that doesn't do it all if this was the last thread.
44294e0a4cdSJulian Elischer  * It is also called from thread_suspend_check().
44394e0a4cdSJulian Elischer  * Of course in the end, they end up coming here through exit1
44494e0a4cdSJulian Elischer  * anyhow..  After fixing 'thr' to play by the rules we should be able
44594e0a4cdSJulian Elischer  * to merge these two functions together.
446ed062c8dSJulian Elischer  *
447ed062c8dSJulian Elischer  * called from:
448ed062c8dSJulian Elischer  * exit1()
449ed062c8dSJulian Elischer  * kse_exit()
450ed062c8dSJulian Elischer  * thr_exit()
451ed062c8dSJulian Elischer  * thread_user_enter()
452ed062c8dSJulian Elischer  * thread_userret()
453ed062c8dSJulian Elischer  * thread_suspend_check()
45444990b8cSJulian Elischer  */
45544990b8cSJulian Elischer void
45644990b8cSJulian Elischer thread_exit(void)
45744990b8cSJulian Elischer {
458e170bfdaSDavid Xu 	uint64_t new_switchtime;
45944990b8cSJulian Elischer 	struct thread *td;
46044990b8cSJulian Elischer 	struct proc *p;
46144990b8cSJulian Elischer 	struct ksegrp	*kg;
46244990b8cSJulian Elischer 
46344990b8cSJulian Elischer 	td = curthread;
46444990b8cSJulian Elischer 	kg = td->td_ksegrp;
46544990b8cSJulian Elischer 	p = td->td_proc;
46644990b8cSJulian Elischer 
46744990b8cSJulian Elischer 	mtx_assert(&sched_lock, MA_OWNED);
468ed062c8dSJulian Elischer 	mtx_assert(&Giant, MA_NOTOWNED);
46944990b8cSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
470ed062c8dSJulian Elischer 	KASSERT(p != NULL, ("thread exiting without a process"));
471ed062c8dSJulian Elischer 	KASSERT(kg != NULL, ("thread exiting without a kse group"));
472cc701b73SRobert Watson 	CTR3(KTR_PROC, "thread_exit: thread %p (pid %ld, %s)", td,
473cc701b73SRobert Watson 	    (long)p->p_pid, p->p_comm);
4749104847fSDavid Xu 	KASSERT(TAILQ_EMPTY(&td->td_sigqueue.sq_list), ("signal pending"));
47544990b8cSJulian Elischer 
47689964dd2SRobert Watson #ifdef AUDIT
47789964dd2SRobert Watson 	AUDIT_SYSCALL_EXIT(0, td);
47889964dd2SRobert Watson #endif
47989964dd2SRobert Watson 
48048bfcdddSJulian Elischer 	if (td->td_standin != NULL) {
481ed062c8dSJulian Elischer 		/*
482ed062c8dSJulian Elischer 		 * Note that we don't need to free the cred here as it
483ed062c8dSJulian Elischer 		 * is done in thread_reap().
484ed062c8dSJulian Elischer 		 */
48548bfcdddSJulian Elischer 		thread_stash(td->td_standin);
48648bfcdddSJulian Elischer 		td->td_standin = NULL;
48748bfcdddSJulian Elischer 	}
48848bfcdddSJulian Elischer 
489ed062c8dSJulian Elischer 	/*
490ed062c8dSJulian Elischer 	 * drop FPU & debug register state storage, or any other
491ed062c8dSJulian Elischer 	 * architecture specific resources that
492ed062c8dSJulian Elischer 	 * would not be on a new untouched process.
493ed062c8dSJulian Elischer 	 */
49444990b8cSJulian Elischer 	cpu_thread_exit(td);	/* XXXSMP */
49544990b8cSJulian Elischer 
4961faf202eSJulian Elischer 	/*
497ed062c8dSJulian Elischer 	 * The thread is exiting. scheduler can release its stuff
498ed062c8dSJulian Elischer 	 * and collect stats etc.
499e170bfdaSDavid Xu 	 * XXX this is not very right, since PROC_UNLOCK may still
500e170bfdaSDavid Xu 	 * need scheduler stuff.
501ed062c8dSJulian Elischer 	 */
502ed062c8dSJulian Elischer 	sched_thread_exit(td);
503ed062c8dSJulian Elischer 
504e170bfdaSDavid Xu 	/* Do the same timestamp bookkeeping that mi_switch() would do. */
505e170bfdaSDavid Xu 	new_switchtime = cpu_ticks();
506e170bfdaSDavid Xu 	p->p_rux.rux_runtime += (new_switchtime - PCPU_GET(switchtime));
507e170bfdaSDavid Xu 	p->p_rux.rux_uticks += td->td_uticks;
508e170bfdaSDavid Xu 	p->p_rux.rux_sticks += td->td_sticks;
509e170bfdaSDavid Xu 	p->p_rux.rux_iticks += td->td_iticks;
510e170bfdaSDavid Xu 	PCPU_SET(switchtime, new_switchtime);
511e170bfdaSDavid Xu 	PCPU_SET(switchticks, ticks);
512e170bfdaSDavid Xu 	cnt.v_swtch++;
513e170bfdaSDavid Xu 
514e170bfdaSDavid Xu 	/* Add our usage into the usage of all our children. */
515e170bfdaSDavid Xu 	if (p->p_numthreads == 1)
516e170bfdaSDavid Xu 		ruadd(p->p_ru, &p->p_rux, &p->p_stats->p_cru, &p->p_crux);
517e170bfdaSDavid Xu 
518ed062c8dSJulian Elischer 	/*
5191faf202eSJulian Elischer 	 * The last thread is left attached to the process
5201faf202eSJulian Elischer 	 * So that the whole bundle gets recycled. Skip
521ed062c8dSJulian Elischer 	 * all this stuff if we never had threads.
522ed062c8dSJulian Elischer 	 * EXIT clears all sign of other threads when
523ed062c8dSJulian Elischer 	 * it goes to single threading, so the last thread always
524ed062c8dSJulian Elischer 	 * takes the short path.
5251faf202eSJulian Elischer 	 */
526ed062c8dSJulian Elischer 	if (p->p_flag & P_HADTHREADS) {
5271faf202eSJulian Elischer 		if (p->p_numthreads > 1) {
528d3a0bd78SJulian Elischer 			thread_unlink(td);
529ed062c8dSJulian Elischer 
530ed062c8dSJulian Elischer 			/* XXX first arg not used in 4BSD or ULE */
531ed062c8dSJulian Elischer 			sched_exit_thread(FIRST_THREAD_IN_PROC(p), td);
532ed062c8dSJulian Elischer 
533ed062c8dSJulian Elischer 			/*
53444990b8cSJulian Elischer 			 * The test below is NOT true if we are the
5351faf202eSJulian Elischer 			 * sole exiting thread. P_STOPPED_SNGL is unset
53644990b8cSJulian Elischer 			 * in exit1() after it is the only survivor.
53744990b8cSJulian Elischer 			 */
5381279572aSDavid Xu 			if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) {
53944990b8cSJulian Elischer 				if (p->p_numthreads == p->p_suspcount) {
54071fad9fdSJulian Elischer 					thread_unsuspend_one(p->p_singlethread);
54144990b8cSJulian Elischer 				}
54244990b8cSJulian Elischer 			}
54348bfcdddSJulian Elischer 
5445215b187SJeff Roberson 			/*
5455215b187SJeff Roberson 			 * Because each upcall structure has an owner thread,
5465215b187SJeff Roberson 			 * owner thread exits only when process is in exiting
5475215b187SJeff Roberson 			 * state, so upcall to userland is no longer needed,
5485215b187SJeff Roberson 			 * deleting upcall structure is safe here.
5495215b187SJeff Roberson 			 * So when all threads in a group is exited, all upcalls
5505215b187SJeff Roberson 			 * in the group should be automatically freed.
551ed062c8dSJulian Elischer 			 *  XXXKSE This is a KSE thing and should be exported
552ed062c8dSJulian Elischer 			 * there somehow.
5535215b187SJeff Roberson 			 */
5545215b187SJeff Roberson 			upcall_remove(td);
5556f8132a8SJulian Elischer 
55648bfcdddSJulian Elischer 			/*
557ed062c8dSJulian Elischer 			 * If the thread we unlinked above was the last one,
558ed062c8dSJulian Elischer 			 * then this ksegrp should go away too.
55948bfcdddSJulian Elischer 			 */
560ed062c8dSJulian Elischer 			if (kg->kg_numthreads == 0) {
561ed062c8dSJulian Elischer 				/*
562ed062c8dSJulian Elischer 				 * let the scheduler know about this in case
563ed062c8dSJulian Elischer 				 * it needs to recover stats or resources.
564ed062c8dSJulian Elischer 				 * Theoretically we could let
565ed062c8dSJulian Elischer 				 * sched_exit_ksegrp()  do the equivalent of
566ed062c8dSJulian Elischer 				 * setting the concurrency to 0
567ed062c8dSJulian Elischer 				 * but don't do it yet to avoid changing
568ed062c8dSJulian Elischer 				 * the existing scheduler code until we
569ed062c8dSJulian Elischer 				 * are ready.
570ed062c8dSJulian Elischer 				 * We supply a random other ksegrp
571ed062c8dSJulian Elischer 				 * as the recipient of any built up
572ed062c8dSJulian Elischer 				 * cpu usage etc. (If the scheduler wants it).
573ed062c8dSJulian Elischer 				 * XXXKSE
574ed062c8dSJulian Elischer 				 * This is probably not fair so think of
575ed062c8dSJulian Elischer  				 * a better answer.
576ed062c8dSJulian Elischer 				 */
57755d44f79SJulian Elischer 				sched_exit_ksegrp(FIRST_KSEGRP_IN_PROC(p), td);
578ed062c8dSJulian Elischer 				sched_set_concurrency(kg, 0); /* XXX TEMP */
579ab2baa72SDavid Xu 				ksegrp_unlink(kg);
580ed062c8dSJulian Elischer 				ksegrp_stash(kg);
581ab2baa72SDavid Xu 			}
5826f8132a8SJulian Elischer 			PROC_UNLOCK(p);
5835c8329edSJulian Elischer 			td->td_ksegrp	= NULL;
584696058c3SJulian Elischer 			PCPU_SET(deadthread, td);
5851faf202eSJulian Elischer 		} else {
586ed062c8dSJulian Elischer 			/*
587ed062c8dSJulian Elischer 			 * The last thread is exiting.. but not through exit()
588ed062c8dSJulian Elischer 			 * what should we do?
589ed062c8dSJulian Elischer 			 * Theoretically this can't happen
590ed062c8dSJulian Elischer  			 * exit1() - clears threading flags before coming here
591ed062c8dSJulian Elischer  			 * kse_exit() - treats last thread specially
592ed062c8dSJulian Elischer  			 * thr_exit() - treats last thread specially
593ed062c8dSJulian Elischer  			 * thread_user_enter() - only if more exist
594ed062c8dSJulian Elischer  			 * thread_userret() - only if more exist
595ed062c8dSJulian Elischer  			 * thread_suspend_check() - only if more exist
596ed062c8dSJulian Elischer 			 */
597ed062c8dSJulian Elischer 			panic ("thread_exit: Last thread exiting on its own");
598ed062c8dSJulian Elischer 		}
599ed062c8dSJulian Elischer 	} else {
600ed062c8dSJulian Elischer 		/*
601ed062c8dSJulian Elischer 		 * non threaded process comes here.
602ed062c8dSJulian Elischer 		 * This includes an EX threaded process that is coming
603ed062c8dSJulian Elischer 		 * here via exit1(). (exit1 dethreads the proc first).
604ed062c8dSJulian Elischer 		 */
6051faf202eSJulian Elischer 		PROC_UNLOCK(p);
6061faf202eSJulian Elischer 	}
607dcc9954eSJulian Elischer 	td->td_state = TDS_INACTIVE;
608732d9528SJulian Elischer 	CTR1(KTR_PROC, "thread_exit: cpu_throw() thread %p", td);
609cc66ebe2SPeter Wemm 	cpu_throw(td, choosethread());
610cc66ebe2SPeter Wemm 	panic("I'm a teapot!");
61144990b8cSJulian Elischer 	/* NOTREACHED */
61244990b8cSJulian Elischer }
61344990b8cSJulian Elischer 
61444990b8cSJulian Elischer /*
615696058c3SJulian Elischer  * Do any thread specific cleanups that may be needed in wait()
61637814395SPeter Wemm  * called with Giant, proc and schedlock not held.
617696058c3SJulian Elischer  */
618696058c3SJulian Elischer void
619696058c3SJulian Elischer thread_wait(struct proc *p)
620696058c3SJulian Elischer {
621696058c3SJulian Elischer 	struct thread *td;
622696058c3SJulian Elischer 
62337814395SPeter Wemm 	mtx_assert(&Giant, MA_NOTOWNED);
62485495c72SJens Schweikhardt 	KASSERT((p->p_numthreads == 1), ("Multiple threads in wait1()"));
62585495c72SJens Schweikhardt 	KASSERT((p->p_numksegrps == 1), ("Multiple ksegrps in wait1()"));
626696058c3SJulian Elischer 	FOREACH_THREAD_IN_PROC(p, td) {
627696058c3SJulian Elischer 		if (td->td_standin != NULL) {
628b75b0311SJulian Elischer 			if (td->td_standin->td_ucred != NULL) {
629b75b0311SJulian Elischer 				crfree(td->td_standin->td_ucred);
630b75b0311SJulian Elischer 				td->td_standin->td_ucred = NULL;
631b75b0311SJulian Elischer 			}
632696058c3SJulian Elischer 			thread_free(td->td_standin);
633696058c3SJulian Elischer 			td->td_standin = NULL;
634696058c3SJulian Elischer 		}
635696058c3SJulian Elischer 		cpu_thread_clean(td);
636ed062c8dSJulian Elischer 		crfree(td->td_ucred);
637696058c3SJulian Elischer 	}
638696058c3SJulian Elischer 	thread_reap();	/* check for zombie threads etc. */
639696058c3SJulian Elischer }
640696058c3SJulian Elischer 
641696058c3SJulian Elischer /*
64244990b8cSJulian Elischer  * Link a thread to a process.
6431faf202eSJulian Elischer  * set up anything that needs to be initialized for it to
6441faf202eSJulian Elischer  * be used by the process.
64544990b8cSJulian Elischer  *
64644990b8cSJulian Elischer  * Note that we do not link to the proc's ucred here.
64744990b8cSJulian Elischer  * The thread is linked as if running but no KSE assigned.
648ed062c8dSJulian Elischer  * Called from:
649ed062c8dSJulian Elischer  *  proc_linkup()
650ed062c8dSJulian Elischer  *  thread_schedule_upcall()
651ed062c8dSJulian Elischer  *  thr_create()
65244990b8cSJulian Elischer  */
65344990b8cSJulian Elischer void
65444990b8cSJulian Elischer thread_link(struct thread *td, struct ksegrp *kg)
65544990b8cSJulian Elischer {
65644990b8cSJulian Elischer 	struct proc *p;
65744990b8cSJulian Elischer 
65844990b8cSJulian Elischer 	p = kg->kg_proc;
65971fad9fdSJulian Elischer 	td->td_state    = TDS_INACTIVE;
66044990b8cSJulian Elischer 	td->td_proc     = p;
66144990b8cSJulian Elischer 	td->td_ksegrp   = kg;
6625215b187SJeff Roberson 	td->td_flags    = 0;
6634fc21c09SDaniel Eischen 	td->td_kflags	= 0;
66444990b8cSJulian Elischer 
6651faf202eSJulian Elischer 	LIST_INIT(&td->td_contested);
6669104847fSDavid Xu 	sigqueue_init(&td->td_sigqueue, p);
667c06eb4e2SSam Leffler 	callout_init(&td->td_slpcallout, CALLOUT_MPSAFE);
66844990b8cSJulian Elischer 	TAILQ_INSERT_HEAD(&p->p_threads, td, td_plist);
66944990b8cSJulian Elischer 	TAILQ_INSERT_HEAD(&kg->kg_threads, td, td_kglist);
67044990b8cSJulian Elischer 	p->p_numthreads++;
67144990b8cSJulian Elischer 	kg->kg_numthreads++;
67244990b8cSJulian Elischer }
67344990b8cSJulian Elischer 
674ed062c8dSJulian Elischer /*
675e5bedcefSJulian Elischer  * Convert a process with one thread to an unthreaded process.
676e5bedcefSJulian Elischer  * Called from:
677e5bedcefSJulian Elischer  *  thread_single(exit)  (called from execve and exit)
678e5bedcefSJulian Elischer  *  kse_exit()		XXX may need cleaning up wrt KSE stuff
679e5bedcefSJulian Elischer  */
680e5bedcefSJulian Elischer void
681e5bedcefSJulian Elischer thread_unthread(struct thread *td)
682e5bedcefSJulian Elischer {
683e5bedcefSJulian Elischer 	struct proc *p = td->td_proc;
684e5bedcefSJulian Elischer 
685e5bedcefSJulian Elischer 	KASSERT((p->p_numthreads == 1), ("Unthreading with >1 threads"));
686e5bedcefSJulian Elischer 	upcall_remove(td);
687e5bedcefSJulian Elischer 	p->p_flag &= ~(P_SA|P_HADTHREADS);
688e5bedcefSJulian Elischer 	td->td_mailbox = NULL;
689e5bedcefSJulian Elischer 	td->td_pflags &= ~(TDP_SA | TDP_CAN_UNBIND);
690e5bedcefSJulian Elischer 	if (td->td_standin != NULL) {
691e5bedcefSJulian Elischer 		thread_stash(td->td_standin);
692e5bedcefSJulian Elischer 		td->td_standin = NULL;
693e5bedcefSJulian Elischer 	}
694e5bedcefSJulian Elischer 	sched_set_concurrency(td->td_ksegrp, 1);
695e5bedcefSJulian Elischer }
696e5bedcefSJulian Elischer 
697e5bedcefSJulian Elischer /*
698ed062c8dSJulian Elischer  * Called from:
699ed062c8dSJulian Elischer  *  thread_exit()
700ed062c8dSJulian Elischer  */
701d3a0bd78SJulian Elischer void
702d3a0bd78SJulian Elischer thread_unlink(struct thread *td)
703d3a0bd78SJulian Elischer {
704d3a0bd78SJulian Elischer 	struct proc *p = td->td_proc;
705d3a0bd78SJulian Elischer 	struct ksegrp *kg = td->td_ksegrp;
706d3a0bd78SJulian Elischer 
707112afcb2SJohn Baldwin 	mtx_assert(&sched_lock, MA_OWNED);
708d3a0bd78SJulian Elischer 	TAILQ_REMOVE(&p->p_threads, td, td_plist);
709d3a0bd78SJulian Elischer 	p->p_numthreads--;
710d3a0bd78SJulian Elischer 	TAILQ_REMOVE(&kg->kg_threads, td, td_kglist);
711d3a0bd78SJulian Elischer 	kg->kg_numthreads--;
712d3a0bd78SJulian Elischer 	/* could clear a few other things here */
713ed062c8dSJulian Elischer 	/* Must  NOT clear links to proc and ksegrp! */
7145c8329edSJulian Elischer }
7155c8329edSJulian Elischer 
7165215b187SJeff Roberson /*
71744990b8cSJulian Elischer  * Enforce single-threading.
71844990b8cSJulian Elischer  *
71944990b8cSJulian Elischer  * Returns 1 if the caller must abort (another thread is waiting to
72044990b8cSJulian Elischer  * exit the process or similar). Process is locked!
72144990b8cSJulian Elischer  * Returns 0 when you are successfully the only thread running.
72244990b8cSJulian Elischer  * A process has successfully single threaded in the suspend mode when
72344990b8cSJulian Elischer  * There are no threads in user mode. Threads in the kernel must be
72444990b8cSJulian Elischer  * allowed to continue until they get to the user boundary. They may even
72544990b8cSJulian Elischer  * copy out their return values and data before suspending. They may however be
726e2668f55SMaxim Konovalov  * accelerated in reaching the user boundary as we will wake up
72744990b8cSJulian Elischer  * any sleeping threads that are interruptable. (PCATCH).
72844990b8cSJulian Elischer  */
72944990b8cSJulian Elischer int
730906ac69dSDavid Xu thread_single(int mode)
73144990b8cSJulian Elischer {
73244990b8cSJulian Elischer 	struct thread *td;
73344990b8cSJulian Elischer 	struct thread *td2;
73444990b8cSJulian Elischer 	struct proc *p;
735ec008e96SDavid Xu 	int remaining;
73644990b8cSJulian Elischer 
73744990b8cSJulian Elischer 	td = curthread;
73844990b8cSJulian Elischer 	p = td->td_proc;
73937814395SPeter Wemm 	mtx_assert(&Giant, MA_NOTOWNED);
74044990b8cSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
74144990b8cSJulian Elischer 	KASSERT((td != NULL), ("curthread is NULL"));
74244990b8cSJulian Elischer 
743ed062c8dSJulian Elischer 	if ((p->p_flag & P_HADTHREADS) == 0)
74444990b8cSJulian Elischer 		return (0);
74544990b8cSJulian Elischer 
746e3b9bf71SJulian Elischer 	/* Is someone already single threading? */
747906ac69dSDavid Xu 	if (p->p_singlethread != NULL && p->p_singlethread != td)
74844990b8cSJulian Elischer 		return (1);
74944990b8cSJulian Elischer 
750906ac69dSDavid Xu 	if (mode == SINGLE_EXIT) {
751906ac69dSDavid Xu 		p->p_flag |= P_SINGLE_EXIT;
752906ac69dSDavid Xu 		p->p_flag &= ~P_SINGLE_BOUNDARY;
753906ac69dSDavid Xu 	} else {
754906ac69dSDavid Xu 		p->p_flag &= ~P_SINGLE_EXIT;
755906ac69dSDavid Xu 		if (mode == SINGLE_BOUNDARY)
756906ac69dSDavid Xu 			p->p_flag |= P_SINGLE_BOUNDARY;
757906ac69dSDavid Xu 		else
758906ac69dSDavid Xu 			p->p_flag &= ~P_SINGLE_BOUNDARY;
759906ac69dSDavid Xu 	}
7601279572aSDavid Xu 	p->p_flag |= P_STOPPED_SINGLE;
76171fad9fdSJulian Elischer 	mtx_lock_spin(&sched_lock);
762112afcb2SJohn Baldwin 	p->p_singlethread = td;
763906ac69dSDavid Xu 	if (mode == SINGLE_EXIT)
764ec008e96SDavid Xu 		remaining = p->p_numthreads;
765906ac69dSDavid Xu 	else if (mode == SINGLE_BOUNDARY)
766906ac69dSDavid Xu 		remaining = p->p_numthreads - p->p_boundary_count;
767906ac69dSDavid Xu 	else
768ec008e96SDavid Xu 		remaining = p->p_numthreads - p->p_suspcount;
769ec008e96SDavid Xu 	while (remaining != 1) {
770bf1a3220SDavid Xu 		if (P_SHOULDSTOP(p) != P_STOPPED_SINGLE)
771bf1a3220SDavid Xu 			goto stopme;
77244990b8cSJulian Elischer 		FOREACH_THREAD_IN_PROC(p, td2) {
77344990b8cSJulian Elischer 			if (td2 == td)
77444990b8cSJulian Elischer 				continue;
775588257e8SDavid Xu 			td2->td_flags |= TDF_ASTPENDING;
77671fad9fdSJulian Elischer 			if (TD_IS_INHIBITED(td2)) {
777906ac69dSDavid Xu 				switch (mode) {
778906ac69dSDavid Xu 				case SINGLE_EXIT:
779cbf4e354SDavid Xu 					if (td->td_flags & TDF_DBSUSPEND)
780cbf4e354SDavid Xu 						td->td_flags &= ~TDF_DBSUSPEND;
781906ac69dSDavid Xu 					if (TD_IS_SUSPENDED(td2))
78271fad9fdSJulian Elischer 						thread_unsuspend_one(td2);
78333862f40SDavid Xu 					if (TD_ON_SLEEPQ(td2) &&
784906ac69dSDavid Xu 					    (td2->td_flags & TDF_SINTR))
78594f0972bSDavid Xu 						sleepq_abort(td2, EINTR);
786906ac69dSDavid Xu 					break;
787906ac69dSDavid Xu 				case SINGLE_BOUNDARY:
788906ac69dSDavid Xu 					if (TD_IS_SUSPENDED(td2) &&
789906ac69dSDavid Xu 					    !(td2->td_flags & TDF_BOUNDARY))
790906ac69dSDavid Xu 						thread_unsuspend_one(td2);
791906ac69dSDavid Xu 					if (TD_ON_SLEEPQ(td2) &&
792906ac69dSDavid Xu 					    (td2->td_flags & TDF_SINTR))
79394f0972bSDavid Xu 						sleepq_abort(td2, ERESTART);
794906ac69dSDavid Xu 					break;
795906ac69dSDavid Xu 				default:
7969d102777SJulian Elischer 					if (TD_IS_SUSPENDED(td2))
7979d102777SJulian Elischer 						continue;
7985215b187SJeff Roberson 					/*
7995215b187SJeff Roberson 					 * maybe other inhibitted states too?
8005215b187SJeff Roberson 					 */
8018acf6057SDavid Xu 					if ((td2->td_flags & TDF_SINTR) &&
8028acf6057SDavid Xu 					    (td2->td_inhibitors &
8038acf6057SDavid Xu 					    (TDI_SLEEPING | TDI_SWAPPED)))
8049d102777SJulian Elischer 						thread_suspend_one(td2);
805906ac69dSDavid Xu 					break;
80644990b8cSJulian Elischer 				}
80744990b8cSJulian Elischer 			}
808d8267df7SDavid Xu #ifdef SMP
809d8267df7SDavid Xu 			else if (TD_IS_RUNNING(td2) && td != td2) {
810d8267df7SDavid Xu 				forward_signal(td2);
811d8267df7SDavid Xu 			}
812d8267df7SDavid Xu #endif
8139d102777SJulian Elischer 		}
814906ac69dSDavid Xu 		if (mode == SINGLE_EXIT)
815ec008e96SDavid Xu 			remaining = p->p_numthreads;
816906ac69dSDavid Xu 		else if (mode == SINGLE_BOUNDARY)
817906ac69dSDavid Xu 			remaining = p->p_numthreads - p->p_boundary_count;
818ec008e96SDavid Xu 		else
819ec008e96SDavid Xu 			remaining = p->p_numthreads - p->p_suspcount;
820ec008e96SDavid Xu 
8219d102777SJulian Elischer 		/*
8229d102777SJulian Elischer 		 * Maybe we suspended some threads.. was it enough?
8239d102777SJulian Elischer 		 */
824ec008e96SDavid Xu 		if (remaining == 1)
8259d102777SJulian Elischer 			break;
8269d102777SJulian Elischer 
827bf1a3220SDavid Xu stopme:
82844990b8cSJulian Elischer 		/*
82944990b8cSJulian Elischer 		 * Wake us up when everyone else has suspended.
830e3b9bf71SJulian Elischer 		 * In the mean time we suspend as well.
83144990b8cSJulian Elischer 		 */
832568b4ebbSDavid Xu 		thread_stopped(p);
83371fad9fdSJulian Elischer 		thread_suspend_one(td);
83444990b8cSJulian Elischer 		PROC_UNLOCK(p);
835bf0acc27SJohn Baldwin 		mi_switch(SW_VOL, NULL);
83644990b8cSJulian Elischer 		mtx_unlock_spin(&sched_lock);
83744990b8cSJulian Elischer 		PROC_LOCK(p);
838112afcb2SJohn Baldwin 		mtx_lock_spin(&sched_lock);
839906ac69dSDavid Xu 		if (mode == SINGLE_EXIT)
840ec008e96SDavid Xu 			remaining = p->p_numthreads;
841906ac69dSDavid Xu 		else if (mode == SINGLE_BOUNDARY)
842906ac69dSDavid Xu 			remaining = p->p_numthreads - p->p_boundary_count;
843ec008e96SDavid Xu 		else
844ec008e96SDavid Xu 			remaining = p->p_numthreads - p->p_suspcount;
84544990b8cSJulian Elischer 	}
846906ac69dSDavid Xu 	if (mode == SINGLE_EXIT) {
84791599697SJulian Elischer 		/*
84891599697SJulian Elischer 		 * We have gotten rid of all the other threads and we
84991599697SJulian Elischer 		 * are about to either exit or exec. In either case,
85091599697SJulian Elischer 		 * we try our utmost  to revert to being a non-threaded
85191599697SJulian Elischer 		 * process.
85291599697SJulian Elischer 		 */
853ed062c8dSJulian Elischer 		p->p_singlethread = NULL;
85464895117SDavid Xu 		p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT);
855e5bedcefSJulian Elischer 		thread_unthread(td);
85691599697SJulian Elischer 	}
857112afcb2SJohn Baldwin 	mtx_unlock_spin(&sched_lock);
85844990b8cSJulian Elischer 	return (0);
85944990b8cSJulian Elischer }
86044990b8cSJulian Elischer 
86144990b8cSJulian Elischer /*
86244990b8cSJulian Elischer  * Called in from locations that can safely check to see
86344990b8cSJulian Elischer  * whether we have to suspend or at least throttle for a
86444990b8cSJulian Elischer  * single-thread event (e.g. fork).
86544990b8cSJulian Elischer  *
86644990b8cSJulian Elischer  * Such locations include userret().
86744990b8cSJulian Elischer  * If the "return_instead" argument is non zero, the thread must be able to
86844990b8cSJulian Elischer  * accept 0 (caller may continue), or 1 (caller must abort) as a result.
86944990b8cSJulian Elischer  *
87044990b8cSJulian Elischer  * The 'return_instead' argument tells the function if it may do a
87144990b8cSJulian Elischer  * thread_exit() or suspend, or whether the caller must abort and back
87244990b8cSJulian Elischer  * out instead.
87344990b8cSJulian Elischer  *
87444990b8cSJulian Elischer  * If the thread that set the single_threading request has set the
87544990b8cSJulian Elischer  * P_SINGLE_EXIT bit in the process flags then this call will never return
87644990b8cSJulian Elischer  * if 'return_instead' is false, but will exit.
87744990b8cSJulian Elischer  *
87844990b8cSJulian Elischer  * P_SINGLE_EXIT | return_instead == 0| return_instead != 0
87944990b8cSJulian Elischer  *---------------+--------------------+---------------------
88044990b8cSJulian Elischer  *       0       | returns 0          |   returns 0 or 1
88144990b8cSJulian Elischer  *               | when ST ends       |   immediatly
88244990b8cSJulian Elischer  *---------------+--------------------+---------------------
88344990b8cSJulian Elischer  *       1       | thread exits       |   returns 1
88444990b8cSJulian Elischer  *               |                    |  immediatly
88544990b8cSJulian Elischer  * 0 = thread_exit() or suspension ok,
88644990b8cSJulian Elischer  * other = return error instead of stopping the thread.
88744990b8cSJulian Elischer  *
88844990b8cSJulian Elischer  * While a full suspension is under effect, even a single threading
88944990b8cSJulian Elischer  * thread would be suspended if it made this call (but it shouldn't).
89044990b8cSJulian Elischer  * This call should only be made from places where
89144990b8cSJulian Elischer  * thread_exit() would be safe as that may be the outcome unless
89244990b8cSJulian Elischer  * return_instead is set.
89344990b8cSJulian Elischer  */
89444990b8cSJulian Elischer int
89544990b8cSJulian Elischer thread_suspend_check(int return_instead)
89644990b8cSJulian Elischer {
897ecafb24bSJuli Mallett 	struct thread *td;
898ecafb24bSJuli Mallett 	struct proc *p;
89944990b8cSJulian Elischer 
90044990b8cSJulian Elischer 	td = curthread;
90144990b8cSJulian Elischer 	p = td->td_proc;
90237814395SPeter Wemm 	mtx_assert(&Giant, MA_NOTOWNED);
90344990b8cSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
904cbf4e354SDavid Xu 	while (P_SHOULDSTOP(p) ||
905cbf4e354SDavid Xu 	      ((p->p_flag & P_TRACED) && (td->td_flags & TDF_DBSUSPEND))) {
9061279572aSDavid Xu 		if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) {
90744990b8cSJulian Elischer 			KASSERT(p->p_singlethread != NULL,
90844990b8cSJulian Elischer 			    ("singlethread not set"));
90944990b8cSJulian Elischer 			/*
910e3b9bf71SJulian Elischer 			 * The only suspension in action is a
911e3b9bf71SJulian Elischer 			 * single-threading. Single threader need not stop.
912b6d5995eSJulian Elischer 			 * XXX Should be safe to access unlocked
913b6d5995eSJulian Elischer 			 * as it can only be set to be true by us.
91444990b8cSJulian Elischer 			 */
915e3b9bf71SJulian Elischer 			if (p->p_singlethread == td)
91644990b8cSJulian Elischer 				return (0);	/* Exempt from stopping. */
91744990b8cSJulian Elischer 		}
91845a4bfa1SDavid Xu 		if ((p->p_flag & P_SINGLE_EXIT) && return_instead)
91994f0972bSDavid Xu 			return (EINTR);
92044990b8cSJulian Elischer 
921906ac69dSDavid Xu 		/* Should we goto user boundary if we didn't come from there? */
922906ac69dSDavid Xu 		if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE &&
923906ac69dSDavid Xu 		    (p->p_flag & P_SINGLE_BOUNDARY) && return_instead)
92494f0972bSDavid Xu 			return (ERESTART);
925906ac69dSDavid Xu 
9269104847fSDavid Xu 		/* If thread will exit, flush its pending signals */
9279104847fSDavid Xu 		if ((p->p_flag & P_SINGLE_EXIT) && (p->p_singlethread != td))
9289104847fSDavid Xu 			sigqueue_flush(&td->td_sigqueue);
9299104847fSDavid Xu 
930e574e444SDavid Xu 		mtx_lock_spin(&sched_lock);
931e574e444SDavid Xu 		thread_stopped(p);
93244990b8cSJulian Elischer 		/*
93344990b8cSJulian Elischer 		 * If the process is waiting for us to exit,
93444990b8cSJulian Elischer 		 * this thread should just suicide.
9351279572aSDavid Xu 		 * Assumes that P_SINGLE_EXIT implies P_STOPPED_SINGLE.
93644990b8cSJulian Elischer 		 */
937906ac69dSDavid Xu 		if ((p->p_flag & P_SINGLE_EXIT) && (p->p_singlethread != td))
93844990b8cSJulian Elischer 			thread_exit();
93944990b8cSJulian Elischer 
94044990b8cSJulian Elischer 		/*
94144990b8cSJulian Elischer 		 * When a thread suspends, it just
94244990b8cSJulian Elischer 		 * moves to the processes's suspend queue
94344990b8cSJulian Elischer 		 * and stays there.
94444990b8cSJulian Elischer 		 */
94571fad9fdSJulian Elischer 		thread_suspend_one(td);
946906ac69dSDavid Xu 		if (return_instead == 0) {
947906ac69dSDavid Xu 			p->p_boundary_count++;
948906ac69dSDavid Xu 			td->td_flags |= TDF_BOUNDARY;
949cf19bf91SJulian Elischer 		}
950906ac69dSDavid Xu 		if (P_SHOULDSTOP(p) == P_STOPPED_SINGLE) {
951906ac69dSDavid Xu 			if (p->p_numthreads == p->p_suspcount)
952906ac69dSDavid Xu 				thread_unsuspend_one(p->p_singlethread);
953cf19bf91SJulian Elischer 		}
954a6f37ac9SJohn Baldwin 		PROC_UNLOCK(p);
955bf0acc27SJohn Baldwin 		mi_switch(SW_INVOL, NULL);
956906ac69dSDavid Xu 		if (return_instead == 0) {
957906ac69dSDavid Xu 			p->p_boundary_count--;
958906ac69dSDavid Xu 			td->td_flags &= ~TDF_BOUNDARY;
959906ac69dSDavid Xu 		}
96044990b8cSJulian Elischer 		mtx_unlock_spin(&sched_lock);
96144990b8cSJulian Elischer 		PROC_LOCK(p);
96244990b8cSJulian Elischer 	}
96344990b8cSJulian Elischer 	return (0);
96444990b8cSJulian Elischer }
96544990b8cSJulian Elischer 
96635c32a76SDavid Xu void
96735c32a76SDavid Xu thread_suspend_one(struct thread *td)
96835c32a76SDavid Xu {
96935c32a76SDavid Xu 	struct proc *p = td->td_proc;
97035c32a76SDavid Xu 
97135c32a76SDavid Xu 	mtx_assert(&sched_lock, MA_OWNED);
972112afcb2SJohn Baldwin 	PROC_LOCK_ASSERT(p, MA_OWNED);
973e574e444SDavid Xu 	KASSERT(!TD_IS_SUSPENDED(td), ("already suspended"));
97435c32a76SDavid Xu 	p->p_suspcount++;
97571fad9fdSJulian Elischer 	TD_SET_SUSPENDED(td);
97635c32a76SDavid Xu 	TAILQ_INSERT_TAIL(&p->p_suspended, td, td_runq);
97735c32a76SDavid Xu }
97835c32a76SDavid Xu 
97935c32a76SDavid Xu void
98035c32a76SDavid Xu thread_unsuspend_one(struct thread *td)
98135c32a76SDavid Xu {
98235c32a76SDavid Xu 	struct proc *p = td->td_proc;
98335c32a76SDavid Xu 
98435c32a76SDavid Xu 	mtx_assert(&sched_lock, MA_OWNED);
985112afcb2SJohn Baldwin 	PROC_LOCK_ASSERT(p, MA_OWNED);
98635c32a76SDavid Xu 	TAILQ_REMOVE(&p->p_suspended, td, td_runq);
98771fad9fdSJulian Elischer 	TD_CLR_SUSPENDED(td);
98835c32a76SDavid Xu 	p->p_suspcount--;
98971fad9fdSJulian Elischer 	setrunnable(td);
99035c32a76SDavid Xu }
99135c32a76SDavid Xu 
99244990b8cSJulian Elischer /*
99344990b8cSJulian Elischer  * Allow all threads blocked by single threading to continue running.
99444990b8cSJulian Elischer  */
99544990b8cSJulian Elischer void
99644990b8cSJulian Elischer thread_unsuspend(struct proc *p)
99744990b8cSJulian Elischer {
99844990b8cSJulian Elischer 	struct thread *td;
99944990b8cSJulian Elischer 
1000b6d5995eSJulian Elischer 	mtx_assert(&sched_lock, MA_OWNED);
100144990b8cSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
100244990b8cSJulian Elischer 	if (!P_SHOULDSTOP(p)) {
100344990b8cSJulian Elischer 		while ((td = TAILQ_FIRST(&p->p_suspended))) {
100435c32a76SDavid Xu 			thread_unsuspend_one(td);
100544990b8cSJulian Elischer 		}
10061279572aSDavid Xu 	} else if ((P_SHOULDSTOP(p) == P_STOPPED_SINGLE) &&
100744990b8cSJulian Elischer 	    (p->p_numthreads == p->p_suspcount)) {
100844990b8cSJulian Elischer 		/*
100944990b8cSJulian Elischer 		 * Stopping everything also did the job for the single
101044990b8cSJulian Elischer 		 * threading request. Now we've downgraded to single-threaded,
101144990b8cSJulian Elischer 		 * let it continue.
101244990b8cSJulian Elischer 		 */
101335c32a76SDavid Xu 		thread_unsuspend_one(p->p_singlethread);
101444990b8cSJulian Elischer 	}
101544990b8cSJulian Elischer }
101644990b8cSJulian Elischer 
1017ed062c8dSJulian Elischer /*
1018ed062c8dSJulian Elischer  * End the single threading mode..
1019ed062c8dSJulian Elischer  */
102044990b8cSJulian Elischer void
102144990b8cSJulian Elischer thread_single_end(void)
102244990b8cSJulian Elischer {
102344990b8cSJulian Elischer 	struct thread *td;
102444990b8cSJulian Elischer 	struct proc *p;
102544990b8cSJulian Elischer 
102644990b8cSJulian Elischer 	td = curthread;
102744990b8cSJulian Elischer 	p = td->td_proc;
102844990b8cSJulian Elischer 	PROC_LOCK_ASSERT(p, MA_OWNED);
1029906ac69dSDavid Xu 	p->p_flag &= ~(P_STOPPED_SINGLE | P_SINGLE_EXIT | P_SINGLE_BOUNDARY);
1030112afcb2SJohn Baldwin 	mtx_lock_spin(&sched_lock);
103144990b8cSJulian Elischer 	p->p_singlethread = NULL;
103221fc3164SDavid Xu 	p->p_procscopegrp = NULL;
103349539972SJulian Elischer 	/*
103449539972SJulian Elischer 	 * If there are other threads they mey now run,
103549539972SJulian Elischer 	 * unless of course there is a blanket 'stop order'
103649539972SJulian Elischer 	 * on the process. The single threader must be allowed
103749539972SJulian Elischer 	 * to continue however as this is a bad place to stop.
103849539972SJulian Elischer 	 */
103949539972SJulian Elischer 	if ((p->p_numthreads != 1) && (!P_SHOULDSTOP(p))) {
104049539972SJulian Elischer 		while ((td = TAILQ_FIRST(&p->p_suspended))) {
104171fad9fdSJulian Elischer 			thread_unsuspend_one(td);
104244990b8cSJulian Elischer 		}
104349539972SJulian Elischer 	}
1044112afcb2SJohn Baldwin 	mtx_unlock_spin(&sched_lock);
104549539972SJulian Elischer }
10464fc21c09SDaniel Eischen 
104744355392SDavid Xu struct thread *
104844355392SDavid Xu thread_find(struct proc *p, lwpid_t tid)
104944355392SDavid Xu {
105044355392SDavid Xu 	struct thread *td;
105144355392SDavid Xu 
105244355392SDavid Xu 	PROC_LOCK_ASSERT(p, MA_OWNED);
105344355392SDavid Xu 	mtx_lock_spin(&sched_lock);
105444355392SDavid Xu 	FOREACH_THREAD_IN_PROC(p, td) {
105544355392SDavid Xu 		if (td->td_tid == tid)
105644355392SDavid Xu 			break;
105744355392SDavid Xu 	}
105844355392SDavid Xu 	mtx_unlock_spin(&sched_lock);
105944355392SDavid Xu 	return (td);
106044355392SDavid Xu }
1061