xref: /linux/include/linux/sched.h (revision d9345c65eb7930ac6755cf593ee7686f4029ccf4)
11da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H
21da177e4SLinus Torvalds #define _LINUX_SCHED_H
31da177e4SLinus Torvalds 
4607ca46eSDavid Howells #include <uapi/linux/sched.h>
5b7b3c76aSDavid Woodhouse 
65c228079SDongsheng Yang #include <linux/sched/prio.h>
75c228079SDongsheng Yang 
8b7b3c76aSDavid Woodhouse 
9b7b3c76aSDavid Woodhouse struct sched_param {
10b7b3c76aSDavid Woodhouse 	int sched_priority;
11b7b3c76aSDavid Woodhouse };
12b7b3c76aSDavid Woodhouse 
131da177e4SLinus Torvalds #include <asm/param.h>	/* for HZ */
141da177e4SLinus Torvalds 
151da177e4SLinus Torvalds #include <linux/capability.h>
161da177e4SLinus Torvalds #include <linux/threads.h>
171da177e4SLinus Torvalds #include <linux/kernel.h>
181da177e4SLinus Torvalds #include <linux/types.h>
191da177e4SLinus Torvalds #include <linux/timex.h>
201da177e4SLinus Torvalds #include <linux/jiffies.h>
21fb00aca4SPeter Zijlstra #include <linux/plist.h>
221da177e4SLinus Torvalds #include <linux/rbtree.h>
231da177e4SLinus Torvalds #include <linux/thread_info.h>
241da177e4SLinus Torvalds #include <linux/cpumask.h>
251da177e4SLinus Torvalds #include <linux/errno.h>
261da177e4SLinus Torvalds #include <linux/nodemask.h>
27c92ff1bdSMartin Schwidefsky #include <linux/mm_types.h>
2892cf2118SFrederic Weisbecker #include <linux/preempt.h>
291da177e4SLinus Torvalds 
301da177e4SLinus Torvalds #include <asm/page.h>
311da177e4SLinus Torvalds #include <asm/ptrace.h>
32bfc3f028SFrederic Weisbecker #include <linux/cputime.h>
331da177e4SLinus Torvalds 
341da177e4SLinus Torvalds #include <linux/smp.h>
351da177e4SLinus Torvalds #include <linux/sem.h>
36ab602f79SJack Miller #include <linux/shm.h>
371da177e4SLinus Torvalds #include <linux/signal.h>
381da177e4SLinus Torvalds #include <linux/compiler.h>
391da177e4SLinus Torvalds #include <linux/completion.h>
401da177e4SLinus Torvalds #include <linux/pid.h>
411da177e4SLinus Torvalds #include <linux/percpu.h>
421da177e4SLinus Torvalds #include <linux/topology.h>
431da177e4SLinus Torvalds #include <linux/seccomp.h>
44e56d0903SIngo Molnar #include <linux/rcupdate.h>
4505725f7eSJiri Pirko #include <linux/rculist.h>
4623f78d4aSIngo Molnar #include <linux/rtmutex.h>
471da177e4SLinus Torvalds 
48a3b6714eSDavid Woodhouse #include <linux/time.h>
49a3b6714eSDavid Woodhouse #include <linux/param.h>
50a3b6714eSDavid Woodhouse #include <linux/resource.h>
51a3b6714eSDavid Woodhouse #include <linux/timer.h>
52a3b6714eSDavid Woodhouse #include <linux/hrtimer.h>
535c9a8750SDmitry Vyukov #include <linux/kcov.h>
547c3ab738SAndrew Morton #include <linux/task_io_accounting.h>
559745512cSArjan van de Ven #include <linux/latencytop.h>
569e2b2dc4SDavid Howells #include <linux/cred.h>
57fa14ff4aSPeter Zijlstra #include <linux/llist.h>
587b44ab97SEric W. Biederman #include <linux/uidgid.h>
5921caf2fcSMing Lei #include <linux/gfp.h>
60d4311ff1SAaron Tomlin #include <linux/magic.h>
617d7efec3STejun Heo #include <linux/cgroup-defs.h>
62a3b6714eSDavid Woodhouse 
63a3b6714eSDavid Woodhouse #include <asm/processor.h>
6436d57ac4SH. J. Lu 
65d50dde5aSDario Faggioli #define SCHED_ATTR_SIZE_VER0	48	/* sizeof first published struct */
66d50dde5aSDario Faggioli 
67d50dde5aSDario Faggioli /*
68d50dde5aSDario Faggioli  * Extended scheduling parameters data structure.
69d50dde5aSDario Faggioli  *
70d50dde5aSDario Faggioli  * This is needed because the original struct sched_param can not be
71d50dde5aSDario Faggioli  * altered without introducing ABI issues with legacy applications
72d50dde5aSDario Faggioli  * (e.g., in sched_getparam()).
73d50dde5aSDario Faggioli  *
74d50dde5aSDario Faggioli  * However, the possibility of specifying more than just a priority for
75d50dde5aSDario Faggioli  * the tasks may be useful for a wide variety of application fields, e.g.,
76d50dde5aSDario Faggioli  * multimedia, streaming, automation and control, and many others.
77d50dde5aSDario Faggioli  *
78d50dde5aSDario Faggioli  * This variant (sched_attr) is meant at describing a so-called
79d50dde5aSDario Faggioli  * sporadic time-constrained task. In such model a task is specified by:
80d50dde5aSDario Faggioli  *  - the activation period or minimum instance inter-arrival time;
81d50dde5aSDario Faggioli  *  - the maximum (or average, depending on the actual scheduling
82d50dde5aSDario Faggioli  *    discipline) computation time of all instances, a.k.a. runtime;
83d50dde5aSDario Faggioli  *  - the deadline (relative to the actual activation time) of each
84d50dde5aSDario Faggioli  *    instance.
85d50dde5aSDario Faggioli  * Very briefly, a periodic (sporadic) task asks for the execution of
86d50dde5aSDario Faggioli  * some specific computation --which is typically called an instance--
87d50dde5aSDario Faggioli  * (at most) every period. Moreover, each instance typically lasts no more
88d50dde5aSDario Faggioli  * than the runtime and must be completed by time instant t equal to
89d50dde5aSDario Faggioli  * the instance activation time + the deadline.
90d50dde5aSDario Faggioli  *
91d50dde5aSDario Faggioli  * This is reflected by the actual fields of the sched_attr structure:
92d50dde5aSDario Faggioli  *
93d50dde5aSDario Faggioli  *  @size		size of the structure, for fwd/bwd compat.
94d50dde5aSDario Faggioli  *
95d50dde5aSDario Faggioli  *  @sched_policy	task's scheduling policy
96d50dde5aSDario Faggioli  *  @sched_flags	for customizing the scheduler behaviour
97d50dde5aSDario Faggioli  *  @sched_nice		task's nice value      (SCHED_NORMAL/BATCH)
98d50dde5aSDario Faggioli  *  @sched_priority	task's static priority (SCHED_FIFO/RR)
99d50dde5aSDario Faggioli  *  @sched_deadline	representative of the task's deadline
100d50dde5aSDario Faggioli  *  @sched_runtime	representative of the task's runtime
101d50dde5aSDario Faggioli  *  @sched_period	representative of the task's period
102d50dde5aSDario Faggioli  *
103d50dde5aSDario Faggioli  * Given this task model, there are a multiplicity of scheduling algorithms
104d50dde5aSDario Faggioli  * and policies, that can be used to ensure all the tasks will make their
105d50dde5aSDario Faggioli  * timing constraints.
106aab03e05SDario Faggioli  *
107aab03e05SDario Faggioli  * As of now, the SCHED_DEADLINE policy (sched_dl scheduling class) is the
108aab03e05SDario Faggioli  * only user of this new interface. More information about the algorithm
109aab03e05SDario Faggioli  * available in the scheduling class file or in Documentation/.
110d50dde5aSDario Faggioli  */
111d50dde5aSDario Faggioli struct sched_attr {
112d50dde5aSDario Faggioli 	u32 size;
113d50dde5aSDario Faggioli 
114d50dde5aSDario Faggioli 	u32 sched_policy;
115d50dde5aSDario Faggioli 	u64 sched_flags;
116d50dde5aSDario Faggioli 
117d50dde5aSDario Faggioli 	/* SCHED_NORMAL, SCHED_BATCH */
118d50dde5aSDario Faggioli 	s32 sched_nice;
119d50dde5aSDario Faggioli 
120d50dde5aSDario Faggioli 	/* SCHED_FIFO, SCHED_RR */
121d50dde5aSDario Faggioli 	u32 sched_priority;
122d50dde5aSDario Faggioli 
123d50dde5aSDario Faggioli 	/* SCHED_DEADLINE */
124d50dde5aSDario Faggioli 	u64 sched_runtime;
125d50dde5aSDario Faggioli 	u64 sched_deadline;
126d50dde5aSDario Faggioli 	u64 sched_period;
127d50dde5aSDario Faggioli };
128d50dde5aSDario Faggioli 
129c87e2837SIngo Molnar struct futex_pi_state;
130286100a6SAlexey Dobriyan struct robust_list_head;
131bddd87c7SAkinobu Mita struct bio_list;
1325ad4e53bSAl Viro struct fs_struct;
133cdd6c482SIngo Molnar struct perf_event_context;
13473c10101SJens Axboe struct blk_plug;
135c4ad8f98SLinus Torvalds struct filename;
13689076bc3SAl Viro struct nameidata;
1371da177e4SLinus Torvalds 
138615d6e87SDavidlohr Bueso #define VMACACHE_BITS 2
139615d6e87SDavidlohr Bueso #define VMACACHE_SIZE (1U << VMACACHE_BITS)
140615d6e87SDavidlohr Bueso #define VMACACHE_MASK (VMACACHE_SIZE - 1)
141615d6e87SDavidlohr Bueso 
1421da177e4SLinus Torvalds /*
1431da177e4SLinus Torvalds  * These are the constant used to fake the fixed-point load-average
1441da177e4SLinus Torvalds  * counting. Some notes:
1451da177e4SLinus Torvalds  *  - 11 bit fractions expand to 22 bits by the multiplies: this gives
1461da177e4SLinus Torvalds  *    a load-average precision of 10 bits integer + 11 bits fractional
1471da177e4SLinus Torvalds  *  - if you want to count load-averages more often, you need more
1481da177e4SLinus Torvalds  *    precision, or rounding will get you. With 2-second counting freq,
1491da177e4SLinus Torvalds  *    the EXP_n values would be 1981, 2034 and 2043 if still using only
1501da177e4SLinus Torvalds  *    11 bit fractions.
1511da177e4SLinus Torvalds  */
1521da177e4SLinus Torvalds extern unsigned long avenrun[];		/* Load averages */
1532d02494fSThomas Gleixner extern void get_avenrun(unsigned long *loads, unsigned long offset, int shift);
1541da177e4SLinus Torvalds 
1551da177e4SLinus Torvalds #define FSHIFT		11		/* nr of bits of precision */
1561da177e4SLinus Torvalds #define FIXED_1		(1<<FSHIFT)	/* 1.0 as fixed-point */
1570c2043abSLinus Torvalds #define LOAD_FREQ	(5*HZ+1)	/* 5 sec intervals */
1581da177e4SLinus Torvalds #define EXP_1		1884		/* 1/exp(5sec/1min) as fixed-point */
1591da177e4SLinus Torvalds #define EXP_5		2014		/* 1/exp(5sec/5min) */
1601da177e4SLinus Torvalds #define EXP_15		2037		/* 1/exp(5sec/15min) */
1611da177e4SLinus Torvalds 
1621da177e4SLinus Torvalds #define CALC_LOAD(load,exp,n) \
1631da177e4SLinus Torvalds 	load *= exp; \
1641da177e4SLinus Torvalds 	load += n*(FIXED_1-exp); \
1651da177e4SLinus Torvalds 	load >>= FSHIFT;
1661da177e4SLinus Torvalds 
1671da177e4SLinus Torvalds extern unsigned long total_forks;
1681da177e4SLinus Torvalds extern int nr_threads;
1691da177e4SLinus Torvalds DECLARE_PER_CPU(unsigned long, process_counts);
1701da177e4SLinus Torvalds extern int nr_processes(void);
1711da177e4SLinus Torvalds extern unsigned long nr_running(void);
1722ee507c4STim Chen extern bool single_task_running(void);
1731da177e4SLinus Torvalds extern unsigned long nr_iowait(void);
1748c215bd3SPeter Zijlstra extern unsigned long nr_iowait_cpu(int cpu);
175372ba8cbSMel Gorman extern void get_iowait_load(unsigned long *nr_waiters, unsigned long *load);
17669d25870SArjan van de Ven 
1770f004f5aSPeter Zijlstra extern void calc_global_load(unsigned long ticks);
1783289bdb4SPeter Zijlstra 
1793289bdb4SPeter Zijlstra #if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
1801f41906aSFrederic Weisbecker extern void cpu_load_update_nohz_start(void);
1811f41906aSFrederic Weisbecker extern void cpu_load_update_nohz_stop(void);
1823289bdb4SPeter Zijlstra #else
1831f41906aSFrederic Weisbecker static inline void cpu_load_update_nohz_start(void) { }
1841f41906aSFrederic Weisbecker static inline void cpu_load_update_nohz_stop(void) { }
1853289bdb4SPeter Zijlstra #endif
1861da177e4SLinus Torvalds 
187b637a328SPaul E. McKenney extern void dump_cpu_task(int cpu);
188b637a328SPaul E. McKenney 
18943ae34cbSIngo Molnar struct seq_file;
19043ae34cbSIngo Molnar struct cfs_rq;
1914cf86d77SIngo Molnar struct task_group;
19243ae34cbSIngo Molnar #ifdef CONFIG_SCHED_DEBUG
19343ae34cbSIngo Molnar extern void proc_sched_show_task(struct task_struct *p, struct seq_file *m);
19443ae34cbSIngo Molnar extern void proc_sched_set_task(struct task_struct *p);
19543ae34cbSIngo Molnar #endif
1961da177e4SLinus Torvalds 
1974a8342d2SLinus Torvalds /*
1984a8342d2SLinus Torvalds  * Task state bitmask. NOTE! These bits are also
1994a8342d2SLinus Torvalds  * encoded in fs/proc/array.c: get_task_state().
2004a8342d2SLinus Torvalds  *
2014a8342d2SLinus Torvalds  * We have two separate sets of flags: task->state
2024a8342d2SLinus Torvalds  * is about runnability, while task->exit_state are
2034a8342d2SLinus Torvalds  * about the task exiting. Confusing, but this way
2044a8342d2SLinus Torvalds  * modifying one set can't modify the other one by
2054a8342d2SLinus Torvalds  * mistake.
2064a8342d2SLinus Torvalds  */
2071da177e4SLinus Torvalds #define TASK_RUNNING		0
2081da177e4SLinus Torvalds #define TASK_INTERRUPTIBLE	1
2091da177e4SLinus Torvalds #define TASK_UNINTERRUPTIBLE	2
210f021a3c2SMatthew Wilcox #define __TASK_STOPPED		4
211f021a3c2SMatthew Wilcox #define __TASK_TRACED		8
2124a8342d2SLinus Torvalds /* in tsk->exit_state */
213ad86622bSOleg Nesterov #define EXIT_DEAD		16
214ad86622bSOleg Nesterov #define EXIT_ZOMBIE		32
215abd50b39SOleg Nesterov #define EXIT_TRACE		(EXIT_ZOMBIE | EXIT_DEAD)
2164a8342d2SLinus Torvalds /* in tsk->state again */
217af927232SMike Galbraith #define TASK_DEAD		64
218f021a3c2SMatthew Wilcox #define TASK_WAKEKILL		128
219e9c84311SPeter Zijlstra #define TASK_WAKING		256
220f2530dc7SThomas Gleixner #define TASK_PARKED		512
22180ed87c8SPeter Zijlstra #define TASK_NOLOAD		1024
2227dc603c9SPeter Zijlstra #define TASK_NEW		2048
2237dc603c9SPeter Zijlstra #define TASK_STATE_MAX		4096
224f021a3c2SMatthew Wilcox 
2257dc603c9SPeter Zijlstra #define TASK_STATE_TO_CHAR_STR "RSDTtXZxKWPNn"
22673342151SPeter Zijlstra 
227e1781538SPeter Zijlstra extern char ___assert_task_state[1 - 2*!!(
228e1781538SPeter Zijlstra 		sizeof(TASK_STATE_TO_CHAR_STR)-1 != ilog2(TASK_STATE_MAX)+1)];
229f021a3c2SMatthew Wilcox 
230f021a3c2SMatthew Wilcox /* Convenience macros for the sake of set_task_state */
231f021a3c2SMatthew Wilcox #define TASK_KILLABLE		(TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
232f021a3c2SMatthew Wilcox #define TASK_STOPPED		(TASK_WAKEKILL | __TASK_STOPPED)
233f021a3c2SMatthew Wilcox #define TASK_TRACED		(TASK_WAKEKILL | __TASK_TRACED)
2341da177e4SLinus Torvalds 
23580ed87c8SPeter Zijlstra #define TASK_IDLE		(TASK_UNINTERRUPTIBLE | TASK_NOLOAD)
23680ed87c8SPeter Zijlstra 
23792a1f4bcSMatthew Wilcox /* Convenience macros for the sake of wake_up */
23892a1f4bcSMatthew Wilcox #define TASK_NORMAL		(TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
239f021a3c2SMatthew Wilcox #define TASK_ALL		(TASK_NORMAL | __TASK_STOPPED | __TASK_TRACED)
24092a1f4bcSMatthew Wilcox 
24192a1f4bcSMatthew Wilcox /* get_task_state() */
24292a1f4bcSMatthew Wilcox #define TASK_REPORT		(TASK_RUNNING | TASK_INTERRUPTIBLE | \
243f021a3c2SMatthew Wilcox 				 TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
24474e37200SOleg Nesterov 				 __TASK_TRACED | EXIT_ZOMBIE | EXIT_DEAD)
24592a1f4bcSMatthew Wilcox 
246f021a3c2SMatthew Wilcox #define task_is_traced(task)	((task->state & __TASK_TRACED) != 0)
247f021a3c2SMatthew Wilcox #define task_is_stopped(task)	((task->state & __TASK_STOPPED) != 0)
24892a1f4bcSMatthew Wilcox #define task_is_stopped_or_traced(task)	\
249f021a3c2SMatthew Wilcox 			((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
25092a1f4bcSMatthew Wilcox #define task_contributes_to_load(task)	\
251e3c8ca83SNathan Lynch 				((task->state & TASK_UNINTERRUPTIBLE) != 0 && \
25280ed87c8SPeter Zijlstra 				 (task->flags & PF_FROZEN) == 0 && \
25380ed87c8SPeter Zijlstra 				 (task->state & TASK_NOLOAD) == 0)
2541da177e4SLinus Torvalds 
2558eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
2568eb23b9fSPeter Zijlstra 
2578eb23b9fSPeter Zijlstra #define __set_task_state(tsk, state_value)			\
2588eb23b9fSPeter Zijlstra 	do {							\
2598eb23b9fSPeter Zijlstra 		(tsk)->task_state_change = _THIS_IP_;		\
2608eb23b9fSPeter Zijlstra 		(tsk)->state = (state_value);			\
2618eb23b9fSPeter Zijlstra 	} while (0)
2628eb23b9fSPeter Zijlstra #define set_task_state(tsk, state_value)			\
2638eb23b9fSPeter Zijlstra 	do {							\
2648eb23b9fSPeter Zijlstra 		(tsk)->task_state_change = _THIS_IP_;		\
265b92b8b35SPeter Zijlstra 		smp_store_mb((tsk)->state, (state_value));		\
2668eb23b9fSPeter Zijlstra 	} while (0)
2678eb23b9fSPeter Zijlstra 
2688eb23b9fSPeter Zijlstra /*
2698eb23b9fSPeter Zijlstra  * set_current_state() includes a barrier so that the write of current->state
2708eb23b9fSPeter Zijlstra  * is correctly serialised wrt the caller's subsequent test of whether to
2718eb23b9fSPeter Zijlstra  * actually sleep:
2728eb23b9fSPeter Zijlstra  *
2738eb23b9fSPeter Zijlstra  *	set_current_state(TASK_UNINTERRUPTIBLE);
2748eb23b9fSPeter Zijlstra  *	if (do_i_need_to_sleep())
2758eb23b9fSPeter Zijlstra  *		schedule();
2768eb23b9fSPeter Zijlstra  *
2778eb23b9fSPeter Zijlstra  * If the caller does not need such serialisation then use __set_current_state()
2788eb23b9fSPeter Zijlstra  */
2798eb23b9fSPeter Zijlstra #define __set_current_state(state_value)			\
2808eb23b9fSPeter Zijlstra 	do {							\
2818eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
2828eb23b9fSPeter Zijlstra 		current->state = (state_value);			\
2838eb23b9fSPeter Zijlstra 	} while (0)
2848eb23b9fSPeter Zijlstra #define set_current_state(state_value)				\
2858eb23b9fSPeter Zijlstra 	do {							\
2868eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
287b92b8b35SPeter Zijlstra 		smp_store_mb(current->state, (state_value));		\
2888eb23b9fSPeter Zijlstra 	} while (0)
2898eb23b9fSPeter Zijlstra 
2908eb23b9fSPeter Zijlstra #else
2918eb23b9fSPeter Zijlstra 
2921da177e4SLinus Torvalds #define __set_task_state(tsk, state_value)		\
2931da177e4SLinus Torvalds 	do { (tsk)->state = (state_value); } while (0)
2941da177e4SLinus Torvalds #define set_task_state(tsk, state_value)		\
295b92b8b35SPeter Zijlstra 	smp_store_mb((tsk)->state, (state_value))
2961da177e4SLinus Torvalds 
297498d0c57SAndrew Morton /*
298498d0c57SAndrew Morton  * set_current_state() includes a barrier so that the write of current->state
299498d0c57SAndrew Morton  * is correctly serialised wrt the caller's subsequent test of whether to
300498d0c57SAndrew Morton  * actually sleep:
301498d0c57SAndrew Morton  *
302498d0c57SAndrew Morton  *	set_current_state(TASK_UNINTERRUPTIBLE);
303498d0c57SAndrew Morton  *	if (do_i_need_to_sleep())
304498d0c57SAndrew Morton  *		schedule();
305498d0c57SAndrew Morton  *
306498d0c57SAndrew Morton  * If the caller does not need such serialisation then use __set_current_state()
307498d0c57SAndrew Morton  */
3081da177e4SLinus Torvalds #define __set_current_state(state_value)		\
3091da177e4SLinus Torvalds 	do { current->state = (state_value); } while (0)
3101da177e4SLinus Torvalds #define set_current_state(state_value)			\
311b92b8b35SPeter Zijlstra 	smp_store_mb(current->state, (state_value))
3121da177e4SLinus Torvalds 
3138eb23b9fSPeter Zijlstra #endif
3148eb23b9fSPeter Zijlstra 
3151da177e4SLinus Torvalds /* Task command name length */
3161da177e4SLinus Torvalds #define TASK_COMM_LEN 16
3171da177e4SLinus Torvalds 
3181da177e4SLinus Torvalds #include <linux/spinlock.h>
3191da177e4SLinus Torvalds 
3201da177e4SLinus Torvalds /*
3211da177e4SLinus Torvalds  * This serializes "schedule()" and also protects
3221da177e4SLinus Torvalds  * the run-queue from deletions/modifications (but
3231da177e4SLinus Torvalds  * _adding_ to the beginning of the run-queue has
3241da177e4SLinus Torvalds  * a separate lock).
3251da177e4SLinus Torvalds  */
3261da177e4SLinus Torvalds extern rwlock_t tasklist_lock;
3271da177e4SLinus Torvalds extern spinlock_t mmlist_lock;
3281da177e4SLinus Torvalds 
32936c8b586SIngo Molnar struct task_struct;
3301da177e4SLinus Torvalds 
331db1466b3SPaul E. McKenney #ifdef CONFIG_PROVE_RCU
332db1466b3SPaul E. McKenney extern int lockdep_tasklist_lock_is_held(void);
333db1466b3SPaul E. McKenney #endif /* #ifdef CONFIG_PROVE_RCU */
334db1466b3SPaul E. McKenney 
3351da177e4SLinus Torvalds extern void sched_init(void);
3361da177e4SLinus Torvalds extern void sched_init_smp(void);
3372d07b255SHarvey Harrison extern asmlinkage void schedule_tail(struct task_struct *prev);
33836c8b586SIngo Molnar extern void init_idle(struct task_struct *idle, int cpu);
3391df21055SIngo Molnar extern void init_idle_bootup_task(struct task_struct *idle);
3401da177e4SLinus Torvalds 
3413fa0818bSRik van Riel extern cpumask_var_t cpu_isolated_map;
3423fa0818bSRik van Riel 
34389f19f04SAndrew Morton extern int runqueue_is_locked(int cpu);
344017730c1SIngo Molnar 
3453451d024SFrederic Weisbecker #if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
346c1cc017cSAlex Shi extern void nohz_balance_enter_idle(int cpu);
34769e1e811SSuresh Siddha extern void set_cpu_sd_state_idle(void);
348bc7a34b8SThomas Gleixner extern int get_nohz_timer_target(void);
34946cb4b7cSSiddha, Suresh B #else
350c1cc017cSAlex Shi static inline void nohz_balance_enter_idle(int cpu) { }
351fdaabd80SPeter Zijlstra static inline void set_cpu_sd_state_idle(void) { }
35246cb4b7cSSiddha, Suresh B #endif
3531da177e4SLinus Torvalds 
354e59e2ae2SIngo Molnar /*
35539bc89fdSIngo Molnar  * Only dump TASK_* tasks. (0 for all tasks)
356e59e2ae2SIngo Molnar  */
357e59e2ae2SIngo Molnar extern void show_state_filter(unsigned long state_filter);
358e59e2ae2SIngo Molnar 
359e59e2ae2SIngo Molnar static inline void show_state(void)
360e59e2ae2SIngo Molnar {
36139bc89fdSIngo Molnar 	show_state_filter(0);
362e59e2ae2SIngo Molnar }
363e59e2ae2SIngo Molnar 
3641da177e4SLinus Torvalds extern void show_regs(struct pt_regs *);
3651da177e4SLinus Torvalds 
3661da177e4SLinus Torvalds /*
3671da177e4SLinus Torvalds  * TASK is a pointer to the task whose backtrace we want to see (or NULL for current
3681da177e4SLinus Torvalds  * task), SP is the stack pointer of the first frame that should be shown in the back
3691da177e4SLinus Torvalds  * trace (or NULL if the entire call-chain of the task should be shown).
3701da177e4SLinus Torvalds  */
3711da177e4SLinus Torvalds extern void show_stack(struct task_struct *task, unsigned long *sp);
3721da177e4SLinus Torvalds 
3731da177e4SLinus Torvalds extern void cpu_init (void);
3741da177e4SLinus Torvalds extern void trap_init(void);
3751da177e4SLinus Torvalds extern void update_process_times(int user);
3761da177e4SLinus Torvalds extern void scheduler_tick(void);
3779cf7243dSThomas Gleixner extern int sched_cpu_starting(unsigned int cpu);
37840190a78SThomas Gleixner extern int sched_cpu_activate(unsigned int cpu);
37940190a78SThomas Gleixner extern int sched_cpu_deactivate(unsigned int cpu);
3801da177e4SLinus Torvalds 
381f2785ddbSThomas Gleixner #ifdef CONFIG_HOTPLUG_CPU
382f2785ddbSThomas Gleixner extern int sched_cpu_dying(unsigned int cpu);
383f2785ddbSThomas Gleixner #else
384f2785ddbSThomas Gleixner # define sched_cpu_dying	NULL
385f2785ddbSThomas Gleixner #endif
3861da177e4SLinus Torvalds 
38782a1fcb9SIngo Molnar extern void sched_show_task(struct task_struct *p);
38882a1fcb9SIngo Molnar 
38919cc36c0SFrederic Weisbecker #ifdef CONFIG_LOCKUP_DETECTOR
39003e0d461STejun Heo extern void touch_softlockup_watchdog_sched(void);
3918446f1d3SIngo Molnar extern void touch_softlockup_watchdog(void);
392d6ad3e28SJason Wessel extern void touch_softlockup_watchdog_sync(void);
39304c9167fSJeremy Fitzhardinge extern void touch_all_softlockup_watchdogs(void);
394332fbdbcSDon Zickus extern int proc_dowatchdog_thresh(struct ctl_table *table, int write,
3958d65af78SAlexey Dobriyan 				  void __user *buffer,
396baf48f65SMandeep Singh Baines 				  size_t *lenp, loff_t *ppos);
3979c44bc03SIngo Molnar extern unsigned int  softlockup_panic;
398ac1f5912SDon Zickus extern unsigned int  hardlockup_panic;
399004417a6SPeter Zijlstra void lockup_detector_init(void);
4008446f1d3SIngo Molnar #else
40103e0d461STejun Heo static inline void touch_softlockup_watchdog_sched(void)
40203e0d461STejun Heo {
40303e0d461STejun Heo }
4048446f1d3SIngo Molnar static inline void touch_softlockup_watchdog(void)
4058446f1d3SIngo Molnar {
4068446f1d3SIngo Molnar }
407d6ad3e28SJason Wessel static inline void touch_softlockup_watchdog_sync(void)
408d6ad3e28SJason Wessel {
409d6ad3e28SJason Wessel }
41004c9167fSJeremy Fitzhardinge static inline void touch_all_softlockup_watchdogs(void)
41104c9167fSJeremy Fitzhardinge {
41204c9167fSJeremy Fitzhardinge }
413004417a6SPeter Zijlstra static inline void lockup_detector_init(void)
414004417a6SPeter Zijlstra {
415004417a6SPeter Zijlstra }
4168446f1d3SIngo Molnar #endif
4178446f1d3SIngo Molnar 
4188b414521SMarcelo Tosatti #ifdef CONFIG_DETECT_HUNG_TASK
4198b414521SMarcelo Tosatti void reset_hung_task_detector(void);
4208b414521SMarcelo Tosatti #else
4218b414521SMarcelo Tosatti static inline void reset_hung_task_detector(void)
4228b414521SMarcelo Tosatti {
4238b414521SMarcelo Tosatti }
4248b414521SMarcelo Tosatti #endif
4258b414521SMarcelo Tosatti 
4261da177e4SLinus Torvalds /* Attach to any functions which should be ignored in wchan output. */
4271da177e4SLinus Torvalds #define __sched		__attribute__((__section__(".sched.text")))
428deaf2227SIngo Molnar 
429deaf2227SIngo Molnar /* Linker adds these: start and end of __sched functions */
430deaf2227SIngo Molnar extern char __sched_text_start[], __sched_text_end[];
431deaf2227SIngo Molnar 
4321da177e4SLinus Torvalds /* Is this address in the __sched functions? */
4331da177e4SLinus Torvalds extern int in_sched_functions(unsigned long addr);
4341da177e4SLinus Torvalds 
4351da177e4SLinus Torvalds #define	MAX_SCHEDULE_TIMEOUT	LONG_MAX
436b3c97528SHarvey Harrison extern signed long schedule_timeout(signed long timeout);
43764ed93a2SNishanth Aravamudan extern signed long schedule_timeout_interruptible(signed long timeout);
438294d5cc2SMatthew Wilcox extern signed long schedule_timeout_killable(signed long timeout);
43964ed93a2SNishanth Aravamudan extern signed long schedule_timeout_uninterruptible(signed long timeout);
44069b27bafSAndrew Morton extern signed long schedule_timeout_idle(signed long timeout);
4411da177e4SLinus Torvalds asmlinkage void schedule(void);
442c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void);
4431da177e4SLinus Torvalds 
4449cff8adeSNeilBrown extern long io_schedule_timeout(long timeout);
4459cff8adeSNeilBrown 
4469cff8adeSNeilBrown static inline void io_schedule(void)
4479cff8adeSNeilBrown {
4489cff8adeSNeilBrown 	io_schedule_timeout(MAX_SCHEDULE_TIMEOUT);
4499cff8adeSNeilBrown }
4509cff8adeSNeilBrown 
4519af6528eSPeter Zijlstra void __noreturn do_task_dead(void);
4529af6528eSPeter Zijlstra 
453ab516013SSerge E. Hallyn struct nsproxy;
454acce292cSCedric Le Goater struct user_namespace;
4551da177e4SLinus Torvalds 
456efc1a3b1SDavid Howells #ifdef CONFIG_MMU
457efc1a3b1SDavid Howells extern void arch_pick_mmap_layout(struct mm_struct *mm);
4581da177e4SLinus Torvalds extern unsigned long
4591da177e4SLinus Torvalds arch_get_unmapped_area(struct file *, unsigned long, unsigned long,
4601da177e4SLinus Torvalds 		       unsigned long, unsigned long);
4611da177e4SLinus Torvalds extern unsigned long
4621da177e4SLinus Torvalds arch_get_unmapped_area_topdown(struct file *filp, unsigned long addr,
4631da177e4SLinus Torvalds 			  unsigned long len, unsigned long pgoff,
4641da177e4SLinus Torvalds 			  unsigned long flags);
465efc1a3b1SDavid Howells #else
466efc1a3b1SDavid Howells static inline void arch_pick_mmap_layout(struct mm_struct *mm) {}
467efc1a3b1SDavid Howells #endif
4681da177e4SLinus Torvalds 
469d049f74fSKees Cook #define SUID_DUMP_DISABLE	0	/* No setuid dumping */
470d049f74fSKees Cook #define SUID_DUMP_USER		1	/* Dump as user of process */
471d049f74fSKees Cook #define SUID_DUMP_ROOT		2	/* Dump as root */
472d049f74fSKees Cook 
4736c5d5238SKawai, Hidehiro /* mm flags */
474f8af4da3SHugh Dickins 
4757288e118SOleg Nesterov /* for SUID_DUMP_* above */
4763cb4a0bbSKawai, Hidehiro #define MMF_DUMPABLE_BITS 2
477f8af4da3SHugh Dickins #define MMF_DUMPABLE_MASK ((1 << MMF_DUMPABLE_BITS) - 1)
4783cb4a0bbSKawai, Hidehiro 
479942be387SOleg Nesterov extern void set_dumpable(struct mm_struct *mm, int value);
480942be387SOleg Nesterov /*
481942be387SOleg Nesterov  * This returns the actual value of the suid_dumpable flag. For things
482942be387SOleg Nesterov  * that are using this for checking for privilege transitions, it must
483942be387SOleg Nesterov  * test against SUID_DUMP_USER rather than treating it as a boolean
484942be387SOleg Nesterov  * value.
485942be387SOleg Nesterov  */
486942be387SOleg Nesterov static inline int __get_dumpable(unsigned long mm_flags)
487942be387SOleg Nesterov {
488942be387SOleg Nesterov 	return mm_flags & MMF_DUMPABLE_MASK;
489942be387SOleg Nesterov }
490942be387SOleg Nesterov 
491942be387SOleg Nesterov static inline int get_dumpable(struct mm_struct *mm)
492942be387SOleg Nesterov {
493942be387SOleg Nesterov 	return __get_dumpable(mm->flags);
494942be387SOleg Nesterov }
495942be387SOleg Nesterov 
4963cb4a0bbSKawai, Hidehiro /* coredump filter bits */
4973cb4a0bbSKawai, Hidehiro #define MMF_DUMP_ANON_PRIVATE	2
4983cb4a0bbSKawai, Hidehiro #define MMF_DUMP_ANON_SHARED	3
4993cb4a0bbSKawai, Hidehiro #define MMF_DUMP_MAPPED_PRIVATE	4
5003cb4a0bbSKawai, Hidehiro #define MMF_DUMP_MAPPED_SHARED	5
50182df3973SRoland McGrath #define MMF_DUMP_ELF_HEADERS	6
502e575f111SKOSAKI Motohiro #define MMF_DUMP_HUGETLB_PRIVATE 7
503e575f111SKOSAKI Motohiro #define MMF_DUMP_HUGETLB_SHARED  8
5045037835cSRoss Zwisler #define MMF_DUMP_DAX_PRIVATE	9
5055037835cSRoss Zwisler #define MMF_DUMP_DAX_SHARED	10
506f8af4da3SHugh Dickins 
5073cb4a0bbSKawai, Hidehiro #define MMF_DUMP_FILTER_SHIFT	MMF_DUMPABLE_BITS
5085037835cSRoss Zwisler #define MMF_DUMP_FILTER_BITS	9
5093cb4a0bbSKawai, Hidehiro #define MMF_DUMP_FILTER_MASK \
5103cb4a0bbSKawai, Hidehiro 	(((1 << MMF_DUMP_FILTER_BITS) - 1) << MMF_DUMP_FILTER_SHIFT)
5113cb4a0bbSKawai, Hidehiro #define MMF_DUMP_FILTER_DEFAULT \
512e575f111SKOSAKI Motohiro 	((1 << MMF_DUMP_ANON_PRIVATE) |	(1 << MMF_DUMP_ANON_SHARED) |\
513656eb2cdSRoland McGrath 	 (1 << MMF_DUMP_HUGETLB_PRIVATE) | MMF_DUMP_MASK_DEFAULT_ELF)
514656eb2cdSRoland McGrath 
515656eb2cdSRoland McGrath #ifdef CONFIG_CORE_DUMP_DEFAULT_ELF_HEADERS
516656eb2cdSRoland McGrath # define MMF_DUMP_MASK_DEFAULT_ELF	(1 << MMF_DUMP_ELF_HEADERS)
517656eb2cdSRoland McGrath #else
518656eb2cdSRoland McGrath # define MMF_DUMP_MASK_DEFAULT_ELF	0
519656eb2cdSRoland McGrath #endif
520f8af4da3SHugh Dickins 					/* leave room for more dump flags */
521f8af4da3SHugh Dickins #define MMF_VM_MERGEABLE	16	/* KSM may merge identical pages */
522ba76149fSAndrea Arcangeli #define MMF_VM_HUGEPAGE		17	/* set when VM_HUGEPAGE is set on vma */
523bafb282dSKonstantin Khlebnikov #define MMF_EXE_FILE_CHANGED	18	/* see prctl_set_mm_exe_file() */
524f8af4da3SHugh Dickins 
5259f68f672SOleg Nesterov #define MMF_HAS_UPROBES		19	/* has uprobes */
5269f68f672SOleg Nesterov #define MMF_RECALC_UPROBES	20	/* MMF_HAS_UPROBES can be wrong */
527862e3073SMichal Hocko #define MMF_OOM_SKIP		21	/* mm is of no interest for the OOM killer */
5283f70dc38SMichal Hocko #define MMF_UNSTABLE		22	/* mm is unstable for copy_from_user */
5296fcb52a5SAaron Lu #define MMF_HUGE_ZERO_PAGE	23      /* mm has ever used the global huge zero page */
530f8ac4ec9SOleg Nesterov 
531f8af4da3SHugh Dickins #define MMF_INIT_MASK		(MMF_DUMPABLE_MASK | MMF_DUMP_FILTER_MASK)
5326c5d5238SKawai, Hidehiro 
5331da177e4SLinus Torvalds struct sighand_struct {
5341da177e4SLinus Torvalds 	atomic_t		count;
5351da177e4SLinus Torvalds 	struct k_sigaction	action[_NSIG];
5361da177e4SLinus Torvalds 	spinlock_t		siglock;
537b8fceee1SDavide Libenzi 	wait_queue_head_t	signalfd_wqh;
5381da177e4SLinus Torvalds };
5391da177e4SLinus Torvalds 
5400e464814SKaiGai Kohei struct pacct_struct {
541f6ec29a4SKaiGai Kohei 	int			ac_flag;
542f6ec29a4SKaiGai Kohei 	long			ac_exitcode;
5430e464814SKaiGai Kohei 	unsigned long		ac_mem;
54477787bfbSKaiGai Kohei 	cputime_t		ac_utime, ac_stime;
54577787bfbSKaiGai Kohei 	unsigned long		ac_minflt, ac_majflt;
5460e464814SKaiGai Kohei };
5470e464814SKaiGai Kohei 
54842c4ab41SStanislaw Gruszka struct cpu_itimer {
54942c4ab41SStanislaw Gruszka 	cputime_t expires;
55042c4ab41SStanislaw Gruszka 	cputime_t incr;
5518356b5f9SStanislaw Gruszka 	u32 error;
5528356b5f9SStanislaw Gruszka 	u32 incr_error;
55342c4ab41SStanislaw Gruszka };
55442c4ab41SStanislaw Gruszka 
555f06febc9SFrank Mayhar /**
5569d7fb042SPeter Zijlstra  * struct prev_cputime - snaphsot of system and user cputime
557d37f761dSFrederic Weisbecker  * @utime: time spent in user mode
558d37f761dSFrederic Weisbecker  * @stime: time spent in system mode
5599d7fb042SPeter Zijlstra  * @lock: protects the above two fields
560d37f761dSFrederic Weisbecker  *
5619d7fb042SPeter Zijlstra  * Stores previous user/system time values such that we can guarantee
5629d7fb042SPeter Zijlstra  * monotonicity.
563d37f761dSFrederic Weisbecker  */
5649d7fb042SPeter Zijlstra struct prev_cputime {
5659d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
566d37f761dSFrederic Weisbecker 	cputime_t utime;
567d37f761dSFrederic Weisbecker 	cputime_t stime;
5689d7fb042SPeter Zijlstra 	raw_spinlock_t lock;
5699d7fb042SPeter Zijlstra #endif
570d37f761dSFrederic Weisbecker };
571d37f761dSFrederic Weisbecker 
5729d7fb042SPeter Zijlstra static inline void prev_cputime_init(struct prev_cputime *prev)
5739d7fb042SPeter Zijlstra {
5749d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
5759d7fb042SPeter Zijlstra 	prev->utime = prev->stime = 0;
5769d7fb042SPeter Zijlstra 	raw_spin_lock_init(&prev->lock);
5779d7fb042SPeter Zijlstra #endif
5789d7fb042SPeter Zijlstra }
5799d7fb042SPeter Zijlstra 
580d37f761dSFrederic Weisbecker /**
581f06febc9SFrank Mayhar  * struct task_cputime - collected CPU time counts
582f06febc9SFrank Mayhar  * @utime:		time spent in user mode, in &cputime_t units
583f06febc9SFrank Mayhar  * @stime:		time spent in kernel mode, in &cputime_t units
584f06febc9SFrank Mayhar  * @sum_exec_runtime:	total time spent on the CPU, in nanoseconds
585f06febc9SFrank Mayhar  *
5869d7fb042SPeter Zijlstra  * This structure groups together three kinds of CPU time that are tracked for
5879d7fb042SPeter Zijlstra  * threads and thread groups.  Most things considering CPU time want to group
5889d7fb042SPeter Zijlstra  * these counts together and treat all three of them in parallel.
589f06febc9SFrank Mayhar  */
590f06febc9SFrank Mayhar struct task_cputime {
591f06febc9SFrank Mayhar 	cputime_t utime;
592f06febc9SFrank Mayhar 	cputime_t stime;
593f06febc9SFrank Mayhar 	unsigned long long sum_exec_runtime;
594f06febc9SFrank Mayhar };
5959d7fb042SPeter Zijlstra 
596f06febc9SFrank Mayhar /* Alternate field names when used to cache expirations. */
597f06febc9SFrank Mayhar #define virt_exp	utime
5989d7fb042SPeter Zijlstra #define prof_exp	stime
599f06febc9SFrank Mayhar #define sched_exp	sum_exec_runtime
600f06febc9SFrank Mayhar 
6014cd4c1b4SPeter Zijlstra #define INIT_CPUTIME	\
6024cd4c1b4SPeter Zijlstra 	(struct task_cputime) {					\
60364861634SMartin Schwidefsky 		.utime = 0,					\
60464861634SMartin Schwidefsky 		.stime = 0,					\
6054cd4c1b4SPeter Zijlstra 		.sum_exec_runtime = 0,				\
6064cd4c1b4SPeter Zijlstra 	}
6074cd4c1b4SPeter Zijlstra 
608971e8a98SJason Low /*
609971e8a98SJason Low  * This is the atomic variant of task_cputime, which can be used for
610971e8a98SJason Low  * storing and updating task_cputime statistics without locking.
611971e8a98SJason Low  */
612971e8a98SJason Low struct task_cputime_atomic {
613971e8a98SJason Low 	atomic64_t utime;
614971e8a98SJason Low 	atomic64_t stime;
615971e8a98SJason Low 	atomic64_t sum_exec_runtime;
616971e8a98SJason Low };
617971e8a98SJason Low 
618971e8a98SJason Low #define INIT_CPUTIME_ATOMIC \
619971e8a98SJason Low 	(struct task_cputime_atomic) {				\
620971e8a98SJason Low 		.utime = ATOMIC64_INIT(0),			\
621971e8a98SJason Low 		.stime = ATOMIC64_INIT(0),			\
622971e8a98SJason Low 		.sum_exec_runtime = ATOMIC64_INIT(0),		\
623971e8a98SJason Low 	}
624971e8a98SJason Low 
625609ca066SPeter Zijlstra #define PREEMPT_DISABLED	(PREEMPT_DISABLE_OFFSET + PREEMPT_ENABLED)
626a233f112SPeter Zijlstra 
627c99e6efeSPeter Zijlstra /*
62887dcbc06SPeter Zijlstra  * Disable preemption until the scheduler is running -- use an unconditional
62987dcbc06SPeter Zijlstra  * value so that it also works on !PREEMPT_COUNT kernels.
630d86ee480SPeter Zijlstra  *
63187dcbc06SPeter Zijlstra  * Reset by start_kernel()->sched_init()->init_idle()->init_idle_preempt_count().
632c99e6efeSPeter Zijlstra  */
63387dcbc06SPeter Zijlstra #define INIT_PREEMPT_COUNT	PREEMPT_OFFSET
634c99e6efeSPeter Zijlstra 
635609ca066SPeter Zijlstra /*
636609ca066SPeter Zijlstra  * Initial preempt_count value; reflects the preempt_count schedule invariant
637609ca066SPeter Zijlstra  * which states that during context switches:
638609ca066SPeter Zijlstra  *
639609ca066SPeter Zijlstra  *    preempt_count() == 2*PREEMPT_DISABLE_OFFSET
640609ca066SPeter Zijlstra  *
641609ca066SPeter Zijlstra  * Note: PREEMPT_DISABLE_OFFSET is 0 for !PREEMPT_COUNT kernels.
642609ca066SPeter Zijlstra  * Note: See finish_task_switch().
643609ca066SPeter Zijlstra  */
644609ca066SPeter Zijlstra #define FORK_PREEMPT_COUNT	(2*PREEMPT_DISABLE_OFFSET + PREEMPT_ENABLED)
6454cd4c1b4SPeter Zijlstra 
646f06febc9SFrank Mayhar /**
647f06febc9SFrank Mayhar  * struct thread_group_cputimer - thread group interval timer counts
648920ce39fSJason Low  * @cputime_atomic:	atomic thread group interval timers.
649d5c373ebSJason Low  * @running:		true when there are timers running and
650d5c373ebSJason Low  *			@cputime_atomic receives updates.
651c8d75aa4SJason Low  * @checking_timer:	true when a thread in the group is in the
652c8d75aa4SJason Low  *			process of checking for thread group timers.
653f06febc9SFrank Mayhar  *
654f06febc9SFrank Mayhar  * This structure contains the version of task_cputime, above, that is
6554cd4c1b4SPeter Zijlstra  * used for thread group CPU timer calculations.
656f06febc9SFrank Mayhar  */
6574cd4c1b4SPeter Zijlstra struct thread_group_cputimer {
65871107445SJason Low 	struct task_cputime_atomic cputime_atomic;
659d5c373ebSJason Low 	bool running;
660c8d75aa4SJason Low 	bool checking_timer;
661f06febc9SFrank Mayhar };
662f06febc9SFrank Mayhar 
6634714d1d3SBen Blum #include <linux/rwsem.h>
6645091faa4SMike Galbraith struct autogroup;
6655091faa4SMike Galbraith 
6661da177e4SLinus Torvalds /*
667e815f0a8SJonathan Neuschäfer  * NOTE! "signal_struct" does not have its own
6681da177e4SLinus Torvalds  * locking, because a shared signal_struct always
6691da177e4SLinus Torvalds  * implies a shared sighand_struct, so locking
6701da177e4SLinus Torvalds  * sighand_struct is always a proper superset of
6711da177e4SLinus Torvalds  * the locking of signal_struct.
6721da177e4SLinus Torvalds  */
6731da177e4SLinus Torvalds struct signal_struct {
674ea6d290cSOleg Nesterov 	atomic_t		sigcnt;
6751da177e4SLinus Torvalds 	atomic_t		live;
676b3ac022cSOleg Nesterov 	int			nr_threads;
6770c740d0aSOleg Nesterov 	struct list_head	thread_head;
6781da177e4SLinus Torvalds 
6791da177e4SLinus Torvalds 	wait_queue_head_t	wait_chldexit;	/* for wait4() */
6801da177e4SLinus Torvalds 
6811da177e4SLinus Torvalds 	/* current thread group signal load-balancing target: */
68236c8b586SIngo Molnar 	struct task_struct	*curr_target;
6831da177e4SLinus Torvalds 
6841da177e4SLinus Torvalds 	/* shared signal handling: */
6851da177e4SLinus Torvalds 	struct sigpending	shared_pending;
6861da177e4SLinus Torvalds 
6871da177e4SLinus Torvalds 	/* thread group exit support */
6881da177e4SLinus Torvalds 	int			group_exit_code;
6891da177e4SLinus Torvalds 	/* overloaded:
6901da177e4SLinus Torvalds 	 * - notify group_exit_task when ->count is equal to notify_count
6911da177e4SLinus Torvalds 	 * - everyone except group_exit_task is stopped during signal delivery
6921da177e4SLinus Torvalds 	 *   of fatal signals, group_exit_task processes the signal.
6931da177e4SLinus Torvalds 	 */
6941da177e4SLinus Torvalds 	int			notify_count;
69507dd20e0SRichard Kennedy 	struct task_struct	*group_exit_task;
6961da177e4SLinus Torvalds 
6971da177e4SLinus Torvalds 	/* thread group stop support, overloads group_exit_code too */
6981da177e4SLinus Torvalds 	int			group_stop_count;
6991da177e4SLinus Torvalds 	unsigned int		flags; /* see SIGNAL_* flags below */
7001da177e4SLinus Torvalds 
701ebec18a6SLennart Poettering 	/*
702ebec18a6SLennart Poettering 	 * PR_SET_CHILD_SUBREAPER marks a process, like a service
703ebec18a6SLennart Poettering 	 * manager, to re-parent orphan (double-forking) child processes
704ebec18a6SLennart Poettering 	 * to this process instead of 'init'. The service manager is
705ebec18a6SLennart Poettering 	 * able to receive SIGCHLD signals and is able to investigate
706ebec18a6SLennart Poettering 	 * the process until it calls wait(). All children of this
707ebec18a6SLennart Poettering 	 * process will inherit a flag if they should look for a
708ebec18a6SLennart Poettering 	 * child_subreaper process at exit.
709ebec18a6SLennart Poettering 	 */
710ebec18a6SLennart Poettering 	unsigned int		is_child_subreaper:1;
711ebec18a6SLennart Poettering 	unsigned int		has_child_subreaper:1;
712ebec18a6SLennart Poettering 
7131da177e4SLinus Torvalds 	/* POSIX.1b Interval Timers */
7145ed67f05SPavel Emelyanov 	int			posix_timer_id;
7151da177e4SLinus Torvalds 	struct list_head	posix_timers;
7161da177e4SLinus Torvalds 
7171da177e4SLinus Torvalds 	/* ITIMER_REAL timer for the process */
7182ff678b8SThomas Gleixner 	struct hrtimer real_timer;
719fea9d175SOleg Nesterov 	struct pid *leader_pid;
7202ff678b8SThomas Gleixner 	ktime_t it_real_incr;
7211da177e4SLinus Torvalds 
72242c4ab41SStanislaw Gruszka 	/*
72342c4ab41SStanislaw Gruszka 	 * ITIMER_PROF and ITIMER_VIRTUAL timers for the process, we use
72442c4ab41SStanislaw Gruszka 	 * CPUCLOCK_PROF and CPUCLOCK_VIRT for indexing array as these
72542c4ab41SStanislaw Gruszka 	 * values are defined to 0 and 1 respectively
72642c4ab41SStanislaw Gruszka 	 */
72742c4ab41SStanislaw Gruszka 	struct cpu_itimer it[2];
7281da177e4SLinus Torvalds 
729f06febc9SFrank Mayhar 	/*
7304cd4c1b4SPeter Zijlstra 	 * Thread group totals for process CPU timers.
7314cd4c1b4SPeter Zijlstra 	 * See thread_group_cputimer(), et al, for details.
732f06febc9SFrank Mayhar 	 */
7334cd4c1b4SPeter Zijlstra 	struct thread_group_cputimer cputimer;
734f06febc9SFrank Mayhar 
735f06febc9SFrank Mayhar 	/* Earliest-expiration cache. */
736f06febc9SFrank Mayhar 	struct task_cputime cputime_expires;
737f06febc9SFrank Mayhar 
738d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
739f009a7a7SFrederic Weisbecker 	atomic_t tick_dep_mask;
740d027d45dSFrederic Weisbecker #endif
741d027d45dSFrederic Weisbecker 
742f06febc9SFrank Mayhar 	struct list_head cpu_timers[3];
743f06febc9SFrank Mayhar 
744ab521dc0SEric W. Biederman 	struct pid *tty_old_pgrp;
7451ec320afSCedric Le Goater 
7461da177e4SLinus Torvalds 	/* boolean value for session group leader */
7471da177e4SLinus Torvalds 	int leader;
7481da177e4SLinus Torvalds 
7491da177e4SLinus Torvalds 	struct tty_struct *tty; /* NULL if no tty */
7501da177e4SLinus Torvalds 
7515091faa4SMike Galbraith #ifdef CONFIG_SCHED_AUTOGROUP
7525091faa4SMike Galbraith 	struct autogroup *autogroup;
7535091faa4SMike Galbraith #endif
7541da177e4SLinus Torvalds 	/*
7551da177e4SLinus Torvalds 	 * Cumulative resource counters for dead threads in the group,
7561da177e4SLinus Torvalds 	 * and for reaped dead child processes forked by this group.
7571da177e4SLinus Torvalds 	 * Live threads maintain their own counters and add to these
7581da177e4SLinus Torvalds 	 * in __exit_signal, except for the group leader.
7591da177e4SLinus Torvalds 	 */
760e78c3496SRik van Riel 	seqlock_t stats_lock;
76132bd671dSPeter Zijlstra 	cputime_t utime, stime, cutime, cstime;
7629ac52315SLaurent Vivier 	cputime_t gtime;
7639ac52315SLaurent Vivier 	cputime_t cgtime;
7649d7fb042SPeter Zijlstra 	struct prev_cputime prev_cputime;
7651da177e4SLinus Torvalds 	unsigned long nvcsw, nivcsw, cnvcsw, cnivcsw;
7661da177e4SLinus Torvalds 	unsigned long min_flt, maj_flt, cmin_flt, cmaj_flt;
7676eaeeabaSEric Dumazet 	unsigned long inblock, oublock, cinblock, coublock;
7681f10206cSJiri Pirko 	unsigned long maxrss, cmaxrss;
769940389b8SAndrea Righi 	struct task_io_accounting ioac;
7701da177e4SLinus Torvalds 
7711da177e4SLinus Torvalds 	/*
77232bd671dSPeter Zijlstra 	 * Cumulative ns of schedule CPU time fo dead threads in the
77332bd671dSPeter Zijlstra 	 * group, not including a zombie group leader, (This only differs
77432bd671dSPeter Zijlstra 	 * from jiffies_to_ns(utime + stime) if sched_clock uses something
77532bd671dSPeter Zijlstra 	 * other than jiffies.)
77632bd671dSPeter Zijlstra 	 */
77732bd671dSPeter Zijlstra 	unsigned long long sum_sched_runtime;
77832bd671dSPeter Zijlstra 
77932bd671dSPeter Zijlstra 	/*
7801da177e4SLinus Torvalds 	 * We don't bother to synchronize most readers of this at all,
7811da177e4SLinus Torvalds 	 * because there is no reader checking a limit that actually needs
7821da177e4SLinus Torvalds 	 * to get both rlim_cur and rlim_max atomically, and either one
7831da177e4SLinus Torvalds 	 * alone is a single word that can safely be read normally.
7841da177e4SLinus Torvalds 	 * getrlimit/setrlimit use task_lock(current->group_leader) to
7851da177e4SLinus Torvalds 	 * protect this instead of the siglock, because they really
7861da177e4SLinus Torvalds 	 * have no need to disable irqs.
7871da177e4SLinus Torvalds 	 */
7881da177e4SLinus Torvalds 	struct rlimit rlim[RLIM_NLIMITS];
7891da177e4SLinus Torvalds 
7900e464814SKaiGai Kohei #ifdef CONFIG_BSD_PROCESS_ACCT
7910e464814SKaiGai Kohei 	struct pacct_struct pacct;	/* per-process accounting information */
7920e464814SKaiGai Kohei #endif
793ad4ecbcbSShailabh Nagar #ifdef CONFIG_TASKSTATS
794ad4ecbcbSShailabh Nagar 	struct taskstats *stats;
795ad4ecbcbSShailabh Nagar #endif
796522ed776SMiloslav Trmac #ifdef CONFIG_AUDIT
797522ed776SMiloslav Trmac 	unsigned audit_tty;
798522ed776SMiloslav Trmac 	struct tty_audit_buf *tty_audit_buf;
799522ed776SMiloslav Trmac #endif
80028b83c51SKOSAKI Motohiro 
801c96fc2d8STetsuo Handa 	/*
802c96fc2d8STetsuo Handa 	 * Thread is the potential origin of an oom condition; kill first on
803c96fc2d8STetsuo Handa 	 * oom
804c96fc2d8STetsuo Handa 	 */
805c96fc2d8STetsuo Handa 	bool oom_flag_origin;
806a9c58b90SDavid Rientjes 	short oom_score_adj;		/* OOM kill score adjustment */
807a9c58b90SDavid Rientjes 	short oom_score_adj_min;	/* OOM kill score adjustment min value.
808dabb16f6SMandeep Singh Baines 					 * Only settable by CAP_SYS_RESOURCE. */
80926db62f1SMichal Hocko 	struct mm_struct *oom_mm;	/* recorded mm when the thread group got
81026db62f1SMichal Hocko 					 * killed by the oom killer */
8119b1bf12dSKOSAKI Motohiro 
8129b1bf12dSKOSAKI Motohiro 	struct mutex cred_guard_mutex;	/* guard against foreign influences on
8139b1bf12dSKOSAKI Motohiro 					 * credential calculations
8149b1bf12dSKOSAKI Motohiro 					 * (notably. ptrace) */
8151da177e4SLinus Torvalds };
8161da177e4SLinus Torvalds 
8171da177e4SLinus Torvalds /*
8181da177e4SLinus Torvalds  * Bits in flags field of signal_struct.
8191da177e4SLinus Torvalds  */
8201da177e4SLinus Torvalds #define SIGNAL_STOP_STOPPED	0x00000001 /* job control stop in effect */
821ee77f075SOleg Nesterov #define SIGNAL_STOP_CONTINUED	0x00000002 /* SIGCONT since WCONTINUED reap */
822ee77f075SOleg Nesterov #define SIGNAL_GROUP_EXIT	0x00000004 /* group exit in progress */
823403bad72SOleg Nesterov #define SIGNAL_GROUP_COREDUMP	0x00000008 /* coredump in progress */
824e4420551SOleg Nesterov /*
825e4420551SOleg Nesterov  * Pending notifications to parent.
826e4420551SOleg Nesterov  */
827e4420551SOleg Nesterov #define SIGNAL_CLD_STOPPED	0x00000010
828e4420551SOleg Nesterov #define SIGNAL_CLD_CONTINUED	0x00000020
829e4420551SOleg Nesterov #define SIGNAL_CLD_MASK		(SIGNAL_CLD_STOPPED|SIGNAL_CLD_CONTINUED)
8301da177e4SLinus Torvalds 
831fae5fa44SOleg Nesterov #define SIGNAL_UNKILLABLE	0x00000040 /* for init: ignore fatal signals */
832fae5fa44SOleg Nesterov 
833ed5d2cacSOleg Nesterov /* If true, all threads except ->group_exit_task have pending SIGKILL */
834ed5d2cacSOleg Nesterov static inline int signal_group_exit(const struct signal_struct *sig)
835ed5d2cacSOleg Nesterov {
836ed5d2cacSOleg Nesterov 	return	(sig->flags & SIGNAL_GROUP_EXIT) ||
837ed5d2cacSOleg Nesterov 		(sig->group_exit_task != NULL);
838ed5d2cacSOleg Nesterov }
839ed5d2cacSOleg Nesterov 
8401da177e4SLinus Torvalds /*
8411da177e4SLinus Torvalds  * Some day this will be a full-fledged user tracking system..
8421da177e4SLinus Torvalds  */
8431da177e4SLinus Torvalds struct user_struct {
8441da177e4SLinus Torvalds 	atomic_t __count;	/* reference count */
8451da177e4SLinus Torvalds 	atomic_t processes;	/* How many processes does this user have? */
8461da177e4SLinus Torvalds 	atomic_t sigpending;	/* How many pending signals does this user have? */
8472d9048e2SAmy Griffis #ifdef CONFIG_INOTIFY_USER
8480eeca283SRobert Love 	atomic_t inotify_watches; /* How many inotify watches does this user have? */
8490eeca283SRobert Love 	atomic_t inotify_devs;	/* How many inotify devs does this user have opened? */
8500eeca283SRobert Love #endif
8514afeff85SEric Paris #ifdef CONFIG_FANOTIFY
8524afeff85SEric Paris 	atomic_t fanotify_listeners;
8534afeff85SEric Paris #endif
8547ef9964eSDavide Libenzi #ifdef CONFIG_EPOLL
85552bd19f7SRobin Holt 	atomic_long_t epoll_watches; /* The number of file descriptors currently watched */
8567ef9964eSDavide Libenzi #endif
857970a8645SAlexey Dobriyan #ifdef CONFIG_POSIX_MQUEUE
8581da177e4SLinus Torvalds 	/* protected by mq_lock	*/
8591da177e4SLinus Torvalds 	unsigned long mq_bytes;	/* How many bytes can be allocated to mqueue? */
860970a8645SAlexey Dobriyan #endif
8611da177e4SLinus Torvalds 	unsigned long locked_shm; /* How many pages of mlocked shm ? */
862712f4aadSwilly tarreau 	unsigned long unix_inflight;	/* How many files in flight in unix sockets */
863759c0114SWilly Tarreau 	atomic_long_t pipe_bufs;  /* how many pages are allocated in pipe buffers */
8641da177e4SLinus Torvalds 
8651da177e4SLinus Torvalds #ifdef CONFIG_KEYS
8661da177e4SLinus Torvalds 	struct key *uid_keyring;	/* UID specific keyring */
8671da177e4SLinus Torvalds 	struct key *session_keyring;	/* UID's default session keyring */
8681da177e4SLinus Torvalds #endif
8691da177e4SLinus Torvalds 
8701da177e4SLinus Torvalds 	/* Hash table maintenance information */
871735de223SPavel Emelyanov 	struct hlist_node uidhash_node;
8727b44ab97SEric W. Biederman 	kuid_t uid;
87324e377a8SSrivatsa Vaddagiri 
874aaac3ba9SAlexei Starovoitov #if defined(CONFIG_PERF_EVENTS) || defined(CONFIG_BPF_SYSCALL)
875789f90fcSPeter Zijlstra 	atomic_long_t locked_vm;
876789f90fcSPeter Zijlstra #endif
8771da177e4SLinus Torvalds };
8781da177e4SLinus Torvalds 
879eb41d946SKay Sievers extern int uids_sysfs_init(void);
8805cb350baSDhaval Giani 
8817b44ab97SEric W. Biederman extern struct user_struct *find_user(kuid_t);
8821da177e4SLinus Torvalds 
8831da177e4SLinus Torvalds extern struct user_struct root_user;
8841da177e4SLinus Torvalds #define INIT_USER (&root_user)
8851da177e4SLinus Torvalds 
886b6dff3ecSDavid Howells 
8871da177e4SLinus Torvalds struct backing_dev_info;
8881da177e4SLinus Torvalds struct reclaim_state;
8891da177e4SLinus Torvalds 
890f6db8347SNaveen N. Rao #ifdef CONFIG_SCHED_INFO
8911da177e4SLinus Torvalds struct sched_info {
8921da177e4SLinus Torvalds 	/* cumulative counters */
8932d72376bSIngo Molnar 	unsigned long pcount;	      /* # of times run on this cpu */
8949c2c4802SKen Chen 	unsigned long long run_delay; /* time spent waiting on a runqueue */
8951da177e4SLinus Torvalds 
8961da177e4SLinus Torvalds 	/* timestamps */
897172ba844SBalbir Singh 	unsigned long long last_arrival,/* when we last ran on a cpu */
8981da177e4SLinus Torvalds 			   last_queued;	/* when we were last queued to run */
8991da177e4SLinus Torvalds };
900f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */
9011da177e4SLinus Torvalds 
902ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT
903ca74e92bSShailabh Nagar struct task_delay_info {
904ca74e92bSShailabh Nagar 	spinlock_t	lock;
905ca74e92bSShailabh Nagar 	unsigned int	flags;	/* Private per-task flags */
906ca74e92bSShailabh Nagar 
907ca74e92bSShailabh Nagar 	/* For each stat XXX, add following, aligned appropriately
908ca74e92bSShailabh Nagar 	 *
909ca74e92bSShailabh Nagar 	 * struct timespec XXX_start, XXX_end;
910ca74e92bSShailabh Nagar 	 * u64 XXX_delay;
911ca74e92bSShailabh Nagar 	 * u32 XXX_count;
912ca74e92bSShailabh Nagar 	 *
913ca74e92bSShailabh Nagar 	 * Atomicity of updates to XXX_delay, XXX_count protected by
914ca74e92bSShailabh Nagar 	 * single lock above (split into XXX_lock if contention is an issue).
915ca74e92bSShailabh Nagar 	 */
9160ff92245SShailabh Nagar 
9170ff92245SShailabh Nagar 	/*
9180ff92245SShailabh Nagar 	 * XXX_count is incremented on every XXX operation, the delay
9190ff92245SShailabh Nagar 	 * associated with the operation is added to XXX_delay.
9200ff92245SShailabh Nagar 	 * XXX_delay contains the accumulated delay time in nanoseconds.
9210ff92245SShailabh Nagar 	 */
9229667a23dSThomas Gleixner 	u64 blkio_start;	/* Shared by blkio, swapin */
9230ff92245SShailabh Nagar 	u64 blkio_delay;	/* wait for sync block io completion */
9240ff92245SShailabh Nagar 	u64 swapin_delay;	/* wait for swapin block io completion */
9250ff92245SShailabh Nagar 	u32 blkio_count;	/* total count of the number of sync block */
9260ff92245SShailabh Nagar 				/* io operations performed */
9270ff92245SShailabh Nagar 	u32 swapin_count;	/* total count of the number of swapin block */
9280ff92245SShailabh Nagar 				/* io operations performed */
929873b4771SKeika Kobayashi 
9309667a23dSThomas Gleixner 	u64 freepages_start;
931873b4771SKeika Kobayashi 	u64 freepages_delay;	/* wait for memory reclaim */
932873b4771SKeika Kobayashi 	u32 freepages_count;	/* total count of memory reclaim */
933ca74e92bSShailabh Nagar };
93452f17b6cSChandra Seetharaman #endif	/* CONFIG_TASK_DELAY_ACCT */
93552f17b6cSChandra Seetharaman 
93652f17b6cSChandra Seetharaman static inline int sched_info_on(void)
93752f17b6cSChandra Seetharaman {
93852f17b6cSChandra Seetharaman #ifdef CONFIG_SCHEDSTATS
93952f17b6cSChandra Seetharaman 	return 1;
94052f17b6cSChandra Seetharaman #elif defined(CONFIG_TASK_DELAY_ACCT)
94152f17b6cSChandra Seetharaman 	extern int delayacct_on;
94252f17b6cSChandra Seetharaman 	return delayacct_on;
94352f17b6cSChandra Seetharaman #else
94452f17b6cSChandra Seetharaman 	return 0;
945ca74e92bSShailabh Nagar #endif
94652f17b6cSChandra Seetharaman }
947ca74e92bSShailabh Nagar 
948cb251765SMel Gorman #ifdef CONFIG_SCHEDSTATS
949cb251765SMel Gorman void force_schedstat_enabled(void);
950cb251765SMel Gorman #endif
951cb251765SMel Gorman 
952d15bcfdbSIngo Molnar enum cpu_idle_type {
953d15bcfdbSIngo Molnar 	CPU_IDLE,
954d15bcfdbSIngo Molnar 	CPU_NOT_IDLE,
955d15bcfdbSIngo Molnar 	CPU_NEWLY_IDLE,
956d15bcfdbSIngo Molnar 	CPU_MAX_IDLE_TYPES
9571da177e4SLinus Torvalds };
9581da177e4SLinus Torvalds 
9591da177e4SLinus Torvalds /*
9606ecdd749SYuyang Du  * Integer metrics need fixed point arithmetic, e.g., sched/fair
9616ecdd749SYuyang Du  * has a few: load, load_avg, util_avg, freq, and capacity.
9626ecdd749SYuyang Du  *
9636ecdd749SYuyang Du  * We define a basic fixed point arithmetic range, and then formalize
9646ecdd749SYuyang Du  * all these metrics based on that basic range.
9656ecdd749SYuyang Du  */
9666ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT	10
9676ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE	(1L << SCHED_FIXEDPOINT_SHIFT)
9686ecdd749SYuyang Du 
9696ecdd749SYuyang Du /*
970ca8ce3d0SNicolas Pitre  * Increase resolution of cpu_capacity calculations
9711399fa78SNikhil Rao  */
9726ecdd749SYuyang Du #define SCHED_CAPACITY_SHIFT	SCHED_FIXEDPOINT_SHIFT
973ca8ce3d0SNicolas Pitre #define SCHED_CAPACITY_SCALE	(1L << SCHED_CAPACITY_SHIFT)
9741da177e4SLinus Torvalds 
9751399fa78SNikhil Rao /*
97676751049SPeter Zijlstra  * Wake-queues are lists of tasks with a pending wakeup, whose
97776751049SPeter Zijlstra  * callers have already marked the task as woken internally,
97876751049SPeter Zijlstra  * and can thus carry on. A common use case is being able to
97976751049SPeter Zijlstra  * do the wakeups once the corresponding user lock as been
98076751049SPeter Zijlstra  * released.
98176751049SPeter Zijlstra  *
98276751049SPeter Zijlstra  * We hold reference to each task in the list across the wakeup,
98376751049SPeter Zijlstra  * thus guaranteeing that the memory is still valid by the time
98476751049SPeter Zijlstra  * the actual wakeups are performed in wake_up_q().
98576751049SPeter Zijlstra  *
98676751049SPeter Zijlstra  * One per task suffices, because there's never a need for a task to be
98776751049SPeter Zijlstra  * in two wake queues simultaneously; it is forbidden to abandon a task
98876751049SPeter Zijlstra  * in a wake queue (a call to wake_up_q() _must_ follow), so if a task is
98976751049SPeter Zijlstra  * already in a wake queue, the wakeup will happen soon and the second
99076751049SPeter Zijlstra  * waker can just skip it.
99176751049SPeter Zijlstra  *
992194a6b5bSWaiman Long  * The DEFINE_WAKE_Q macro declares and initializes the list head.
99376751049SPeter Zijlstra  * wake_up_q() does NOT reinitialize the list; it's expected to be
99476751049SPeter Zijlstra  * called near the end of a function, where the fact that the queue is
99576751049SPeter Zijlstra  * not used again will be easy to see by inspection.
99676751049SPeter Zijlstra  *
99776751049SPeter Zijlstra  * Note that this can cause spurious wakeups. schedule() callers
99876751049SPeter Zijlstra  * must ensure the call is done inside a loop, confirming that the
99976751049SPeter Zijlstra  * wakeup condition has in fact occurred.
100076751049SPeter Zijlstra  */
100176751049SPeter Zijlstra struct wake_q_node {
100276751049SPeter Zijlstra 	struct wake_q_node *next;
100376751049SPeter Zijlstra };
100476751049SPeter Zijlstra 
100576751049SPeter Zijlstra struct wake_q_head {
100676751049SPeter Zijlstra 	struct wake_q_node *first;
100776751049SPeter Zijlstra 	struct wake_q_node **lastp;
100876751049SPeter Zijlstra };
100976751049SPeter Zijlstra 
101076751049SPeter Zijlstra #define WAKE_Q_TAIL ((struct wake_q_node *) 0x01)
101176751049SPeter Zijlstra 
1012194a6b5bSWaiman Long #define DEFINE_WAKE_Q(name)				\
101376751049SPeter Zijlstra 	struct wake_q_head name = { WAKE_Q_TAIL, &name.first }
101476751049SPeter Zijlstra 
101576751049SPeter Zijlstra extern void wake_q_add(struct wake_q_head *head,
101676751049SPeter Zijlstra 		       struct task_struct *task);
101776751049SPeter Zijlstra extern void wake_up_q(struct wake_q_head *head);
101876751049SPeter Zijlstra 
101976751049SPeter Zijlstra /*
10201399fa78SNikhil Rao  * sched-domains (multiprocessor balancing) declarations:
10211399fa78SNikhil Rao  */
10222dd73a4fSPeter Williams #ifdef CONFIG_SMP
1023b5d978e0SPeter Zijlstra #define SD_LOAD_BALANCE		0x0001	/* Do load balancing on this domain. */
1024b5d978e0SPeter Zijlstra #define SD_BALANCE_NEWIDLE	0x0002	/* Balance when about to become idle */
1025b5d978e0SPeter Zijlstra #define SD_BALANCE_EXEC		0x0004	/* Balance on exec */
1026b5d978e0SPeter Zijlstra #define SD_BALANCE_FORK		0x0008	/* Balance on fork, clone */
1027c88d5910SPeter Zijlstra #define SD_BALANCE_WAKE		0x0010  /* Balance on wakeup */
1028b5d978e0SPeter Zijlstra #define SD_WAKE_AFFINE		0x0020	/* Wake task to waking CPU */
10291f6e6c7cSMorten Rasmussen #define SD_ASYM_CPUCAPACITY	0x0040  /* Groups have different max cpu capacities */
1030bd425d4bSMorten Rasmussen #define SD_SHARE_CPUCAPACITY	0x0080	/* Domain members share cpu capacity */
1031d77b3ed5SVincent Guittot #define SD_SHARE_POWERDOMAIN	0x0100	/* Domain members share power domain */
1032b5d978e0SPeter Zijlstra #define SD_SHARE_PKG_RESOURCES	0x0200	/* Domain members share cpu pkg resources */
1033b5d978e0SPeter Zijlstra #define SD_SERIALIZE		0x0400	/* Only a single load balancing instance */
1034532cb4c4SMichael Neuling #define SD_ASYM_PACKING		0x0800  /* Place busy groups earlier in the domain */
1035b5d978e0SPeter Zijlstra #define SD_PREFER_SIBLING	0x1000	/* Prefer to place tasks in a sibling domain */
1036e3589f6cSPeter Zijlstra #define SD_OVERLAP		0x2000	/* sched_domains of this level overlap */
10373a7053b3SMel Gorman #define SD_NUMA			0x4000	/* cross-node balancing */
10385c45bf27SSiddha, Suresh B 
1039143e1e28SVincent Guittot #ifdef CONFIG_SCHED_SMT
1040b6220ad6SGuenter Roeck static inline int cpu_smt_flags(void)
1041143e1e28SVincent Guittot {
10425d4dfdddSNicolas Pitre 	return SD_SHARE_CPUCAPACITY | SD_SHARE_PKG_RESOURCES;
1043143e1e28SVincent Guittot }
1044143e1e28SVincent Guittot #endif
1045143e1e28SVincent Guittot 
1046143e1e28SVincent Guittot #ifdef CONFIG_SCHED_MC
1047b6220ad6SGuenter Roeck static inline int cpu_core_flags(void)
1048143e1e28SVincent Guittot {
1049143e1e28SVincent Guittot 	return SD_SHARE_PKG_RESOURCES;
1050143e1e28SVincent Guittot }
1051143e1e28SVincent Guittot #endif
1052143e1e28SVincent Guittot 
1053143e1e28SVincent Guittot #ifdef CONFIG_NUMA
1054b6220ad6SGuenter Roeck static inline int cpu_numa_flags(void)
1055143e1e28SVincent Guittot {
1056143e1e28SVincent Guittot 	return SD_NUMA;
1057143e1e28SVincent Guittot }
1058143e1e28SVincent Guittot #endif
1059532cb4c4SMichael Neuling 
10601d3504fcSHidetoshi Seto struct sched_domain_attr {
10611d3504fcSHidetoshi Seto 	int relax_domain_level;
10621d3504fcSHidetoshi Seto };
10631d3504fcSHidetoshi Seto 
10641d3504fcSHidetoshi Seto #define SD_ATTR_INIT	(struct sched_domain_attr) {	\
10651d3504fcSHidetoshi Seto 	.relax_domain_level = -1,			\
10661d3504fcSHidetoshi Seto }
10671d3504fcSHidetoshi Seto 
106860495e77SPeter Zijlstra extern int sched_domain_level_max;
106960495e77SPeter Zijlstra 
10705e6521eaSLi Zefan struct sched_group;
10715e6521eaSLi Zefan 
107224fc7edbSPeter Zijlstra struct sched_domain_shared {
107324fc7edbSPeter Zijlstra 	atomic_t	ref;
10740e369d75SPeter Zijlstra 	atomic_t	nr_busy_cpus;
107510e2f1acSPeter Zijlstra 	int		has_idle_cores;
107624fc7edbSPeter Zijlstra };
107724fc7edbSPeter Zijlstra 
10781da177e4SLinus Torvalds struct sched_domain {
10791da177e4SLinus Torvalds 	/* These fields must be setup */
10801da177e4SLinus Torvalds 	struct sched_domain *parent;	/* top domain must be null terminated */
10811a848870SSiddha, Suresh B 	struct sched_domain *child;	/* bottom domain must be null terminated */
10821da177e4SLinus Torvalds 	struct sched_group *groups;	/* the balancing groups of the domain */
10831da177e4SLinus Torvalds 	unsigned long min_interval;	/* Minimum balance interval ms */
10841da177e4SLinus Torvalds 	unsigned long max_interval;	/* Maximum balance interval ms */
10851da177e4SLinus Torvalds 	unsigned int busy_factor;	/* less balancing by factor if busy */
10861da177e4SLinus Torvalds 	unsigned int imbalance_pct;	/* No balance until over watermark */
10871da177e4SLinus Torvalds 	unsigned int cache_nice_tries;	/* Leave cache hot tasks for # tries */
10887897986bSNick Piggin 	unsigned int busy_idx;
10897897986bSNick Piggin 	unsigned int idle_idx;
10907897986bSNick Piggin 	unsigned int newidle_idx;
10917897986bSNick Piggin 	unsigned int wake_idx;
1092147cbb4bSNick Piggin 	unsigned int forkexec_idx;
1093a52bfd73SPeter Zijlstra 	unsigned int smt_gain;
109425f55d9dSVincent Guittot 
109525f55d9dSVincent Guittot 	int nohz_idle;			/* NOHZ IDLE status */
10961da177e4SLinus Torvalds 	int flags;			/* See SD_* */
109760495e77SPeter Zijlstra 	int level;
10981da177e4SLinus Torvalds 
10991da177e4SLinus Torvalds 	/* Runtime fields. */
11001da177e4SLinus Torvalds 	unsigned long last_balance;	/* init to jiffies. units in jiffies */
11011da177e4SLinus Torvalds 	unsigned int balance_interval;	/* initialise to 1. units in ms. */
11021da177e4SLinus Torvalds 	unsigned int nr_balance_failed; /* initialise to 0 */
11031da177e4SLinus Torvalds 
1104f48627e6SJason Low 	/* idle_balance() stats */
11059bd721c5SJason Low 	u64 max_newidle_lb_cost;
1106f48627e6SJason Low 	unsigned long next_decay_max_lb_cost;
11072398f2c6SPeter Zijlstra 
110810e2f1acSPeter Zijlstra 	u64 avg_scan_cost;		/* select_idle_sibling */
110910e2f1acSPeter Zijlstra 
11101da177e4SLinus Torvalds #ifdef CONFIG_SCHEDSTATS
11111da177e4SLinus Torvalds 	/* load_balance() stats */
1112480b9434SKen Chen 	unsigned int lb_count[CPU_MAX_IDLE_TYPES];
1113480b9434SKen Chen 	unsigned int lb_failed[CPU_MAX_IDLE_TYPES];
1114480b9434SKen Chen 	unsigned int lb_balanced[CPU_MAX_IDLE_TYPES];
1115480b9434SKen Chen 	unsigned int lb_imbalance[CPU_MAX_IDLE_TYPES];
1116480b9434SKen Chen 	unsigned int lb_gained[CPU_MAX_IDLE_TYPES];
1117480b9434SKen Chen 	unsigned int lb_hot_gained[CPU_MAX_IDLE_TYPES];
1118480b9434SKen Chen 	unsigned int lb_nobusyg[CPU_MAX_IDLE_TYPES];
1119480b9434SKen Chen 	unsigned int lb_nobusyq[CPU_MAX_IDLE_TYPES];
11201da177e4SLinus Torvalds 
11211da177e4SLinus Torvalds 	/* Active load balancing */
1122480b9434SKen Chen 	unsigned int alb_count;
1123480b9434SKen Chen 	unsigned int alb_failed;
1124480b9434SKen Chen 	unsigned int alb_pushed;
11251da177e4SLinus Torvalds 
112668767a0aSNick Piggin 	/* SD_BALANCE_EXEC stats */
1127480b9434SKen Chen 	unsigned int sbe_count;
1128480b9434SKen Chen 	unsigned int sbe_balanced;
1129480b9434SKen Chen 	unsigned int sbe_pushed;
11301da177e4SLinus Torvalds 
113168767a0aSNick Piggin 	/* SD_BALANCE_FORK stats */
1132480b9434SKen Chen 	unsigned int sbf_count;
1133480b9434SKen Chen 	unsigned int sbf_balanced;
1134480b9434SKen Chen 	unsigned int sbf_pushed;
113568767a0aSNick Piggin 
11361da177e4SLinus Torvalds 	/* try_to_wake_up() stats */
1137480b9434SKen Chen 	unsigned int ttwu_wake_remote;
1138480b9434SKen Chen 	unsigned int ttwu_move_affine;
1139480b9434SKen Chen 	unsigned int ttwu_move_balance;
11401da177e4SLinus Torvalds #endif
1141a5d8c348SIngo Molnar #ifdef CONFIG_SCHED_DEBUG
1142a5d8c348SIngo Molnar 	char *name;
1143a5d8c348SIngo Molnar #endif
1144dce840a0SPeter Zijlstra 	union {
1145dce840a0SPeter Zijlstra 		void *private;		/* used during construction */
1146dce840a0SPeter Zijlstra 		struct rcu_head rcu;	/* used during destruction */
1147dce840a0SPeter Zijlstra 	};
114824fc7edbSPeter Zijlstra 	struct sched_domain_shared *shared;
11496c99e9adSRusty Russell 
1150669c55e9SPeter Zijlstra 	unsigned int span_weight;
11514200efd9SIngo Molnar 	/*
11524200efd9SIngo Molnar 	 * Span of all CPUs in this domain.
11534200efd9SIngo Molnar 	 *
11544200efd9SIngo Molnar 	 * NOTE: this field is variable length. (Allocated dynamically
11554200efd9SIngo Molnar 	 * by attaching extra space to the end of the structure,
11564200efd9SIngo Molnar 	 * depending on how many CPUs the kernel has booted up with)
11574200efd9SIngo Molnar 	 */
11584200efd9SIngo Molnar 	unsigned long span[0];
11591da177e4SLinus Torvalds };
11601da177e4SLinus Torvalds 
1161758b2cdcSRusty Russell static inline struct cpumask *sched_domain_span(struct sched_domain *sd)
1162758b2cdcSRusty Russell {
11636c99e9adSRusty Russell 	return to_cpumask(sd->span);
1164758b2cdcSRusty Russell }
1165758b2cdcSRusty Russell 
1166acc3f5d7SRusty Russell extern void partition_sched_domains(int ndoms_new, cpumask_var_t doms_new[],
11671d3504fcSHidetoshi Seto 				    struct sched_domain_attr *dattr_new);
1168029190c5SPaul Jackson 
1169acc3f5d7SRusty Russell /* Allocate an array of sched domains, for partition_sched_domains(). */
1170acc3f5d7SRusty Russell cpumask_var_t *alloc_sched_domains(unsigned int ndoms);
1171acc3f5d7SRusty Russell void free_sched_domains(cpumask_var_t doms[], unsigned int ndoms);
1172acc3f5d7SRusty Russell 
117339be3501SPeter Zijlstra bool cpus_share_cache(int this_cpu, int that_cpu);
117439be3501SPeter Zijlstra 
1175143e1e28SVincent Guittot typedef const struct cpumask *(*sched_domain_mask_f)(int cpu);
1176b6220ad6SGuenter Roeck typedef int (*sched_domain_flags_f)(void);
1177143e1e28SVincent Guittot 
1178143e1e28SVincent Guittot #define SDTL_OVERLAP	0x01
1179143e1e28SVincent Guittot 
1180143e1e28SVincent Guittot struct sd_data {
1181143e1e28SVincent Guittot 	struct sched_domain **__percpu sd;
118224fc7edbSPeter Zijlstra 	struct sched_domain_shared **__percpu sds;
1183143e1e28SVincent Guittot 	struct sched_group **__percpu sg;
118463b2ca30SNicolas Pitre 	struct sched_group_capacity **__percpu sgc;
1185143e1e28SVincent Guittot };
1186143e1e28SVincent Guittot 
1187143e1e28SVincent Guittot struct sched_domain_topology_level {
1188143e1e28SVincent Guittot 	sched_domain_mask_f mask;
1189143e1e28SVincent Guittot 	sched_domain_flags_f sd_flags;
1190143e1e28SVincent Guittot 	int		    flags;
1191143e1e28SVincent Guittot 	int		    numa_level;
1192143e1e28SVincent Guittot 	struct sd_data      data;
1193143e1e28SVincent Guittot #ifdef CONFIG_SCHED_DEBUG
1194143e1e28SVincent Guittot 	char                *name;
1195143e1e28SVincent Guittot #endif
1196143e1e28SVincent Guittot };
1197143e1e28SVincent Guittot 
1198143e1e28SVincent Guittot extern void set_sched_topology(struct sched_domain_topology_level *tl);
1199f6be8af1SChuansheng Liu extern void wake_up_if_idle(int cpu);
1200143e1e28SVincent Guittot 
1201143e1e28SVincent Guittot #ifdef CONFIG_SCHED_DEBUG
1202143e1e28SVincent Guittot # define SD_INIT_NAME(type)		.name = #type
1203143e1e28SVincent Guittot #else
1204143e1e28SVincent Guittot # define SD_INIT_NAME(type)
1205143e1e28SVincent Guittot #endif
1206143e1e28SVincent Guittot 
12071b427c15SIngo Molnar #else /* CONFIG_SMP */
12081da177e4SLinus Torvalds 
12091b427c15SIngo Molnar struct sched_domain_attr;
12101b427c15SIngo Molnar 
12111b427c15SIngo Molnar static inline void
1212acc3f5d7SRusty Russell partition_sched_domains(int ndoms_new, cpumask_var_t doms_new[],
12131b427c15SIngo Molnar 			struct sched_domain_attr *dattr_new)
1214d02c7a8cSCon Kolivas {
1215d02c7a8cSCon Kolivas }
121639be3501SPeter Zijlstra 
121739be3501SPeter Zijlstra static inline bool cpus_share_cache(int this_cpu, int that_cpu)
121839be3501SPeter Zijlstra {
121939be3501SPeter Zijlstra 	return true;
122039be3501SPeter Zijlstra }
122139be3501SPeter Zijlstra 
12221b427c15SIngo Molnar #endif	/* !CONFIG_SMP */
12231da177e4SLinus Torvalds 
122447fe38fcSPeter Zijlstra 
12251da177e4SLinus Torvalds struct io_context;			/* See blkdev.h */
12261da177e4SLinus Torvalds 
12271da177e4SLinus Torvalds 
1228383f2835SChen, Kenneth W #ifdef ARCH_HAS_PREFETCH_SWITCH_STACK
122936c8b586SIngo Molnar extern void prefetch_stack(struct task_struct *t);
1230383f2835SChen, Kenneth W #else
1231383f2835SChen, Kenneth W static inline void prefetch_stack(struct task_struct *t) { }
1232383f2835SChen, Kenneth W #endif
12331da177e4SLinus Torvalds 
12341da177e4SLinus Torvalds struct audit_context;		/* See audit.c */
12351da177e4SLinus Torvalds struct mempolicy;
1236b92ce558SJens Axboe struct pipe_inode_info;
12374865ecf1SSerge E. Hallyn struct uts_namespace;
12381da177e4SLinus Torvalds 
123920b8a59fSIngo Molnar struct load_weight {
12409dbdb155SPeter Zijlstra 	unsigned long weight;
12419dbdb155SPeter Zijlstra 	u32 inv_weight;
124220b8a59fSIngo Molnar };
124320b8a59fSIngo Molnar 
12449d89c257SYuyang Du /*
12457b595334SYuyang Du  * The load_avg/util_avg accumulates an infinite geometric series
12467b595334SYuyang Du  * (see __update_load_avg() in kernel/sched/fair.c).
12477b595334SYuyang Du  *
12487b595334SYuyang Du  * [load_avg definition]
12497b595334SYuyang Du  *
12507b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load)
12517b595334SYuyang Du  *
12527b595334SYuyang Du  * where runnable% is the time ratio that a sched_entity is runnable.
12537b595334SYuyang Du  * For cfs_rq, it is the aggregated load_avg of all runnable and
12549d89c257SYuyang Du  * blocked sched_entities.
12557b595334SYuyang Du  *
12567b595334SYuyang Du  * load_avg may also take frequency scaling into account:
12577b595334SYuyang Du  *
12587b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load) * freq%
12597b595334SYuyang Du  *
12607b595334SYuyang Du  * where freq% is the CPU frequency normalized to the highest frequency.
12617b595334SYuyang Du  *
12627b595334SYuyang Du  * [util_avg definition]
12637b595334SYuyang Du  *
12647b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE
12657b595334SYuyang Du  *
12667b595334SYuyang Du  * where running% is the time ratio that a sched_entity is running on
12677b595334SYuyang Du  * a CPU. For cfs_rq, it is the aggregated util_avg of all runnable
12687b595334SYuyang Du  * and blocked sched_entities.
12697b595334SYuyang Du  *
12707b595334SYuyang Du  * util_avg may also factor frequency scaling and CPU capacity scaling:
12717b595334SYuyang Du  *
12727b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE * freq% * capacity%
12737b595334SYuyang Du  *
12747b595334SYuyang Du  * where freq% is the same as above, and capacity% is the CPU capacity
12757b595334SYuyang Du  * normalized to the greatest capacity (due to uarch differences, etc).
12767b595334SYuyang Du  *
12777b595334SYuyang Du  * N.B., the above ratios (runnable%, running%, freq%, and capacity%)
12787b595334SYuyang Du  * themselves are in the range of [0, 1]. To do fixed point arithmetics,
12797b595334SYuyang Du  * we therefore scale them to as large a range as necessary. This is for
12807b595334SYuyang Du  * example reflected by util_avg's SCHED_CAPACITY_SCALE.
12817b595334SYuyang Du  *
12827b595334SYuyang Du  * [Overflow issue]
12837b595334SYuyang Du  *
12847b595334SYuyang Du  * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities
12857b595334SYuyang Du  * with the highest load (=88761), always runnable on a single cfs_rq,
12867b595334SYuyang Du  * and should not overflow as the number already hits PID_MAX_LIMIT.
12877b595334SYuyang Du  *
12887b595334SYuyang Du  * For all other cases (including 32-bit kernels), struct load_weight's
12897b595334SYuyang Du  * weight will overflow first before we do, because:
12907b595334SYuyang Du  *
12917b595334SYuyang Du  *    Max(load_avg) <= Max(load.weight)
12927b595334SYuyang Du  *
12937b595334SYuyang Du  * Then it is the load_weight's responsibility to consider overflow
12947b595334SYuyang Du  * issues.
12959d89c257SYuyang Du  */
12969d85f21cSPaul Turner struct sched_avg {
12979d89c257SYuyang Du 	u64 last_update_time, load_sum;
12989d89c257SYuyang Du 	u32 util_sum, period_contrib;
12999d89c257SYuyang Du 	unsigned long load_avg, util_avg;
13009d85f21cSPaul Turner };
13019d85f21cSPaul Turner 
130294c18227SIngo Molnar #ifdef CONFIG_SCHEDSTATS
130341acab88SLucas De Marchi struct sched_statistics {
130494c18227SIngo Molnar 	u64			wait_start;
130594c18227SIngo Molnar 	u64			wait_max;
13066d082592SArjan van de Ven 	u64			wait_count;
13076d082592SArjan van de Ven 	u64			wait_sum;
13088f0dfc34SArjan van de Ven 	u64			iowait_count;
13098f0dfc34SArjan van de Ven 	u64			iowait_sum;
131094c18227SIngo Molnar 
131194c18227SIngo Molnar 	u64			sleep_start;
131220b8a59fSIngo Molnar 	u64			sleep_max;
131394c18227SIngo Molnar 	s64			sum_sleep_runtime;
131494c18227SIngo Molnar 
131594c18227SIngo Molnar 	u64			block_start;
131620b8a59fSIngo Molnar 	u64			block_max;
131720b8a59fSIngo Molnar 	u64			exec_max;
1318eba1ed4bSIngo Molnar 	u64			slice_max;
1319cc367732SIngo Molnar 
1320cc367732SIngo Molnar 	u64			nr_migrations_cold;
1321cc367732SIngo Molnar 	u64			nr_failed_migrations_affine;
1322cc367732SIngo Molnar 	u64			nr_failed_migrations_running;
1323cc367732SIngo Molnar 	u64			nr_failed_migrations_hot;
1324cc367732SIngo Molnar 	u64			nr_forced_migrations;
1325cc367732SIngo Molnar 
1326cc367732SIngo Molnar 	u64			nr_wakeups;
1327cc367732SIngo Molnar 	u64			nr_wakeups_sync;
1328cc367732SIngo Molnar 	u64			nr_wakeups_migrate;
1329cc367732SIngo Molnar 	u64			nr_wakeups_local;
1330cc367732SIngo Molnar 	u64			nr_wakeups_remote;
1331cc367732SIngo Molnar 	u64			nr_wakeups_affine;
1332cc367732SIngo Molnar 	u64			nr_wakeups_affine_attempts;
1333cc367732SIngo Molnar 	u64			nr_wakeups_passive;
1334cc367732SIngo Molnar 	u64			nr_wakeups_idle;
133541acab88SLucas De Marchi };
133641acab88SLucas De Marchi #endif
133741acab88SLucas De Marchi 
133841acab88SLucas De Marchi struct sched_entity {
133941acab88SLucas De Marchi 	struct load_weight	load;		/* for load-balancing */
134041acab88SLucas De Marchi 	struct rb_node		run_node;
134141acab88SLucas De Marchi 	struct list_head	group_node;
134241acab88SLucas De Marchi 	unsigned int		on_rq;
134341acab88SLucas De Marchi 
134441acab88SLucas De Marchi 	u64			exec_start;
134541acab88SLucas De Marchi 	u64			sum_exec_runtime;
134641acab88SLucas De Marchi 	u64			vruntime;
134741acab88SLucas De Marchi 	u64			prev_sum_exec_runtime;
134841acab88SLucas De Marchi 
134941acab88SLucas De Marchi 	u64			nr_migrations;
135041acab88SLucas De Marchi 
135141acab88SLucas De Marchi #ifdef CONFIG_SCHEDSTATS
135241acab88SLucas De Marchi 	struct sched_statistics statistics;
135394c18227SIngo Molnar #endif
135494c18227SIngo Molnar 
135520b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED
1356fed14d45SPeter Zijlstra 	int			depth;
135720b8a59fSIngo Molnar 	struct sched_entity	*parent;
135820b8a59fSIngo Molnar 	/* rq on which this entity is (to be) queued: */
135920b8a59fSIngo Molnar 	struct cfs_rq		*cfs_rq;
136020b8a59fSIngo Molnar 	/* rq "owned" by this entity/group: */
136120b8a59fSIngo Molnar 	struct cfs_rq		*my_q;
136220b8a59fSIngo Molnar #endif
13638bd75c77SClark Williams 
1364141965c7SAlex Shi #ifdef CONFIG_SMP
13655a107804SJiri Olsa 	/*
13665a107804SJiri Olsa 	 * Per entity load average tracking.
13675a107804SJiri Olsa 	 *
13685a107804SJiri Olsa 	 * Put into separate cache line so it does not
13695a107804SJiri Olsa 	 * collide with read-mostly values above.
13705a107804SJiri Olsa 	 */
13715a107804SJiri Olsa 	struct sched_avg	avg ____cacheline_aligned_in_smp;
13729d85f21cSPaul Turner #endif
137320b8a59fSIngo Molnar };
137470b97a7fSIngo Molnar 
1375fa717060SPeter Zijlstra struct sched_rt_entity {
1376fa717060SPeter Zijlstra 	struct list_head run_list;
137778f2c7dbSPeter Zijlstra 	unsigned long timeout;
137857d2aa00SYing Xue 	unsigned long watchdog_stamp;
1379bee367edSRichard Kennedy 	unsigned int time_slice;
1380ff77e468SPeter Zijlstra 	unsigned short on_rq;
1381ff77e468SPeter Zijlstra 	unsigned short on_list;
13826f505b16SPeter Zijlstra 
138358d6c2d7SPeter Zijlstra 	struct sched_rt_entity *back;
1384052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED
13856f505b16SPeter Zijlstra 	struct sched_rt_entity	*parent;
13866f505b16SPeter Zijlstra 	/* rq on which this entity is (to be) queued: */
13876f505b16SPeter Zijlstra 	struct rt_rq		*rt_rq;
13886f505b16SPeter Zijlstra 	/* rq "owned" by this entity/group: */
13896f505b16SPeter Zijlstra 	struct rt_rq		*my_q;
13906f505b16SPeter Zijlstra #endif
1391fa717060SPeter Zijlstra };
1392fa717060SPeter Zijlstra 
1393aab03e05SDario Faggioli struct sched_dl_entity {
1394aab03e05SDario Faggioli 	struct rb_node	rb_node;
1395aab03e05SDario Faggioli 
1396aab03e05SDario Faggioli 	/*
1397aab03e05SDario Faggioli 	 * Original scheduling parameters. Copied here from sched_attr
13984027d080Sxiaofeng.yan 	 * during sched_setattr(), they will remain the same until
13994027d080Sxiaofeng.yan 	 * the next sched_setattr().
1400aab03e05SDario Faggioli 	 */
1401aab03e05SDario Faggioli 	u64 dl_runtime;		/* maximum runtime for each instance	*/
1402aab03e05SDario Faggioli 	u64 dl_deadline;	/* relative deadline of each instance	*/
1403755378a4SHarald Gustafsson 	u64 dl_period;		/* separation of two instances (period) */
1404332ac17eSDario Faggioli 	u64 dl_bw;		/* dl_runtime / dl_deadline		*/
1405aab03e05SDario Faggioli 
1406aab03e05SDario Faggioli 	/*
1407aab03e05SDario Faggioli 	 * Actual scheduling parameters. Initialized with the values above,
1408aab03e05SDario Faggioli 	 * they are continously updated during task execution. Note that
1409aab03e05SDario Faggioli 	 * the remaining runtime could be < 0 in case we are in overrun.
1410aab03e05SDario Faggioli 	 */
1411aab03e05SDario Faggioli 	s64 runtime;		/* remaining runtime for this instance	*/
1412aab03e05SDario Faggioli 	u64 deadline;		/* absolute deadline for this instance	*/
1413aab03e05SDario Faggioli 	unsigned int flags;	/* specifying the scheduler behaviour	*/
1414aab03e05SDario Faggioli 
1415aab03e05SDario Faggioli 	/*
1416aab03e05SDario Faggioli 	 * Some bool flags:
1417aab03e05SDario Faggioli 	 *
1418aab03e05SDario Faggioli 	 * @dl_throttled tells if we exhausted the runtime. If so, the
1419aab03e05SDario Faggioli 	 * task has to wait for a replenishment to be performed at the
1420aab03e05SDario Faggioli 	 * next firing of dl_timer.
1421aab03e05SDario Faggioli 	 *
14222d3d891dSDario Faggioli 	 * @dl_boosted tells if we are boosted due to DI. If so we are
14232d3d891dSDario Faggioli 	 * outside bandwidth enforcement mechanism (but only until we
14245bfd126eSJuri Lelli 	 * exit the critical section);
14255bfd126eSJuri Lelli 	 *
14265bfd126eSJuri Lelli 	 * @dl_yielded tells if task gave up the cpu before consuming
14275bfd126eSJuri Lelli 	 * all its available runtime during the last job.
1428aab03e05SDario Faggioli 	 */
142972f9f3fdSLuca Abeni 	int dl_throttled, dl_boosted, dl_yielded;
1430aab03e05SDario Faggioli 
1431aab03e05SDario Faggioli 	/*
1432aab03e05SDario Faggioli 	 * Bandwidth enforcement timer. Each -deadline task has its
1433aab03e05SDario Faggioli 	 * own bandwidth to be enforced, thus we need one timer per task.
1434aab03e05SDario Faggioli 	 */
1435aab03e05SDario Faggioli 	struct hrtimer dl_timer;
1436aab03e05SDario Faggioli };
14378bd75c77SClark Williams 
14381d082fd0SPaul E. McKenney union rcu_special {
14391d082fd0SPaul E. McKenney 	struct {
14408203d6d0SPaul E. McKenney 		u8 blocked;
14418203d6d0SPaul E. McKenney 		u8 need_qs;
14428203d6d0SPaul E. McKenney 		u8 exp_need_qs;
14438203d6d0SPaul E. McKenney 		u8 pad;	/* Otherwise the compiler can store garbage here. */
14448203d6d0SPaul E. McKenney 	} b; /* Bits. */
14458203d6d0SPaul E. McKenney 	u32 s; /* Set of bits. */
14461d082fd0SPaul E. McKenney };
144786848966SPaul E. McKenney struct rcu_node;
144886848966SPaul E. McKenney 
14498dc85d54SPeter Zijlstra enum perf_event_task_context {
14508dc85d54SPeter Zijlstra 	perf_invalid_context = -1,
14518dc85d54SPeter Zijlstra 	perf_hw_context = 0,
145289a1e187SPeter Zijlstra 	perf_sw_context,
14538dc85d54SPeter Zijlstra 	perf_nr_task_contexts,
14548dc85d54SPeter Zijlstra };
14558dc85d54SPeter Zijlstra 
145672b252aeSMel Gorman /* Track pages that require TLB flushes */
145772b252aeSMel Gorman struct tlbflush_unmap_batch {
145872b252aeSMel Gorman 	/*
145972b252aeSMel Gorman 	 * Each bit set is a CPU that potentially has a TLB entry for one of
146072b252aeSMel Gorman 	 * the PFNs being flushed. See set_tlb_ubc_flush_pending().
146172b252aeSMel Gorman 	 */
146272b252aeSMel Gorman 	struct cpumask cpumask;
146372b252aeSMel Gorman 
146472b252aeSMel Gorman 	/* True if any bit in cpumask is set */
146572b252aeSMel Gorman 	bool flush_required;
1466d950c947SMel Gorman 
1467d950c947SMel Gorman 	/*
1468d950c947SMel Gorman 	 * If true then the PTE was dirty when unmapped. The entry must be
1469d950c947SMel Gorman 	 * flushed before IO is initiated or a stale TLB entry potentially
1470d950c947SMel Gorman 	 * allows an update without redirtying the page.
1471d950c947SMel Gorman 	 */
1472d950c947SMel Gorman 	bool writable;
147372b252aeSMel Gorman };
147472b252aeSMel Gorman 
14751da177e4SLinus Torvalds struct task_struct {
1476c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
1477c65eacbeSAndy Lutomirski 	/*
1478c65eacbeSAndy Lutomirski 	 * For reasons of header soup (see current_thread_info()), this
1479c65eacbeSAndy Lutomirski 	 * must be the first element of task_struct.
1480c65eacbeSAndy Lutomirski 	 */
1481c65eacbeSAndy Lutomirski 	struct thread_info thread_info;
1482c65eacbeSAndy Lutomirski #endif
14831da177e4SLinus Torvalds 	volatile long state;	/* -1 unrunnable, 0 runnable, >0 stopped */
1484f7e4217bSRoman Zippel 	void *stack;
14851da177e4SLinus Torvalds 	atomic_t usage;
148697dc32cdSWilliam Cohen 	unsigned int flags;	/* per process flags, defined below */
148797dc32cdSWilliam Cohen 	unsigned int ptrace;
14881da177e4SLinus Torvalds 
14892dd73a4fSPeter Williams #ifdef CONFIG_SMP
1490fa14ff4aSPeter Zijlstra 	struct llist_node wake_entry;
14913ca7a440SPeter Zijlstra 	int on_cpu;
1492c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
1493c65eacbeSAndy Lutomirski 	unsigned int cpu;	/* current CPU */
1494c65eacbeSAndy Lutomirski #endif
149563b0e9edSMike Galbraith 	unsigned int wakee_flips;
149662470419SMichael Wang 	unsigned long wakee_flip_decay_ts;
149763b0e9edSMike Galbraith 	struct task_struct *last_wakee;
1498ac66f547SPeter Zijlstra 
1499ac66f547SPeter Zijlstra 	int wake_cpu;
15004866cde0SNick Piggin #endif
1501fd2f4419SPeter Zijlstra 	int on_rq;
150250e645a8SIngo Molnar 
1503b29739f9SIngo Molnar 	int prio, static_prio, normal_prio;
1504c7aceabaSRichard Kennedy 	unsigned int rt_priority;
15055522d5d5SIngo Molnar 	const struct sched_class *sched_class;
150620b8a59fSIngo Molnar 	struct sched_entity se;
1507fa717060SPeter Zijlstra 	struct sched_rt_entity rt;
15088323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED
15098323f26cSPeter Zijlstra 	struct task_group *sched_task_group;
15108323f26cSPeter Zijlstra #endif
1511aab03e05SDario Faggioli 	struct sched_dl_entity dl;
15121da177e4SLinus Torvalds 
1513e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS
1514e107be36SAvi Kivity 	/* list of struct preempt_notifier: */
1515e107be36SAvi Kivity 	struct hlist_head preempt_notifiers;
1516e107be36SAvi Kivity #endif
1517e107be36SAvi Kivity 
15186c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE
15192056a782SJens Axboe 	unsigned int btrace_seq;
15206c5c9341SAlexey Dobriyan #endif
15211da177e4SLinus Torvalds 
152297dc32cdSWilliam Cohen 	unsigned int policy;
152329baa747SPeter Zijlstra 	int nr_cpus_allowed;
15241da177e4SLinus Torvalds 	cpumask_t cpus_allowed;
15251da177e4SLinus Torvalds 
1526a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU
1527e260be67SPaul E. McKenney 	int rcu_read_lock_nesting;
15281d082fd0SPaul E. McKenney 	union rcu_special rcu_read_unlock_special;
1529f41d911fSPaul E. McKenney 	struct list_head rcu_node_entry;
1530a57eb940SPaul E. McKenney 	struct rcu_node *rcu_blocked_node;
153128f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */
15328315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU
15338315f422SPaul E. McKenney 	unsigned long rcu_tasks_nvcsw;
15348315f422SPaul E. McKenney 	bool rcu_tasks_holdout;
15358315f422SPaul E. McKenney 	struct list_head rcu_tasks_holdout_list;
1536176f8f7aSPaul E. McKenney 	int rcu_tasks_idle_cpu;
15378315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */
1538e260be67SPaul E. McKenney 
1539f6db8347SNaveen N. Rao #ifdef CONFIG_SCHED_INFO
15401da177e4SLinus Torvalds 	struct sched_info sched_info;
15411da177e4SLinus Torvalds #endif
15421da177e4SLinus Torvalds 
15431da177e4SLinus Torvalds 	struct list_head tasks;
1544806c09a7SDario Faggioli #ifdef CONFIG_SMP
1545917b627dSGregory Haskins 	struct plist_node pushable_tasks;
15461baca4ceSJuri Lelli 	struct rb_node pushable_dl_tasks;
1547806c09a7SDario Faggioli #endif
15481da177e4SLinus Torvalds 
15491da177e4SLinus Torvalds 	struct mm_struct *mm, *active_mm;
1550615d6e87SDavidlohr Bueso 	/* per-thread vma caching */
1551615d6e87SDavidlohr Bueso 	u32 vmacache_seqnum;
1552615d6e87SDavidlohr Bueso 	struct vm_area_struct *vmacache[VMACACHE_SIZE];
155334e55232SKAMEZAWA Hiroyuki #if defined(SPLIT_RSS_COUNTING)
155434e55232SKAMEZAWA Hiroyuki 	struct task_rss_stat	rss_stat;
155534e55232SKAMEZAWA Hiroyuki #endif
15561da177e4SLinus Torvalds /* task state */
155797dc32cdSWilliam Cohen 	int exit_state;
15581da177e4SLinus Torvalds 	int exit_code, exit_signal;
15591da177e4SLinus Torvalds 	int pdeath_signal;  /*  The signal sent when the parent dies  */
1560e7cc4173SPalmer Dabbelt 	unsigned long jobctl;	/* JOBCTL_*, siglock protected */
15619b89f6baSAndrei Epure 
15629b89f6baSAndrei Epure 	/* Used for emulating ABI behavior of previous Linux versions */
156397dc32cdSWilliam Cohen 	unsigned int personality;
15649b89f6baSAndrei Epure 
1565be958bdcSPeter Zijlstra 	/* scheduler bits, serialized by scheduler locks */
1566ca94c442SLennart Poettering 	unsigned sched_reset_on_fork:1;
1567a8e4f2eaSPeter Zijlstra 	unsigned sched_contributes_to_load:1;
1568ff303e66SPeter Zijlstra 	unsigned sched_migrated:1;
1569b7e7ade3SPeter Zijlstra 	unsigned sched_remote_wakeup:1;
1570be958bdcSPeter Zijlstra 	unsigned :0; /* force alignment to the next boundary */
1571be958bdcSPeter Zijlstra 
1572be958bdcSPeter Zijlstra 	/* unserialized, strictly 'current' */
1573be958bdcSPeter Zijlstra 	unsigned in_execve:1; /* bit to tell LSMs we're in execve */
1574be958bdcSPeter Zijlstra 	unsigned in_iowait:1;
15757e781418SAndy Lutomirski #if !defined(TIF_RESTORE_SIGMASK)
15767e781418SAndy Lutomirski 	unsigned restore_sigmask:1;
15777e781418SAndy Lutomirski #endif
1578626ebc41STejun Heo #ifdef CONFIG_MEMCG
1579626ebc41STejun Heo 	unsigned memcg_may_oom:1;
1580127424c8SJohannes Weiner #ifndef CONFIG_SLOB
15816f185c29SVladimir Davydov 	unsigned memcg_kmem_skip_account:1;
15826f185c29SVladimir Davydov #endif
1583127424c8SJohannes Weiner #endif
1584ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK
1585ff303e66SPeter Zijlstra 	unsigned brk_randomized:1;
1586ff303e66SPeter Zijlstra #endif
15876f185c29SVladimir Davydov 
15881d4457f9SKees Cook 	unsigned long atomic_flags; /* Flags needing atomic access. */
15891d4457f9SKees Cook 
1590f56141e3SAndy Lutomirski 	struct restart_block restart_block;
1591f56141e3SAndy Lutomirski 
15921da177e4SLinus Torvalds 	pid_t pid;
15931da177e4SLinus Torvalds 	pid_t tgid;
15940a425405SArjan van de Ven 
15951314562aSHiroshi Shimamoto #ifdef CONFIG_CC_STACKPROTECTOR
15960a425405SArjan van de Ven 	/* Canary value for the -fstack-protector gcc feature */
15970a425405SArjan van de Ven 	unsigned long stack_canary;
15981314562aSHiroshi Shimamoto #endif
15991da177e4SLinus Torvalds 	/*
16001da177e4SLinus Torvalds 	 * pointers to (original) parent process, youngest child, younger sibling,
16011da177e4SLinus Torvalds 	 * older sibling, respectively.  (p->father can be replaced with
1602f470021aSRoland McGrath 	 * p->real_parent->pid)
16031da177e4SLinus Torvalds 	 */
1604abd63bc3SKees Cook 	struct task_struct __rcu *real_parent; /* real parent process */
1605abd63bc3SKees Cook 	struct task_struct __rcu *parent; /* recipient of SIGCHLD, wait4() reports */
16061da177e4SLinus Torvalds 	/*
1607f470021aSRoland McGrath 	 * children/sibling forms the list of my natural children
16081da177e4SLinus Torvalds 	 */
16091da177e4SLinus Torvalds 	struct list_head children;	/* list of my children */
16101da177e4SLinus Torvalds 	struct list_head sibling;	/* linkage in my parent's children list */
16111da177e4SLinus Torvalds 	struct task_struct *group_leader;	/* threadgroup leader */
16121da177e4SLinus Torvalds 
1613f470021aSRoland McGrath 	/*
1614f470021aSRoland McGrath 	 * ptraced is the list of tasks this task is using ptrace on.
1615f470021aSRoland McGrath 	 * This includes both natural children and PTRACE_ATTACH targets.
1616f470021aSRoland McGrath 	 * p->ptrace_entry is p's link on the p->parent->ptraced list.
1617f470021aSRoland McGrath 	 */
1618f470021aSRoland McGrath 	struct list_head ptraced;
1619f470021aSRoland McGrath 	struct list_head ptrace_entry;
1620f470021aSRoland McGrath 
16211da177e4SLinus Torvalds 	/* PID/PID hash table linkage. */
162292476d7fSEric W. Biederman 	struct pid_link pids[PIDTYPE_MAX];
162347e65328SOleg Nesterov 	struct list_head thread_group;
16240c740d0aSOleg Nesterov 	struct list_head thread_node;
16251da177e4SLinus Torvalds 
16261da177e4SLinus Torvalds 	struct completion *vfork_done;		/* for vfork() */
16271da177e4SLinus Torvalds 	int __user *set_child_tid;		/* CLONE_CHILD_SETTID */
16281da177e4SLinus Torvalds 	int __user *clear_child_tid;		/* CLONE_CHILD_CLEARTID */
16291da177e4SLinus Torvalds 
1630c66f08beSMichael Neuling 	cputime_t utime, stime, utimescaled, stimescaled;
16319ac52315SLaurent Vivier 	cputime_t gtime;
16329d7fb042SPeter Zijlstra 	struct prev_cputime prev_cputime;
16336a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
1634b7ce2277SFrederic Weisbecker 	seqcount_t vtime_seqcount;
16356a61671bSFrederic Weisbecker 	unsigned long long vtime_snap;
16366a61671bSFrederic Weisbecker 	enum {
16377098c1eaSFrederic Weisbecker 		/* Task is sleeping or running in a CPU with VTIME inactive */
16387098c1eaSFrederic Weisbecker 		VTIME_INACTIVE = 0,
16397098c1eaSFrederic Weisbecker 		/* Task runs in userspace in a CPU with VTIME active */
16406a61671bSFrederic Weisbecker 		VTIME_USER,
16417098c1eaSFrederic Weisbecker 		/* Task runs in kernelspace in a CPU with VTIME active */
16426a61671bSFrederic Weisbecker 		VTIME_SYS,
16436a61671bSFrederic Weisbecker 	} vtime_snap_whence;
16446a61671bSFrederic Weisbecker #endif
1645d027d45dSFrederic Weisbecker 
1646d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
1647f009a7a7SFrederic Weisbecker 	atomic_t tick_dep_mask;
1648d027d45dSFrederic Weisbecker #endif
16491da177e4SLinus Torvalds 	unsigned long nvcsw, nivcsw; /* context switch counts */
1650ccbf62d8SThomas Gleixner 	u64 start_time;		/* monotonic time in nsec */
165157e0be04SThomas Gleixner 	u64 real_start_time;	/* boot based time in nsec */
16521da177e4SLinus Torvalds /* mm fault and swap info: this can arguably be seen as either mm-specific or thread-specific */
16531da177e4SLinus Torvalds 	unsigned long min_flt, maj_flt;
16541da177e4SLinus Torvalds 
1655f06febc9SFrank Mayhar 	struct task_cputime cputime_expires;
16561da177e4SLinus Torvalds 	struct list_head cpu_timers[3];
16571da177e4SLinus Torvalds 
16581da177e4SLinus Torvalds /* process credentials */
16591b0ba1c9SArnd Bergmann 	const struct cred __rcu *real_cred; /* objective and real subjective task
16603b11a1deSDavid Howells 					 * credentials (COW) */
16611b0ba1c9SArnd Bergmann 	const struct cred __rcu *cred;	/* effective (overridable) subjective task
16623b11a1deSDavid Howells 					 * credentials (COW) */
166336772092SPaolo 'Blaisorblade' Giarrusso 	char comm[TASK_COMM_LEN]; /* executable name excluding path
166436772092SPaolo 'Blaisorblade' Giarrusso 				     - access with [gs]et_task_comm (which lock
166536772092SPaolo 'Blaisorblade' Giarrusso 				       it with task_lock())
1666221af7f8SLinus Torvalds 				     - initialized normally by setup_new_exec */
16671da177e4SLinus Torvalds /* file system info */
1668756daf26SNeilBrown 	struct nameidata *nameidata;
16693d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC
16701da177e4SLinus Torvalds /* ipc stuff */
16711da177e4SLinus Torvalds 	struct sysv_sem sysvsem;
1672ab602f79SJack Miller 	struct sysv_shm sysvshm;
16733d5b6fccSAlexey Dobriyan #endif
1674e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK
167582a1fcb9SIngo Molnar /* hung task detection */
167682a1fcb9SIngo Molnar 	unsigned long last_switch_count;
167782a1fcb9SIngo Molnar #endif
16781da177e4SLinus Torvalds /* filesystem information */
16791da177e4SLinus Torvalds 	struct fs_struct *fs;
16801da177e4SLinus Torvalds /* open file information */
16811da177e4SLinus Torvalds 	struct files_struct *files;
16821651e14eSSerge E. Hallyn /* namespaces */
1683ab516013SSerge E. Hallyn 	struct nsproxy *nsproxy;
16841da177e4SLinus Torvalds /* signal handlers */
16851da177e4SLinus Torvalds 	struct signal_struct *signal;
16861da177e4SLinus Torvalds 	struct sighand_struct *sighand;
16871da177e4SLinus Torvalds 
16881da177e4SLinus Torvalds 	sigset_t blocked, real_blocked;
1689f3de272bSRoland McGrath 	sigset_t saved_sigmask;	/* restored if set_restore_sigmask() was used */
16901da177e4SLinus Torvalds 	struct sigpending pending;
16911da177e4SLinus Torvalds 
16921da177e4SLinus Torvalds 	unsigned long sas_ss_sp;
16931da177e4SLinus Torvalds 	size_t sas_ss_size;
16942a742138SStas Sergeev 	unsigned sas_ss_flags;
16952e01fabeSOleg Nesterov 
169667d12145SAl Viro 	struct callback_head *task_works;
1697e73f8959SOleg Nesterov 
16981da177e4SLinus Torvalds 	struct audit_context *audit_context;
1699bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL
1700e1760bd5SEric W. Biederman 	kuid_t loginuid;
17014746ec5bSEric Paris 	unsigned int sessionid;
1702bfef93a5SAl Viro #endif
1703932ecebbSWill Drewry 	struct seccomp seccomp;
17041da177e4SLinus Torvalds 
17051da177e4SLinus Torvalds /* Thread group tracking */
17061da177e4SLinus Torvalds    	u32 parent_exec_id;
17071da177e4SLinus Torvalds    	u32 self_exec_id;
170858568d2aSMiao Xie /* Protection of (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed,
170958568d2aSMiao Xie  * mempolicy */
17101da177e4SLinus Torvalds 	spinlock_t alloc_lock;
17111da177e4SLinus Torvalds 
1712b29739f9SIngo Molnar 	/* Protection of the PI data structures: */
17131d615482SThomas Gleixner 	raw_spinlock_t pi_lock;
1714b29739f9SIngo Molnar 
171576751049SPeter Zijlstra 	struct wake_q_node wake_q;
171676751049SPeter Zijlstra 
171723f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES
171823f78d4aSIngo Molnar 	/* PI waiters blocked on a rt_mutex held by this task */
1719fb00aca4SPeter Zijlstra 	struct rb_root pi_waiters;
1720fb00aca4SPeter Zijlstra 	struct rb_node *pi_waiters_leftmost;
172123f78d4aSIngo Molnar 	/* Deadlock detection and priority inheritance handling */
172223f78d4aSIngo Molnar 	struct rt_mutex_waiter *pi_blocked_on;
172323f78d4aSIngo Molnar #endif
172423f78d4aSIngo Molnar 
1725408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES
1726408894eeSIngo Molnar 	/* mutex deadlock detection */
1727408894eeSIngo Molnar 	struct mutex_waiter *blocked_on;
1728408894eeSIngo Molnar #endif
1729de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS
1730de30a2b3SIngo Molnar 	unsigned int irq_events;
1731de30a2b3SIngo Molnar 	unsigned long hardirq_enable_ip;
1732de30a2b3SIngo Molnar 	unsigned long hardirq_disable_ip;
1733fa1452e8SHiroshi Shimamoto 	unsigned int hardirq_enable_event;
1734de30a2b3SIngo Molnar 	unsigned int hardirq_disable_event;
1735fa1452e8SHiroshi Shimamoto 	int hardirqs_enabled;
1736de30a2b3SIngo Molnar 	int hardirq_context;
1737fa1452e8SHiroshi Shimamoto 	unsigned long softirq_disable_ip;
1738fa1452e8SHiroshi Shimamoto 	unsigned long softirq_enable_ip;
1739fa1452e8SHiroshi Shimamoto 	unsigned int softirq_disable_event;
1740fa1452e8SHiroshi Shimamoto 	unsigned int softirq_enable_event;
1741fa1452e8SHiroshi Shimamoto 	int softirqs_enabled;
1742de30a2b3SIngo Molnar 	int softirq_context;
1743de30a2b3SIngo Molnar #endif
1744fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP
1745bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH 48UL
1746fbb9ce95SIngo Molnar 	u64 curr_chain_key;
1747fbb9ce95SIngo Molnar 	int lockdep_depth;
1748fbb9ce95SIngo Molnar 	unsigned int lockdep_recursion;
1749c7aceabaSRichard Kennedy 	struct held_lock held_locks[MAX_LOCK_DEPTH];
1750cf40bd16SNick Piggin 	gfp_t lockdep_reclaim_gfp;
1751fbb9ce95SIngo Molnar #endif
1752c6d30853SAndrey Ryabinin #ifdef CONFIG_UBSAN
1753c6d30853SAndrey Ryabinin 	unsigned int in_ubsan;
1754c6d30853SAndrey Ryabinin #endif
1755408894eeSIngo Molnar 
17561da177e4SLinus Torvalds /* journalling filesystem info */
17571da177e4SLinus Torvalds 	void *journal_info;
17581da177e4SLinus Torvalds 
1759d89d8796SNeil Brown /* stacked block device info */
1760bddd87c7SAkinobu Mita 	struct bio_list *bio_list;
1761d89d8796SNeil Brown 
176273c10101SJens Axboe #ifdef CONFIG_BLOCK
176373c10101SJens Axboe /* stack plugging */
176473c10101SJens Axboe 	struct blk_plug *plug;
176573c10101SJens Axboe #endif
176673c10101SJens Axboe 
17671da177e4SLinus Torvalds /* VM state */
17681da177e4SLinus Torvalds 	struct reclaim_state *reclaim_state;
17691da177e4SLinus Torvalds 
17701da177e4SLinus Torvalds 	struct backing_dev_info *backing_dev_info;
17711da177e4SLinus Torvalds 
17721da177e4SLinus Torvalds 	struct io_context *io_context;
17731da177e4SLinus Torvalds 
17741da177e4SLinus Torvalds 	unsigned long ptrace_message;
17751da177e4SLinus Torvalds 	siginfo_t *last_siginfo; /* For ptrace use.  */
17767c3ab738SAndrew Morton 	struct task_io_accounting ioac;
17778f0ab514SJay Lan #if defined(CONFIG_TASK_XACCT)
17781da177e4SLinus Torvalds 	u64 acct_rss_mem1;	/* accumulated rss usage */
17791da177e4SLinus Torvalds 	u64 acct_vm_mem1;	/* accumulated virtual memory usage */
178049b5cf34SJonathan Lim 	cputime_t acct_timexpd;	/* stime + utime since last update */
17811da177e4SLinus Torvalds #endif
17821da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS
178358568d2aSMiao Xie 	nodemask_t mems_allowed;	/* Protected by alloc_lock */
1784cc9a6c87SMel Gorman 	seqcount_t mems_allowed_seq;	/* Seqence no to catch updates */
1785825a46afSPaul Jackson 	int cpuset_mem_spread_rotor;
17866adef3ebSJack Steiner 	int cpuset_slab_spread_rotor;
17871da177e4SLinus Torvalds #endif
1788ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS
1789817929ecSPaul Menage 	/* Control Group info protected by css_set_lock */
17902c392b8cSArnd Bergmann 	struct css_set __rcu *cgroups;
1791817929ecSPaul Menage 	/* cg_list protected by css_set_lock and tsk->alloc_lock */
1792817929ecSPaul Menage 	struct list_head cg_list;
1793ddbcc7e8SPaul Menage #endif
179442b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX
17950771dfefSIngo Molnar 	struct robust_list_head __user *robust_list;
179634f192c6SIngo Molnar #ifdef CONFIG_COMPAT
179734f192c6SIngo Molnar 	struct compat_robust_list_head __user *compat_robust_list;
179834f192c6SIngo Molnar #endif
1799c87e2837SIngo Molnar 	struct list_head pi_state_list;
1800c87e2837SIngo Molnar 	struct futex_pi_state *pi_state_cache;
180142b2dd0aSAlexey Dobriyan #endif
1802cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS
18038dc85d54SPeter Zijlstra 	struct perf_event_context *perf_event_ctxp[perf_nr_task_contexts];
1804cdd6c482SIngo Molnar 	struct mutex perf_event_mutex;
1805cdd6c482SIngo Molnar 	struct list_head perf_event_list;
1806a63eaf34SPaul Mackerras #endif
18078f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT
18088f47b187SThomas Gleixner 	unsigned long preempt_disable_ip;
18098f47b187SThomas Gleixner #endif
1810c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA
181158568d2aSMiao Xie 	struct mempolicy *mempolicy;	/* Protected by alloc_lock */
1812c7aceabaSRichard Kennedy 	short il_next;
1813207205a2SEric Dumazet 	short pref_node_fork;
1814c7aceabaSRichard Kennedy #endif
1815cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING
1816cbee9f88SPeter Zijlstra 	int numa_scan_seq;
1817cbee9f88SPeter Zijlstra 	unsigned int numa_scan_period;
1818598f0ec0SMel Gorman 	unsigned int numa_scan_period_max;
1819de1c9ce6SRik van Riel 	int numa_preferred_nid;
18206b9a7460SMel Gorman 	unsigned long numa_migrate_retry;
1821cbee9f88SPeter Zijlstra 	u64 node_stamp;			/* migration stamp  */
18227e2703e6SRik van Riel 	u64 last_task_numa_placement;
18237e2703e6SRik van Riel 	u64 last_sum_exec_runtime;
1824cbee9f88SPeter Zijlstra 	struct callback_head numa_work;
1825f809ca9aSMel Gorman 
18268c8a743cSPeter Zijlstra 	struct list_head numa_entry;
18278c8a743cSPeter Zijlstra 	struct numa_group *numa_group;
18288c8a743cSPeter Zijlstra 
1829745d6147SMel Gorman 	/*
183044dba3d5SIulia Manda 	 * numa_faults is an array split into four regions:
183144dba3d5SIulia Manda 	 * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer
183244dba3d5SIulia Manda 	 * in this precise order.
183344dba3d5SIulia Manda 	 *
183444dba3d5SIulia Manda 	 * faults_memory: Exponential decaying average of faults on a per-node
183544dba3d5SIulia Manda 	 * basis. Scheduling placement decisions are made based on these
183644dba3d5SIulia Manda 	 * counts. The values remain static for the duration of a PTE scan.
183744dba3d5SIulia Manda 	 * faults_cpu: Track the nodes the process was running on when a NUMA
183844dba3d5SIulia Manda 	 * hinting fault was incurred.
183944dba3d5SIulia Manda 	 * faults_memory_buffer and faults_cpu_buffer: Record faults per node
184044dba3d5SIulia Manda 	 * during the current scan window. When the scan completes, the counts
184144dba3d5SIulia Manda 	 * in faults_memory and faults_cpu decay and these values are copied.
1842745d6147SMel Gorman 	 */
184344dba3d5SIulia Manda 	unsigned long *numa_faults;
184483e1d2cdSMel Gorman 	unsigned long total_numa_faults;
1845745d6147SMel Gorman 
1846745d6147SMel Gorman 	/*
184704bb2f94SRik van Riel 	 * numa_faults_locality tracks if faults recorded during the last
1848074c2381SMel Gorman 	 * scan window were remote/local or failed to migrate. The task scan
1849074c2381SMel Gorman 	 * period is adapted based on the locality of the faults with different
1850074c2381SMel Gorman 	 * weights depending on whether they were shared or private faults
185104bb2f94SRik van Riel 	 */
1852074c2381SMel Gorman 	unsigned long numa_faults_locality[3];
185304bb2f94SRik van Riel 
1854b32e86b4SIngo Molnar 	unsigned long numa_pages_migrated;
1855cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */
1856cbee9f88SPeter Zijlstra 
185772b252aeSMel Gorman #ifdef CONFIG_ARCH_WANT_BATCHED_UNMAP_TLB_FLUSH
185872b252aeSMel Gorman 	struct tlbflush_unmap_batch tlb_ubc;
185972b252aeSMel Gorman #endif
186072b252aeSMel Gorman 
1861e56d0903SIngo Molnar 	struct rcu_head rcu;
1862b92ce558SJens Axboe 
1863b92ce558SJens Axboe 	/*
1864b92ce558SJens Axboe 	 * cache last used pipe for splice
1865b92ce558SJens Axboe 	 */
1866b92ce558SJens Axboe 	struct pipe_inode_info *splice_pipe;
18675640f768SEric Dumazet 
18685640f768SEric Dumazet 	struct page_frag task_frag;
18695640f768SEric Dumazet 
1870ca74e92bSShailabh Nagar #ifdef	CONFIG_TASK_DELAY_ACCT
1871ca74e92bSShailabh Nagar 	struct task_delay_info *delays;
1872ca74e92bSShailabh Nagar #endif
1873f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION
1874f4f154fdSAkinobu Mita 	int make_it_fail;
1875f4f154fdSAkinobu Mita #endif
18769d823e8fSWu Fengguang 	/*
18779d823e8fSWu Fengguang 	 * when (nr_dirtied >= nr_dirtied_pause), it's time to call
18789d823e8fSWu Fengguang 	 * balance_dirty_pages() for some dirty throttling pause
18799d823e8fSWu Fengguang 	 */
18809d823e8fSWu Fengguang 	int nr_dirtied;
18819d823e8fSWu Fengguang 	int nr_dirtied_pause;
188283712358SWu Fengguang 	unsigned long dirty_paused_when; /* start of a write-and-pause period */
18839d823e8fSWu Fengguang 
18849745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP
18859745512cSArjan van de Ven 	int latency_record_count;
18869745512cSArjan van de Ven 	struct latency_record latency_record[LT_SAVECOUNT];
18879745512cSArjan van de Ven #endif
18886976675dSArjan van de Ven 	/*
18896976675dSArjan van de Ven 	 * time slack values; these are used to round up poll() and
18906976675dSArjan van de Ven 	 * select() etc timeout values. These are in nanoseconds.
18916976675dSArjan van de Ven 	 */
1892da8b44d5SJohn Stultz 	u64 timer_slack_ns;
1893da8b44d5SJohn Stultz 	u64 default_timer_slack_ns;
1894f8d570a4SDavid Miller 
18950b24beccSAndrey Ryabinin #ifdef CONFIG_KASAN
18960b24beccSAndrey Ryabinin 	unsigned int kasan_depth;
18970b24beccSAndrey Ryabinin #endif
1898fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER
18993ad2f3fbSDaniel Mack 	/* Index of current stored address in ret_stack */
1900f201ae23SFrederic Weisbecker 	int curr_ret_stack;
1901f201ae23SFrederic Weisbecker 	/* Stack of return addresses for return function tracing */
1902f201ae23SFrederic Weisbecker 	struct ftrace_ret_stack	*ret_stack;
19038aef2d28SSteven Rostedt 	/* time stamp for last schedule */
19048aef2d28SSteven Rostedt 	unsigned long long ftrace_timestamp;
1905f201ae23SFrederic Weisbecker 	/*
1906f201ae23SFrederic Weisbecker 	 * Number of functions that haven't been traced
1907f201ae23SFrederic Weisbecker 	 * because of depth overrun.
1908f201ae23SFrederic Weisbecker 	 */
1909f201ae23SFrederic Weisbecker 	atomic_t trace_overrun;
1910380c4b14SFrederic Weisbecker 	/* Pause for the tracing */
1911380c4b14SFrederic Weisbecker 	atomic_t tracing_graph_pause;
1912f201ae23SFrederic Weisbecker #endif
1913ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING
1914ea4e2bc4SSteven Rostedt 	/* state flags for use by tracers */
1915ea4e2bc4SSteven Rostedt 	unsigned long trace;
1916b1cff0adSSteven Rostedt 	/* bitmask and counter of trace recursion */
1917261842b7SSteven Rostedt 	unsigned long trace_recursion;
1918261842b7SSteven Rostedt #endif /* CONFIG_TRACING */
19195c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV
19205c9a8750SDmitry Vyukov 	/* Coverage collection mode enabled for this task (0 if disabled). */
19215c9a8750SDmitry Vyukov 	enum kcov_mode kcov_mode;
19225c9a8750SDmitry Vyukov 	/* Size of the kcov_area. */
19235c9a8750SDmitry Vyukov 	unsigned	kcov_size;
19245c9a8750SDmitry Vyukov 	/* Buffer for coverage collection. */
19255c9a8750SDmitry Vyukov 	void		*kcov_area;
19265c9a8750SDmitry Vyukov 	/* kcov desciptor wired with this task or NULL. */
19275c9a8750SDmitry Vyukov 	struct kcov	*kcov;
19285c9a8750SDmitry Vyukov #endif
19296f185c29SVladimir Davydov #ifdef CONFIG_MEMCG
1930626ebc41STejun Heo 	struct mem_cgroup *memcg_in_oom;
1931626ebc41STejun Heo 	gfp_t memcg_oom_gfp_mask;
1932626ebc41STejun Heo 	int memcg_oom_order;
1933b23afb93STejun Heo 
1934b23afb93STejun Heo 	/* number of pages to reclaim on returning to userland */
1935b23afb93STejun Heo 	unsigned int memcg_nr_pages_over_high;
1936569b846dSKAMEZAWA Hiroyuki #endif
19370326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES
19380326f5a9SSrikar Dronamraju 	struct uprobe_task *utask;
19390326f5a9SSrikar Dronamraju #endif
1940cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE)
1941cafe5635SKent Overstreet 	unsigned int	sequential_io;
1942cafe5635SKent Overstreet 	unsigned int	sequential_io_avg;
1943cafe5635SKent Overstreet #endif
19448eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
19458eb23b9fSPeter Zijlstra 	unsigned long	task_state_change;
19468eb23b9fSPeter Zijlstra #endif
19478bcbde54SDavid Hildenbrand 	int pagefault_disabled;
194803049269SMichal Hocko #ifdef CONFIG_MMU
194929c696e1SVladimir Davydov 	struct task_struct *oom_reaper_list;
195003049269SMichal Hocko #endif
1951ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK
1952ba14a194SAndy Lutomirski 	struct vm_struct *stack_vm_area;
1953ba14a194SAndy Lutomirski #endif
195468f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
195568f24b08SAndy Lutomirski 	/* A live task holds one reference. */
195668f24b08SAndy Lutomirski 	atomic_t stack_refcount;
195768f24b08SAndy Lutomirski #endif
19580c8c0f03SDave Hansen /* CPU-specific state of this task */
19590c8c0f03SDave Hansen 	struct thread_struct thread;
19600c8c0f03SDave Hansen /*
19610c8c0f03SDave Hansen  * WARNING: on x86, 'thread_struct' contains a variable-sized
19620c8c0f03SDave Hansen  * structure.  It *MUST* be at the end of 'task_struct'.
19630c8c0f03SDave Hansen  *
19640c8c0f03SDave Hansen  * Do not put anything below here!
19650c8c0f03SDave Hansen  */
19661da177e4SLinus Torvalds };
19671da177e4SLinus Torvalds 
19685aaeb5c0SIngo Molnar #ifdef CONFIG_ARCH_WANTS_DYNAMIC_TASK_STRUCT
19695aaeb5c0SIngo Molnar extern int arch_task_struct_size __read_mostly;
19705aaeb5c0SIngo Molnar #else
19715aaeb5c0SIngo Molnar # define arch_task_struct_size (sizeof(struct task_struct))
19725aaeb5c0SIngo Molnar #endif
19730c8c0f03SDave Hansen 
1974ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK
1975ba14a194SAndy Lutomirski static inline struct vm_struct *task_stack_vm_area(const struct task_struct *t)
1976ba14a194SAndy Lutomirski {
1977ba14a194SAndy Lutomirski 	return t->stack_vm_area;
1978ba14a194SAndy Lutomirski }
1979ba14a194SAndy Lutomirski #else
1980ba14a194SAndy Lutomirski static inline struct vm_struct *task_stack_vm_area(const struct task_struct *t)
1981ba14a194SAndy Lutomirski {
1982ba14a194SAndy Lutomirski 	return NULL;
1983ba14a194SAndy Lutomirski }
1984ba14a194SAndy Lutomirski #endif
1985ba14a194SAndy Lutomirski 
198676e6eee0SRusty Russell /* Future-safe accessor for struct task_struct's cpus_allowed. */
1987a4636818SRusty Russell #define tsk_cpus_allowed(tsk) (&(tsk)->cpus_allowed)
198876e6eee0SRusty Russell 
198950605ffbSThomas Gleixner static inline int tsk_nr_cpus_allowed(struct task_struct *p)
199050605ffbSThomas Gleixner {
199150605ffbSThomas Gleixner 	return p->nr_cpus_allowed;
199250605ffbSThomas Gleixner }
199350605ffbSThomas Gleixner 
19946688cc05SPeter Zijlstra #define TNF_MIGRATED	0x01
19956688cc05SPeter Zijlstra #define TNF_NO_GROUP	0x02
1996dabe1d99SRik van Riel #define TNF_SHARED	0x04
199704bb2f94SRik van Riel #define TNF_FAULT_LOCAL	0x08
1998074c2381SMel Gorman #define TNF_MIGRATE_FAIL 0x10
19996688cc05SPeter Zijlstra 
2000b18dc5f2SMichal Hocko static inline bool in_vfork(struct task_struct *tsk)
2001b18dc5f2SMichal Hocko {
2002b18dc5f2SMichal Hocko 	bool ret;
2003b18dc5f2SMichal Hocko 
2004b18dc5f2SMichal Hocko 	/*
2005b18dc5f2SMichal Hocko 	 * need RCU to access ->real_parent if CLONE_VM was used along with
2006b18dc5f2SMichal Hocko 	 * CLONE_PARENT.
2007b18dc5f2SMichal Hocko 	 *
2008b18dc5f2SMichal Hocko 	 * We check real_parent->mm == tsk->mm because CLONE_VFORK does not
2009b18dc5f2SMichal Hocko 	 * imply CLONE_VM
2010b18dc5f2SMichal Hocko 	 *
2011b18dc5f2SMichal Hocko 	 * CLONE_VFORK can be used with CLONE_PARENT/CLONE_THREAD and thus
2012b18dc5f2SMichal Hocko 	 * ->real_parent is not necessarily the task doing vfork(), so in
2013b18dc5f2SMichal Hocko 	 * theory we can't rely on task_lock() if we want to dereference it.
2014b18dc5f2SMichal Hocko 	 *
2015b18dc5f2SMichal Hocko 	 * And in this case we can't trust the real_parent->mm == tsk->mm
2016b18dc5f2SMichal Hocko 	 * check, it can be false negative. But we do not care, if init or
2017b18dc5f2SMichal Hocko 	 * another oom-unkillable task does this it should blame itself.
2018b18dc5f2SMichal Hocko 	 */
2019b18dc5f2SMichal Hocko 	rcu_read_lock();
2020b18dc5f2SMichal Hocko 	ret = tsk->vfork_done && tsk->real_parent->mm == tsk->mm;
2021b18dc5f2SMichal Hocko 	rcu_read_unlock();
2022b18dc5f2SMichal Hocko 
2023b18dc5f2SMichal Hocko 	return ret;
2024b18dc5f2SMichal Hocko }
2025b18dc5f2SMichal Hocko 
2026cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING
20276688cc05SPeter Zijlstra extern void task_numa_fault(int last_node, int node, int pages, int flags);
2028e29cf08bSMel Gorman extern pid_t task_numa_group_id(struct task_struct *p);
20291a687c2eSMel Gorman extern void set_numabalancing_state(bool enabled);
203082727018SRik van Riel extern void task_numa_free(struct task_struct *p);
203110f39042SRik van Riel extern bool should_numa_migrate_memory(struct task_struct *p, struct page *page,
203210f39042SRik van Riel 					int src_nid, int dst_cpu);
2033cbee9f88SPeter Zijlstra #else
2034ac8e895bSMel Gorman static inline void task_numa_fault(int last_node, int node, int pages,
20356688cc05SPeter Zijlstra 				   int flags)
2036cbee9f88SPeter Zijlstra {
2037cbee9f88SPeter Zijlstra }
2038e29cf08bSMel Gorman static inline pid_t task_numa_group_id(struct task_struct *p)
2039e29cf08bSMel Gorman {
2040e29cf08bSMel Gorman 	return 0;
2041e29cf08bSMel Gorman }
20421a687c2eSMel Gorman static inline void set_numabalancing_state(bool enabled)
20431a687c2eSMel Gorman {
20441a687c2eSMel Gorman }
204582727018SRik van Riel static inline void task_numa_free(struct task_struct *p)
204682727018SRik van Riel {
204782727018SRik van Riel }
204810f39042SRik van Riel static inline bool should_numa_migrate_memory(struct task_struct *p,
204910f39042SRik van Riel 				struct page *page, int src_nid, int dst_cpu)
205010f39042SRik van Riel {
205110f39042SRik van Riel 	return true;
205210f39042SRik van Riel }
2053cbee9f88SPeter Zijlstra #endif
2054cbee9f88SPeter Zijlstra 
2055e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task)
205622c935f4SEric W. Biederman {
205722c935f4SEric W. Biederman 	return task->pids[PIDTYPE_PID].pid;
205822c935f4SEric W. Biederman }
205922c935f4SEric W. Biederman 
2060e868171aSAlexey Dobriyan static inline struct pid *task_tgid(struct task_struct *task)
206122c935f4SEric W. Biederman {
206222c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_PID].pid;
206322c935f4SEric W. Biederman }
206422c935f4SEric W. Biederman 
20656dda81f4SOleg Nesterov /*
20666dda81f4SOleg Nesterov  * Without tasklist or rcu lock it is not safe to dereference
20676dda81f4SOleg Nesterov  * the result of task_pgrp/task_session even if task == current,
20686dda81f4SOleg Nesterov  * we can race with another thread doing sys_setsid/sys_setpgid.
20696dda81f4SOleg Nesterov  */
2070e868171aSAlexey Dobriyan static inline struct pid *task_pgrp(struct task_struct *task)
207122c935f4SEric W. Biederman {
207222c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_PGID].pid;
207322c935f4SEric W. Biederman }
207422c935f4SEric W. Biederman 
2075e868171aSAlexey Dobriyan static inline struct pid *task_session(struct task_struct *task)
207622c935f4SEric W. Biederman {
207722c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_SID].pid;
207822c935f4SEric W. Biederman }
207922c935f4SEric W. Biederman 
20807af57294SPavel Emelyanov struct pid_namespace;
20817af57294SPavel Emelyanov 
20827af57294SPavel Emelyanov /*
20837af57294SPavel Emelyanov  * the helpers to get the task's different pids as they are seen
20847af57294SPavel Emelyanov  * from various namespaces
20857af57294SPavel Emelyanov  *
20867af57294SPavel Emelyanov  * task_xid_nr()     : global id, i.e. the id seen from the init namespace;
208744c4e1b2SEric W. Biederman  * task_xid_vnr()    : virtual id, i.e. the id seen from the pid namespace of
208844c4e1b2SEric W. Biederman  *                     current.
20897af57294SPavel Emelyanov  * task_xid_nr_ns()  : id seen from the ns specified;
20907af57294SPavel Emelyanov  *
20917af57294SPavel Emelyanov  * set_task_vxid()   : assigns a virtual id to a task;
20927af57294SPavel Emelyanov  *
20937af57294SPavel Emelyanov  * see also pid_nr() etc in include/linux/pid.h
20947af57294SPavel Emelyanov  */
209552ee2dfdSOleg Nesterov pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type,
209652ee2dfdSOleg Nesterov 			struct pid_namespace *ns);
20977af57294SPavel Emelyanov 
2098e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk)
20997af57294SPavel Emelyanov {
21007af57294SPavel Emelyanov 	return tsk->pid;
21017af57294SPavel Emelyanov }
21027af57294SPavel Emelyanov 
210352ee2dfdSOleg Nesterov static inline pid_t task_pid_nr_ns(struct task_struct *tsk,
210452ee2dfdSOleg Nesterov 					struct pid_namespace *ns)
210552ee2dfdSOleg Nesterov {
210652ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
210752ee2dfdSOleg Nesterov }
21087af57294SPavel Emelyanov 
21097af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk)
21107af57294SPavel Emelyanov {
211152ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
21127af57294SPavel Emelyanov }
21137af57294SPavel Emelyanov 
21147af57294SPavel Emelyanov 
2115e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk)
21167af57294SPavel Emelyanov {
21177af57294SPavel Emelyanov 	return tsk->tgid;
21187af57294SPavel Emelyanov }
21197af57294SPavel Emelyanov 
21202f2a3a46SPavel Emelyanov pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns);
21217af57294SPavel Emelyanov 
21227af57294SPavel Emelyanov static inline pid_t task_tgid_vnr(struct task_struct *tsk)
21237af57294SPavel Emelyanov {
21247af57294SPavel Emelyanov 	return pid_vnr(task_tgid(tsk));
21257af57294SPavel Emelyanov }
21267af57294SPavel Emelyanov 
21277af57294SPavel Emelyanov 
212880e0b6e8SRichard Guy Briggs static inline int pid_alive(const struct task_struct *p);
2129ad36d282SRichard Guy Briggs static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns)
2130ad36d282SRichard Guy Briggs {
2131ad36d282SRichard Guy Briggs 	pid_t pid = 0;
2132ad36d282SRichard Guy Briggs 
2133ad36d282SRichard Guy Briggs 	rcu_read_lock();
2134ad36d282SRichard Guy Briggs 	if (pid_alive(tsk))
2135ad36d282SRichard Guy Briggs 		pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns);
2136ad36d282SRichard Guy Briggs 	rcu_read_unlock();
2137ad36d282SRichard Guy Briggs 
2138ad36d282SRichard Guy Briggs 	return pid;
2139ad36d282SRichard Guy Briggs }
2140ad36d282SRichard Guy Briggs 
2141ad36d282SRichard Guy Briggs static inline pid_t task_ppid_nr(const struct task_struct *tsk)
2142ad36d282SRichard Guy Briggs {
2143ad36d282SRichard Guy Briggs 	return task_ppid_nr_ns(tsk, &init_pid_ns);
2144ad36d282SRichard Guy Briggs }
2145ad36d282SRichard Guy Briggs 
214652ee2dfdSOleg Nesterov static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk,
214752ee2dfdSOleg Nesterov 					struct pid_namespace *ns)
21487af57294SPavel Emelyanov {
214952ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
21507af57294SPavel Emelyanov }
21517af57294SPavel Emelyanov 
21527af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
21537af57294SPavel Emelyanov {
215452ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
21557af57294SPavel Emelyanov }
21567af57294SPavel Emelyanov 
21577af57294SPavel Emelyanov 
215852ee2dfdSOleg Nesterov static inline pid_t task_session_nr_ns(struct task_struct *tsk,
215952ee2dfdSOleg Nesterov 					struct pid_namespace *ns)
21607af57294SPavel Emelyanov {
216152ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
21627af57294SPavel Emelyanov }
21637af57294SPavel Emelyanov 
21647af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk)
21657af57294SPavel Emelyanov {
216652ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
21677af57294SPavel Emelyanov }
21687af57294SPavel Emelyanov 
21691b0f7ffdSOleg Nesterov /* obsolete, do not use */
21701b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk)
21711b0f7ffdSOleg Nesterov {
21721b0f7ffdSOleg Nesterov 	return task_pgrp_nr_ns(tsk, &init_pid_ns);
21731b0f7ffdSOleg Nesterov }
21747af57294SPavel Emelyanov 
21751da177e4SLinus Torvalds /**
21761da177e4SLinus Torvalds  * pid_alive - check that a task structure is not stale
21771da177e4SLinus Torvalds  * @p: Task structure to be checked.
21781da177e4SLinus Torvalds  *
21791da177e4SLinus Torvalds  * Test if a process is not yet dead (at most zombie state)
21801da177e4SLinus Torvalds  * If pid_alive fails, then pointers within the task structure
21811da177e4SLinus Torvalds  * can be stale and must not be dereferenced.
2182e69f6186SYacine Belkadi  *
2183e69f6186SYacine Belkadi  * Return: 1 if the process is alive. 0 otherwise.
21841da177e4SLinus Torvalds  */
2185ad36d282SRichard Guy Briggs static inline int pid_alive(const struct task_struct *p)
21861da177e4SLinus Torvalds {
218792476d7fSEric W. Biederman 	return p->pids[PIDTYPE_PID].pid != NULL;
21881da177e4SLinus Torvalds }
21891da177e4SLinus Torvalds 
2190f400e198SSukadev Bhattiprolu /**
2191570f5241SSergey Senozhatsky  * is_global_init - check if a task structure is init. Since init
2192570f5241SSergey Senozhatsky  * is free to have sub-threads we need to check tgid.
21933260259fSHenne  * @tsk: Task structure to be checked.
21943260259fSHenne  *
21953260259fSHenne  * Check if a task structure is the first user space task the kernel created.
2196e69f6186SYacine Belkadi  *
2197e69f6186SYacine Belkadi  * Return: 1 if the task structure is init. 0 otherwise.
2198f400e198SSukadev Bhattiprolu  */
2199e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk)
2200b461cc03SPavel Emelyanov {
2201570f5241SSergey Senozhatsky 	return task_tgid_nr(tsk) == 1;
2202b461cc03SPavel Emelyanov }
2203b460cbc5SSerge E. Hallyn 
22049ec52099SCedric Le Goater extern struct pid *cad_pid;
22059ec52099SCedric Le Goater 
22061da177e4SLinus Torvalds extern void free_task(struct task_struct *tsk);
22071da177e4SLinus Torvalds #define get_task_struct(tsk) do { atomic_inc(&(tsk)->usage); } while(0)
2208e56d0903SIngo Molnar 
2209158d9ebdSAndrew Morton extern void __put_task_struct(struct task_struct *t);
2210e56d0903SIngo Molnar 
2211e56d0903SIngo Molnar static inline void put_task_struct(struct task_struct *t)
2212e56d0903SIngo Molnar {
2213e56d0903SIngo Molnar 	if (atomic_dec_and_test(&t->usage))
22148c7904a0SEric W. Biederman 		__put_task_struct(t);
2215e56d0903SIngo Molnar }
22161da177e4SLinus Torvalds 
2217150593bfSOleg Nesterov struct task_struct *task_rcu_dereference(struct task_struct **ptask);
2218150593bfSOleg Nesterov struct task_struct *try_get_task_struct(struct task_struct **ptask);
2219150593bfSOleg Nesterov 
22206a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
22216a61671bSFrederic Weisbecker extern void task_cputime(struct task_struct *t,
22226a61671bSFrederic Weisbecker 			 cputime_t *utime, cputime_t *stime);
22236a61671bSFrederic Weisbecker extern void task_cputime_scaled(struct task_struct *t,
22246a61671bSFrederic Weisbecker 				cputime_t *utimescaled, cputime_t *stimescaled);
22256a61671bSFrederic Weisbecker extern cputime_t task_gtime(struct task_struct *t);
22266a61671bSFrederic Weisbecker #else
22276fac4829SFrederic Weisbecker static inline void task_cputime(struct task_struct *t,
22286fac4829SFrederic Weisbecker 				cputime_t *utime, cputime_t *stime)
22296fac4829SFrederic Weisbecker {
22306fac4829SFrederic Weisbecker 	if (utime)
22316fac4829SFrederic Weisbecker 		*utime = t->utime;
22326fac4829SFrederic Weisbecker 	if (stime)
22336fac4829SFrederic Weisbecker 		*stime = t->stime;
22346fac4829SFrederic Weisbecker }
22356fac4829SFrederic Weisbecker 
22366fac4829SFrederic Weisbecker static inline void task_cputime_scaled(struct task_struct *t,
22376fac4829SFrederic Weisbecker 				       cputime_t *utimescaled,
22386fac4829SFrederic Weisbecker 				       cputime_t *stimescaled)
22396fac4829SFrederic Weisbecker {
22406fac4829SFrederic Weisbecker 	if (utimescaled)
22416fac4829SFrederic Weisbecker 		*utimescaled = t->utimescaled;
22426fac4829SFrederic Weisbecker 	if (stimescaled)
22436fac4829SFrederic Weisbecker 		*stimescaled = t->stimescaled;
22446fac4829SFrederic Weisbecker }
22456a61671bSFrederic Weisbecker 
22466a61671bSFrederic Weisbecker static inline cputime_t task_gtime(struct task_struct *t)
22476a61671bSFrederic Weisbecker {
22486a61671bSFrederic Weisbecker 	return t->gtime;
22496a61671bSFrederic Weisbecker }
22506a61671bSFrederic Weisbecker #endif
2251e80d0a1aSFrederic Weisbecker extern void task_cputime_adjusted(struct task_struct *p, cputime_t *ut, cputime_t *st);
2252e80d0a1aSFrederic Weisbecker extern void thread_group_cputime_adjusted(struct task_struct *p, cputime_t *ut, cputime_t *st);
225349048622SBalbir Singh 
22541da177e4SLinus Torvalds /*
22551da177e4SLinus Torvalds  * Per process flags
22561da177e4SLinus Torvalds  */
22571da177e4SLinus Torvalds #define PF_EXITING	0x00000004	/* getting shut down */
2258778e9a9cSAlexey Kuznetsov #define PF_EXITPIDONE	0x00000008	/* pi exit done on shut down */
225994886b84SLaurent Vivier #define PF_VCPU		0x00000010	/* I'm a virtual CPU */
226021aa9af0STejun Heo #define PF_WQ_WORKER	0x00000020	/* I'm a workqueue worker */
22611da177e4SLinus Torvalds #define PF_FORKNOEXEC	0x00000040	/* forked but didn't exec */
22624db96cf0SAndi Kleen #define PF_MCE_PROCESS  0x00000080      /* process policy on mce errors */
22631da177e4SLinus Torvalds #define PF_SUPERPRIV	0x00000100	/* used super-user privileges */
22641da177e4SLinus Torvalds #define PF_DUMPCORE	0x00000200	/* dumped core */
22651da177e4SLinus Torvalds #define PF_SIGNALED	0x00000400	/* killed by a signal */
22661da177e4SLinus Torvalds #define PF_MEMALLOC	0x00000800	/* Allocating memory */
226772fa5997SVasiliy Kulikov #define PF_NPROC_EXCEEDED 0x00001000	/* set_user noticed that RLIMIT_NPROC was exceeded */
22681da177e4SLinus Torvalds #define PF_USED_MATH	0x00002000	/* if unset the fpu must be initialized before use */
2269774a1221STejun Heo #define PF_USED_ASYNC	0x00004000	/* used async_schedule*(), used by module init */
22701da177e4SLinus Torvalds #define PF_NOFREEZE	0x00008000	/* this thread should not be frozen */
22711da177e4SLinus Torvalds #define PF_FROZEN	0x00010000	/* frozen for system suspend */
22721da177e4SLinus Torvalds #define PF_FSTRANS	0x00020000	/* inside a filesystem transaction */
22731da177e4SLinus Torvalds #define PF_KSWAPD	0x00040000	/* I am kswapd */
227421caf2fcSMing Lei #define PF_MEMALLOC_NOIO 0x00080000	/* Allocating memory without IO involved */
22751da177e4SLinus Torvalds #define PF_LESS_THROTTLE 0x00100000	/* Throttle me less: I clean memory */
2276246bb0b1SOleg Nesterov #define PF_KTHREAD	0x00200000	/* I am a kernel thread */
2277b31dc66aSJens Axboe #define PF_RANDOMIZE	0x00400000	/* randomize virtual address space */
2278b31dc66aSJens Axboe #define PF_SWAPWRITE	0x00800000	/* Allowed to write to swap */
227914a40ffcSTejun Heo #define PF_NO_SETAFFINITY 0x04000000	/* Userland is not allowed to meddle with cpus_allowed */
22804db96cf0SAndi Kleen #define PF_MCE_EARLY    0x08000000      /* Early kill for mce process policy */
228161a87122SThomas Gleixner #define PF_MUTEX_TESTER	0x20000000	/* Thread belongs to the rt mutex tester */
228258a69cb4STejun Heo #define PF_FREEZER_SKIP	0x40000000	/* Freezer should not count it as freezable */
22832b44c4dbSColin Cross #define PF_SUSPEND_TASK 0x80000000      /* this thread called freeze_processes and should not be frozen */
22841da177e4SLinus Torvalds 
22851da177e4SLinus Torvalds /*
22861da177e4SLinus Torvalds  * Only the _current_ task can read/write to tsk->flags, but other
22871da177e4SLinus Torvalds  * tasks can access tsk->flags in readonly mode for example
22881da177e4SLinus Torvalds  * with tsk_used_math (like during threaded core dumping).
22891da177e4SLinus Torvalds  * There is however an exception to this rule during ptrace
22901da177e4SLinus Torvalds  * or during fork: the ptracer task is allowed to write to the
22911da177e4SLinus Torvalds  * child->flags of its traced child (same goes for fork, the parent
22921da177e4SLinus Torvalds  * can write to the child->flags), because we're guaranteed the
22931da177e4SLinus Torvalds  * child is not running and in turn not changing child->flags
22941da177e4SLinus Torvalds  * at the same time the parent does it.
22951da177e4SLinus Torvalds  */
22961da177e4SLinus Torvalds #define clear_stopped_child_used_math(child) do { (child)->flags &= ~PF_USED_MATH; } while (0)
22971da177e4SLinus Torvalds #define set_stopped_child_used_math(child) do { (child)->flags |= PF_USED_MATH; } while (0)
22981da177e4SLinus Torvalds #define clear_used_math() clear_stopped_child_used_math(current)
22991da177e4SLinus Torvalds #define set_used_math() set_stopped_child_used_math(current)
23001da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \
23011da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0)
23021da177e4SLinus Torvalds #define conditional_used_math(condition) \
23031da177e4SLinus Torvalds 	conditional_stopped_child_used_math(condition, current)
23041da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \
23051da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0)
23061da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */
23071da177e4SLinus Torvalds #define tsk_used_math(p) ((p)->flags & PF_USED_MATH)
23081da177e4SLinus Torvalds #define used_math() tsk_used_math(current)
23091da177e4SLinus Torvalds 
2310934f3072SJunxiao Bi /* __GFP_IO isn't allowed if PF_MEMALLOC_NOIO is set in current->flags
2311934f3072SJunxiao Bi  * __GFP_FS is also cleared as it implies __GFP_IO.
2312934f3072SJunxiao Bi  */
231321caf2fcSMing Lei static inline gfp_t memalloc_noio_flags(gfp_t flags)
231421caf2fcSMing Lei {
231521caf2fcSMing Lei 	if (unlikely(current->flags & PF_MEMALLOC_NOIO))
2316934f3072SJunxiao Bi 		flags &= ~(__GFP_IO | __GFP_FS);
231721caf2fcSMing Lei 	return flags;
231821caf2fcSMing Lei }
231921caf2fcSMing Lei 
232021caf2fcSMing Lei static inline unsigned int memalloc_noio_save(void)
232121caf2fcSMing Lei {
232221caf2fcSMing Lei 	unsigned int flags = current->flags & PF_MEMALLOC_NOIO;
232321caf2fcSMing Lei 	current->flags |= PF_MEMALLOC_NOIO;
232421caf2fcSMing Lei 	return flags;
232521caf2fcSMing Lei }
232621caf2fcSMing Lei 
232721caf2fcSMing Lei static inline void memalloc_noio_restore(unsigned int flags)
232821caf2fcSMing Lei {
232921caf2fcSMing Lei 	current->flags = (current->flags & ~PF_MEMALLOC_NOIO) | flags;
233021caf2fcSMing Lei }
233121caf2fcSMing Lei 
23321d4457f9SKees Cook /* Per-process atomic flags. */
2333a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS 0	/* May not gain new privileges. */
23342ad654bcSZefan Li #define PFA_SPREAD_PAGE  1      /* Spread page cache over cpuset */
23352ad654bcSZefan Li #define PFA_SPREAD_SLAB  2      /* Spread some slab caches over cpuset */
233677ed2c57STetsuo Handa #define PFA_LMK_WAITING  3      /* Lowmemorykiller is waiting */
23371d4457f9SKees Cook 
23381d4457f9SKees Cook 
2339e0e5070bSZefan Li #define TASK_PFA_TEST(name, func)					\
2340e0e5070bSZefan Li 	static inline bool task_##func(struct task_struct *p)		\
2341e0e5070bSZefan Li 	{ return test_bit(PFA_##name, &p->atomic_flags); }
2342e0e5070bSZefan Li #define TASK_PFA_SET(name, func)					\
2343e0e5070bSZefan Li 	static inline void task_set_##func(struct task_struct *p)	\
2344e0e5070bSZefan Li 	{ set_bit(PFA_##name, &p->atomic_flags); }
2345e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func)					\
2346e0e5070bSZefan Li 	static inline void task_clear_##func(struct task_struct *p)	\
2347e0e5070bSZefan Li 	{ clear_bit(PFA_##name, &p->atomic_flags); }
23481d4457f9SKees Cook 
2349e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs)
2350e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs)
23511d4457f9SKees Cook 
23522ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page)
23532ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page)
23542ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
23552ad654bcSZefan Li 
23562ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
23572ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab)
23582ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
2359544b2c91STejun Heo 
236077ed2c57STetsuo Handa TASK_PFA_TEST(LMK_WAITING, lmk_waiting)
236177ed2c57STetsuo Handa TASK_PFA_SET(LMK_WAITING, lmk_waiting)
236277ed2c57STetsuo Handa 
236339efa3efSTejun Heo /*
2364e5c1902eSTejun Heo  * task->jobctl flags
2365d79fdd6dSTejun Heo  */
2366ee77f075SOleg Nesterov #define JOBCTL_STOP_SIGMASK	0xffff	/* signr of the last group stop */
2367e5c1902eSTejun Heo 
2368f41d911fSPaul E. McKenney #define JOBCTL_STOP_DEQUEUED_BIT 16	/* stop signal dequeued */
2369a8f072c1STejun Heo #define JOBCTL_STOP_PENDING_BIT	17	/* task should stop for group stop */
2370a8f072c1STejun Heo #define JOBCTL_STOP_CONSUME_BIT	18	/* consume group stop count */
2371a8f072c1STejun Heo #define JOBCTL_TRAP_STOP_BIT	19	/* trap for STOP */
237273ddff2bSTejun Heo #define JOBCTL_TRAP_NOTIFY_BIT	20	/* trap for NOTIFY */
2373fb1d910cSTejun Heo #define JOBCTL_TRAPPING_BIT	21	/* switching to TRACED */
2374a8f072c1STejun Heo #define JOBCTL_LISTENING_BIT	22	/* ptracer is listening for events */
2375a8f072c1STejun Heo 
2376b76808e6SPalmer Dabbelt #define JOBCTL_STOP_DEQUEUED	(1UL << JOBCTL_STOP_DEQUEUED_BIT)
2377b76808e6SPalmer Dabbelt #define JOBCTL_STOP_PENDING	(1UL << JOBCTL_STOP_PENDING_BIT)
2378b76808e6SPalmer Dabbelt #define JOBCTL_STOP_CONSUME	(1UL << JOBCTL_STOP_CONSUME_BIT)
2379b76808e6SPalmer Dabbelt #define JOBCTL_TRAP_STOP	(1UL << JOBCTL_TRAP_STOP_BIT)
2380b76808e6SPalmer Dabbelt #define JOBCTL_TRAP_NOTIFY	(1UL << JOBCTL_TRAP_NOTIFY_BIT)
2381b76808e6SPalmer Dabbelt #define JOBCTL_TRAPPING		(1UL << JOBCTL_TRAPPING_BIT)
2382b76808e6SPalmer Dabbelt #define JOBCTL_LISTENING	(1UL << JOBCTL_LISTENING_BIT)
2383a8f072c1STejun Heo 
2384fb1d910cSTejun Heo #define JOBCTL_TRAP_MASK	(JOBCTL_TRAP_STOP | JOBCTL_TRAP_NOTIFY)
238573ddff2bSTejun Heo #define JOBCTL_PENDING_MASK	(JOBCTL_STOP_PENDING | JOBCTL_TRAP_MASK)
23863759a0d9STejun Heo 
23877dd3db54STejun Heo extern bool task_set_jobctl_pending(struct task_struct *task,
2388b76808e6SPalmer Dabbelt 				    unsigned long mask);
238973ddff2bSTejun Heo extern void task_clear_jobctl_trapping(struct task_struct *task);
23903759a0d9STejun Heo extern void task_clear_jobctl_pending(struct task_struct *task,
2391b76808e6SPalmer Dabbelt 				      unsigned long mask);
239239efa3efSTejun Heo 
2393f41d911fSPaul E. McKenney static inline void rcu_copy_process(struct task_struct *p)
2394f41d911fSPaul E. McKenney {
23951da177e4SLinus Torvalds #ifdef CONFIG_PREEMPT_RCU
2396f41d911fSPaul E. McKenney 	p->rcu_read_lock_nesting = 0;
23971d082fd0SPaul E. McKenney 	p->rcu_read_unlock_special.s = 0;
2398dd5d19baSPaul E. McKenney 	p->rcu_blocked_node = NULL;
2399f41d911fSPaul E. McKenney 	INIT_LIST_HEAD(&p->rcu_node_entry);
24008315f422SPaul E. McKenney #endif /* #ifdef CONFIG_PREEMPT_RCU */
24018315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU
24028315f422SPaul E. McKenney 	p->rcu_tasks_holdout = false;
24038315f422SPaul E. McKenney 	INIT_LIST_HEAD(&p->rcu_tasks_holdout_list);
2404176f8f7aSPaul E. McKenney 	p->rcu_tasks_idle_cpu = -1;
24058315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */
2406f41d911fSPaul E. McKenney }
2407f41d911fSPaul E. McKenney 
2408907aed48SMel Gorman static inline void tsk_restore_flags(struct task_struct *task,
2409907aed48SMel Gorman 				unsigned long orig_flags, unsigned long flags)
2410907aed48SMel Gorman {
2411907aed48SMel Gorman 	task->flags &= ~flags;
2412907aed48SMel Gorman 	task->flags |= orig_flags & flags;
2413907aed48SMel Gorman }
2414907aed48SMel Gorman 
2415f82f8042SJuri Lelli extern int cpuset_cpumask_can_shrink(const struct cpumask *cur,
2416f82f8042SJuri Lelli 				     const struct cpumask *trial);
24177f51412aSJuri Lelli extern int task_can_attach(struct task_struct *p,
24187f51412aSJuri Lelli 			   const struct cpumask *cs_cpus_allowed);
24191da177e4SLinus Torvalds #ifdef CONFIG_SMP
24201e1b6c51SKOSAKI Motohiro extern void do_set_cpus_allowed(struct task_struct *p,
24211e1b6c51SKOSAKI Motohiro 			       const struct cpumask *new_mask);
24221e1b6c51SKOSAKI Motohiro 
2423cd8ba7cdSMike Travis extern int set_cpus_allowed_ptr(struct task_struct *p,
242496f874e2SRusty Russell 				const struct cpumask *new_mask);
24251da177e4SLinus Torvalds #else
24261e1b6c51SKOSAKI Motohiro static inline void do_set_cpus_allowed(struct task_struct *p,
24271e1b6c51SKOSAKI Motohiro 				      const struct cpumask *new_mask)
24281e1b6c51SKOSAKI Motohiro {
24291e1b6c51SKOSAKI Motohiro }
2430cd8ba7cdSMike Travis static inline int set_cpus_allowed_ptr(struct task_struct *p,
243196f874e2SRusty Russell 				       const struct cpumask *new_mask)
24321da177e4SLinus Torvalds {
243396f874e2SRusty Russell 	if (!cpumask_test_cpu(0, new_mask))
24341da177e4SLinus Torvalds 		return -EINVAL;
24351da177e4SLinus Torvalds 	return 0;
24361da177e4SLinus Torvalds }
24371da177e4SLinus Torvalds #endif
2438e0ad9556SRusty Russell 
24393451d024SFrederic Weisbecker #ifdef CONFIG_NO_HZ_COMMON
24405167e8d5SPeter Zijlstra void calc_load_enter_idle(void);
24415167e8d5SPeter Zijlstra void calc_load_exit_idle(void);
24425167e8d5SPeter Zijlstra #else
24435167e8d5SPeter Zijlstra static inline void calc_load_enter_idle(void) { }
24445167e8d5SPeter Zijlstra static inline void calc_load_exit_idle(void) { }
24453451d024SFrederic Weisbecker #endif /* CONFIG_NO_HZ_COMMON */
24465167e8d5SPeter Zijlstra 
24476d0d2878SChristian Borntraeger #ifndef cpu_relax_yield
24486d0d2878SChristian Borntraeger #define cpu_relax_yield() cpu_relax()
24496d0d2878SChristian Borntraeger #endif
24506d0d2878SChristian Borntraeger 
2451b342501cSIngo Molnar /*
2452c676329aSPeter Zijlstra  * Do not use outside of architecture code which knows its limitations.
2453c676329aSPeter Zijlstra  *
2454c676329aSPeter Zijlstra  * sched_clock() has no promise of monotonicity or bounded drift between
2455c676329aSPeter Zijlstra  * CPUs, use (which you should not) requires disabling IRQs.
2456c676329aSPeter Zijlstra  *
2457c676329aSPeter Zijlstra  * Please use one of the three interfaces below.
2458b342501cSIngo Molnar  */
24591bbfa6f2SMike Frysinger extern unsigned long long notrace sched_clock(void);
2460c676329aSPeter Zijlstra /*
2461489a71b0SHiroshi Shimamoto  * See the comment in kernel/sched/clock.c
2462c676329aSPeter Zijlstra  */
2463545a2bf7SCyril Bur extern u64 running_clock(void);
2464c676329aSPeter Zijlstra extern u64 sched_clock_cpu(int cpu);
2465c676329aSPeter Zijlstra 
2466e436d800SIngo Molnar 
2467c1955a3dSPeter Zijlstra extern void sched_clock_init(void);
2468c1955a3dSPeter Zijlstra 
24693e51f33fSPeter Zijlstra #ifndef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
24703e51f33fSPeter Zijlstra static inline void sched_clock_tick(void)
24713e51f33fSPeter Zijlstra {
24723e51f33fSPeter Zijlstra }
24733e51f33fSPeter Zijlstra 
24743e51f33fSPeter Zijlstra static inline void sched_clock_idle_sleep_event(void)
24753e51f33fSPeter Zijlstra {
24763e51f33fSPeter Zijlstra }
24773e51f33fSPeter Zijlstra 
24783e51f33fSPeter Zijlstra static inline void sched_clock_idle_wakeup_event(u64 delta_ns)
24793e51f33fSPeter Zijlstra {
24803e51f33fSPeter Zijlstra }
24812c923e94SDaniel Lezcano 
24822c923e94SDaniel Lezcano static inline u64 cpu_clock(int cpu)
24832c923e94SDaniel Lezcano {
24842c923e94SDaniel Lezcano 	return sched_clock();
24852c923e94SDaniel Lezcano }
24862c923e94SDaniel Lezcano 
24872c923e94SDaniel Lezcano static inline u64 local_clock(void)
24882c923e94SDaniel Lezcano {
24892c923e94SDaniel Lezcano 	return sched_clock();
24902c923e94SDaniel Lezcano }
24913e51f33fSPeter Zijlstra #else
2492c676329aSPeter Zijlstra /*
2493c676329aSPeter Zijlstra  * Architectures can set this to 1 if they have specified
2494c676329aSPeter Zijlstra  * CONFIG_HAVE_UNSTABLE_SCHED_CLOCK in their arch Kconfig,
2495c676329aSPeter Zijlstra  * but then during bootup it turns out that sched_clock()
2496c676329aSPeter Zijlstra  * is reliable after all:
2497c676329aSPeter Zijlstra  */
249835af99e6SPeter Zijlstra extern int sched_clock_stable(void);
249935af99e6SPeter Zijlstra extern void set_sched_clock_stable(void);
250035af99e6SPeter Zijlstra extern void clear_sched_clock_stable(void);
2501c676329aSPeter Zijlstra 
25023e51f33fSPeter Zijlstra extern void sched_clock_tick(void);
25033e51f33fSPeter Zijlstra extern void sched_clock_idle_sleep_event(void);
25043e51f33fSPeter Zijlstra extern void sched_clock_idle_wakeup_event(u64 delta_ns);
25052c923e94SDaniel Lezcano 
25062c923e94SDaniel Lezcano /*
25072c923e94SDaniel Lezcano  * As outlined in clock.c, provides a fast, high resolution, nanosecond
25082c923e94SDaniel Lezcano  * time source that is monotonic per cpu argument and has bounded drift
25092c923e94SDaniel Lezcano  * between cpus.
25102c923e94SDaniel Lezcano  *
25112c923e94SDaniel Lezcano  * ######################### BIG FAT WARNING ##########################
25122c923e94SDaniel Lezcano  * # when comparing cpu_clock(i) to cpu_clock(j) for i != j, time can #
25132c923e94SDaniel Lezcano  * # go backwards !!                                                  #
25142c923e94SDaniel Lezcano  * ####################################################################
25152c923e94SDaniel Lezcano  */
25162c923e94SDaniel Lezcano static inline u64 cpu_clock(int cpu)
25172c923e94SDaniel Lezcano {
25182c923e94SDaniel Lezcano 	return sched_clock_cpu(cpu);
25192c923e94SDaniel Lezcano }
25202c923e94SDaniel Lezcano 
25212c923e94SDaniel Lezcano static inline u64 local_clock(void)
25222c923e94SDaniel Lezcano {
25232c923e94SDaniel Lezcano 	return sched_clock_cpu(raw_smp_processor_id());
25242c923e94SDaniel Lezcano }
25253e51f33fSPeter Zijlstra #endif
25263e51f33fSPeter Zijlstra 
2527b52bfee4SVenkatesh Pallipadi #ifdef CONFIG_IRQ_TIME_ACCOUNTING
2528b52bfee4SVenkatesh Pallipadi /*
2529b52bfee4SVenkatesh Pallipadi  * An i/f to runtime opt-in for irq time accounting based off of sched_clock.
2530b52bfee4SVenkatesh Pallipadi  * The reason for this explicit opt-in is not to have perf penalty with
2531b52bfee4SVenkatesh Pallipadi  * slow sched_clocks.
2532b52bfee4SVenkatesh Pallipadi  */
2533b52bfee4SVenkatesh Pallipadi extern void enable_sched_clock_irqtime(void);
2534b52bfee4SVenkatesh Pallipadi extern void disable_sched_clock_irqtime(void);
2535b52bfee4SVenkatesh Pallipadi #else
2536b52bfee4SVenkatesh Pallipadi static inline void enable_sched_clock_irqtime(void) {}
2537b52bfee4SVenkatesh Pallipadi static inline void disable_sched_clock_irqtime(void) {}
2538b52bfee4SVenkatesh Pallipadi #endif
2539b52bfee4SVenkatesh Pallipadi 
254036c8b586SIngo Molnar extern unsigned long long
254141b86e9cSIngo Molnar task_sched_runtime(struct task_struct *task);
25421da177e4SLinus Torvalds 
25431da177e4SLinus Torvalds /* sched_exec is called by processes performing an exec */
25441da177e4SLinus Torvalds #ifdef CONFIG_SMP
25451da177e4SLinus Torvalds extern void sched_exec(void);
25461da177e4SLinus Torvalds #else
25471da177e4SLinus Torvalds #define sched_exec()   {}
25481da177e4SLinus Torvalds #endif
25491da177e4SLinus Torvalds 
25502aa44d05SIngo Molnar extern void sched_clock_idle_sleep_event(void);
25512aa44d05SIngo Molnar extern void sched_clock_idle_wakeup_event(u64 delta_ns);
2552bb29ab26SIngo Molnar 
25531da177e4SLinus Torvalds #ifdef CONFIG_HOTPLUG_CPU
25541da177e4SLinus Torvalds extern void idle_task_exit(void);
25551da177e4SLinus Torvalds #else
25561da177e4SLinus Torvalds static inline void idle_task_exit(void) {}
25571da177e4SLinus Torvalds #endif
25581da177e4SLinus Torvalds 
25593451d024SFrederic Weisbecker #if defined(CONFIG_NO_HZ_COMMON) && defined(CONFIG_SMP)
25601c20091eSFrederic Weisbecker extern void wake_up_nohz_cpu(int cpu);
256106d8308cSThomas Gleixner #else
25621c20091eSFrederic Weisbecker static inline void wake_up_nohz_cpu(int cpu) { }
256306d8308cSThomas Gleixner #endif
256406d8308cSThomas Gleixner 
2565ce831b38SFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
2566265f22a9SFrederic Weisbecker extern u64 scheduler_tick_max_deferment(void);
2567bf0f6f24SIngo Molnar #endif
2568bf0f6f24SIngo Molnar 
25695091faa4SMike Galbraith #ifdef CONFIG_SCHED_AUTOGROUP
25705091faa4SMike Galbraith extern void sched_autogroup_create_attach(struct task_struct *p);
25715091faa4SMike Galbraith extern void sched_autogroup_detach(struct task_struct *p);
25725091faa4SMike Galbraith extern void sched_autogroup_fork(struct signal_struct *sig);
25735091faa4SMike Galbraith extern void sched_autogroup_exit(struct signal_struct *sig);
25745091faa4SMike Galbraith #ifdef CONFIG_PROC_FS
25755091faa4SMike Galbraith extern void proc_sched_autogroup_show_task(struct task_struct *p, struct seq_file *m);
25762e5b5b3aSHiroshi Shimamoto extern int proc_sched_autogroup_set_nice(struct task_struct *p, int nice);
25775091faa4SMike Galbraith #endif
25785091faa4SMike Galbraith #else
25795091faa4SMike Galbraith static inline void sched_autogroup_create_attach(struct task_struct *p) { }
25805091faa4SMike Galbraith static inline void sched_autogroup_detach(struct task_struct *p) { }
25815091faa4SMike Galbraith static inline void sched_autogroup_fork(struct signal_struct *sig) { }
25825091faa4SMike Galbraith static inline void sched_autogroup_exit(struct signal_struct *sig) { }
25835091faa4SMike Galbraith #endif
25845091faa4SMike Galbraith 
2585fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt);
258636c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice);
258736c8b586SIngo Molnar extern int task_prio(const struct task_struct *p);
2588d0ea0268SDongsheng Yang /**
2589d0ea0268SDongsheng Yang  * task_nice - return the nice value of a given task.
2590d0ea0268SDongsheng Yang  * @p: the task in question.
2591d0ea0268SDongsheng Yang  *
2592d0ea0268SDongsheng Yang  * Return: The nice value [ -20 ... 0 ... 19 ].
2593d0ea0268SDongsheng Yang  */
2594d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p)
2595d0ea0268SDongsheng Yang {
2596d0ea0268SDongsheng Yang 	return PRIO_TO_NICE((p)->static_prio);
2597d0ea0268SDongsheng Yang }
259836c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice);
259936c8b586SIngo Molnar extern int task_curr(const struct task_struct *p);
26001da177e4SLinus Torvalds extern int idle_cpu(int cpu);
2601fe7de49fSKOSAKI Motohiro extern int sched_setscheduler(struct task_struct *, int,
2602fe7de49fSKOSAKI Motohiro 			      const struct sched_param *);
2603961ccdddSRusty Russell extern int sched_setscheduler_nocheck(struct task_struct *, int,
2604fe7de49fSKOSAKI Motohiro 				      const struct sched_param *);
2605d50dde5aSDario Faggioli extern int sched_setattr(struct task_struct *,
2606d50dde5aSDario Faggioli 			 const struct sched_attr *);
260736c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu);
2608c4f30608SPaul E. McKenney /**
2609c4f30608SPaul E. McKenney  * is_idle_task - is the specified task an idle task?
2610fa757281SRandy Dunlap  * @p: the task in question.
2611e69f6186SYacine Belkadi  *
2612e69f6186SYacine Belkadi  * Return: 1 if @p is an idle task. 0 otherwise.
2613c4f30608SPaul E. McKenney  */
26147061ca3bSPaul E. McKenney static inline bool is_idle_task(const struct task_struct *p)
2615c4f30608SPaul E. McKenney {
2616c4f30608SPaul E. McKenney 	return p->pid == 0;
2617c4f30608SPaul E. McKenney }
261836c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu);
2619a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p);
26201da177e4SLinus Torvalds 
26211da177e4SLinus Torvalds void yield(void);
26221da177e4SLinus Torvalds 
26231da177e4SLinus Torvalds union thread_union {
2624c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK
26251da177e4SLinus Torvalds 	struct thread_info thread_info;
2626c65eacbeSAndy Lutomirski #endif
26271da177e4SLinus Torvalds 	unsigned long stack[THREAD_SIZE/sizeof(long)];
26281da177e4SLinus Torvalds };
26291da177e4SLinus Torvalds 
26301da177e4SLinus Torvalds #ifndef __HAVE_ARCH_KSTACK_END
26311da177e4SLinus Torvalds static inline int kstack_end(void *addr)
26321da177e4SLinus Torvalds {
26331da177e4SLinus Torvalds 	/* Reliable end of stack detection:
26341da177e4SLinus Torvalds 	 * Some APM bios versions misalign the stack
26351da177e4SLinus Torvalds 	 */
26361da177e4SLinus Torvalds 	return !(((unsigned long)addr+sizeof(void*)-1) & (THREAD_SIZE-sizeof(void*)));
26371da177e4SLinus Torvalds }
26381da177e4SLinus Torvalds #endif
26391da177e4SLinus Torvalds 
26401da177e4SLinus Torvalds extern union thread_union init_thread_union;
26411da177e4SLinus Torvalds extern struct task_struct init_task;
26421da177e4SLinus Torvalds 
26431da177e4SLinus Torvalds extern struct   mm_struct init_mm;
26441da177e4SLinus Torvalds 
2645198fe21bSPavel Emelyanov extern struct pid_namespace init_pid_ns;
2646198fe21bSPavel Emelyanov 
2647198fe21bSPavel Emelyanov /*
2648198fe21bSPavel Emelyanov  * find a task by one of its numerical ids
2649198fe21bSPavel Emelyanov  *
2650198fe21bSPavel Emelyanov  * find_task_by_pid_ns():
2651198fe21bSPavel Emelyanov  *      finds a task by its pid in the specified namespace
2652228ebcbeSPavel Emelyanov  * find_task_by_vpid():
2653228ebcbeSPavel Emelyanov  *      finds a task by its virtual pid
2654198fe21bSPavel Emelyanov  *
2655e49859e7SPavel Emelyanov  * see also find_vpid() etc in include/linux/pid.h
2656198fe21bSPavel Emelyanov  */
2657198fe21bSPavel Emelyanov 
2658228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr);
2659228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_pid_ns(pid_t nr,
2660228ebcbeSPavel Emelyanov 		struct pid_namespace *ns);
2661198fe21bSPavel Emelyanov 
26621da177e4SLinus Torvalds /* per-UID process charging. */
26637b44ab97SEric W. Biederman extern struct user_struct * alloc_uid(kuid_t);
26641da177e4SLinus Torvalds static inline struct user_struct *get_uid(struct user_struct *u)
26651da177e4SLinus Torvalds {
26661da177e4SLinus Torvalds 	atomic_inc(&u->__count);
26671da177e4SLinus Torvalds 	return u;
26681da177e4SLinus Torvalds }
26691da177e4SLinus Torvalds extern void free_uid(struct user_struct *);
26701da177e4SLinus Torvalds 
26711da177e4SLinus Torvalds #include <asm/current.h>
26721da177e4SLinus Torvalds 
2673f0af911aSTorben Hohn extern void xtime_update(unsigned long ticks);
26741da177e4SLinus Torvalds 
2675b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state);
2676b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk);
26773e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk);
26781da177e4SLinus Torvalds #ifdef CONFIG_SMP
26791da177e4SLinus Torvalds  extern void kick_process(struct task_struct *tsk);
26801da177e4SLinus Torvalds #else
26811da177e4SLinus Torvalds  static inline void kick_process(struct task_struct *tsk) { }
26821da177e4SLinus Torvalds #endif
2683aab03e05SDario Faggioli extern int sched_fork(unsigned long clone_flags, struct task_struct *p);
2684ad46c2c4SIngo Molnar extern void sched_dead(struct task_struct *p);
26851da177e4SLinus Torvalds 
26861da177e4SLinus Torvalds extern void proc_caches_init(void);
26871da177e4SLinus Torvalds extern void flush_signals(struct task_struct *);
268810ab825bSOleg Nesterov extern void ignore_signals(struct task_struct *);
26891da177e4SLinus Torvalds extern void flush_signal_handlers(struct task_struct *, int force_default);
26901da177e4SLinus Torvalds extern int dequeue_signal(struct task_struct *tsk, sigset_t *mask, siginfo_t *info);
26911da177e4SLinus Torvalds 
2692be0e6f29SOleg Nesterov static inline int kernel_dequeue_signal(siginfo_t *info)
26931da177e4SLinus Torvalds {
2694be0e6f29SOleg Nesterov 	struct task_struct *tsk = current;
2695be0e6f29SOleg Nesterov 	siginfo_t __info;
26961da177e4SLinus Torvalds 	int ret;
26971da177e4SLinus Torvalds 
2698be0e6f29SOleg Nesterov 	spin_lock_irq(&tsk->sighand->siglock);
2699be0e6f29SOleg Nesterov 	ret = dequeue_signal(tsk, &tsk->blocked, info ?: &__info);
2700be0e6f29SOleg Nesterov 	spin_unlock_irq(&tsk->sighand->siglock);
27011da177e4SLinus Torvalds 
27021da177e4SLinus Torvalds 	return ret;
27031da177e4SLinus Torvalds }
27041da177e4SLinus Torvalds 
27059a13049eSOleg Nesterov static inline void kernel_signal_stop(void)
27069a13049eSOleg Nesterov {
27079a13049eSOleg Nesterov 	spin_lock_irq(&current->sighand->siglock);
27089a13049eSOleg Nesterov 	if (current->jobctl & JOBCTL_STOP_DEQUEUED)
27099a13049eSOleg Nesterov 		__set_current_state(TASK_STOPPED);
27109a13049eSOleg Nesterov 	spin_unlock_irq(&current->sighand->siglock);
27119a13049eSOleg Nesterov 
27129a13049eSOleg Nesterov 	schedule();
27139a13049eSOleg Nesterov }
27149a13049eSOleg Nesterov 
27151da177e4SLinus Torvalds extern void release_task(struct task_struct * p);
27161da177e4SLinus Torvalds extern int send_sig_info(int, struct siginfo *, struct task_struct *);
27171da177e4SLinus Torvalds extern int force_sigsegv(int, struct task_struct *);
27181da177e4SLinus Torvalds extern int force_sig_info(int, struct siginfo *, struct task_struct *);
2719c4b92fc1SEric W. Biederman extern int __kill_pgrp_info(int sig, struct siginfo *info, struct pid *pgrp);
2720c4b92fc1SEric W. Biederman extern int kill_pid_info(int sig, struct siginfo *info, struct pid *pid);
2721d178bc3aSSerge Hallyn extern int kill_pid_info_as_cred(int, struct siginfo *, struct pid *,
2722d178bc3aSSerge Hallyn 				const struct cred *, u32);
2723c4b92fc1SEric W. Biederman extern int kill_pgrp(struct pid *pid, int sig, int priv);
2724c4b92fc1SEric W. Biederman extern int kill_pid(struct pid *pid, int sig, int priv);
2725c3de4b38SMatthew Wilcox extern int kill_proc_info(int, struct siginfo *, pid_t);
272686773473SOleg Nesterov extern __must_check bool do_notify_parent(struct task_struct *, int);
2727a7f0765eSOleg Nesterov extern void __wake_up_parent(struct task_struct *p, struct task_struct *parent);
27281da177e4SLinus Torvalds extern void force_sig(int, struct task_struct *);
27291da177e4SLinus Torvalds extern int send_sig(int, struct task_struct *, int);
273009faef11SOleg Nesterov extern int zap_other_threads(struct task_struct *p);
27311da177e4SLinus Torvalds extern struct sigqueue *sigqueue_alloc(void);
27321da177e4SLinus Torvalds extern void sigqueue_free(struct sigqueue *);
2733ac5c2153SOleg Nesterov extern int send_sigqueue(struct sigqueue *,  struct task_struct *, int group);
27349ac95f2fSOleg Nesterov extern int do_sigaction(int, struct k_sigaction *, struct k_sigaction *);
27351da177e4SLinus Torvalds 
27367e781418SAndy Lutomirski #ifdef TIF_RESTORE_SIGMASK
27377e781418SAndy Lutomirski /*
27387e781418SAndy Lutomirski  * Legacy restore_sigmask accessors.  These are inefficient on
27397e781418SAndy Lutomirski  * SMP architectures because they require atomic operations.
27407e781418SAndy Lutomirski  */
27417e781418SAndy Lutomirski 
27427e781418SAndy Lutomirski /**
27437e781418SAndy Lutomirski  * set_restore_sigmask() - make sure saved_sigmask processing gets done
27447e781418SAndy Lutomirski  *
27457e781418SAndy Lutomirski  * This sets TIF_RESTORE_SIGMASK and ensures that the arch signal code
27467e781418SAndy Lutomirski  * will run before returning to user mode, to process the flag.  For
27477e781418SAndy Lutomirski  * all callers, TIF_SIGPENDING is already set or it's no harm to set
27487e781418SAndy Lutomirski  * it.  TIF_RESTORE_SIGMASK need not be in the set of bits that the
27497e781418SAndy Lutomirski  * arch code will notice on return to user mode, in case those bits
27507e781418SAndy Lutomirski  * are scarce.  We set TIF_SIGPENDING here to ensure that the arch
27517e781418SAndy Lutomirski  * signal code always gets run when TIF_RESTORE_SIGMASK is set.
27527e781418SAndy Lutomirski  */
27537e781418SAndy Lutomirski static inline void set_restore_sigmask(void)
27547e781418SAndy Lutomirski {
27557e781418SAndy Lutomirski 	set_thread_flag(TIF_RESTORE_SIGMASK);
27567e781418SAndy Lutomirski 	WARN_ON(!test_thread_flag(TIF_SIGPENDING));
27577e781418SAndy Lutomirski }
27587e781418SAndy Lutomirski static inline void clear_restore_sigmask(void)
27597e781418SAndy Lutomirski {
27607e781418SAndy Lutomirski 	clear_thread_flag(TIF_RESTORE_SIGMASK);
27617e781418SAndy Lutomirski }
27627e781418SAndy Lutomirski static inline bool test_restore_sigmask(void)
27637e781418SAndy Lutomirski {
27647e781418SAndy Lutomirski 	return test_thread_flag(TIF_RESTORE_SIGMASK);
27657e781418SAndy Lutomirski }
27667e781418SAndy Lutomirski static inline bool test_and_clear_restore_sigmask(void)
27677e781418SAndy Lutomirski {
27687e781418SAndy Lutomirski 	return test_and_clear_thread_flag(TIF_RESTORE_SIGMASK);
27697e781418SAndy Lutomirski }
27707e781418SAndy Lutomirski 
27717e781418SAndy Lutomirski #else	/* TIF_RESTORE_SIGMASK */
27727e781418SAndy Lutomirski 
27737e781418SAndy Lutomirski /* Higher-quality implementation, used if TIF_RESTORE_SIGMASK doesn't exist. */
27747e781418SAndy Lutomirski static inline void set_restore_sigmask(void)
27757e781418SAndy Lutomirski {
27767e781418SAndy Lutomirski 	current->restore_sigmask = true;
27777e781418SAndy Lutomirski 	WARN_ON(!test_thread_flag(TIF_SIGPENDING));
27787e781418SAndy Lutomirski }
27797e781418SAndy Lutomirski static inline void clear_restore_sigmask(void)
27807e781418SAndy Lutomirski {
27817e781418SAndy Lutomirski 	current->restore_sigmask = false;
27827e781418SAndy Lutomirski }
27837e781418SAndy Lutomirski static inline bool test_restore_sigmask(void)
27847e781418SAndy Lutomirski {
27857e781418SAndy Lutomirski 	return current->restore_sigmask;
27867e781418SAndy Lutomirski }
27877e781418SAndy Lutomirski static inline bool test_and_clear_restore_sigmask(void)
27887e781418SAndy Lutomirski {
27897e781418SAndy Lutomirski 	if (!current->restore_sigmask)
27907e781418SAndy Lutomirski 		return false;
27917e781418SAndy Lutomirski 	current->restore_sigmask = false;
27927e781418SAndy Lutomirski 	return true;
27937e781418SAndy Lutomirski }
27947e781418SAndy Lutomirski #endif
27957e781418SAndy Lutomirski 
279651a7b448SAl Viro static inline void restore_saved_sigmask(void)
279751a7b448SAl Viro {
279851a7b448SAl Viro 	if (test_and_clear_restore_sigmask())
279977097ae5SAl Viro 		__set_current_blocked(&current->saved_sigmask);
280051a7b448SAl Viro }
280151a7b448SAl Viro 
2802b7f9a11aSAl Viro static inline sigset_t *sigmask_to_save(void)
2803b7f9a11aSAl Viro {
2804b7f9a11aSAl Viro 	sigset_t *res = &current->blocked;
2805b7f9a11aSAl Viro 	if (unlikely(test_restore_sigmask()))
2806b7f9a11aSAl Viro 		res = &current->saved_sigmask;
2807b7f9a11aSAl Viro 	return res;
2808b7f9a11aSAl Viro }
2809b7f9a11aSAl Viro 
28109ec52099SCedric Le Goater static inline int kill_cad_pid(int sig, int priv)
28119ec52099SCedric Le Goater {
28129ec52099SCedric Le Goater 	return kill_pid(cad_pid, sig, priv);
28139ec52099SCedric Le Goater }
28149ec52099SCedric Le Goater 
28151da177e4SLinus Torvalds /* These can be the second arg to send_sig_info/send_group_sig_info.  */
28161da177e4SLinus Torvalds #define SEND_SIG_NOINFO ((struct siginfo *) 0)
28171da177e4SLinus Torvalds #define SEND_SIG_PRIV	((struct siginfo *) 1)
28181da177e4SLinus Torvalds #define SEND_SIG_FORCED	((struct siginfo *) 2)
28191da177e4SLinus Torvalds 
28202a855dd0SSebastian Andrzej Siewior /*
28212a855dd0SSebastian Andrzej Siewior  * True if we are on the alternate signal stack.
28222a855dd0SSebastian Andrzej Siewior  */
28231da177e4SLinus Torvalds static inline int on_sig_stack(unsigned long sp)
28241da177e4SLinus Torvalds {
2825c876eeabSAndy Lutomirski 	/*
2826c876eeabSAndy Lutomirski 	 * If the signal stack is SS_AUTODISARM then, by construction, we
2827c876eeabSAndy Lutomirski 	 * can't be on the signal stack unless user code deliberately set
2828c876eeabSAndy Lutomirski 	 * SS_AUTODISARM when we were already on it.
2829c876eeabSAndy Lutomirski 	 *
2830c876eeabSAndy Lutomirski 	 * This improves reliability: if user state gets corrupted such that
2831c876eeabSAndy Lutomirski 	 * the stack pointer points very close to the end of the signal stack,
2832c876eeabSAndy Lutomirski 	 * then this check will enable the signal to be handled anyway.
2833c876eeabSAndy Lutomirski 	 */
2834c876eeabSAndy Lutomirski 	if (current->sas_ss_flags & SS_AUTODISARM)
2835c876eeabSAndy Lutomirski 		return 0;
2836c876eeabSAndy Lutomirski 
28372a855dd0SSebastian Andrzej Siewior #ifdef CONFIG_STACK_GROWSUP
28382a855dd0SSebastian Andrzej Siewior 	return sp >= current->sas_ss_sp &&
28392a855dd0SSebastian Andrzej Siewior 		sp - current->sas_ss_sp < current->sas_ss_size;
28402a855dd0SSebastian Andrzej Siewior #else
28412a855dd0SSebastian Andrzej Siewior 	return sp > current->sas_ss_sp &&
28422a855dd0SSebastian Andrzej Siewior 		sp - current->sas_ss_sp <= current->sas_ss_size;
28432a855dd0SSebastian Andrzej Siewior #endif
28441da177e4SLinus Torvalds }
28451da177e4SLinus Torvalds 
28461da177e4SLinus Torvalds static inline int sas_ss_flags(unsigned long sp)
28471da177e4SLinus Torvalds {
284872f15c03SRichard Weinberger 	if (!current->sas_ss_size)
284972f15c03SRichard Weinberger 		return SS_DISABLE;
285072f15c03SRichard Weinberger 
285172f15c03SRichard Weinberger 	return on_sig_stack(sp) ? SS_ONSTACK : 0;
28521da177e4SLinus Torvalds }
28531da177e4SLinus Torvalds 
28542a742138SStas Sergeev static inline void sas_ss_reset(struct task_struct *p)
28552a742138SStas Sergeev {
28562a742138SStas Sergeev 	p->sas_ss_sp = 0;
28572a742138SStas Sergeev 	p->sas_ss_size = 0;
28582a742138SStas Sergeev 	p->sas_ss_flags = SS_DISABLE;
28592a742138SStas Sergeev }
28602a742138SStas Sergeev 
28615a1b98d3SAl Viro static inline unsigned long sigsp(unsigned long sp, struct ksignal *ksig)
28625a1b98d3SAl Viro {
28635a1b98d3SAl Viro 	if (unlikely((ksig->ka.sa.sa_flags & SA_ONSTACK)) && ! sas_ss_flags(sp))
28645a1b98d3SAl Viro #ifdef CONFIG_STACK_GROWSUP
28655a1b98d3SAl Viro 		return current->sas_ss_sp;
28665a1b98d3SAl Viro #else
28675a1b98d3SAl Viro 		return current->sas_ss_sp + current->sas_ss_size;
28685a1b98d3SAl Viro #endif
28695a1b98d3SAl Viro 	return sp;
28705a1b98d3SAl Viro }
28715a1b98d3SAl Viro 
28721da177e4SLinus Torvalds /*
28731da177e4SLinus Torvalds  * Routines for handling mm_structs
28741da177e4SLinus Torvalds  */
28751da177e4SLinus Torvalds extern struct mm_struct * mm_alloc(void);
28761da177e4SLinus Torvalds 
28771da177e4SLinus Torvalds /* mmdrop drops the mm and the page tables */
2878b3c97528SHarvey Harrison extern void __mmdrop(struct mm_struct *);
28791da177e4SLinus Torvalds static inline void mmdrop(struct mm_struct *mm)
28801da177e4SLinus Torvalds {
28816fb43d7bSIngo Molnar 	if (unlikely(atomic_dec_and_test(&mm->mm_count)))
28821da177e4SLinus Torvalds 		__mmdrop(mm);
28831da177e4SLinus Torvalds }
28841da177e4SLinus Torvalds 
28857283094eSMichal Hocko static inline void mmdrop_async_fn(struct work_struct *work)
28867283094eSMichal Hocko {
28877283094eSMichal Hocko 	struct mm_struct *mm = container_of(work, struct mm_struct, async_put_work);
28887283094eSMichal Hocko 	__mmdrop(mm);
28897283094eSMichal Hocko }
28907283094eSMichal Hocko 
28917283094eSMichal Hocko static inline void mmdrop_async(struct mm_struct *mm)
28927283094eSMichal Hocko {
28937283094eSMichal Hocko 	if (unlikely(atomic_dec_and_test(&mm->mm_count))) {
28947283094eSMichal Hocko 		INIT_WORK(&mm->async_put_work, mmdrop_async_fn);
28957283094eSMichal Hocko 		schedule_work(&mm->async_put_work);
28967283094eSMichal Hocko 	}
28977283094eSMichal Hocko }
28987283094eSMichal Hocko 
2899d2005e3fSOleg Nesterov static inline bool mmget_not_zero(struct mm_struct *mm)
2900d2005e3fSOleg Nesterov {
2901d2005e3fSOleg Nesterov 	return atomic_inc_not_zero(&mm->mm_users);
29021da177e4SLinus Torvalds }
29031da177e4SLinus Torvalds 
29041da177e4SLinus Torvalds /* mmput gets rid of the mappings and all user-space */
29051da177e4SLinus Torvalds extern void mmput(struct mm_struct *);
29067ef949d7SMichal Hocko #ifdef CONFIG_MMU
29077ef949d7SMichal Hocko /* same as above but performs the slow path from the async context. Can
2908ec8d7c14SMichal Hocko  * be called from the atomic context as well
2909ec8d7c14SMichal Hocko  */
2910ec8d7c14SMichal Hocko extern void mmput_async(struct mm_struct *);
29117ef949d7SMichal Hocko #endif
2912ec8d7c14SMichal Hocko 
29131da177e4SLinus Torvalds /* Grab a reference to a task's mm, if it is not already going away */
29141da177e4SLinus Torvalds extern struct mm_struct *get_task_mm(struct task_struct *task);
29158cdb878dSChristopher Yeoh /*
29168cdb878dSChristopher Yeoh  * Grab a reference to a task's mm, if it is not already going away
29178cdb878dSChristopher Yeoh  * and ptrace_may_access with the mode parameter passed to it
29188cdb878dSChristopher Yeoh  * succeeds.
29198cdb878dSChristopher Yeoh  */
29208cdb878dSChristopher Yeoh extern struct mm_struct *mm_access(struct task_struct *task, unsigned int mode);
29211da177e4SLinus Torvalds /* Remove the current tasks stale references to the old mm_struct */
29221da177e4SLinus Torvalds extern void mm_release(struct task_struct *, struct mm_struct *);
29231da177e4SLinus Torvalds 
29243033f14aSJosh Triplett #ifdef CONFIG_HAVE_COPY_THREAD_TLS
29253033f14aSJosh Triplett extern int copy_thread_tls(unsigned long, unsigned long, unsigned long,
29263033f14aSJosh Triplett 			struct task_struct *, unsigned long);
29273033f14aSJosh Triplett #else
29286f2c55b8SAlexey Dobriyan extern int copy_thread(unsigned long, unsigned long, unsigned long,
2929afa86fc4SAl Viro 			struct task_struct *);
29303033f14aSJosh Triplett 
29313033f14aSJosh Triplett /* Architectures that haven't opted into copy_thread_tls get the tls argument
29323033f14aSJosh Triplett  * via pt_regs, so ignore the tls argument passed via C. */
29333033f14aSJosh Triplett static inline int copy_thread_tls(
29343033f14aSJosh Triplett 		unsigned long clone_flags, unsigned long sp, unsigned long arg,
29353033f14aSJosh Triplett 		struct task_struct *p, unsigned long tls)
29363033f14aSJosh Triplett {
29373033f14aSJosh Triplett 	return copy_thread(clone_flags, sp, arg, p);
29383033f14aSJosh Triplett }
29393033f14aSJosh Triplett #endif
29401da177e4SLinus Torvalds extern void flush_thread(void);
29415f56a5dfSJiri Slaby 
29425f56a5dfSJiri Slaby #ifdef CONFIG_HAVE_EXIT_THREAD
2943e6464694SJiri Slaby extern void exit_thread(struct task_struct *tsk);
29445f56a5dfSJiri Slaby #else
2945e6464694SJiri Slaby static inline void exit_thread(struct task_struct *tsk)
29465f56a5dfSJiri Slaby {
29475f56a5dfSJiri Slaby }
29485f56a5dfSJiri Slaby #endif
29491da177e4SLinus Torvalds 
29501da177e4SLinus Torvalds extern void exit_files(struct task_struct *);
2951a7e5328aSOleg Nesterov extern void __cleanup_sighand(struct sighand_struct *);
2952cbaffba1SOleg Nesterov 
29531da177e4SLinus Torvalds extern void exit_itimers(struct signal_struct *);
2954cbaffba1SOleg Nesterov extern void flush_itimer_signals(void);
29551da177e4SLinus Torvalds 
29569402c95fSJoe Perches extern void do_group_exit(int);
29571da177e4SLinus Torvalds 
2958c4ad8f98SLinus Torvalds extern int do_execve(struct filename *,
2959d7627467SDavid Howells 		     const char __user * const __user *,
2960da3d4c5fSAl Viro 		     const char __user * const __user *);
296151f39a1fSDavid Drysdale extern int do_execveat(int, struct filename *,
296251f39a1fSDavid Drysdale 		       const char __user * const __user *,
296351f39a1fSDavid Drysdale 		       const char __user * const __user *,
296451f39a1fSDavid Drysdale 		       int);
29653033f14aSJosh Triplett extern long _do_fork(unsigned long, unsigned long, unsigned long, int __user *, int __user *, unsigned long);
2966e80d6661SAl Viro extern long do_fork(unsigned long, unsigned long, unsigned long, int __user *, int __user *);
296736c8b586SIngo Molnar struct task_struct *fork_idle(int);
29682aa3a7f8SAl Viro extern pid_t kernel_thread(int (*fn)(void *), void *arg, unsigned long flags);
29691da177e4SLinus Torvalds 
297082b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
297182b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from)
297282b89778SAdrian Hunter {
297382b89778SAdrian Hunter 	__set_task_comm(tsk, from, false);
297482b89778SAdrian Hunter }
297559714d65SAndrew Morton extern char *get_task_comm(char *to, struct task_struct *tsk);
29761da177e4SLinus Torvalds 
29771da177e4SLinus Torvalds #ifdef CONFIG_SMP
2978317f3941SPeter Zijlstra void scheduler_ipi(void);
297985ba2d86SRoland McGrath extern unsigned long wait_task_inactive(struct task_struct *, long match_state);
29801da177e4SLinus Torvalds #else
2981184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { }
298285ba2d86SRoland McGrath static inline unsigned long wait_task_inactive(struct task_struct *p,
298385ba2d86SRoland McGrath 					       long match_state)
298485ba2d86SRoland McGrath {
298585ba2d86SRoland McGrath 	return 1;
298685ba2d86SRoland McGrath }
29871da177e4SLinus Torvalds #endif
29881da177e4SLinus Torvalds 
2989fafe870fSFrederic Weisbecker #define tasklist_empty() \
2990fafe870fSFrederic Weisbecker 	list_empty(&init_task.tasks)
2991fafe870fSFrederic Weisbecker 
299205725f7eSJiri Pirko #define next_task(p) \
299305725f7eSJiri Pirko 	list_entry_rcu((p)->tasks.next, struct task_struct, tasks)
29941da177e4SLinus Torvalds 
29951da177e4SLinus Torvalds #define for_each_process(p) \
29961da177e4SLinus Torvalds 	for (p = &init_task ; (p = next_task(p)) != &init_task ; )
29971da177e4SLinus Torvalds 
29985bb459bbSOleg Nesterov extern bool current_is_single_threaded(void);
2999d84f4f99SDavid Howells 
30001da177e4SLinus Torvalds /*
30011da177e4SLinus Torvalds  * Careful: do_each_thread/while_each_thread is a double loop so
30021da177e4SLinus Torvalds  *          'break' will not work as expected - use goto instead.
30031da177e4SLinus Torvalds  */
30041da177e4SLinus Torvalds #define do_each_thread(g, t) \
30051da177e4SLinus Torvalds 	for (g = t = &init_task ; (g = t = next_task(g)) != &init_task ; ) do
30061da177e4SLinus Torvalds 
30071da177e4SLinus Torvalds #define while_each_thread(g, t) \
30081da177e4SLinus Torvalds 	while ((t = next_thread(t)) != g)
30091da177e4SLinus Torvalds 
30100c740d0aSOleg Nesterov #define __for_each_thread(signal, t)	\
30110c740d0aSOleg Nesterov 	list_for_each_entry_rcu(t, &(signal)->thread_head, thread_node)
30120c740d0aSOleg Nesterov 
30130c740d0aSOleg Nesterov #define for_each_thread(p, t)		\
30140c740d0aSOleg Nesterov 	__for_each_thread((p)->signal, t)
30150c740d0aSOleg Nesterov 
30160c740d0aSOleg Nesterov /* Careful: this is a double loop, 'break' won't work as expected. */
30170c740d0aSOleg Nesterov #define for_each_process_thread(p, t)	\
30180c740d0aSOleg Nesterov 	for_each_process(p) for_each_thread(p, t)
30190c740d0aSOleg Nesterov 
30207e49827cSOleg Nesterov static inline int get_nr_threads(struct task_struct *tsk)
30217e49827cSOleg Nesterov {
3022b3ac022cSOleg Nesterov 	return tsk->signal->nr_threads;
30237e49827cSOleg Nesterov }
30247e49827cSOleg Nesterov 
3025087806b1SOleg Nesterov static inline bool thread_group_leader(struct task_struct *p)
3026087806b1SOleg Nesterov {
3027087806b1SOleg Nesterov 	return p->exit_signal >= 0;
3028087806b1SOleg Nesterov }
30291da177e4SLinus Torvalds 
30300804ef4bSEric W. Biederman /* Do to the insanities of de_thread it is possible for a process
30310804ef4bSEric W. Biederman  * to have the pid of the thread group leader without actually being
30320804ef4bSEric W. Biederman  * the thread group leader.  For iteration through the pids in proc
30330804ef4bSEric W. Biederman  * all we care about is that we have a task with the appropriate
30340804ef4bSEric W. Biederman  * pid, we don't actually care if we have the right task.
30350804ef4bSEric W. Biederman  */
3036e1403b8eSOleg Nesterov static inline bool has_group_leader_pid(struct task_struct *p)
30370804ef4bSEric W. Biederman {
3038e1403b8eSOleg Nesterov 	return task_pid(p) == p->signal->leader_pid;
30390804ef4bSEric W. Biederman }
30400804ef4bSEric W. Biederman 
3041bac0abd6SPavel Emelyanov static inline
3042e1403b8eSOleg Nesterov bool same_thread_group(struct task_struct *p1, struct task_struct *p2)
3043bac0abd6SPavel Emelyanov {
3044e1403b8eSOleg Nesterov 	return p1->signal == p2->signal;
3045bac0abd6SPavel Emelyanov }
3046bac0abd6SPavel Emelyanov 
304736c8b586SIngo Molnar static inline struct task_struct *next_thread(const struct task_struct *p)
304847e65328SOleg Nesterov {
304905725f7eSJiri Pirko 	return list_entry_rcu(p->thread_group.next,
305036c8b586SIngo Molnar 			      struct task_struct, thread_group);
305147e65328SOleg Nesterov }
305247e65328SOleg Nesterov 
3053e868171aSAlexey Dobriyan static inline int thread_group_empty(struct task_struct *p)
30541da177e4SLinus Torvalds {
305547e65328SOleg Nesterov 	return list_empty(&p->thread_group);
30561da177e4SLinus Torvalds }
30571da177e4SLinus Torvalds 
30581da177e4SLinus Torvalds #define delay_group_leader(p) \
30591da177e4SLinus Torvalds 		(thread_group_leader(p) && !thread_group_empty(p))
30601da177e4SLinus Torvalds 
30611da177e4SLinus Torvalds /*
3062260ea101SEric W. Biederman  * Protects ->fs, ->files, ->mm, ->group_info, ->comm, keyring
306322e2c507SJens Axboe  * subscriptions and synchronises with wait4().  Also used in procfs.  Also
3064ddbcc7e8SPaul Menage  * pins the final release of task.io_context.  Also protects ->cpuset and
3065d68b46feSOleg Nesterov  * ->cgroup.subsys[]. And ->vfork_done.
30661da177e4SLinus Torvalds  *
30671da177e4SLinus Torvalds  * Nests both inside and outside of read_lock(&tasklist_lock).
30681da177e4SLinus Torvalds  * It must not be nested with write_lock_irq(&tasklist_lock),
30691da177e4SLinus Torvalds  * neither inside nor outside.
30701da177e4SLinus Torvalds  */
30711da177e4SLinus Torvalds static inline void task_lock(struct task_struct *p)
30721da177e4SLinus Torvalds {
30731da177e4SLinus Torvalds 	spin_lock(&p->alloc_lock);
30741da177e4SLinus Torvalds }
30751da177e4SLinus Torvalds 
30761da177e4SLinus Torvalds static inline void task_unlock(struct task_struct *p)
30771da177e4SLinus Torvalds {
30781da177e4SLinus Torvalds 	spin_unlock(&p->alloc_lock);
30791da177e4SLinus Torvalds }
30801da177e4SLinus Torvalds 
3081b8ed374eSNamhyung Kim extern struct sighand_struct *__lock_task_sighand(struct task_struct *tsk,
3082f63ee72eSOleg Nesterov 							unsigned long *flags);
3083f63ee72eSOleg Nesterov 
30849388dc30SAnton Vorontsov static inline struct sighand_struct *lock_task_sighand(struct task_struct *tsk,
30859388dc30SAnton Vorontsov 						       unsigned long *flags)
30869388dc30SAnton Vorontsov {
30879388dc30SAnton Vorontsov 	struct sighand_struct *ret;
30889388dc30SAnton Vorontsov 
30899388dc30SAnton Vorontsov 	ret = __lock_task_sighand(tsk, flags);
30909388dc30SAnton Vorontsov 	(void)__cond_lock(&tsk->sighand->siglock, ret);
30919388dc30SAnton Vorontsov 	return ret;
30929388dc30SAnton Vorontsov }
3093b8ed374eSNamhyung Kim 
3094f63ee72eSOleg Nesterov static inline void unlock_task_sighand(struct task_struct *tsk,
3095f63ee72eSOleg Nesterov 						unsigned long *flags)
3096f63ee72eSOleg Nesterov {
3097f63ee72eSOleg Nesterov 	spin_unlock_irqrestore(&tsk->sighand->siglock, *flags);
3098f63ee72eSOleg Nesterov }
3099f63ee72eSOleg Nesterov 
31007d7efec3STejun Heo /**
31017d7efec3STejun Heo  * threadgroup_change_begin - mark the beginning of changes to a threadgroup
31027d7efec3STejun Heo  * @tsk: task causing the changes
31037d7efec3STejun Heo  *
31047d7efec3STejun Heo  * All operations which modify a threadgroup - a new thread joining the
31057d7efec3STejun Heo  * group, death of a member thread (the assertion of PF_EXITING) and
31067d7efec3STejun Heo  * exec(2) dethreading the process and replacing the leader - are wrapped
31077d7efec3STejun Heo  * by threadgroup_change_{begin|end}().  This is to provide a place which
31087d7efec3STejun Heo  * subsystems needing threadgroup stability can hook into for
31097d7efec3STejun Heo  * synchronization.
31107d7efec3STejun Heo  */
3111257058aeSTejun Heo static inline void threadgroup_change_begin(struct task_struct *tsk)
31124714d1d3SBen Blum {
31137d7efec3STejun Heo 	might_sleep();
31147d7efec3STejun Heo 	cgroup_threadgroup_change_begin(tsk);
31154714d1d3SBen Blum }
31167d7efec3STejun Heo 
31177d7efec3STejun Heo /**
31187d7efec3STejun Heo  * threadgroup_change_end - mark the end of changes to a threadgroup
31197d7efec3STejun Heo  * @tsk: task causing the changes
31207d7efec3STejun Heo  *
31217d7efec3STejun Heo  * See threadgroup_change_begin().
31227d7efec3STejun Heo  */
3123257058aeSTejun Heo static inline void threadgroup_change_end(struct task_struct *tsk)
31244714d1d3SBen Blum {
31257d7efec3STejun Heo 	cgroup_threadgroup_change_end(tsk);
31264714d1d3SBen Blum }
312777e4ef99STejun Heo 
3128c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
3129c65eacbeSAndy Lutomirski 
3130c65eacbeSAndy Lutomirski static inline struct thread_info *task_thread_info(struct task_struct *task)
3131c65eacbeSAndy Lutomirski {
3132c65eacbeSAndy Lutomirski 	return &task->thread_info;
3133c65eacbeSAndy Lutomirski }
3134c6c314a6SAndy Lutomirski 
3135c6c314a6SAndy Lutomirski /*
3136c6c314a6SAndy Lutomirski  * When accessing the stack of a non-current task that might exit, use
3137c6c314a6SAndy Lutomirski  * try_get_task_stack() instead.  task_stack_page will return a pointer
3138c6c314a6SAndy Lutomirski  * that could get freed out from under you.
3139c6c314a6SAndy Lutomirski  */
3140c65eacbeSAndy Lutomirski static inline void *task_stack_page(const struct task_struct *task)
3141c65eacbeSAndy Lutomirski {
3142c65eacbeSAndy Lutomirski 	return task->stack;
3143c65eacbeSAndy Lutomirski }
3144c6c314a6SAndy Lutomirski 
3145c65eacbeSAndy Lutomirski #define setup_thread_stack(new,old)	do { } while(0)
3146c6c314a6SAndy Lutomirski 
3147c65eacbeSAndy Lutomirski static inline unsigned long *end_of_stack(const struct task_struct *task)
3148c65eacbeSAndy Lutomirski {
3149c65eacbeSAndy Lutomirski 	return task->stack;
3150c65eacbeSAndy Lutomirski }
3151c65eacbeSAndy Lutomirski 
3152c65eacbeSAndy Lutomirski #elif !defined(__HAVE_THREAD_FUNCTIONS)
3153f037360fSAl Viro 
3154f7e4217bSRoman Zippel #define task_thread_info(task)	((struct thread_info *)(task)->stack)
3155c65eacbeSAndy Lutomirski #define task_stack_page(task)	((void *)(task)->stack)
3156a1261f54SAl Viro 
315710ebffdeSAl Viro static inline void setup_thread_stack(struct task_struct *p, struct task_struct *org)
315810ebffdeSAl Viro {
315910ebffdeSAl Viro 	*task_thread_info(p) = *task_thread_info(org);
316010ebffdeSAl Viro 	task_thread_info(p)->task = p;
316110ebffdeSAl Viro }
316210ebffdeSAl Viro 
31636a40281aSChuck Ebbert /*
31646a40281aSChuck Ebbert  * Return the address of the last usable long on the stack.
31656a40281aSChuck Ebbert  *
31666a40281aSChuck Ebbert  * When the stack grows down, this is just above the thread
31676a40281aSChuck Ebbert  * info struct. Going any lower will corrupt the threadinfo.
31686a40281aSChuck Ebbert  *
31696a40281aSChuck Ebbert  * When the stack grows up, this is the highest address.
31706a40281aSChuck Ebbert  * Beyond that position, we corrupt data on the next page.
31716a40281aSChuck Ebbert  */
317210ebffdeSAl Viro static inline unsigned long *end_of_stack(struct task_struct *p)
317310ebffdeSAl Viro {
31746a40281aSChuck Ebbert #ifdef CONFIG_STACK_GROWSUP
31756a40281aSChuck Ebbert 	return (unsigned long *)((unsigned long)task_thread_info(p) + THREAD_SIZE) - 1;
31766a40281aSChuck Ebbert #else
3177f7e4217bSRoman Zippel 	return (unsigned long *)(task_thread_info(p) + 1);
31786a40281aSChuck Ebbert #endif
317910ebffdeSAl Viro }
318010ebffdeSAl Viro 
3181f037360fSAl Viro #endif
3182c6c314a6SAndy Lutomirski 
318368f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
318468f24b08SAndy Lutomirski static inline void *try_get_task_stack(struct task_struct *tsk)
318568f24b08SAndy Lutomirski {
318668f24b08SAndy Lutomirski 	return atomic_inc_not_zero(&tsk->stack_refcount) ?
318768f24b08SAndy Lutomirski 		task_stack_page(tsk) : NULL;
318868f24b08SAndy Lutomirski }
318968f24b08SAndy Lutomirski 
319068f24b08SAndy Lutomirski extern void put_task_stack(struct task_struct *tsk);
319168f24b08SAndy Lutomirski #else
3192c6c314a6SAndy Lutomirski static inline void *try_get_task_stack(struct task_struct *tsk)
3193c6c314a6SAndy Lutomirski {
3194c6c314a6SAndy Lutomirski 	return task_stack_page(tsk);
3195c6c314a6SAndy Lutomirski }
3196c6c314a6SAndy Lutomirski 
3197c6c314a6SAndy Lutomirski static inline void put_task_stack(struct task_struct *tsk) {}
319868f24b08SAndy Lutomirski #endif
3199c6c314a6SAndy Lutomirski 
3200a70857e4SAaron Tomlin #define task_stack_end_corrupted(task) \
3201a70857e4SAaron Tomlin 		(*(end_of_stack(task)) != STACK_END_MAGIC)
3202f037360fSAl Viro 
32038b05c7e6SFUJITA Tomonori static inline int object_is_on_stack(void *obj)
32048b05c7e6SFUJITA Tomonori {
32058b05c7e6SFUJITA Tomonori 	void *stack = task_stack_page(current);
32068b05c7e6SFUJITA Tomonori 
32078b05c7e6SFUJITA Tomonori 	return (obj >= stack) && (obj < (stack + THREAD_SIZE));
32088b05c7e6SFUJITA Tomonori }
32098b05c7e6SFUJITA Tomonori 
3210b235beeaSLinus Torvalds extern void thread_stack_cache_init(void);
32118c9843e5SBenjamin Herrenschmidt 
32127c9f8861SEric Sandeen #ifdef CONFIG_DEBUG_STACK_USAGE
32137c9f8861SEric Sandeen static inline unsigned long stack_not_used(struct task_struct *p)
32147c9f8861SEric Sandeen {
32157c9f8861SEric Sandeen 	unsigned long *n = end_of_stack(p);
32167c9f8861SEric Sandeen 
32177c9f8861SEric Sandeen 	do { 	/* Skip over canary */
32186c31da34SHelge Deller # ifdef CONFIG_STACK_GROWSUP
32196c31da34SHelge Deller 		n--;
32206c31da34SHelge Deller # else
32217c9f8861SEric Sandeen 		n++;
32226c31da34SHelge Deller # endif
32237c9f8861SEric Sandeen 	} while (!*n);
32247c9f8861SEric Sandeen 
32256c31da34SHelge Deller # ifdef CONFIG_STACK_GROWSUP
32266c31da34SHelge Deller 	return (unsigned long)end_of_stack(p) - (unsigned long)n;
32276c31da34SHelge Deller # else
32287c9f8861SEric Sandeen 	return (unsigned long)n - (unsigned long)end_of_stack(p);
32296c31da34SHelge Deller # endif
32307c9f8861SEric Sandeen }
32317c9f8861SEric Sandeen #endif
3232d4311ff1SAaron Tomlin extern void set_task_stack_end_magic(struct task_struct *tsk);
32337c9f8861SEric Sandeen 
32341da177e4SLinus Torvalds /* set thread flags in other task's structures
32351da177e4SLinus Torvalds  * - see asm/thread_info.h for TIF_xxxx flags available
32361da177e4SLinus Torvalds  */
32371da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag)
32381da177e4SLinus Torvalds {
3239a1261f54SAl Viro 	set_ti_thread_flag(task_thread_info(tsk), flag);
32401da177e4SLinus Torvalds }
32411da177e4SLinus Torvalds 
32421da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag)
32431da177e4SLinus Torvalds {
3244a1261f54SAl Viro 	clear_ti_thread_flag(task_thread_info(tsk), flag);
32451da177e4SLinus Torvalds }
32461da177e4SLinus Torvalds 
32471da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag)
32481da177e4SLinus Torvalds {
3249a1261f54SAl Viro 	return test_and_set_ti_thread_flag(task_thread_info(tsk), flag);
32501da177e4SLinus Torvalds }
32511da177e4SLinus Torvalds 
32521da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag)
32531da177e4SLinus Torvalds {
3254a1261f54SAl Viro 	return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag);
32551da177e4SLinus Torvalds }
32561da177e4SLinus Torvalds 
32571da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag)
32581da177e4SLinus Torvalds {
3259a1261f54SAl Viro 	return test_ti_thread_flag(task_thread_info(tsk), flag);
32601da177e4SLinus Torvalds }
32611da177e4SLinus Torvalds 
32621da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk)
32631da177e4SLinus Torvalds {
32641da177e4SLinus Torvalds 	set_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
32651da177e4SLinus Torvalds }
32661da177e4SLinus Torvalds 
32671da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk)
32681da177e4SLinus Torvalds {
32691da177e4SLinus Torvalds 	clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
32701da177e4SLinus Torvalds }
32711da177e4SLinus Torvalds 
32728ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk)
32738ae121acSGregory Haskins {
32748ae121acSGregory Haskins 	return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
32758ae121acSGregory Haskins }
32768ae121acSGregory Haskins 
3277690cc3ffSEric W. Biederman static inline int restart_syscall(void)
3278690cc3ffSEric W. Biederman {
3279690cc3ffSEric W. Biederman 	set_tsk_thread_flag(current, TIF_SIGPENDING);
3280690cc3ffSEric W. Biederman 	return -ERESTARTNOINTR;
3281690cc3ffSEric W. Biederman }
3282690cc3ffSEric W. Biederman 
32831da177e4SLinus Torvalds static inline int signal_pending(struct task_struct *p)
32841da177e4SLinus Torvalds {
32851da177e4SLinus Torvalds 	return unlikely(test_tsk_thread_flag(p,TIF_SIGPENDING));
32861da177e4SLinus Torvalds }
32871da177e4SLinus Torvalds 
3288d9588725SRoland McGrath static inline int __fatal_signal_pending(struct task_struct *p)
3289d9588725SRoland McGrath {
3290d9588725SRoland McGrath 	return unlikely(sigismember(&p->pending.signal, SIGKILL));
3291d9588725SRoland McGrath }
3292f776d12dSMatthew Wilcox 
3293f776d12dSMatthew Wilcox static inline int fatal_signal_pending(struct task_struct *p)
3294f776d12dSMatthew Wilcox {
3295f776d12dSMatthew Wilcox 	return signal_pending(p) && __fatal_signal_pending(p);
3296f776d12dSMatthew Wilcox }
3297f776d12dSMatthew Wilcox 
329816882c1eSOleg Nesterov static inline int signal_pending_state(long state, struct task_struct *p)
329916882c1eSOleg Nesterov {
330016882c1eSOleg Nesterov 	if (!(state & (TASK_INTERRUPTIBLE | TASK_WAKEKILL)))
330116882c1eSOleg Nesterov 		return 0;
330216882c1eSOleg Nesterov 	if (!signal_pending(p))
330316882c1eSOleg Nesterov 		return 0;
330416882c1eSOleg Nesterov 
330516882c1eSOleg Nesterov 	return (state & TASK_INTERRUPTIBLE) || __fatal_signal_pending(p);
330616882c1eSOleg Nesterov }
330716882c1eSOleg Nesterov 
33081da177e4SLinus Torvalds /*
33091da177e4SLinus Torvalds  * cond_resched() and cond_resched_lock(): latency reduction via
33101da177e4SLinus Torvalds  * explicit rescheduling in places that are safe. The return
33111da177e4SLinus Torvalds  * value indicates whether a reschedule was done in fact.
33121da177e4SLinus Torvalds  * cond_resched_lock() will drop the spinlock before scheduling,
33131da177e4SLinus Torvalds  * cond_resched_softirq() will enable bhs before scheduling.
33141da177e4SLinus Torvalds  */
331535a773a0SPeter Zijlstra #ifndef CONFIG_PREEMPT
3316c3921ab7SLinus Torvalds extern int _cond_resched(void);
331735a773a0SPeter Zijlstra #else
331835a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; }
331935a773a0SPeter Zijlstra #endif
33206f80bd98SFrederic Weisbecker 
3321613afbf8SFrederic Weisbecker #define cond_resched() ({			\
33223427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, 0);	\
3323613afbf8SFrederic Weisbecker 	_cond_resched();			\
3324613afbf8SFrederic Weisbecker })
33256f80bd98SFrederic Weisbecker 
3326613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock);
3327613afbf8SFrederic Weisbecker 
3328613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({				\
33293427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\
3330613afbf8SFrederic Weisbecker 	__cond_resched_lock(lock);				\
3331613afbf8SFrederic Weisbecker })
3332613afbf8SFrederic Weisbecker 
3333613afbf8SFrederic Weisbecker extern int __cond_resched_softirq(void);
3334613afbf8SFrederic Weisbecker 
3335613afbf8SFrederic Weisbecker #define cond_resched_softirq() ({					\
33363427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, SOFTIRQ_DISABLE_OFFSET);	\
3337613afbf8SFrederic Weisbecker 	__cond_resched_softirq();					\
3338613afbf8SFrederic Weisbecker })
33391da177e4SLinus Torvalds 
3340f6f3c437SSimon Horman static inline void cond_resched_rcu(void)
3341f6f3c437SSimon Horman {
3342f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU)
3343f6f3c437SSimon Horman 	rcu_read_unlock();
3344f6f3c437SSimon Horman 	cond_resched();
3345f6f3c437SSimon Horman 	rcu_read_lock();
3346f6f3c437SSimon Horman #endif
3347f6f3c437SSimon Horman }
3348f6f3c437SSimon Horman 
3349d1c6d149SVegard Nossum static inline unsigned long get_preempt_disable_ip(struct task_struct *p)
3350d1c6d149SVegard Nossum {
3351d1c6d149SVegard Nossum #ifdef CONFIG_DEBUG_PREEMPT
3352d1c6d149SVegard Nossum 	return p->preempt_disable_ip;
3353d1c6d149SVegard Nossum #else
3354d1c6d149SVegard Nossum 	return 0;
3355d1c6d149SVegard Nossum #endif
3356d1c6d149SVegard Nossum }
3357d1c6d149SVegard Nossum 
33581da177e4SLinus Torvalds /*
33591da177e4SLinus Torvalds  * Does a critical section need to be broken due to another
336095c354feSNick Piggin  * task waiting?: (technically does not depend on CONFIG_PREEMPT,
336195c354feSNick Piggin  * but a general need for low latency)
33621da177e4SLinus Torvalds  */
336395c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock)
33641da177e4SLinus Torvalds {
336595c354feSNick Piggin #ifdef CONFIG_PREEMPT
336695c354feSNick Piggin 	return spin_is_contended(lock);
336795c354feSNick Piggin #else
33681da177e4SLinus Torvalds 	return 0;
336995c354feSNick Piggin #endif
33701da177e4SLinus Torvalds }
33711da177e4SLinus Torvalds 
33727bb44adeSRoland McGrath /*
3373ee761f62SThomas Gleixner  * Idle thread specific functions to determine the need_resched
337469dd0f84SPeter Zijlstra  * polling state.
3375ee761f62SThomas Gleixner  */
337669dd0f84SPeter Zijlstra #ifdef TIF_POLLING_NRFLAG
3377ee761f62SThomas Gleixner static inline int tsk_is_polling(struct task_struct *p)
3378ee761f62SThomas Gleixner {
3379ee761f62SThomas Gleixner 	return test_tsk_thread_flag(p, TIF_POLLING_NRFLAG);
3380ee761f62SThomas Gleixner }
3381ea811747SPeter Zijlstra 
3382ea811747SPeter Zijlstra static inline void __current_set_polling(void)
33833a98f871SThomas Gleixner {
33843a98f871SThomas Gleixner 	set_thread_flag(TIF_POLLING_NRFLAG);
33853a98f871SThomas Gleixner }
33863a98f871SThomas Gleixner 
3387ea811747SPeter Zijlstra static inline bool __must_check current_set_polling_and_test(void)
3388ea811747SPeter Zijlstra {
3389ea811747SPeter Zijlstra 	__current_set_polling();
3390ea811747SPeter Zijlstra 
3391ea811747SPeter Zijlstra 	/*
3392ea811747SPeter Zijlstra 	 * Polling state must be visible before we test NEED_RESCHED,
33938875125eSKirill Tkhai 	 * paired by resched_curr()
3394ea811747SPeter Zijlstra 	 */
33954e857c58SPeter Zijlstra 	smp_mb__after_atomic();
3396ea811747SPeter Zijlstra 
3397ea811747SPeter Zijlstra 	return unlikely(tif_need_resched());
3398ea811747SPeter Zijlstra }
3399ea811747SPeter Zijlstra 
3400ea811747SPeter Zijlstra static inline void __current_clr_polling(void)
34013a98f871SThomas Gleixner {
34023a98f871SThomas Gleixner 	clear_thread_flag(TIF_POLLING_NRFLAG);
34033a98f871SThomas Gleixner }
3404ea811747SPeter Zijlstra 
3405ea811747SPeter Zijlstra static inline bool __must_check current_clr_polling_and_test(void)
3406ea811747SPeter Zijlstra {
3407ea811747SPeter Zijlstra 	__current_clr_polling();
3408ea811747SPeter Zijlstra 
3409ea811747SPeter Zijlstra 	/*
3410ea811747SPeter Zijlstra 	 * Polling state must be visible before we test NEED_RESCHED,
34118875125eSKirill Tkhai 	 * paired by resched_curr()
3412ea811747SPeter Zijlstra 	 */
34134e857c58SPeter Zijlstra 	smp_mb__after_atomic();
3414ea811747SPeter Zijlstra 
3415ea811747SPeter Zijlstra 	return unlikely(tif_need_resched());
3416ea811747SPeter Zijlstra }
3417ea811747SPeter Zijlstra 
3418ee761f62SThomas Gleixner #else
3419ee761f62SThomas Gleixner static inline int tsk_is_polling(struct task_struct *p) { return 0; }
3420ea811747SPeter Zijlstra static inline void __current_set_polling(void) { }
3421ea811747SPeter Zijlstra static inline void __current_clr_polling(void) { }
3422ea811747SPeter Zijlstra 
3423ea811747SPeter Zijlstra static inline bool __must_check current_set_polling_and_test(void)
3424ea811747SPeter Zijlstra {
3425ea811747SPeter Zijlstra 	return unlikely(tif_need_resched());
3426ea811747SPeter Zijlstra }
3427ea811747SPeter Zijlstra static inline bool __must_check current_clr_polling_and_test(void)
3428ea811747SPeter Zijlstra {
3429ea811747SPeter Zijlstra 	return unlikely(tif_need_resched());
3430ea811747SPeter Zijlstra }
3431ee761f62SThomas Gleixner #endif
3432ee761f62SThomas Gleixner 
34338cb75e0cSPeter Zijlstra static inline void current_clr_polling(void)
34348cb75e0cSPeter Zijlstra {
34358cb75e0cSPeter Zijlstra 	__current_clr_polling();
34368cb75e0cSPeter Zijlstra 
34378cb75e0cSPeter Zijlstra 	/*
34388cb75e0cSPeter Zijlstra 	 * Ensure we check TIF_NEED_RESCHED after we clear the polling bit.
34398cb75e0cSPeter Zijlstra 	 * Once the bit is cleared, we'll get IPIs with every new
34408cb75e0cSPeter Zijlstra 	 * TIF_NEED_RESCHED and the IPI handler, scheduler_ipi(), will also
34418cb75e0cSPeter Zijlstra 	 * fold.
34428cb75e0cSPeter Zijlstra 	 */
34438875125eSKirill Tkhai 	smp_mb(); /* paired with resched_curr() */
34448cb75e0cSPeter Zijlstra 
34458cb75e0cSPeter Zijlstra 	preempt_fold_need_resched();
34468cb75e0cSPeter Zijlstra }
34478cb75e0cSPeter Zijlstra 
344875f93fedSPeter Zijlstra static __always_inline bool need_resched(void)
344975f93fedSPeter Zijlstra {
345075f93fedSPeter Zijlstra 	return unlikely(tif_need_resched());
345175f93fedSPeter Zijlstra }
345275f93fedSPeter Zijlstra 
3453ee761f62SThomas Gleixner /*
3454f06febc9SFrank Mayhar  * Thread group CPU time accounting.
3455f06febc9SFrank Mayhar  */
34564cd4c1b4SPeter Zijlstra void thread_group_cputime(struct task_struct *tsk, struct task_cputime *times);
34574da94d49SPeter Zijlstra void thread_group_cputimer(struct task_struct *tsk, struct task_cputime *times);
3458f06febc9SFrank Mayhar 
3459f06febc9SFrank Mayhar /*
34607bb44adeSRoland McGrath  * Reevaluate whether the task has signals pending delivery.
34617bb44adeSRoland McGrath  * Wake the task if so.
34627bb44adeSRoland McGrath  * This is required every time the blocked sigset_t changes.
34637bb44adeSRoland McGrath  * callers must hold sighand->siglock.
34647bb44adeSRoland McGrath  */
34657bb44adeSRoland McGrath extern void recalc_sigpending_and_wake(struct task_struct *t);
34661da177e4SLinus Torvalds extern void recalc_sigpending(void);
34671da177e4SLinus Torvalds 
3468910ffdb1SOleg Nesterov extern void signal_wake_up_state(struct task_struct *t, unsigned int state);
3469910ffdb1SOleg Nesterov 
3470910ffdb1SOleg Nesterov static inline void signal_wake_up(struct task_struct *t, bool resume)
3471910ffdb1SOleg Nesterov {
3472910ffdb1SOleg Nesterov 	signal_wake_up_state(t, resume ? TASK_WAKEKILL : 0);
3473910ffdb1SOleg Nesterov }
3474910ffdb1SOleg Nesterov static inline void ptrace_signal_wake_up(struct task_struct *t, bool resume)
3475910ffdb1SOleg Nesterov {
3476910ffdb1SOleg Nesterov 	signal_wake_up_state(t, resume ? __TASK_TRACED : 0);
3477910ffdb1SOleg Nesterov }
34781da177e4SLinus Torvalds 
34791da177e4SLinus Torvalds /*
34801da177e4SLinus Torvalds  * Wrappers for p->thread_info->cpu access. No-op on UP.
34811da177e4SLinus Torvalds  */
34821da177e4SLinus Torvalds #ifdef CONFIG_SMP
34831da177e4SLinus Torvalds 
34841da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
34851da177e4SLinus Torvalds {
3486c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
3487c65eacbeSAndy Lutomirski 	return p->cpu;
3488c65eacbeSAndy Lutomirski #else
3489a1261f54SAl Viro 	return task_thread_info(p)->cpu;
3490c65eacbeSAndy Lutomirski #endif
34911da177e4SLinus Torvalds }
34921da177e4SLinus Torvalds 
3493b32e86b4SIngo Molnar static inline int task_node(const struct task_struct *p)
3494b32e86b4SIngo Molnar {
3495b32e86b4SIngo Molnar 	return cpu_to_node(task_cpu(p));
3496b32e86b4SIngo Molnar }
3497b32e86b4SIngo Molnar 
3498c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu);
34991da177e4SLinus Torvalds 
35001da177e4SLinus Torvalds #else
35011da177e4SLinus Torvalds 
35021da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
35031da177e4SLinus Torvalds {
35041da177e4SLinus Torvalds 	return 0;
35051da177e4SLinus Torvalds }
35061da177e4SLinus Torvalds 
35071da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu)
35081da177e4SLinus Torvalds {
35091da177e4SLinus Torvalds }
35101da177e4SLinus Torvalds 
35111da177e4SLinus Torvalds #endif /* CONFIG_SMP */
35121da177e4SLinus Torvalds 
3513*d9345c65SPan Xinhui /*
3514*d9345c65SPan Xinhui  * In order to reduce various lock holder preemption latencies provide an
3515*d9345c65SPan Xinhui  * interface to see if a vCPU is currently running or not.
3516*d9345c65SPan Xinhui  *
3517*d9345c65SPan Xinhui  * This allows us to terminate optimistic spin loops and block, analogous to
3518*d9345c65SPan Xinhui  * the native optimistic spin heuristic of testing if the lock owner task is
3519*d9345c65SPan Xinhui  * running or not.
3520*d9345c65SPan Xinhui  */
3521*d9345c65SPan Xinhui #ifndef vcpu_is_preempted
3522*d9345c65SPan Xinhui # define vcpu_is_preempted(cpu)	false
3523*d9345c65SPan Xinhui #endif
3524*d9345c65SPan Xinhui 
352596f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask);
352696f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask);
35275c45bf27SSiddha, Suresh B 
35287c941438SDhaval Giani #ifdef CONFIG_CGROUP_SCHED
352907e06b01SYong Zhang extern struct task_group root_task_group;
35308323f26cSPeter Zijlstra #endif /* CONFIG_CGROUP_SCHED */
35319b5b7751SSrivatsa Vaddagiri 
353254e99124SDhaval Giani extern int task_can_switch_user(struct user_struct *up,
353354e99124SDhaval Giani 					struct task_struct *tsk);
353454e99124SDhaval Giani 
35354b98d11bSAlexey Dobriyan #ifdef CONFIG_TASK_XACCT
35364b98d11bSAlexey Dobriyan static inline void add_rchar(struct task_struct *tsk, ssize_t amt)
35374b98d11bSAlexey Dobriyan {
3538940389b8SAndrea Righi 	tsk->ioac.rchar += amt;
35394b98d11bSAlexey Dobriyan }
35404b98d11bSAlexey Dobriyan 
35414b98d11bSAlexey Dobriyan static inline void add_wchar(struct task_struct *tsk, ssize_t amt)
35424b98d11bSAlexey Dobriyan {
3543940389b8SAndrea Righi 	tsk->ioac.wchar += amt;
35444b98d11bSAlexey Dobriyan }
35454b98d11bSAlexey Dobriyan 
35464b98d11bSAlexey Dobriyan static inline void inc_syscr(struct task_struct *tsk)
35474b98d11bSAlexey Dobriyan {
3548940389b8SAndrea Righi 	tsk->ioac.syscr++;
35494b98d11bSAlexey Dobriyan }
35504b98d11bSAlexey Dobriyan 
35514b98d11bSAlexey Dobriyan static inline void inc_syscw(struct task_struct *tsk)
35524b98d11bSAlexey Dobriyan {
3553940389b8SAndrea Righi 	tsk->ioac.syscw++;
35544b98d11bSAlexey Dobriyan }
35554b98d11bSAlexey Dobriyan #else
35564b98d11bSAlexey Dobriyan static inline void add_rchar(struct task_struct *tsk, ssize_t amt)
35574b98d11bSAlexey Dobriyan {
35584b98d11bSAlexey Dobriyan }
35594b98d11bSAlexey Dobriyan 
35604b98d11bSAlexey Dobriyan static inline void add_wchar(struct task_struct *tsk, ssize_t amt)
35614b98d11bSAlexey Dobriyan {
35624b98d11bSAlexey Dobriyan }
35634b98d11bSAlexey Dobriyan 
35644b98d11bSAlexey Dobriyan static inline void inc_syscr(struct task_struct *tsk)
35654b98d11bSAlexey Dobriyan {
35664b98d11bSAlexey Dobriyan }
35674b98d11bSAlexey Dobriyan 
35684b98d11bSAlexey Dobriyan static inline void inc_syscw(struct task_struct *tsk)
35694b98d11bSAlexey Dobriyan {
35704b98d11bSAlexey Dobriyan }
35714b98d11bSAlexey Dobriyan #endif
35724b98d11bSAlexey Dobriyan 
357382455257SDave Hansen #ifndef TASK_SIZE_OF
357482455257SDave Hansen #define TASK_SIZE_OF(tsk)	TASK_SIZE
357582455257SDave Hansen #endif
357682455257SDave Hansen 
3577f98bafa0SOleg Nesterov #ifdef CONFIG_MEMCG
3578cf475ad2SBalbir Singh extern void mm_update_next_owner(struct mm_struct *mm);
3579cf475ad2SBalbir Singh #else
3580cf475ad2SBalbir Singh static inline void mm_update_next_owner(struct mm_struct *mm)
3581cf475ad2SBalbir Singh {
3582cf475ad2SBalbir Singh }
3583f98bafa0SOleg Nesterov #endif /* CONFIG_MEMCG */
3584cf475ad2SBalbir Singh 
35853e10e716SJiri Slaby static inline unsigned long task_rlimit(const struct task_struct *tsk,
35863e10e716SJiri Slaby 		unsigned int limit)
35873e10e716SJiri Slaby {
3588316c1608SJason Low 	return READ_ONCE(tsk->signal->rlim[limit].rlim_cur);
35893e10e716SJiri Slaby }
35903e10e716SJiri Slaby 
35913e10e716SJiri Slaby static inline unsigned long task_rlimit_max(const struct task_struct *tsk,
35923e10e716SJiri Slaby 		unsigned int limit)
35933e10e716SJiri Slaby {
3594316c1608SJason Low 	return READ_ONCE(tsk->signal->rlim[limit].rlim_max);
35953e10e716SJiri Slaby }
35963e10e716SJiri Slaby 
35973e10e716SJiri Slaby static inline unsigned long rlimit(unsigned int limit)
35983e10e716SJiri Slaby {
35993e10e716SJiri Slaby 	return task_rlimit(current, limit);
36003e10e716SJiri Slaby }
36013e10e716SJiri Slaby 
36023e10e716SJiri Slaby static inline unsigned long rlimit_max(unsigned int limit)
36033e10e716SJiri Slaby {
36043e10e716SJiri Slaby 	return task_rlimit_max(current, limit);
36053e10e716SJiri Slaby }
36063e10e716SJiri Slaby 
360758919e83SRafael J. Wysocki #define SCHED_CPUFREQ_RT	(1U << 0)
360858919e83SRafael J. Wysocki #define SCHED_CPUFREQ_DL	(1U << 1)
36098c34ab19SRafael J. Wysocki #define SCHED_CPUFREQ_IOWAIT	(1U << 2)
361058919e83SRafael J. Wysocki 
361158919e83SRafael J. Wysocki #define SCHED_CPUFREQ_RT_DL	(SCHED_CPUFREQ_RT | SCHED_CPUFREQ_DL)
361258919e83SRafael J. Wysocki 
3613adaf9fcdSRafael J. Wysocki #ifdef CONFIG_CPU_FREQ
3614adaf9fcdSRafael J. Wysocki struct update_util_data {
361558919e83SRafael J. Wysocki        void (*func)(struct update_util_data *data, u64 time, unsigned int flags);
3616adaf9fcdSRafael J. Wysocki };
3617adaf9fcdSRafael J. Wysocki 
36180bed612bSRafael J. Wysocki void cpufreq_add_update_util_hook(int cpu, struct update_util_data *data,
36190bed612bSRafael J. Wysocki                        void (*func)(struct update_util_data *data, u64 time,
362058919e83SRafael J. Wysocki 				    unsigned int flags));
36210bed612bSRafael J. Wysocki void cpufreq_remove_update_util_hook(int cpu);
3622adaf9fcdSRafael J. Wysocki #endif /* CONFIG_CPU_FREQ */
3623adaf9fcdSRafael J. Wysocki 
36241da177e4SLinus Torvalds #endif
3625