xref: /linux/include/linux/sched.h (revision 356e4bfff2c5489e016fdb925adbf12a1e3950ee)
1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */
21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H
31da177e4SLinus Torvalds #define _LINUX_SCHED_H
41da177e4SLinus Torvalds 
55eca1c10SIngo Molnar /*
65eca1c10SIngo Molnar  * Define 'struct task_struct' and provide the main scheduler
75eca1c10SIngo Molnar  * APIs (schedule(), wakeup variants, etc.)
85eca1c10SIngo Molnar  */
95eca1c10SIngo Molnar 
10607ca46eSDavid Howells #include <uapi/linux/sched.h>
11b7b3c76aSDavid Woodhouse 
1270b8157eSIngo Molnar #include <asm/current.h>
1370b8157eSIngo Molnar 
145eca1c10SIngo Molnar #include <linux/pid.h>
155eca1c10SIngo Molnar #include <linux/sem.h>
165eca1c10SIngo Molnar #include <linux/shm.h>
175eca1c10SIngo Molnar #include <linux/kcov.h>
185eca1c10SIngo Molnar #include <linux/mutex.h>
195eca1c10SIngo Molnar #include <linux/plist.h>
205eca1c10SIngo Molnar #include <linux/hrtimer.h>
215eca1c10SIngo Molnar #include <linux/seccomp.h>
225eca1c10SIngo Molnar #include <linux/nodemask.h>
235eca1c10SIngo Molnar #include <linux/rcupdate.h>
245eca1c10SIngo Molnar #include <linux/resource.h>
255eca1c10SIngo Molnar #include <linux/latencytop.h>
265eca1c10SIngo Molnar #include <linux/sched/prio.h>
275eca1c10SIngo Molnar #include <linux/signal_types.h>
285eca1c10SIngo Molnar #include <linux/mm_types_task.h>
295eca1c10SIngo Molnar #include <linux/task_io_accounting.h>
305eca1c10SIngo Molnar 
315eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */
32c7af7877SIngo Molnar struct audit_context;
33c7af7877SIngo Molnar struct backing_dev_info;
34c7af7877SIngo Molnar struct bio_list;
35c7af7877SIngo Molnar struct blk_plug;
36c7af7877SIngo Molnar struct cfs_rq;
37c7af7877SIngo Molnar struct fs_struct;
38c7af7877SIngo Molnar struct futex_pi_state;
39c7af7877SIngo Molnar struct io_context;
40c7af7877SIngo Molnar struct mempolicy;
41c7af7877SIngo Molnar struct nameidata;
42c7af7877SIngo Molnar struct nsproxy;
43c7af7877SIngo Molnar struct perf_event_context;
44c7af7877SIngo Molnar struct pid_namespace;
45c7af7877SIngo Molnar struct pipe_inode_info;
46c7af7877SIngo Molnar struct rcu_node;
47c7af7877SIngo Molnar struct reclaim_state;
48c7af7877SIngo Molnar struct robust_list_head;
49e2d1e2aeSIngo Molnar struct sched_attr;
50e2d1e2aeSIngo Molnar struct sched_param;
5143ae34cbSIngo Molnar struct seq_file;
52c7af7877SIngo Molnar struct sighand_struct;
53c7af7877SIngo Molnar struct signal_struct;
54c7af7877SIngo Molnar struct task_delay_info;
554cf86d77SIngo Molnar struct task_group;
561da177e4SLinus Torvalds 
574a8342d2SLinus Torvalds /*
584a8342d2SLinus Torvalds  * Task state bitmask. NOTE! These bits are also
594a8342d2SLinus Torvalds  * encoded in fs/proc/array.c: get_task_state().
604a8342d2SLinus Torvalds  *
614a8342d2SLinus Torvalds  * We have two separate sets of flags: task->state
624a8342d2SLinus Torvalds  * is about runnability, while task->exit_state are
634a8342d2SLinus Torvalds  * about the task exiting. Confusing, but this way
644a8342d2SLinus Torvalds  * modifying one set can't modify the other one by
654a8342d2SLinus Torvalds  * mistake.
664a8342d2SLinus Torvalds  */
675eca1c10SIngo Molnar 
685eca1c10SIngo Molnar /* Used in tsk->state: */
6992c4bc9fSPeter Zijlstra #define TASK_RUNNING			0x0000
7092c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE		0x0001
7192c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE		0x0002
7292c4bc9fSPeter Zijlstra #define __TASK_STOPPED			0x0004
7392c4bc9fSPeter Zijlstra #define __TASK_TRACED			0x0008
745eca1c10SIngo Molnar /* Used in tsk->exit_state: */
7592c4bc9fSPeter Zijlstra #define EXIT_DEAD			0x0010
7692c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE			0x0020
77abd50b39SOleg Nesterov #define EXIT_TRACE			(EXIT_ZOMBIE | EXIT_DEAD)
785eca1c10SIngo Molnar /* Used in tsk->state again: */
798ef9925bSPeter Zijlstra #define TASK_PARKED			0x0040
808ef9925bSPeter Zijlstra #define TASK_DEAD			0x0080
818ef9925bSPeter Zijlstra #define TASK_WAKEKILL			0x0100
828ef9925bSPeter Zijlstra #define TASK_WAKING			0x0200
8392c4bc9fSPeter Zijlstra #define TASK_NOLOAD			0x0400
8492c4bc9fSPeter Zijlstra #define TASK_NEW			0x0800
8592c4bc9fSPeter Zijlstra #define TASK_STATE_MAX			0x1000
86f021a3c2SMatthew Wilcox 
875eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */
88f021a3c2SMatthew Wilcox #define TASK_KILLABLE			(TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
89f021a3c2SMatthew Wilcox #define TASK_STOPPED			(TASK_WAKEKILL | __TASK_STOPPED)
90f021a3c2SMatthew Wilcox #define TASK_TRACED			(TASK_WAKEKILL | __TASK_TRACED)
911da177e4SLinus Torvalds 
9280ed87c8SPeter Zijlstra #define TASK_IDLE			(TASK_UNINTERRUPTIBLE | TASK_NOLOAD)
9380ed87c8SPeter Zijlstra 
945eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */
9592a1f4bcSMatthew Wilcox #define TASK_NORMAL			(TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
9692a1f4bcSMatthew Wilcox 
975eca1c10SIngo Molnar /* get_task_state(): */
9892a1f4bcSMatthew Wilcox #define TASK_REPORT			(TASK_RUNNING | TASK_INTERRUPTIBLE | \
99f021a3c2SMatthew Wilcox 					 TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
1008ef9925bSPeter Zijlstra 					 __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \
1018ef9925bSPeter Zijlstra 					 TASK_PARKED)
10292a1f4bcSMatthew Wilcox 
103f021a3c2SMatthew Wilcox #define task_is_traced(task)		((task->state & __TASK_TRACED) != 0)
1045eca1c10SIngo Molnar 
105f021a3c2SMatthew Wilcox #define task_is_stopped(task)		((task->state & __TASK_STOPPED) != 0)
1065eca1c10SIngo Molnar 
1075eca1c10SIngo Molnar #define task_is_stopped_or_traced(task)	((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
1085eca1c10SIngo Molnar 
1095eca1c10SIngo Molnar #define task_contributes_to_load(task)	((task->state & TASK_UNINTERRUPTIBLE) != 0 && \
11080ed87c8SPeter Zijlstra 					 (task->flags & PF_FROZEN) == 0 && \
11180ed87c8SPeter Zijlstra 					 (task->state & TASK_NOLOAD) == 0)
1121da177e4SLinus Torvalds 
1138eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
1148eb23b9fSPeter Zijlstra 
1158eb23b9fSPeter Zijlstra #define __set_current_state(state_value)			\
1168eb23b9fSPeter Zijlstra 	do {							\
1178eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
1188eb23b9fSPeter Zijlstra 		current->state = (state_value);			\
1198eb23b9fSPeter Zijlstra 	} while (0)
1208eb23b9fSPeter Zijlstra #define set_current_state(state_value)				\
1218eb23b9fSPeter Zijlstra 	do {							\
1228eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
123b92b8b35SPeter Zijlstra 		smp_store_mb(current->state, (state_value));	\
1248eb23b9fSPeter Zijlstra 	} while (0)
1258eb23b9fSPeter Zijlstra 
1268eb23b9fSPeter Zijlstra #else
127498d0c57SAndrew Morton /*
128498d0c57SAndrew Morton  * set_current_state() includes a barrier so that the write of current->state
129498d0c57SAndrew Morton  * is correctly serialised wrt the caller's subsequent test of whether to
130498d0c57SAndrew Morton  * actually sleep:
131498d0c57SAndrew Morton  *
132a2250238SPeter Zijlstra  *   for (;;) {
133498d0c57SAndrew Morton  *	set_current_state(TASK_UNINTERRUPTIBLE);
134a2250238SPeter Zijlstra  *	if (!need_sleep)
135a2250238SPeter Zijlstra  *		break;
136498d0c57SAndrew Morton  *
137a2250238SPeter Zijlstra  *	schedule();
138a2250238SPeter Zijlstra  *   }
139a2250238SPeter Zijlstra  *   __set_current_state(TASK_RUNNING);
140a2250238SPeter Zijlstra  *
141a2250238SPeter Zijlstra  * If the caller does not need such serialisation (because, for instance, the
142a2250238SPeter Zijlstra  * condition test and condition change and wakeup are under the same lock) then
143a2250238SPeter Zijlstra  * use __set_current_state().
144a2250238SPeter Zijlstra  *
145a2250238SPeter Zijlstra  * The above is typically ordered against the wakeup, which does:
146a2250238SPeter Zijlstra  *
147a2250238SPeter Zijlstra  *	need_sleep = false;
148a2250238SPeter Zijlstra  *	wake_up_state(p, TASK_UNINTERRUPTIBLE);
149a2250238SPeter Zijlstra  *
150a2250238SPeter Zijlstra  * Where wake_up_state() (and all other wakeup primitives) imply enough
151a2250238SPeter Zijlstra  * barriers to order the store of the variable against wakeup.
152a2250238SPeter Zijlstra  *
153a2250238SPeter Zijlstra  * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is,
154a2250238SPeter Zijlstra  * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a
155a2250238SPeter Zijlstra  * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING).
156a2250238SPeter Zijlstra  *
157a2250238SPeter Zijlstra  * This is obviously fine, since they both store the exact same value.
158a2250238SPeter Zijlstra  *
159a2250238SPeter Zijlstra  * Also see the comments of try_to_wake_up().
160498d0c57SAndrew Morton  */
1615eca1c10SIngo Molnar #define __set_current_state(state_value) do { current->state = (state_value); } while (0)
1625eca1c10SIngo Molnar #define set_current_state(state_value)	 smp_store_mb(current->state, (state_value))
1638eb23b9fSPeter Zijlstra #endif
1648eb23b9fSPeter Zijlstra 
1655eca1c10SIngo Molnar /* Task command name length: */
1661da177e4SLinus Torvalds #define TASK_COMM_LEN			16
1671da177e4SLinus Torvalds 
1681da177e4SLinus Torvalds extern void scheduler_tick(void);
1691da177e4SLinus Torvalds 
1701da177e4SLinus Torvalds #define	MAX_SCHEDULE_TIMEOUT		LONG_MAX
1715eca1c10SIngo Molnar 
1725eca1c10SIngo Molnar extern long schedule_timeout(long timeout);
1735eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout);
1745eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout);
1755eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout);
1765eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout);
1771da177e4SLinus Torvalds asmlinkage void schedule(void);
178c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void);
1791da177e4SLinus Torvalds 
18010ab5643STejun Heo extern int __must_check io_schedule_prepare(void);
18110ab5643STejun Heo extern void io_schedule_finish(int token);
1829cff8adeSNeilBrown extern long io_schedule_timeout(long timeout);
18310ab5643STejun Heo extern void io_schedule(void);
1849cff8adeSNeilBrown 
185f06febc9SFrank Mayhar /**
1860ba42a59SMasanari Iida  * struct prev_cputime - snapshot of system and user cputime
187d37f761dSFrederic Weisbecker  * @utime: time spent in user mode
188d37f761dSFrederic Weisbecker  * @stime: time spent in system mode
1899d7fb042SPeter Zijlstra  * @lock: protects the above two fields
190d37f761dSFrederic Weisbecker  *
1919d7fb042SPeter Zijlstra  * Stores previous user/system time values such that we can guarantee
1929d7fb042SPeter Zijlstra  * monotonicity.
193d37f761dSFrederic Weisbecker  */
1949d7fb042SPeter Zijlstra struct prev_cputime {
1959d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
1965613fda9SFrederic Weisbecker 	u64				utime;
1975613fda9SFrederic Weisbecker 	u64				stime;
1989d7fb042SPeter Zijlstra 	raw_spinlock_t			lock;
1999d7fb042SPeter Zijlstra #endif
200d37f761dSFrederic Weisbecker };
201d37f761dSFrederic Weisbecker 
202d37f761dSFrederic Weisbecker /**
203f06febc9SFrank Mayhar  * struct task_cputime - collected CPU time counts
2045613fda9SFrederic Weisbecker  * @utime:		time spent in user mode, in nanoseconds
2055613fda9SFrederic Weisbecker  * @stime:		time spent in kernel mode, in nanoseconds
206f06febc9SFrank Mayhar  * @sum_exec_runtime:	total time spent on the CPU, in nanoseconds
207f06febc9SFrank Mayhar  *
2089d7fb042SPeter Zijlstra  * This structure groups together three kinds of CPU time that are tracked for
2099d7fb042SPeter Zijlstra  * threads and thread groups.  Most things considering CPU time want to group
2109d7fb042SPeter Zijlstra  * these counts together and treat all three of them in parallel.
211f06febc9SFrank Mayhar  */
212f06febc9SFrank Mayhar struct task_cputime {
2135613fda9SFrederic Weisbecker 	u64				utime;
2145613fda9SFrederic Weisbecker 	u64				stime;
215f06febc9SFrank Mayhar 	unsigned long long		sum_exec_runtime;
216f06febc9SFrank Mayhar };
2179d7fb042SPeter Zijlstra 
2185eca1c10SIngo Molnar /* Alternate field names when used on cache expirations: */
219f06febc9SFrank Mayhar #define virt_exp			utime
2209d7fb042SPeter Zijlstra #define prof_exp			stime
221f06febc9SFrank Mayhar #define sched_exp			sum_exec_runtime
222f06febc9SFrank Mayhar 
223bac5b6b6SFrederic Weisbecker enum vtime_state {
224bac5b6b6SFrederic Weisbecker 	/* Task is sleeping or running in a CPU with VTIME inactive: */
225bac5b6b6SFrederic Weisbecker 	VTIME_INACTIVE = 0,
226bac5b6b6SFrederic Weisbecker 	/* Task runs in userspace in a CPU with VTIME active: */
227bac5b6b6SFrederic Weisbecker 	VTIME_USER,
228bac5b6b6SFrederic Weisbecker 	/* Task runs in kernelspace in a CPU with VTIME active: */
229bac5b6b6SFrederic Weisbecker 	VTIME_SYS,
230bac5b6b6SFrederic Weisbecker };
231bac5b6b6SFrederic Weisbecker 
232bac5b6b6SFrederic Weisbecker struct vtime {
233bac5b6b6SFrederic Weisbecker 	seqcount_t		seqcount;
234bac5b6b6SFrederic Weisbecker 	unsigned long long	starttime;
235bac5b6b6SFrederic Weisbecker 	enum vtime_state	state;
2362a42eb95SWanpeng Li 	u64			utime;
2372a42eb95SWanpeng Li 	u64			stime;
2382a42eb95SWanpeng Li 	u64			gtime;
239bac5b6b6SFrederic Weisbecker };
240bac5b6b6SFrederic Weisbecker 
2411da177e4SLinus Torvalds struct sched_info {
2427f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO
2435eca1c10SIngo Molnar 	/* Cumulative counters: */
2441da177e4SLinus Torvalds 
2455eca1c10SIngo Molnar 	/* # of times we have run on this CPU: */
2465eca1c10SIngo Molnar 	unsigned long			pcount;
2475eca1c10SIngo Molnar 
2485eca1c10SIngo Molnar 	/* Time spent waiting on a runqueue: */
2495eca1c10SIngo Molnar 	unsigned long long		run_delay;
2505eca1c10SIngo Molnar 
2515eca1c10SIngo Molnar 	/* Timestamps: */
2525eca1c10SIngo Molnar 
2535eca1c10SIngo Molnar 	/* When did we last run on a CPU? */
2545eca1c10SIngo Molnar 	unsigned long long		last_arrival;
2555eca1c10SIngo Molnar 
2565eca1c10SIngo Molnar 	/* When were we last queued to run? */
2575eca1c10SIngo Molnar 	unsigned long long		last_queued;
2585eca1c10SIngo Molnar 
259f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */
2607f5f8e8dSIngo Molnar };
2611da177e4SLinus Torvalds 
2621da177e4SLinus Torvalds /*
2636ecdd749SYuyang Du  * Integer metrics need fixed point arithmetic, e.g., sched/fair
2646ecdd749SYuyang Du  * has a few: load, load_avg, util_avg, freq, and capacity.
2656ecdd749SYuyang Du  *
2666ecdd749SYuyang Du  * We define a basic fixed point arithmetic range, and then formalize
2676ecdd749SYuyang Du  * all these metrics based on that basic range.
2686ecdd749SYuyang Du  */
2696ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT		10
2706ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE		(1L << SCHED_FIXEDPOINT_SHIFT)
2716ecdd749SYuyang Du 
27220b8a59fSIngo Molnar struct load_weight {
2739dbdb155SPeter Zijlstra 	unsigned long			weight;
2749dbdb155SPeter Zijlstra 	u32				inv_weight;
27520b8a59fSIngo Molnar };
27620b8a59fSIngo Molnar 
2777f65ea42SPatrick Bellasi /**
2787f65ea42SPatrick Bellasi  * struct util_est - Estimation utilization of FAIR tasks
2797f65ea42SPatrick Bellasi  * @enqueued: instantaneous estimated utilization of a task/cpu
2807f65ea42SPatrick Bellasi  * @ewma:     the Exponential Weighted Moving Average (EWMA)
2817f65ea42SPatrick Bellasi  *            utilization of a task
2827f65ea42SPatrick Bellasi  *
2837f65ea42SPatrick Bellasi  * Support data structure to track an Exponential Weighted Moving Average
2847f65ea42SPatrick Bellasi  * (EWMA) of a FAIR task's utilization. New samples are added to the moving
2857f65ea42SPatrick Bellasi  * average each time a task completes an activation. Sample's weight is chosen
2867f65ea42SPatrick Bellasi  * so that the EWMA will be relatively insensitive to transient changes to the
2877f65ea42SPatrick Bellasi  * task's workload.
2887f65ea42SPatrick Bellasi  *
2897f65ea42SPatrick Bellasi  * The enqueued attribute has a slightly different meaning for tasks and cpus:
2907f65ea42SPatrick Bellasi  * - task:   the task's util_avg at last task dequeue time
2917f65ea42SPatrick Bellasi  * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU
2927f65ea42SPatrick Bellasi  * Thus, the util_est.enqueued of a task represents the contribution on the
2937f65ea42SPatrick Bellasi  * estimated utilization of the CPU where that task is currently enqueued.
2947f65ea42SPatrick Bellasi  *
2957f65ea42SPatrick Bellasi  * Only for tasks we track a moving average of the past instantaneous
2967f65ea42SPatrick Bellasi  * estimated utilization. This allows to absorb sporadic drops in utilization
2977f65ea42SPatrick Bellasi  * of an otherwise almost periodic task.
2987f65ea42SPatrick Bellasi  */
2997f65ea42SPatrick Bellasi struct util_est {
3007f65ea42SPatrick Bellasi 	unsigned int			enqueued;
3017f65ea42SPatrick Bellasi 	unsigned int			ewma;
3027f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT		2
303317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64))));
3047f65ea42SPatrick Bellasi 
3059d89c257SYuyang Du /*
3067b595334SYuyang Du  * The load_avg/util_avg accumulates an infinite geometric series
3077b595334SYuyang Du  * (see __update_load_avg() in kernel/sched/fair.c).
3087b595334SYuyang Du  *
3097b595334SYuyang Du  * [load_avg definition]
3107b595334SYuyang Du  *
3117b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load)
3127b595334SYuyang Du  *
3137b595334SYuyang Du  * where runnable% is the time ratio that a sched_entity is runnable.
3147b595334SYuyang Du  * For cfs_rq, it is the aggregated load_avg of all runnable and
3159d89c257SYuyang Du  * blocked sched_entities.
3167b595334SYuyang Du  *
3177b595334SYuyang Du  * load_avg may also take frequency scaling into account:
3187b595334SYuyang Du  *
3197b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load) * freq%
3207b595334SYuyang Du  *
3217b595334SYuyang Du  * where freq% is the CPU frequency normalized to the highest frequency.
3227b595334SYuyang Du  *
3237b595334SYuyang Du  * [util_avg definition]
3247b595334SYuyang Du  *
3257b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE
3267b595334SYuyang Du  *
3277b595334SYuyang Du  * where running% is the time ratio that a sched_entity is running on
3287b595334SYuyang Du  * a CPU. For cfs_rq, it is the aggregated util_avg of all runnable
3297b595334SYuyang Du  * and blocked sched_entities.
3307b595334SYuyang Du  *
3317b595334SYuyang Du  * util_avg may also factor frequency scaling and CPU capacity scaling:
3327b595334SYuyang Du  *
3337b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE * freq% * capacity%
3347b595334SYuyang Du  *
3357b595334SYuyang Du  * where freq% is the same as above, and capacity% is the CPU capacity
3367b595334SYuyang Du  * normalized to the greatest capacity (due to uarch differences, etc).
3377b595334SYuyang Du  *
3387b595334SYuyang Du  * N.B., the above ratios (runnable%, running%, freq%, and capacity%)
3397b595334SYuyang Du  * themselves are in the range of [0, 1]. To do fixed point arithmetics,
3407b595334SYuyang Du  * we therefore scale them to as large a range as necessary. This is for
3417b595334SYuyang Du  * example reflected by util_avg's SCHED_CAPACITY_SCALE.
3427b595334SYuyang Du  *
3437b595334SYuyang Du  * [Overflow issue]
3447b595334SYuyang Du  *
3457b595334SYuyang Du  * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities
3467b595334SYuyang Du  * with the highest load (=88761), always runnable on a single cfs_rq,
3477b595334SYuyang Du  * and should not overflow as the number already hits PID_MAX_LIMIT.
3487b595334SYuyang Du  *
3497b595334SYuyang Du  * For all other cases (including 32-bit kernels), struct load_weight's
3507b595334SYuyang Du  * weight will overflow first before we do, because:
3517b595334SYuyang Du  *
3527b595334SYuyang Du  *    Max(load_avg) <= Max(load.weight)
3537b595334SYuyang Du  *
3547b595334SYuyang Du  * Then it is the load_weight's responsibility to consider overflow
3557b595334SYuyang Du  * issues.
3569d89c257SYuyang Du  */
3579d85f21cSPaul Turner struct sched_avg {
3585eca1c10SIngo Molnar 	u64				last_update_time;
3595eca1c10SIngo Molnar 	u64				load_sum;
3601ea6c46aSPeter Zijlstra 	u64				runnable_load_sum;
3615eca1c10SIngo Molnar 	u32				util_sum;
3625eca1c10SIngo Molnar 	u32				period_contrib;
3635eca1c10SIngo Molnar 	unsigned long			load_avg;
3641ea6c46aSPeter Zijlstra 	unsigned long			runnable_load_avg;
3655eca1c10SIngo Molnar 	unsigned long			util_avg;
3667f65ea42SPatrick Bellasi 	struct util_est			util_est;
367317d359dSPeter Zijlstra } ____cacheline_aligned;
3689d85f21cSPaul Turner 
36941acab88SLucas De Marchi struct sched_statistics {
3707f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS
37194c18227SIngo Molnar 	u64				wait_start;
37294c18227SIngo Molnar 	u64				wait_max;
3736d082592SArjan van de Ven 	u64				wait_count;
3746d082592SArjan van de Ven 	u64				wait_sum;
3758f0dfc34SArjan van de Ven 	u64				iowait_count;
3768f0dfc34SArjan van de Ven 	u64				iowait_sum;
37794c18227SIngo Molnar 
37894c18227SIngo Molnar 	u64				sleep_start;
37920b8a59fSIngo Molnar 	u64				sleep_max;
38094c18227SIngo Molnar 	s64				sum_sleep_runtime;
38194c18227SIngo Molnar 
38294c18227SIngo Molnar 	u64				block_start;
38320b8a59fSIngo Molnar 	u64				block_max;
38420b8a59fSIngo Molnar 	u64				exec_max;
385eba1ed4bSIngo Molnar 	u64				slice_max;
386cc367732SIngo Molnar 
387cc367732SIngo Molnar 	u64				nr_migrations_cold;
388cc367732SIngo Molnar 	u64				nr_failed_migrations_affine;
389cc367732SIngo Molnar 	u64				nr_failed_migrations_running;
390cc367732SIngo Molnar 	u64				nr_failed_migrations_hot;
391cc367732SIngo Molnar 	u64				nr_forced_migrations;
392cc367732SIngo Molnar 
393cc367732SIngo Molnar 	u64				nr_wakeups;
394cc367732SIngo Molnar 	u64				nr_wakeups_sync;
395cc367732SIngo Molnar 	u64				nr_wakeups_migrate;
396cc367732SIngo Molnar 	u64				nr_wakeups_local;
397cc367732SIngo Molnar 	u64				nr_wakeups_remote;
398cc367732SIngo Molnar 	u64				nr_wakeups_affine;
399cc367732SIngo Molnar 	u64				nr_wakeups_affine_attempts;
400cc367732SIngo Molnar 	u64				nr_wakeups_passive;
401cc367732SIngo Molnar 	u64				nr_wakeups_idle;
40241acab88SLucas De Marchi #endif
4037f5f8e8dSIngo Molnar };
40441acab88SLucas De Marchi 
40541acab88SLucas De Marchi struct sched_entity {
4065eca1c10SIngo Molnar 	/* For load-balancing: */
4075eca1c10SIngo Molnar 	struct load_weight		load;
4081ea6c46aSPeter Zijlstra 	unsigned long			runnable_weight;
40941acab88SLucas De Marchi 	struct rb_node			run_node;
41041acab88SLucas De Marchi 	struct list_head		group_node;
41141acab88SLucas De Marchi 	unsigned int			on_rq;
41241acab88SLucas De Marchi 
41341acab88SLucas De Marchi 	u64				exec_start;
41441acab88SLucas De Marchi 	u64				sum_exec_runtime;
41541acab88SLucas De Marchi 	u64				vruntime;
41641acab88SLucas De Marchi 	u64				prev_sum_exec_runtime;
41741acab88SLucas De Marchi 
41841acab88SLucas De Marchi 	u64				nr_migrations;
41941acab88SLucas De Marchi 
42041acab88SLucas De Marchi 	struct sched_statistics		statistics;
42194c18227SIngo Molnar 
42220b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED
423fed14d45SPeter Zijlstra 	int				depth;
42420b8a59fSIngo Molnar 	struct sched_entity		*parent;
42520b8a59fSIngo Molnar 	/* rq on which this entity is (to be) queued: */
42620b8a59fSIngo Molnar 	struct cfs_rq			*cfs_rq;
42720b8a59fSIngo Molnar 	/* rq "owned" by this entity/group: */
42820b8a59fSIngo Molnar 	struct cfs_rq			*my_q;
42920b8a59fSIngo Molnar #endif
4308bd75c77SClark Williams 
431141965c7SAlex Shi #ifdef CONFIG_SMP
4325a107804SJiri Olsa 	/*
4335a107804SJiri Olsa 	 * Per entity load average tracking.
4345a107804SJiri Olsa 	 *
4355a107804SJiri Olsa 	 * Put into separate cache line so it does not
4365a107804SJiri Olsa 	 * collide with read-mostly values above.
4375a107804SJiri Olsa 	 */
438317d359dSPeter Zijlstra 	struct sched_avg		avg;
4399d85f21cSPaul Turner #endif
44020b8a59fSIngo Molnar };
44170b97a7fSIngo Molnar 
442fa717060SPeter Zijlstra struct sched_rt_entity {
443fa717060SPeter Zijlstra 	struct list_head		run_list;
44478f2c7dbSPeter Zijlstra 	unsigned long			timeout;
44557d2aa00SYing Xue 	unsigned long			watchdog_stamp;
446bee367edSRichard Kennedy 	unsigned int			time_slice;
447ff77e468SPeter Zijlstra 	unsigned short			on_rq;
448ff77e468SPeter Zijlstra 	unsigned short			on_list;
4496f505b16SPeter Zijlstra 
45058d6c2d7SPeter Zijlstra 	struct sched_rt_entity		*back;
451052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED
4526f505b16SPeter Zijlstra 	struct sched_rt_entity		*parent;
4536f505b16SPeter Zijlstra 	/* rq on which this entity is (to be) queued: */
4546f505b16SPeter Zijlstra 	struct rt_rq			*rt_rq;
4556f505b16SPeter Zijlstra 	/* rq "owned" by this entity/group: */
4566f505b16SPeter Zijlstra 	struct rt_rq			*my_q;
4576f505b16SPeter Zijlstra #endif
4583859a271SKees Cook } __randomize_layout;
459fa717060SPeter Zijlstra 
460aab03e05SDario Faggioli struct sched_dl_entity {
461aab03e05SDario Faggioli 	struct rb_node			rb_node;
462aab03e05SDario Faggioli 
463aab03e05SDario Faggioli 	/*
464aab03e05SDario Faggioli 	 * Original scheduling parameters. Copied here from sched_attr
4654027d080Sxiaofeng.yan 	 * during sched_setattr(), they will remain the same until
4664027d080Sxiaofeng.yan 	 * the next sched_setattr().
467aab03e05SDario Faggioli 	 */
4685eca1c10SIngo Molnar 	u64				dl_runtime;	/* Maximum runtime for each instance	*/
4695eca1c10SIngo Molnar 	u64				dl_deadline;	/* Relative deadline of each instance	*/
4705eca1c10SIngo Molnar 	u64				dl_period;	/* Separation of two instances (period) */
47154d6d303SDaniel Bristot de Oliveira 	u64				dl_bw;		/* dl_runtime / dl_period		*/
4723effcb42SDaniel Bristot de Oliveira 	u64				dl_density;	/* dl_runtime / dl_deadline		*/
473aab03e05SDario Faggioli 
474aab03e05SDario Faggioli 	/*
475aab03e05SDario Faggioli 	 * Actual scheduling parameters. Initialized with the values above,
476aab03e05SDario Faggioli 	 * they are continously updated during task execution. Note that
477aab03e05SDario Faggioli 	 * the remaining runtime could be < 0 in case we are in overrun.
478aab03e05SDario Faggioli 	 */
4795eca1c10SIngo Molnar 	s64				runtime;	/* Remaining runtime for this instance	*/
4805eca1c10SIngo Molnar 	u64				deadline;	/* Absolute deadline for this instance	*/
4815eca1c10SIngo Molnar 	unsigned int			flags;		/* Specifying the scheduler behaviour	*/
482aab03e05SDario Faggioli 
483aab03e05SDario Faggioli 	/*
484aab03e05SDario Faggioli 	 * Some bool flags:
485aab03e05SDario Faggioli 	 *
486aab03e05SDario Faggioli 	 * @dl_throttled tells if we exhausted the runtime. If so, the
487aab03e05SDario Faggioli 	 * task has to wait for a replenishment to be performed at the
488aab03e05SDario Faggioli 	 * next firing of dl_timer.
489aab03e05SDario Faggioli 	 *
4902d3d891dSDario Faggioli 	 * @dl_boosted tells if we are boosted due to DI. If so we are
4912d3d891dSDario Faggioli 	 * outside bandwidth enforcement mechanism (but only until we
4925bfd126eSJuri Lelli 	 * exit the critical section);
4935bfd126eSJuri Lelli 	 *
4945eca1c10SIngo Molnar 	 * @dl_yielded tells if task gave up the CPU before consuming
4955bfd126eSJuri Lelli 	 * all its available runtime during the last job.
496209a0cbdSLuca Abeni 	 *
497209a0cbdSLuca Abeni 	 * @dl_non_contending tells if the task is inactive while still
498209a0cbdSLuca Abeni 	 * contributing to the active utilization. In other words, it
499209a0cbdSLuca Abeni 	 * indicates if the inactive timer has been armed and its handler
500209a0cbdSLuca Abeni 	 * has not been executed yet. This flag is useful to avoid race
501209a0cbdSLuca Abeni 	 * conditions between the inactive timer handler and the wakeup
502209a0cbdSLuca Abeni 	 * code.
50334be3930SJuri Lelli 	 *
50434be3930SJuri Lelli 	 * @dl_overrun tells if the task asked to be informed about runtime
50534be3930SJuri Lelli 	 * overruns.
506aab03e05SDario Faggioli 	 */
507aa5222e9SDan Carpenter 	unsigned int			dl_throttled      : 1;
508aa5222e9SDan Carpenter 	unsigned int			dl_boosted        : 1;
509aa5222e9SDan Carpenter 	unsigned int			dl_yielded        : 1;
510aa5222e9SDan Carpenter 	unsigned int			dl_non_contending : 1;
51134be3930SJuri Lelli 	unsigned int			dl_overrun	  : 1;
512aab03e05SDario Faggioli 
513aab03e05SDario Faggioli 	/*
514aab03e05SDario Faggioli 	 * Bandwidth enforcement timer. Each -deadline task has its
515aab03e05SDario Faggioli 	 * own bandwidth to be enforced, thus we need one timer per task.
516aab03e05SDario Faggioli 	 */
517aab03e05SDario Faggioli 	struct hrtimer			dl_timer;
518209a0cbdSLuca Abeni 
519209a0cbdSLuca Abeni 	/*
520209a0cbdSLuca Abeni 	 * Inactive timer, responsible for decreasing the active utilization
521209a0cbdSLuca Abeni 	 * at the "0-lag time". When a -deadline task blocks, it contributes
522209a0cbdSLuca Abeni 	 * to GRUB's active utilization until the "0-lag time", hence a
523209a0cbdSLuca Abeni 	 * timer is needed to decrease the active utilization at the correct
524209a0cbdSLuca Abeni 	 * time.
525209a0cbdSLuca Abeni 	 */
526209a0cbdSLuca Abeni 	struct hrtimer inactive_timer;
527aab03e05SDario Faggioli };
5288bd75c77SClark Williams 
5291d082fd0SPaul E. McKenney union rcu_special {
5301d082fd0SPaul E. McKenney 	struct {
5318203d6d0SPaul E. McKenney 		u8			blocked;
5328203d6d0SPaul E. McKenney 		u8			need_qs;
5338203d6d0SPaul E. McKenney 		u8			exp_need_qs;
5345eca1c10SIngo Molnar 
5355eca1c10SIngo Molnar 		/* Otherwise the compiler can store garbage here: */
5365eca1c10SIngo Molnar 		u8			pad;
5378203d6d0SPaul E. McKenney 	} b; /* Bits. */
5388203d6d0SPaul E. McKenney 	u32 s; /* Set of bits. */
5391d082fd0SPaul E. McKenney };
54086848966SPaul E. McKenney 
5418dc85d54SPeter Zijlstra enum perf_event_task_context {
5428dc85d54SPeter Zijlstra 	perf_invalid_context = -1,
5438dc85d54SPeter Zijlstra 	perf_hw_context = 0,
54489a1e187SPeter Zijlstra 	perf_sw_context,
5458dc85d54SPeter Zijlstra 	perf_nr_task_contexts,
5468dc85d54SPeter Zijlstra };
5478dc85d54SPeter Zijlstra 
548eb61baf6SIngo Molnar struct wake_q_node {
549eb61baf6SIngo Molnar 	struct wake_q_node *next;
550eb61baf6SIngo Molnar };
551eb61baf6SIngo Molnar 
5521da177e4SLinus Torvalds struct task_struct {
553c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
554c65eacbeSAndy Lutomirski 	/*
555c65eacbeSAndy Lutomirski 	 * For reasons of header soup (see current_thread_info()), this
556c65eacbeSAndy Lutomirski 	 * must be the first element of task_struct.
557c65eacbeSAndy Lutomirski 	 */
558c65eacbeSAndy Lutomirski 	struct thread_info		thread_info;
559c65eacbeSAndy Lutomirski #endif
5605eca1c10SIngo Molnar 	/* -1 unrunnable, 0 runnable, >0 stopped: */
5615eca1c10SIngo Molnar 	volatile long			state;
56229e48ce8SKees Cook 
56329e48ce8SKees Cook 	/*
56429e48ce8SKees Cook 	 * This begins the randomizable portion of task_struct. Only
56529e48ce8SKees Cook 	 * scheduling-critical items should be added above here.
56629e48ce8SKees Cook 	 */
56729e48ce8SKees Cook 	randomized_struct_fields_start
56829e48ce8SKees Cook 
569f7e4217bSRoman Zippel 	void				*stack;
5701da177e4SLinus Torvalds 	atomic_t			usage;
5715eca1c10SIngo Molnar 	/* Per task flags (PF_*), defined further below: */
5725eca1c10SIngo Molnar 	unsigned int			flags;
57397dc32cdSWilliam Cohen 	unsigned int			ptrace;
5741da177e4SLinus Torvalds 
5752dd73a4fSPeter Williams #ifdef CONFIG_SMP
576fa14ff4aSPeter Zijlstra 	struct llist_node		wake_entry;
5773ca7a440SPeter Zijlstra 	int				on_cpu;
578c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
5795eca1c10SIngo Molnar 	/* Current CPU: */
5805eca1c10SIngo Molnar 	unsigned int			cpu;
581c65eacbeSAndy Lutomirski #endif
58263b0e9edSMike Galbraith 	unsigned int			wakee_flips;
58362470419SMichael Wang 	unsigned long			wakee_flip_decay_ts;
58463b0e9edSMike Galbraith 	struct task_struct		*last_wakee;
585ac66f547SPeter Zijlstra 
58632e839ddSMel Gorman 	/*
58732e839ddSMel Gorman 	 * recent_used_cpu is initially set as the last CPU used by a task
58832e839ddSMel Gorman 	 * that wakes affine another task. Waker/wakee relationships can
58932e839ddSMel Gorman 	 * push tasks around a CPU where each wakeup moves to the next one.
59032e839ddSMel Gorman 	 * Tracking a recently used CPU allows a quick search for a recently
59132e839ddSMel Gorman 	 * used CPU that may be idle.
59232e839ddSMel Gorman 	 */
59332e839ddSMel Gorman 	int				recent_used_cpu;
594ac66f547SPeter Zijlstra 	int				wake_cpu;
5954866cde0SNick Piggin #endif
596fd2f4419SPeter Zijlstra 	int				on_rq;
59750e645a8SIngo Molnar 
5985eca1c10SIngo Molnar 	int				prio;
5995eca1c10SIngo Molnar 	int				static_prio;
6005eca1c10SIngo Molnar 	int				normal_prio;
601c7aceabaSRichard Kennedy 	unsigned int			rt_priority;
6025eca1c10SIngo Molnar 
6035522d5d5SIngo Molnar 	const struct sched_class	*sched_class;
60420b8a59fSIngo Molnar 	struct sched_entity		se;
605fa717060SPeter Zijlstra 	struct sched_rt_entity		rt;
6068323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED
6078323f26cSPeter Zijlstra 	struct task_group		*sched_task_group;
6088323f26cSPeter Zijlstra #endif
609aab03e05SDario Faggioli 	struct sched_dl_entity		dl;
6101da177e4SLinus Torvalds 
611e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS
6125eca1c10SIngo Molnar 	/* List of struct preempt_notifier: */
613e107be36SAvi Kivity 	struct hlist_head		preempt_notifiers;
614e107be36SAvi Kivity #endif
615e107be36SAvi Kivity 
6166c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE
6172056a782SJens Axboe 	unsigned int			btrace_seq;
6186c5c9341SAlexey Dobriyan #endif
6191da177e4SLinus Torvalds 
62097dc32cdSWilliam Cohen 	unsigned int			policy;
62129baa747SPeter Zijlstra 	int				nr_cpus_allowed;
6221da177e4SLinus Torvalds 	cpumask_t			cpus_allowed;
6231da177e4SLinus Torvalds 
624a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU
625e260be67SPaul E. McKenney 	int				rcu_read_lock_nesting;
6261d082fd0SPaul E. McKenney 	union rcu_special		rcu_read_unlock_special;
627f41d911fSPaul E. McKenney 	struct list_head		rcu_node_entry;
628a57eb940SPaul E. McKenney 	struct rcu_node			*rcu_blocked_node;
62928f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */
6305eca1c10SIngo Molnar 
6318315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU
6328315f422SPaul E. McKenney 	unsigned long			rcu_tasks_nvcsw;
633ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_holdout;
634ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_idx;
635176f8f7aSPaul E. McKenney 	int				rcu_tasks_idle_cpu;
636ccdd29ffSPaul E. McKenney 	struct list_head		rcu_tasks_holdout_list;
6378315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */
638e260be67SPaul E. McKenney 
6391da177e4SLinus Torvalds 	struct sched_info		sched_info;
6401da177e4SLinus Torvalds 
6411da177e4SLinus Torvalds 	struct list_head		tasks;
642806c09a7SDario Faggioli #ifdef CONFIG_SMP
643917b627dSGregory Haskins 	struct plist_node		pushable_tasks;
6441baca4ceSJuri Lelli 	struct rb_node			pushable_dl_tasks;
645806c09a7SDario Faggioli #endif
6461da177e4SLinus Torvalds 
6475eca1c10SIngo Molnar 	struct mm_struct		*mm;
6485eca1c10SIngo Molnar 	struct mm_struct		*active_mm;
649314ff785SIngo Molnar 
650314ff785SIngo Molnar 	/* Per-thread vma caching: */
651314ff785SIngo Molnar 	struct vmacache			vmacache;
652314ff785SIngo Molnar 
6535eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING
65434e55232SKAMEZAWA Hiroyuki 	struct task_rss_stat		rss_stat;
65534e55232SKAMEZAWA Hiroyuki #endif
65697dc32cdSWilliam Cohen 	int				exit_state;
6575eca1c10SIngo Molnar 	int				exit_code;
6585eca1c10SIngo Molnar 	int				exit_signal;
6595eca1c10SIngo Molnar 	/* The signal sent when the parent dies: */
6605eca1c10SIngo Molnar 	int				pdeath_signal;
6615eca1c10SIngo Molnar 	/* JOBCTL_*, siglock protected: */
6625eca1c10SIngo Molnar 	unsigned long			jobctl;
6639b89f6baSAndrei Epure 
6645eca1c10SIngo Molnar 	/* Used for emulating ABI behavior of previous Linux versions: */
66597dc32cdSWilliam Cohen 	unsigned int			personality;
6669b89f6baSAndrei Epure 
6675eca1c10SIngo Molnar 	/* Scheduler bits, serialized by scheduler locks: */
668ca94c442SLennart Poettering 	unsigned			sched_reset_on_fork:1;
669a8e4f2eaSPeter Zijlstra 	unsigned			sched_contributes_to_load:1;
670ff303e66SPeter Zijlstra 	unsigned			sched_migrated:1;
671b7e7ade3SPeter Zijlstra 	unsigned			sched_remote_wakeup:1;
6725eca1c10SIngo Molnar 	/* Force alignment to the next boundary: */
6735eca1c10SIngo Molnar 	unsigned			:0;
674be958bdcSPeter Zijlstra 
6755eca1c10SIngo Molnar 	/* Unserialized, strictly 'current' */
6765eca1c10SIngo Molnar 
6775eca1c10SIngo Molnar 	/* Bit to tell LSMs we're in execve(): */
6785eca1c10SIngo Molnar 	unsigned			in_execve:1;
679be958bdcSPeter Zijlstra 	unsigned			in_iowait:1;
6805eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK
6817e781418SAndy Lutomirski 	unsigned			restore_sigmask:1;
6827e781418SAndy Lutomirski #endif
683626ebc41STejun Heo #ifdef CONFIG_MEMCG
684626ebc41STejun Heo 	unsigned			memcg_may_oom:1;
685127424c8SJohannes Weiner #ifndef CONFIG_SLOB
6866f185c29SVladimir Davydov 	unsigned			memcg_kmem_skip_account:1;
6876f185c29SVladimir Davydov #endif
688127424c8SJohannes Weiner #endif
689ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK
690ff303e66SPeter Zijlstra 	unsigned			brk_randomized:1;
691ff303e66SPeter Zijlstra #endif
69277f88796STejun Heo #ifdef CONFIG_CGROUPS
69377f88796STejun Heo 	/* disallow userland-initiated cgroup migration */
69477f88796STejun Heo 	unsigned			no_cgroup_migration:1;
69577f88796STejun Heo #endif
6966f185c29SVladimir Davydov 
6975eca1c10SIngo Molnar 	unsigned long			atomic_flags; /* Flags requiring atomic access. */
6981d4457f9SKees Cook 
699f56141e3SAndy Lutomirski 	struct restart_block		restart_block;
700f56141e3SAndy Lutomirski 
7011da177e4SLinus Torvalds 	pid_t				pid;
7021da177e4SLinus Torvalds 	pid_t				tgid;
7030a425405SArjan van de Ven 
7041314562aSHiroshi Shimamoto #ifdef CONFIG_CC_STACKPROTECTOR
7055eca1c10SIngo Molnar 	/* Canary value for the -fstack-protector GCC feature: */
7060a425405SArjan van de Ven 	unsigned long			stack_canary;
7071314562aSHiroshi Shimamoto #endif
7081da177e4SLinus Torvalds 	/*
7095eca1c10SIngo Molnar 	 * Pointers to the (original) parent process, youngest child, younger sibling,
7101da177e4SLinus Torvalds 	 * older sibling, respectively.  (p->father can be replaced with
711f470021aSRoland McGrath 	 * p->real_parent->pid)
7121da177e4SLinus Torvalds 	 */
7135eca1c10SIngo Molnar 
7145eca1c10SIngo Molnar 	/* Real parent process: */
7155eca1c10SIngo Molnar 	struct task_struct __rcu	*real_parent;
7165eca1c10SIngo Molnar 
7175eca1c10SIngo Molnar 	/* Recipient of SIGCHLD, wait4() reports: */
7185eca1c10SIngo Molnar 	struct task_struct __rcu	*parent;
7191da177e4SLinus Torvalds 
720f470021aSRoland McGrath 	/*
7215eca1c10SIngo Molnar 	 * Children/sibling form the list of natural children:
7225eca1c10SIngo Molnar 	 */
7235eca1c10SIngo Molnar 	struct list_head		children;
7245eca1c10SIngo Molnar 	struct list_head		sibling;
7255eca1c10SIngo Molnar 	struct task_struct		*group_leader;
7265eca1c10SIngo Molnar 
7275eca1c10SIngo Molnar 	/*
7285eca1c10SIngo Molnar 	 * 'ptraced' is the list of tasks this task is using ptrace() on.
7295eca1c10SIngo Molnar 	 *
730f470021aSRoland McGrath 	 * This includes both natural children and PTRACE_ATTACH targets.
7315eca1c10SIngo Molnar 	 * 'ptrace_entry' is this task's link on the p->parent->ptraced list.
732f470021aSRoland McGrath 	 */
733f470021aSRoland McGrath 	struct list_head		ptraced;
734f470021aSRoland McGrath 	struct list_head		ptrace_entry;
735f470021aSRoland McGrath 
7361da177e4SLinus Torvalds 	/* PID/PID hash table linkage. */
73792476d7fSEric W. Biederman 	struct pid_link			pids[PIDTYPE_MAX];
73847e65328SOleg Nesterov 	struct list_head		thread_group;
7390c740d0aSOleg Nesterov 	struct list_head		thread_node;
7401da177e4SLinus Torvalds 
7415eca1c10SIngo Molnar 	struct completion		*vfork_done;
7421da177e4SLinus Torvalds 
7435eca1c10SIngo Molnar 	/* CLONE_CHILD_SETTID: */
7445eca1c10SIngo Molnar 	int __user			*set_child_tid;
7455eca1c10SIngo Molnar 
7465eca1c10SIngo Molnar 	/* CLONE_CHILD_CLEARTID: */
7475eca1c10SIngo Molnar 	int __user			*clear_child_tid;
7485eca1c10SIngo Molnar 
7495eca1c10SIngo Molnar 	u64				utime;
7505eca1c10SIngo Molnar 	u64				stime;
75140565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME
7525eca1c10SIngo Molnar 	u64				utimescaled;
7535eca1c10SIngo Molnar 	u64				stimescaled;
75440565b5aSStanislaw Gruszka #endif
75516a6d9beSFrederic Weisbecker 	u64				gtime;
7569d7fb042SPeter Zijlstra 	struct prev_cputime		prev_cputime;
7576a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
758bac5b6b6SFrederic Weisbecker 	struct vtime			vtime;
7596a61671bSFrederic Weisbecker #endif
760d027d45dSFrederic Weisbecker 
761d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
762f009a7a7SFrederic Weisbecker 	atomic_t			tick_dep_mask;
763d027d45dSFrederic Weisbecker #endif
7645eca1c10SIngo Molnar 	/* Context switch counts: */
7655eca1c10SIngo Molnar 	unsigned long			nvcsw;
7665eca1c10SIngo Molnar 	unsigned long			nivcsw;
7675eca1c10SIngo Molnar 
7685eca1c10SIngo Molnar 	/* Monotonic time in nsecs: */
7695eca1c10SIngo Molnar 	u64				start_time;
7705eca1c10SIngo Molnar 
7715eca1c10SIngo Molnar 	/* Boot based time in nsecs: */
7725eca1c10SIngo Molnar 	u64				real_start_time;
7735eca1c10SIngo Molnar 
7745eca1c10SIngo Molnar 	/* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */
7755eca1c10SIngo Molnar 	unsigned long			min_flt;
7765eca1c10SIngo Molnar 	unsigned long			maj_flt;
7771da177e4SLinus Torvalds 
778b18b6a9cSNicolas Pitre #ifdef CONFIG_POSIX_TIMERS
779f06febc9SFrank Mayhar 	struct task_cputime		cputime_expires;
7801da177e4SLinus Torvalds 	struct list_head		cpu_timers[3];
781b18b6a9cSNicolas Pitre #endif
7821da177e4SLinus Torvalds 
7835eca1c10SIngo Molnar 	/* Process credentials: */
7845eca1c10SIngo Molnar 
7855eca1c10SIngo Molnar 	/* Tracer's credentials at attach: */
7865eca1c10SIngo Molnar 	const struct cred __rcu		*ptracer_cred;
7875eca1c10SIngo Molnar 
7885eca1c10SIngo Molnar 	/* Objective and real subjective task credentials (COW): */
7895eca1c10SIngo Molnar 	const struct cred __rcu		*real_cred;
7905eca1c10SIngo Molnar 
7915eca1c10SIngo Molnar 	/* Effective (overridable) subjective task credentials (COW): */
7925eca1c10SIngo Molnar 	const struct cred __rcu		*cred;
7935eca1c10SIngo Molnar 
7945eca1c10SIngo Molnar 	/*
7955eca1c10SIngo Molnar 	 * executable name, excluding path.
7965eca1c10SIngo Molnar 	 *
7975eca1c10SIngo Molnar 	 * - normally initialized setup_new_exec()
7985eca1c10SIngo Molnar 	 * - access it with [gs]et_task_comm()
7995eca1c10SIngo Molnar 	 * - lock it with task_lock()
8005eca1c10SIngo Molnar 	 */
8015eca1c10SIngo Molnar 	char				comm[TASK_COMM_LEN];
8025eca1c10SIngo Molnar 
803756daf26SNeilBrown 	struct nameidata		*nameidata;
8045eca1c10SIngo Molnar 
8053d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC
8061da177e4SLinus Torvalds 	struct sysv_sem			sysvsem;
807ab602f79SJack Miller 	struct sysv_shm			sysvshm;
8083d5b6fccSAlexey Dobriyan #endif
809e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK
81082a1fcb9SIngo Molnar 	unsigned long			last_switch_count;
81182a1fcb9SIngo Molnar #endif
8125eca1c10SIngo Molnar 	/* Filesystem information: */
8131da177e4SLinus Torvalds 	struct fs_struct		*fs;
8145eca1c10SIngo Molnar 
8155eca1c10SIngo Molnar 	/* Open file information: */
8161da177e4SLinus Torvalds 	struct files_struct		*files;
8175eca1c10SIngo Molnar 
8185eca1c10SIngo Molnar 	/* Namespaces: */
819ab516013SSerge E. Hallyn 	struct nsproxy			*nsproxy;
8205eca1c10SIngo Molnar 
8215eca1c10SIngo Molnar 	/* Signal handlers: */
8221da177e4SLinus Torvalds 	struct signal_struct		*signal;
8231da177e4SLinus Torvalds 	struct sighand_struct		*sighand;
8245eca1c10SIngo Molnar 	sigset_t			blocked;
8255eca1c10SIngo Molnar 	sigset_t			real_blocked;
8265eca1c10SIngo Molnar 	/* Restored if set_restore_sigmask() was used: */
8275eca1c10SIngo Molnar 	sigset_t			saved_sigmask;
8281da177e4SLinus Torvalds 	struct sigpending		pending;
8291da177e4SLinus Torvalds 	unsigned long			sas_ss_sp;
8301da177e4SLinus Torvalds 	size_t				sas_ss_size;
8315eca1c10SIngo Molnar 	unsigned int			sas_ss_flags;
8322e01fabeSOleg Nesterov 
83367d12145SAl Viro 	struct callback_head		*task_works;
834e73f8959SOleg Nesterov 
8351da177e4SLinus Torvalds 	struct audit_context		*audit_context;
836bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL
837e1760bd5SEric W. Biederman 	kuid_t				loginuid;
8384746ec5bSEric Paris 	unsigned int			sessionid;
839bfef93a5SAl Viro #endif
840932ecebbSWill Drewry 	struct seccomp			seccomp;
8411da177e4SLinus Torvalds 
8425eca1c10SIngo Molnar 	/* Thread group tracking: */
8431da177e4SLinus Torvalds 	u32				parent_exec_id;
8441da177e4SLinus Torvalds 	u32				self_exec_id;
8455eca1c10SIngo Molnar 
8465eca1c10SIngo Molnar 	/* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */
8471da177e4SLinus Torvalds 	spinlock_t			alloc_lock;
8481da177e4SLinus Torvalds 
849b29739f9SIngo Molnar 	/* Protection of the PI data structures: */
8501d615482SThomas Gleixner 	raw_spinlock_t			pi_lock;
851b29739f9SIngo Molnar 
85276751049SPeter Zijlstra 	struct wake_q_node		wake_q;
85376751049SPeter Zijlstra 
85423f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES
8555eca1c10SIngo Molnar 	/* PI waiters blocked on a rt_mutex held by this task: */
856a23ba907SDavidlohr Bueso 	struct rb_root_cached		pi_waiters;
857e96a7705SXunlei Pang 	/* Updated under owner's pi_lock and rq lock */
858e96a7705SXunlei Pang 	struct task_struct		*pi_top_task;
8595eca1c10SIngo Molnar 	/* Deadlock detection and priority inheritance handling: */
86023f78d4aSIngo Molnar 	struct rt_mutex_waiter		*pi_blocked_on;
86123f78d4aSIngo Molnar #endif
86223f78d4aSIngo Molnar 
863408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES
8645eca1c10SIngo Molnar 	/* Mutex deadlock detection: */
865408894eeSIngo Molnar 	struct mutex_waiter		*blocked_on;
866408894eeSIngo Molnar #endif
8675eca1c10SIngo Molnar 
868de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS
869de30a2b3SIngo Molnar 	unsigned int			irq_events;
870de30a2b3SIngo Molnar 	unsigned long			hardirq_enable_ip;
871de30a2b3SIngo Molnar 	unsigned long			hardirq_disable_ip;
872fa1452e8SHiroshi Shimamoto 	unsigned int			hardirq_enable_event;
873de30a2b3SIngo Molnar 	unsigned int			hardirq_disable_event;
874fa1452e8SHiroshi Shimamoto 	int				hardirqs_enabled;
875de30a2b3SIngo Molnar 	int				hardirq_context;
876fa1452e8SHiroshi Shimamoto 	unsigned long			softirq_disable_ip;
877fa1452e8SHiroshi Shimamoto 	unsigned long			softirq_enable_ip;
878fa1452e8SHiroshi Shimamoto 	unsigned int			softirq_disable_event;
879fa1452e8SHiroshi Shimamoto 	unsigned int			softirq_enable_event;
880fa1452e8SHiroshi Shimamoto 	int				softirqs_enabled;
881de30a2b3SIngo Molnar 	int				softirq_context;
882de30a2b3SIngo Molnar #endif
8835eca1c10SIngo Molnar 
884fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP
885bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH			48UL
886fbb9ce95SIngo Molnar 	u64				curr_chain_key;
887fbb9ce95SIngo Molnar 	int				lockdep_depth;
888fbb9ce95SIngo Molnar 	unsigned int			lockdep_recursion;
889c7aceabaSRichard Kennedy 	struct held_lock		held_locks[MAX_LOCK_DEPTH];
890fbb9ce95SIngo Molnar #endif
8915eca1c10SIngo Molnar 
892c6d30853SAndrey Ryabinin #ifdef CONFIG_UBSAN
893c6d30853SAndrey Ryabinin 	unsigned int			in_ubsan;
894c6d30853SAndrey Ryabinin #endif
895408894eeSIngo Molnar 
8965eca1c10SIngo Molnar 	/* Journalling filesystem info: */
8971da177e4SLinus Torvalds 	void				*journal_info;
8981da177e4SLinus Torvalds 
8995eca1c10SIngo Molnar 	/* Stacked block device info: */
900bddd87c7SAkinobu Mita 	struct bio_list			*bio_list;
901d89d8796SNeil Brown 
90273c10101SJens Axboe #ifdef CONFIG_BLOCK
9035eca1c10SIngo Molnar 	/* Stack plugging: */
90473c10101SJens Axboe 	struct blk_plug			*plug;
90573c10101SJens Axboe #endif
90673c10101SJens Axboe 
9075eca1c10SIngo Molnar 	/* VM state: */
9081da177e4SLinus Torvalds 	struct reclaim_state		*reclaim_state;
9091da177e4SLinus Torvalds 
9101da177e4SLinus Torvalds 	struct backing_dev_info		*backing_dev_info;
9111da177e4SLinus Torvalds 
9121da177e4SLinus Torvalds 	struct io_context		*io_context;
9131da177e4SLinus Torvalds 
9145eca1c10SIngo Molnar 	/* Ptrace state: */
9151da177e4SLinus Torvalds 	unsigned long			ptrace_message;
9165eca1c10SIngo Molnar 	siginfo_t			*last_siginfo;
9175eca1c10SIngo Molnar 
9187c3ab738SAndrew Morton 	struct task_io_accounting	ioac;
9195eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT
9205eca1c10SIngo Molnar 	/* Accumulated RSS usage: */
9215eca1c10SIngo Molnar 	u64				acct_rss_mem1;
9225eca1c10SIngo Molnar 	/* Accumulated virtual memory usage: */
9235eca1c10SIngo Molnar 	u64				acct_vm_mem1;
9245eca1c10SIngo Molnar 	/* stime + utime since last update: */
9255eca1c10SIngo Molnar 	u64				acct_timexpd;
9261da177e4SLinus Torvalds #endif
9271da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS
9285eca1c10SIngo Molnar 	/* Protected by ->alloc_lock: */
9295eca1c10SIngo Molnar 	nodemask_t			mems_allowed;
9305eca1c10SIngo Molnar 	/* Seqence number to catch updates: */
9315eca1c10SIngo Molnar 	seqcount_t			mems_allowed_seq;
932825a46afSPaul Jackson 	int				cpuset_mem_spread_rotor;
9336adef3ebSJack Steiner 	int				cpuset_slab_spread_rotor;
9341da177e4SLinus Torvalds #endif
935ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS
9365eca1c10SIngo Molnar 	/* Control Group info protected by css_set_lock: */
9372c392b8cSArnd Bergmann 	struct css_set __rcu		*cgroups;
9385eca1c10SIngo Molnar 	/* cg_list protected by css_set_lock and tsk->alloc_lock: */
939817929ecSPaul Menage 	struct list_head		cg_list;
940ddbcc7e8SPaul Menage #endif
941f01d7d51SVikas Shivappa #ifdef CONFIG_INTEL_RDT
9420734ded1SVikas Shivappa 	u32				closid;
943d6aaba61SVikas Shivappa 	u32				rmid;
944e02737d5SFenghua Yu #endif
94542b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX
9460771dfefSIngo Molnar 	struct robust_list_head __user	*robust_list;
94734f192c6SIngo Molnar #ifdef CONFIG_COMPAT
94834f192c6SIngo Molnar 	struct compat_robust_list_head __user *compat_robust_list;
94934f192c6SIngo Molnar #endif
950c87e2837SIngo Molnar 	struct list_head		pi_state_list;
951c87e2837SIngo Molnar 	struct futex_pi_state		*pi_state_cache;
95242b2dd0aSAlexey Dobriyan #endif
953cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS
9548dc85d54SPeter Zijlstra 	struct perf_event_context	*perf_event_ctxp[perf_nr_task_contexts];
955cdd6c482SIngo Molnar 	struct mutex			perf_event_mutex;
956cdd6c482SIngo Molnar 	struct list_head		perf_event_list;
957a63eaf34SPaul Mackerras #endif
9588f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT
9598f47b187SThomas Gleixner 	unsigned long			preempt_disable_ip;
9608f47b187SThomas Gleixner #endif
961c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA
9625eca1c10SIngo Molnar 	/* Protected by alloc_lock: */
9635eca1c10SIngo Molnar 	struct mempolicy		*mempolicy;
96445816682SVlastimil Babka 	short				il_prev;
965207205a2SEric Dumazet 	short				pref_node_fork;
966c7aceabaSRichard Kennedy #endif
967cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING
968cbee9f88SPeter Zijlstra 	int				numa_scan_seq;
969cbee9f88SPeter Zijlstra 	unsigned int			numa_scan_period;
970598f0ec0SMel Gorman 	unsigned int			numa_scan_period_max;
971de1c9ce6SRik van Riel 	int				numa_preferred_nid;
9726b9a7460SMel Gorman 	unsigned long			numa_migrate_retry;
9735eca1c10SIngo Molnar 	/* Migration stamp: */
9745eca1c10SIngo Molnar 	u64				node_stamp;
9757e2703e6SRik van Riel 	u64				last_task_numa_placement;
9767e2703e6SRik van Riel 	u64				last_sum_exec_runtime;
977cbee9f88SPeter Zijlstra 	struct callback_head		numa_work;
978f809ca9aSMel Gorman 
9798c8a743cSPeter Zijlstra 	struct list_head		numa_entry;
9808c8a743cSPeter Zijlstra 	struct numa_group		*numa_group;
9818c8a743cSPeter Zijlstra 
982745d6147SMel Gorman 	/*
98344dba3d5SIulia Manda 	 * numa_faults is an array split into four regions:
98444dba3d5SIulia Manda 	 * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer
98544dba3d5SIulia Manda 	 * in this precise order.
98644dba3d5SIulia Manda 	 *
98744dba3d5SIulia Manda 	 * faults_memory: Exponential decaying average of faults on a per-node
98844dba3d5SIulia Manda 	 * basis. Scheduling placement decisions are made based on these
98944dba3d5SIulia Manda 	 * counts. The values remain static for the duration of a PTE scan.
99044dba3d5SIulia Manda 	 * faults_cpu: Track the nodes the process was running on when a NUMA
99144dba3d5SIulia Manda 	 * hinting fault was incurred.
99244dba3d5SIulia Manda 	 * faults_memory_buffer and faults_cpu_buffer: Record faults per node
99344dba3d5SIulia Manda 	 * during the current scan window. When the scan completes, the counts
99444dba3d5SIulia Manda 	 * in faults_memory and faults_cpu decay and these values are copied.
995745d6147SMel Gorman 	 */
99644dba3d5SIulia Manda 	unsigned long			*numa_faults;
99783e1d2cdSMel Gorman 	unsigned long			total_numa_faults;
998745d6147SMel Gorman 
999745d6147SMel Gorman 	/*
100004bb2f94SRik van Riel 	 * numa_faults_locality tracks if faults recorded during the last
1001074c2381SMel Gorman 	 * scan window were remote/local or failed to migrate. The task scan
1002074c2381SMel Gorman 	 * period is adapted based on the locality of the faults with different
1003074c2381SMel Gorman 	 * weights depending on whether they were shared or private faults
100404bb2f94SRik van Riel 	 */
1005074c2381SMel Gorman 	unsigned long			numa_faults_locality[3];
100604bb2f94SRik van Riel 
1007b32e86b4SIngo Molnar 	unsigned long			numa_pages_migrated;
1008cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */
1009cbee9f88SPeter Zijlstra 
101072b252aeSMel Gorman 	struct tlbflush_unmap_batch	tlb_ubc;
101172b252aeSMel Gorman 
1012e56d0903SIngo Molnar 	struct rcu_head			rcu;
1013b92ce558SJens Axboe 
10145eca1c10SIngo Molnar 	/* Cache last used pipe for splice(): */
1015b92ce558SJens Axboe 	struct pipe_inode_info		*splice_pipe;
10165640f768SEric Dumazet 
10175640f768SEric Dumazet 	struct page_frag		task_frag;
10185640f768SEric Dumazet 
1019ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT
1020ca74e92bSShailabh Nagar 	struct task_delay_info		*delays;
1021ca74e92bSShailabh Nagar #endif
102247913d4eSIngo Molnar 
1023f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION
1024f4f154fdSAkinobu Mita 	int				make_it_fail;
10259049f2f6SAkinobu Mita 	unsigned int			fail_nth;
1026f4f154fdSAkinobu Mita #endif
10279d823e8fSWu Fengguang 	/*
10285eca1c10SIngo Molnar 	 * When (nr_dirtied >= nr_dirtied_pause), it's time to call
10295eca1c10SIngo Molnar 	 * balance_dirty_pages() for a dirty throttling pause:
10309d823e8fSWu Fengguang 	 */
10319d823e8fSWu Fengguang 	int				nr_dirtied;
10329d823e8fSWu Fengguang 	int				nr_dirtied_pause;
10335eca1c10SIngo Molnar 	/* Start of a write-and-pause period: */
10345eca1c10SIngo Molnar 	unsigned long			dirty_paused_when;
10359d823e8fSWu Fengguang 
10369745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP
10379745512cSArjan van de Ven 	int				latency_record_count;
10389745512cSArjan van de Ven 	struct latency_record		latency_record[LT_SAVECOUNT];
10399745512cSArjan van de Ven #endif
10406976675dSArjan van de Ven 	/*
10415eca1c10SIngo Molnar 	 * Time slack values; these are used to round up poll() and
10426976675dSArjan van de Ven 	 * select() etc timeout values. These are in nanoseconds.
10436976675dSArjan van de Ven 	 */
1044da8b44d5SJohn Stultz 	u64				timer_slack_ns;
1045da8b44d5SJohn Stultz 	u64				default_timer_slack_ns;
1046f8d570a4SDavid Miller 
10470b24beccSAndrey Ryabinin #ifdef CONFIG_KASAN
10480b24beccSAndrey Ryabinin 	unsigned int			kasan_depth;
10490b24beccSAndrey Ryabinin #endif
10505eca1c10SIngo Molnar 
1051fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER
10525eca1c10SIngo Molnar 	/* Index of current stored address in ret_stack: */
1053f201ae23SFrederic Weisbecker 	int				curr_ret_stack;
10545eca1c10SIngo Molnar 
10555eca1c10SIngo Molnar 	/* Stack of return addresses for return function tracing: */
1056f201ae23SFrederic Weisbecker 	struct ftrace_ret_stack		*ret_stack;
10575eca1c10SIngo Molnar 
10585eca1c10SIngo Molnar 	/* Timestamp for last schedule: */
10598aef2d28SSteven Rostedt 	unsigned long long		ftrace_timestamp;
10605eca1c10SIngo Molnar 
1061f201ae23SFrederic Weisbecker 	/*
1062f201ae23SFrederic Weisbecker 	 * Number of functions that haven't been traced
10635eca1c10SIngo Molnar 	 * because of depth overrun:
1064f201ae23SFrederic Weisbecker 	 */
1065f201ae23SFrederic Weisbecker 	atomic_t			trace_overrun;
10665eca1c10SIngo Molnar 
10675eca1c10SIngo Molnar 	/* Pause tracing: */
1068380c4b14SFrederic Weisbecker 	atomic_t			tracing_graph_pause;
1069f201ae23SFrederic Weisbecker #endif
10705eca1c10SIngo Molnar 
1071ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING
10725eca1c10SIngo Molnar 	/* State flags for use by tracers: */
1073ea4e2bc4SSteven Rostedt 	unsigned long			trace;
10745eca1c10SIngo Molnar 
10755eca1c10SIngo Molnar 	/* Bitmask and counter of trace recursion: */
1076261842b7SSteven Rostedt 	unsigned long			trace_recursion;
1077261842b7SSteven Rostedt #endif /* CONFIG_TRACING */
10785eca1c10SIngo Molnar 
10795c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV
10805eca1c10SIngo Molnar 	/* Coverage collection mode enabled for this task (0 if disabled): */
10815c9a8750SDmitry Vyukov 	enum kcov_mode			kcov_mode;
10825eca1c10SIngo Molnar 
10835eca1c10SIngo Molnar 	/* Size of the kcov_area: */
10845eca1c10SIngo Molnar 	unsigned int			kcov_size;
10855eca1c10SIngo Molnar 
10865eca1c10SIngo Molnar 	/* Buffer for coverage collection: */
10875c9a8750SDmitry Vyukov 	void				*kcov_area;
10885eca1c10SIngo Molnar 
10895eca1c10SIngo Molnar 	/* KCOV descriptor wired with this task or NULL: */
10905c9a8750SDmitry Vyukov 	struct kcov			*kcov;
10915c9a8750SDmitry Vyukov #endif
10925eca1c10SIngo Molnar 
10936f185c29SVladimir Davydov #ifdef CONFIG_MEMCG
1094626ebc41STejun Heo 	struct mem_cgroup		*memcg_in_oom;
1095626ebc41STejun Heo 	gfp_t				memcg_oom_gfp_mask;
1096626ebc41STejun Heo 	int				memcg_oom_order;
1097b23afb93STejun Heo 
10985eca1c10SIngo Molnar 	/* Number of pages to reclaim on returning to userland: */
1099b23afb93STejun Heo 	unsigned int			memcg_nr_pages_over_high;
1100569b846dSKAMEZAWA Hiroyuki #endif
11015eca1c10SIngo Molnar 
11020326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES
11030326f5a9SSrikar Dronamraju 	struct uprobe_task		*utask;
11040326f5a9SSrikar Dronamraju #endif
1105cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE)
1106cafe5635SKent Overstreet 	unsigned int			sequential_io;
1107cafe5635SKent Overstreet 	unsigned int			sequential_io_avg;
1108cafe5635SKent Overstreet #endif
11098eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
11108eb23b9fSPeter Zijlstra 	unsigned long			task_state_change;
11118eb23b9fSPeter Zijlstra #endif
11128bcbde54SDavid Hildenbrand 	int				pagefault_disabled;
111303049269SMichal Hocko #ifdef CONFIG_MMU
111429c696e1SVladimir Davydov 	struct task_struct		*oom_reaper_list;
111503049269SMichal Hocko #endif
1116ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK
1117ba14a194SAndy Lutomirski 	struct vm_struct		*stack_vm_area;
1118ba14a194SAndy Lutomirski #endif
111968f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
11205eca1c10SIngo Molnar 	/* A live task holds one reference: */
112168f24b08SAndy Lutomirski 	atomic_t			stack_refcount;
112268f24b08SAndy Lutomirski #endif
1123d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH
1124d83a7cb3SJosh Poimboeuf 	int patch_state;
1125d83a7cb3SJosh Poimboeuf #endif
1126e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY
1127e4e55b47STetsuo Handa 	/* Used by LSM modules for access restriction: */
1128e4e55b47STetsuo Handa 	void				*security;
1129e4e55b47STetsuo Handa #endif
113029e48ce8SKees Cook 
113129e48ce8SKees Cook 	/*
113229e48ce8SKees Cook 	 * New fields for task_struct should be added above here, so that
113329e48ce8SKees Cook 	 * they are included in the randomized portion of task_struct.
113429e48ce8SKees Cook 	 */
113529e48ce8SKees Cook 	randomized_struct_fields_end
113629e48ce8SKees Cook 
11375eca1c10SIngo Molnar 	/* CPU-specific state of this task: */
11380c8c0f03SDave Hansen 	struct thread_struct		thread;
11395eca1c10SIngo Molnar 
11400c8c0f03SDave Hansen 	/*
11410c8c0f03SDave Hansen 	 * WARNING: on x86, 'thread_struct' contains a variable-sized
11420c8c0f03SDave Hansen 	 * structure.  It *MUST* be at the end of 'task_struct'.
11430c8c0f03SDave Hansen 	 *
11440c8c0f03SDave Hansen 	 * Do not put anything below here!
11450c8c0f03SDave Hansen 	 */
11461da177e4SLinus Torvalds };
11471da177e4SLinus Torvalds 
1148e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task)
114922c935f4SEric W. Biederman {
115022c935f4SEric W. Biederman 	return task->pids[PIDTYPE_PID].pid;
115122c935f4SEric W. Biederman }
115222c935f4SEric W. Biederman 
1153e868171aSAlexey Dobriyan static inline struct pid *task_tgid(struct task_struct *task)
115422c935f4SEric W. Biederman {
115522c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_PID].pid;
115622c935f4SEric W. Biederman }
115722c935f4SEric W. Biederman 
11586dda81f4SOleg Nesterov /*
11595eca1c10SIngo Molnar  * Without tasklist or RCU lock it is not safe to dereference
11606dda81f4SOleg Nesterov  * the result of task_pgrp/task_session even if task == current,
11616dda81f4SOleg Nesterov  * we can race with another thread doing sys_setsid/sys_setpgid.
11626dda81f4SOleg Nesterov  */
1163e868171aSAlexey Dobriyan static inline struct pid *task_pgrp(struct task_struct *task)
116422c935f4SEric W. Biederman {
116522c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_PGID].pid;
116622c935f4SEric W. Biederman }
116722c935f4SEric W. Biederman 
1168e868171aSAlexey Dobriyan static inline struct pid *task_session(struct task_struct *task)
116922c935f4SEric W. Biederman {
117022c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_SID].pid;
117122c935f4SEric W. Biederman }
117222c935f4SEric W. Biederman 
11737af57294SPavel Emelyanov /*
11747af57294SPavel Emelyanov  * the helpers to get the task's different pids as they are seen
11757af57294SPavel Emelyanov  * from various namespaces
11767af57294SPavel Emelyanov  *
11777af57294SPavel Emelyanov  * task_xid_nr()     : global id, i.e. the id seen from the init namespace;
117844c4e1b2SEric W. Biederman  * task_xid_vnr()    : virtual id, i.e. the id seen from the pid namespace of
117944c4e1b2SEric W. Biederman  *                     current.
11807af57294SPavel Emelyanov  * task_xid_nr_ns()  : id seen from the ns specified;
11817af57294SPavel Emelyanov  *
11827af57294SPavel Emelyanov  * see also pid_nr() etc in include/linux/pid.h
11837af57294SPavel Emelyanov  */
11845eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns);
11857af57294SPavel Emelyanov 
1186e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk)
11877af57294SPavel Emelyanov {
11887af57294SPavel Emelyanov 	return tsk->pid;
11897af57294SPavel Emelyanov }
11907af57294SPavel Emelyanov 
11915eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
119252ee2dfdSOleg Nesterov {
119352ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
119452ee2dfdSOleg Nesterov }
11957af57294SPavel Emelyanov 
11967af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk)
11977af57294SPavel Emelyanov {
119852ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
11997af57294SPavel Emelyanov }
12007af57294SPavel Emelyanov 
12017af57294SPavel Emelyanov 
1202e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk)
12037af57294SPavel Emelyanov {
12047af57294SPavel Emelyanov 	return tsk->tgid;
12057af57294SPavel Emelyanov }
12067af57294SPavel Emelyanov 
12075eca1c10SIngo Molnar /**
12085eca1c10SIngo Molnar  * pid_alive - check that a task structure is not stale
12095eca1c10SIngo Molnar  * @p: Task structure to be checked.
12105eca1c10SIngo Molnar  *
12115eca1c10SIngo Molnar  * Test if a process is not yet dead (at most zombie state)
12125eca1c10SIngo Molnar  * If pid_alive fails, then pointers within the task structure
12135eca1c10SIngo Molnar  * can be stale and must not be dereferenced.
12145eca1c10SIngo Molnar  *
12155eca1c10SIngo Molnar  * Return: 1 if the process is alive. 0 otherwise.
12165eca1c10SIngo Molnar  */
12175eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p)
12185eca1c10SIngo Molnar {
12195eca1c10SIngo Molnar 	return p->pids[PIDTYPE_PID].pid != NULL;
12205eca1c10SIngo Molnar }
12217af57294SPavel Emelyanov 
12225eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
12237af57294SPavel Emelyanov {
122452ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
12257af57294SPavel Emelyanov }
12267af57294SPavel Emelyanov 
12277af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
12287af57294SPavel Emelyanov {
122952ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
12307af57294SPavel Emelyanov }
12317af57294SPavel Emelyanov 
12327af57294SPavel Emelyanov 
12335eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
12347af57294SPavel Emelyanov {
123552ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
12367af57294SPavel Emelyanov }
12377af57294SPavel Emelyanov 
12387af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk)
12397af57294SPavel Emelyanov {
124052ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
12417af57294SPavel Emelyanov }
12427af57294SPavel Emelyanov 
1243dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
1244dd1c1f2fSOleg Nesterov {
1245dd1c1f2fSOleg Nesterov 	return __task_pid_nr_ns(tsk, __PIDTYPE_TGID, ns);
1246dd1c1f2fSOleg Nesterov }
1247dd1c1f2fSOleg Nesterov 
1248dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk)
1249dd1c1f2fSOleg Nesterov {
1250dd1c1f2fSOleg Nesterov 	return __task_pid_nr_ns(tsk, __PIDTYPE_TGID, NULL);
1251dd1c1f2fSOleg Nesterov }
1252dd1c1f2fSOleg Nesterov 
1253dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns)
1254dd1c1f2fSOleg Nesterov {
1255dd1c1f2fSOleg Nesterov 	pid_t pid = 0;
1256dd1c1f2fSOleg Nesterov 
1257dd1c1f2fSOleg Nesterov 	rcu_read_lock();
1258dd1c1f2fSOleg Nesterov 	if (pid_alive(tsk))
1259dd1c1f2fSOleg Nesterov 		pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns);
1260dd1c1f2fSOleg Nesterov 	rcu_read_unlock();
1261dd1c1f2fSOleg Nesterov 
1262dd1c1f2fSOleg Nesterov 	return pid;
1263dd1c1f2fSOleg Nesterov }
1264dd1c1f2fSOleg Nesterov 
1265dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk)
1266dd1c1f2fSOleg Nesterov {
1267dd1c1f2fSOleg Nesterov 	return task_ppid_nr_ns(tsk, &init_pid_ns);
1268dd1c1f2fSOleg Nesterov }
1269dd1c1f2fSOleg Nesterov 
12705eca1c10SIngo Molnar /* Obsolete, do not use: */
12711b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk)
12721b0f7ffdSOleg Nesterov {
12731b0f7ffdSOleg Nesterov 	return task_pgrp_nr_ns(tsk, &init_pid_ns);
12741b0f7ffdSOleg Nesterov }
12757af57294SPavel Emelyanov 
127606eb6184SPeter Zijlstra #define TASK_REPORT_IDLE	(TASK_REPORT + 1)
127706eb6184SPeter Zijlstra #define TASK_REPORT_MAX		(TASK_REPORT_IDLE << 1)
127806eb6184SPeter Zijlstra 
12791d48b080SPeter Zijlstra static inline unsigned int task_state_index(struct task_struct *tsk)
128020435d84SXie XiuQi {
12811593baabSPeter Zijlstra 	unsigned int tsk_state = READ_ONCE(tsk->state);
12821593baabSPeter Zijlstra 	unsigned int state = (tsk_state | tsk->exit_state) & TASK_REPORT;
128320435d84SXie XiuQi 
128406eb6184SPeter Zijlstra 	BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX);
128506eb6184SPeter Zijlstra 
128606eb6184SPeter Zijlstra 	if (tsk_state == TASK_IDLE)
128706eb6184SPeter Zijlstra 		state = TASK_REPORT_IDLE;
128806eb6184SPeter Zijlstra 
12891593baabSPeter Zijlstra 	return fls(state);
12901593baabSPeter Zijlstra }
129120435d84SXie XiuQi 
12921d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state)
12931593baabSPeter Zijlstra {
12948ef9925bSPeter Zijlstra 	static const char state_char[] = "RSDTtXZPI";
12951593baabSPeter Zijlstra 
129606eb6184SPeter Zijlstra 	BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1);
12971593baabSPeter Zijlstra 
12981593baabSPeter Zijlstra 	return state_char[state];
12991593baabSPeter Zijlstra }
13001593baabSPeter Zijlstra 
13011593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk)
13021593baabSPeter Zijlstra {
13031d48b080SPeter Zijlstra 	return task_index_to_char(task_state_index(tsk));
130420435d84SXie XiuQi }
130520435d84SXie XiuQi 
13061da177e4SLinus Torvalds /**
1307570f5241SSergey Senozhatsky  * is_global_init - check if a task structure is init. Since init
1308570f5241SSergey Senozhatsky  * is free to have sub-threads we need to check tgid.
13093260259fSHenne  * @tsk: Task structure to be checked.
13103260259fSHenne  *
13113260259fSHenne  * Check if a task structure is the first user space task the kernel created.
1312e69f6186SYacine Belkadi  *
1313e69f6186SYacine Belkadi  * Return: 1 if the task structure is init. 0 otherwise.
1314f400e198SSukadev Bhattiprolu  */
1315e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk)
1316b461cc03SPavel Emelyanov {
1317570f5241SSergey Senozhatsky 	return task_tgid_nr(tsk) == 1;
1318b461cc03SPavel Emelyanov }
1319b460cbc5SSerge E. Hallyn 
13209ec52099SCedric Le Goater extern struct pid *cad_pid;
13219ec52099SCedric Le Goater 
13221da177e4SLinus Torvalds /*
13231da177e4SLinus Torvalds  * Per process flags
13241da177e4SLinus Torvalds  */
1325c1de45caSPeter Zijlstra #define PF_IDLE			0x00000002	/* I am an IDLE thread */
13265eca1c10SIngo Molnar #define PF_EXITING		0x00000004	/* Getting shut down */
13275eca1c10SIngo Molnar #define PF_EXITPIDONE		0x00000008	/* PI exit done on shut down */
132894886b84SLaurent Vivier #define PF_VCPU			0x00000010	/* I'm a virtual CPU */
132921aa9af0STejun Heo #define PF_WQ_WORKER		0x00000020	/* I'm a workqueue worker */
13305eca1c10SIngo Molnar #define PF_FORKNOEXEC		0x00000040	/* Forked but didn't exec */
13315eca1c10SIngo Molnar #define PF_MCE_PROCESS		0x00000080      /* Process policy on mce errors */
13325eca1c10SIngo Molnar #define PF_SUPERPRIV		0x00000100	/* Used super-user privileges */
13335eca1c10SIngo Molnar #define PF_DUMPCORE		0x00000200	/* Dumped core */
13345eca1c10SIngo Molnar #define PF_SIGNALED		0x00000400	/* Killed by a signal */
13351da177e4SLinus Torvalds #define PF_MEMALLOC		0x00000800	/* Allocating memory */
13365eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED	0x00001000	/* set_user() noticed that RLIMIT_NPROC was exceeded */
13375eca1c10SIngo Molnar #define PF_USED_MATH		0x00002000	/* If unset the fpu must be initialized before use */
13385eca1c10SIngo Molnar #define PF_USED_ASYNC		0x00004000	/* Used async_schedule*(), used by module init */
13395eca1c10SIngo Molnar #define PF_NOFREEZE		0x00008000	/* This thread should not be frozen */
13405eca1c10SIngo Molnar #define PF_FROZEN		0x00010000	/* Frozen for system suspend */
13417dea19f9SMichal Hocko #define PF_KSWAPD		0x00020000	/* I am kswapd */
13427dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS	0x00040000	/* All allocation requests will inherit GFP_NOFS */
13437dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO	0x00080000	/* All allocation requests will inherit GFP_NOIO */
13441da177e4SLinus Torvalds #define PF_LESS_THROTTLE	0x00100000	/* Throttle me less: I clean memory */
1345246bb0b1SOleg Nesterov #define PF_KTHREAD		0x00200000	/* I am a kernel thread */
13465eca1c10SIngo Molnar #define PF_RANDOMIZE		0x00400000	/* Randomize virtual address space */
1347b31dc66aSJens Axboe #define PF_SWAPWRITE		0x00800000	/* Allowed to write to swap */
134814a40ffcSTejun Heo #define PF_NO_SETAFFINITY	0x04000000	/* Userland is not allowed to meddle with cpus_allowed */
13494db96cf0SAndi Kleen #define PF_MCE_EARLY		0x08000000      /* Early kill for mce process policy */
135061a87122SThomas Gleixner #define PF_MUTEX_TESTER		0x20000000	/* Thread belongs to the rt mutex tester */
135158a69cb4STejun Heo #define PF_FREEZER_SKIP		0x40000000	/* Freezer should not count it as freezable */
13525eca1c10SIngo Molnar #define PF_SUSPEND_TASK		0x80000000      /* This thread called freeze_processes() and should not be frozen */
13531da177e4SLinus Torvalds 
13541da177e4SLinus Torvalds /*
13551da177e4SLinus Torvalds  * Only the _current_ task can read/write to tsk->flags, but other
13561da177e4SLinus Torvalds  * tasks can access tsk->flags in readonly mode for example
13571da177e4SLinus Torvalds  * with tsk_used_math (like during threaded core dumping).
13581da177e4SLinus Torvalds  * There is however an exception to this rule during ptrace
13591da177e4SLinus Torvalds  * or during fork: the ptracer task is allowed to write to the
13601da177e4SLinus Torvalds  * child->flags of its traced child (same goes for fork, the parent
13611da177e4SLinus Torvalds  * can write to the child->flags), because we're guaranteed the
13621da177e4SLinus Torvalds  * child is not running and in turn not changing child->flags
13631da177e4SLinus Torvalds  * at the same time the parent does it.
13641da177e4SLinus Torvalds  */
13651da177e4SLinus Torvalds #define clear_stopped_child_used_math(child)	do { (child)->flags &= ~PF_USED_MATH; } while (0)
13661da177e4SLinus Torvalds #define set_stopped_child_used_math(child)	do { (child)->flags |= PF_USED_MATH; } while (0)
13671da177e4SLinus Torvalds #define clear_used_math()			clear_stopped_child_used_math(current)
13681da177e4SLinus Torvalds #define set_used_math()				set_stopped_child_used_math(current)
13695eca1c10SIngo Molnar 
13701da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \
13711da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0)
13725eca1c10SIngo Molnar 
13735eca1c10SIngo Molnar #define conditional_used_math(condition)	conditional_stopped_child_used_math(condition, current)
13745eca1c10SIngo Molnar 
13751da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \
13761da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0)
13775eca1c10SIngo Molnar 
13781da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */
13791da177e4SLinus Torvalds #define tsk_used_math(p)			((p)->flags & PF_USED_MATH)
13801da177e4SLinus Torvalds #define used_math()				tsk_used_math(current)
13811da177e4SLinus Torvalds 
138262ec05ddSThomas Gleixner static inline bool is_percpu_thread(void)
138362ec05ddSThomas Gleixner {
138462ec05ddSThomas Gleixner #ifdef CONFIG_SMP
138562ec05ddSThomas Gleixner 	return (current->flags & PF_NO_SETAFFINITY) &&
138662ec05ddSThomas Gleixner 		(current->nr_cpus_allowed  == 1);
138762ec05ddSThomas Gleixner #else
138862ec05ddSThomas Gleixner 	return true;
138962ec05ddSThomas Gleixner #endif
139062ec05ddSThomas Gleixner }
139162ec05ddSThomas Gleixner 
13921d4457f9SKees Cook /* Per-process atomic flags. */
1393a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS		0	/* May not gain new privileges. */
13942ad654bcSZefan Li #define PFA_SPREAD_PAGE			1	/* Spread page cache over cpuset */
13952ad654bcSZefan Li #define PFA_SPREAD_SLAB			2	/* Spread some slab caches over cpuset */
1396*356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE		3	/* Speculative Store Bypass disabled */
1397*356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE	4	/* Speculative Store Bypass force disabled*/
13981d4457f9SKees Cook 
1399e0e5070bSZefan Li #define TASK_PFA_TEST(name, func)					\
1400e0e5070bSZefan Li 	static inline bool task_##func(struct task_struct *p)		\
1401e0e5070bSZefan Li 	{ return test_bit(PFA_##name, &p->atomic_flags); }
14025eca1c10SIngo Molnar 
1403e0e5070bSZefan Li #define TASK_PFA_SET(name, func)					\
1404e0e5070bSZefan Li 	static inline void task_set_##func(struct task_struct *p)	\
1405e0e5070bSZefan Li 	{ set_bit(PFA_##name, &p->atomic_flags); }
14065eca1c10SIngo Molnar 
1407e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func)					\
1408e0e5070bSZefan Li 	static inline void task_clear_##func(struct task_struct *p)	\
1409e0e5070bSZefan Li 	{ clear_bit(PFA_##name, &p->atomic_flags); }
14101d4457f9SKees Cook 
1411e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs)
1412e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs)
14131d4457f9SKees Cook 
14142ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page)
14152ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page)
14162ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
14172ad654bcSZefan Li 
14182ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
14192ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab)
14202ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
1421544b2c91STejun Heo 
1422*356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable)
1423*356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable)
1424*356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable)
1425*356e4bffSThomas Gleixner 
1426*356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1427*356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1428*356e4bffSThomas Gleixner 
14295eca1c10SIngo Molnar static inline void
1430717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags)
1431907aed48SMel Gorman {
1432717a94b5SNeilBrown 	current->flags &= ~flags;
1433717a94b5SNeilBrown 	current->flags |= orig_flags & flags;
1434907aed48SMel Gorman }
1435907aed48SMel Gorman 
14365eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial);
14375eca1c10SIngo Molnar extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_cpus_allowed);
14381da177e4SLinus Torvalds #ifdef CONFIG_SMP
14395eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask);
14405eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask);
14411da177e4SLinus Torvalds #else
14425eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask)
14431e1b6c51SKOSAKI Motohiro {
14441e1b6c51SKOSAKI Motohiro }
14455eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask)
14461da177e4SLinus Torvalds {
144796f874e2SRusty Russell 	if (!cpumask_test_cpu(0, new_mask))
14481da177e4SLinus Torvalds 		return -EINVAL;
14491da177e4SLinus Torvalds 	return 0;
14501da177e4SLinus Torvalds }
14511da177e4SLinus Torvalds #endif
1452e0ad9556SRusty Russell 
14536d0d2878SChristian Borntraeger #ifndef cpu_relax_yield
14546d0d2878SChristian Borntraeger #define cpu_relax_yield() cpu_relax()
14556d0d2878SChristian Borntraeger #endif
14566d0d2878SChristian Borntraeger 
1457fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt);
145836c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice);
145936c8b586SIngo Molnar extern int task_prio(const struct task_struct *p);
14605eca1c10SIngo Molnar 
1461d0ea0268SDongsheng Yang /**
1462d0ea0268SDongsheng Yang  * task_nice - return the nice value of a given task.
1463d0ea0268SDongsheng Yang  * @p: the task in question.
1464d0ea0268SDongsheng Yang  *
1465d0ea0268SDongsheng Yang  * Return: The nice value [ -20 ... 0 ... 19 ].
1466d0ea0268SDongsheng Yang  */
1467d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p)
1468d0ea0268SDongsheng Yang {
1469d0ea0268SDongsheng Yang 	return PRIO_TO_NICE((p)->static_prio);
1470d0ea0268SDongsheng Yang }
14715eca1c10SIngo Molnar 
147236c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice);
147336c8b586SIngo Molnar extern int task_curr(const struct task_struct *p);
14741da177e4SLinus Torvalds extern int idle_cpu(int cpu);
14755eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *);
14765eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *);
14775eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *);
1478794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *);
147936c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu);
14805eca1c10SIngo Molnar 
1481c4f30608SPaul E. McKenney /**
1482c4f30608SPaul E. McKenney  * is_idle_task - is the specified task an idle task?
1483fa757281SRandy Dunlap  * @p: the task in question.
1484e69f6186SYacine Belkadi  *
1485e69f6186SYacine Belkadi  * Return: 1 if @p is an idle task. 0 otherwise.
1486c4f30608SPaul E. McKenney  */
14877061ca3bSPaul E. McKenney static inline bool is_idle_task(const struct task_struct *p)
1488c4f30608SPaul E. McKenney {
1489c1de45caSPeter Zijlstra 	return !!(p->flags & PF_IDLE);
1490c4f30608SPaul E. McKenney }
14915eca1c10SIngo Molnar 
149236c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu);
1493a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p);
14941da177e4SLinus Torvalds 
14951da177e4SLinus Torvalds void yield(void);
14961da177e4SLinus Torvalds 
14971da177e4SLinus Torvalds union thread_union {
14980500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK
14990500871fSDavid Howells 	struct task_struct task;
15000500871fSDavid Howells #endif
1501c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK
15021da177e4SLinus Torvalds 	struct thread_info thread_info;
1503c65eacbeSAndy Lutomirski #endif
15041da177e4SLinus Torvalds 	unsigned long stack[THREAD_SIZE/sizeof(long)];
15051da177e4SLinus Torvalds };
15061da177e4SLinus Torvalds 
15070500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK
15080500871fSDavid Howells extern struct thread_info init_thread_info;
15090500871fSDavid Howells #endif
15100500871fSDavid Howells 
15110500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)];
15120500871fSDavid Howells 
1513f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK
1514f3ac6067SIngo Molnar static inline struct thread_info *task_thread_info(struct task_struct *task)
1515f3ac6067SIngo Molnar {
1516f3ac6067SIngo Molnar 	return &task->thread_info;
1517f3ac6067SIngo Molnar }
1518f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS)
1519f3ac6067SIngo Molnar # define task_thread_info(task)	((struct thread_info *)(task)->stack)
1520f3ac6067SIngo Molnar #endif
1521f3ac6067SIngo Molnar 
1522198fe21bSPavel Emelyanov /*
1523198fe21bSPavel Emelyanov  * find a task by one of its numerical ids
1524198fe21bSPavel Emelyanov  *
1525198fe21bSPavel Emelyanov  * find_task_by_pid_ns():
1526198fe21bSPavel Emelyanov  *      finds a task by its pid in the specified namespace
1527228ebcbeSPavel Emelyanov  * find_task_by_vpid():
1528228ebcbeSPavel Emelyanov  *      finds a task by its virtual pid
1529198fe21bSPavel Emelyanov  *
1530e49859e7SPavel Emelyanov  * see also find_vpid() etc in include/linux/pid.h
1531198fe21bSPavel Emelyanov  */
1532198fe21bSPavel Emelyanov 
1533228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr);
15345eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns);
1535198fe21bSPavel Emelyanov 
15362ee08260SMike Rapoport /*
15372ee08260SMike Rapoport  * find a task by its virtual pid and get the task struct
15382ee08260SMike Rapoport  */
15392ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr);
15402ee08260SMike Rapoport 
1541b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state);
1542b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk);
15433e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk);
15445eca1c10SIngo Molnar 
15451da177e4SLinus Torvalds #ifdef CONFIG_SMP
15461da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk);
15471da177e4SLinus Torvalds #else
15481da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { }
15491da177e4SLinus Torvalds #endif
15501da177e4SLinus Torvalds 
155182b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
15525eca1c10SIngo Molnar 
155382b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from)
155482b89778SAdrian Hunter {
155582b89778SAdrian Hunter 	__set_task_comm(tsk, from, false);
155682b89778SAdrian Hunter }
15575eca1c10SIngo Molnar 
15583756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk);
15593756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({			\
15603756f640SArnd Bergmann 	BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN);	\
15613756f640SArnd Bergmann 	__get_task_comm(buf, sizeof(buf), tsk);		\
15623756f640SArnd Bergmann })
15631da177e4SLinus Torvalds 
15641da177e4SLinus Torvalds #ifdef CONFIG_SMP
1565317f3941SPeter Zijlstra void scheduler_ipi(void);
156685ba2d86SRoland McGrath extern unsigned long wait_task_inactive(struct task_struct *, long match_state);
15671da177e4SLinus Torvalds #else
1568184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { }
15695eca1c10SIngo Molnar static inline unsigned long wait_task_inactive(struct task_struct *p, long match_state)
157085ba2d86SRoland McGrath {
157185ba2d86SRoland McGrath 	return 1;
157285ba2d86SRoland McGrath }
15731da177e4SLinus Torvalds #endif
15741da177e4SLinus Torvalds 
15755eca1c10SIngo Molnar /*
15765eca1c10SIngo Molnar  * Set thread flags in other task's structures.
15775eca1c10SIngo Molnar  * See asm/thread_info.h for TIF_xxxx flags available:
15781da177e4SLinus Torvalds  */
15791da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag)
15801da177e4SLinus Torvalds {
1581a1261f54SAl Viro 	set_ti_thread_flag(task_thread_info(tsk), flag);
15821da177e4SLinus Torvalds }
15831da177e4SLinus Torvalds 
15841da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag)
15851da177e4SLinus Torvalds {
1586a1261f54SAl Viro 	clear_ti_thread_flag(task_thread_info(tsk), flag);
15871da177e4SLinus Torvalds }
15881da177e4SLinus Torvalds 
15891da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag)
15901da177e4SLinus Torvalds {
1591a1261f54SAl Viro 	return test_and_set_ti_thread_flag(task_thread_info(tsk), flag);
15921da177e4SLinus Torvalds }
15931da177e4SLinus Torvalds 
15941da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag)
15951da177e4SLinus Torvalds {
1596a1261f54SAl Viro 	return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag);
15971da177e4SLinus Torvalds }
15981da177e4SLinus Torvalds 
15991da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag)
16001da177e4SLinus Torvalds {
1601a1261f54SAl Viro 	return test_ti_thread_flag(task_thread_info(tsk), flag);
16021da177e4SLinus Torvalds }
16031da177e4SLinus Torvalds 
16041da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk)
16051da177e4SLinus Torvalds {
16061da177e4SLinus Torvalds 	set_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
16071da177e4SLinus Torvalds }
16081da177e4SLinus Torvalds 
16091da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk)
16101da177e4SLinus Torvalds {
16111da177e4SLinus Torvalds 	clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
16121da177e4SLinus Torvalds }
16131da177e4SLinus Torvalds 
16148ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk)
16158ae121acSGregory Haskins {
16168ae121acSGregory Haskins 	return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
16178ae121acSGregory Haskins }
16188ae121acSGregory Haskins 
16191da177e4SLinus Torvalds /*
16201da177e4SLinus Torvalds  * cond_resched() and cond_resched_lock(): latency reduction via
16211da177e4SLinus Torvalds  * explicit rescheduling in places that are safe. The return
16221da177e4SLinus Torvalds  * value indicates whether a reschedule was done in fact.
16231da177e4SLinus Torvalds  * cond_resched_lock() will drop the spinlock before scheduling,
16241da177e4SLinus Torvalds  * cond_resched_softirq() will enable bhs before scheduling.
16251da177e4SLinus Torvalds  */
162635a773a0SPeter Zijlstra #ifndef CONFIG_PREEMPT
1627c3921ab7SLinus Torvalds extern int _cond_resched(void);
162835a773a0SPeter Zijlstra #else
162935a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; }
163035a773a0SPeter Zijlstra #endif
16316f80bd98SFrederic Weisbecker 
1632613afbf8SFrederic Weisbecker #define cond_resched() ({			\
16333427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, 0);	\
1634613afbf8SFrederic Weisbecker 	_cond_resched();			\
1635613afbf8SFrederic Weisbecker })
16366f80bd98SFrederic Weisbecker 
1637613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock);
1638613afbf8SFrederic Weisbecker 
1639613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({				\
16403427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\
1641613afbf8SFrederic Weisbecker 	__cond_resched_lock(lock);				\
1642613afbf8SFrederic Weisbecker })
1643613afbf8SFrederic Weisbecker 
1644613afbf8SFrederic Weisbecker extern int __cond_resched_softirq(void);
1645613afbf8SFrederic Weisbecker 
1646613afbf8SFrederic Weisbecker #define cond_resched_softirq() ({					\
16473427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, SOFTIRQ_DISABLE_OFFSET);	\
1648613afbf8SFrederic Weisbecker 	__cond_resched_softirq();					\
1649613afbf8SFrederic Weisbecker })
16501da177e4SLinus Torvalds 
1651f6f3c437SSimon Horman static inline void cond_resched_rcu(void)
1652f6f3c437SSimon Horman {
1653f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU)
1654f6f3c437SSimon Horman 	rcu_read_unlock();
1655f6f3c437SSimon Horman 	cond_resched();
1656f6f3c437SSimon Horman 	rcu_read_lock();
1657f6f3c437SSimon Horman #endif
1658f6f3c437SSimon Horman }
1659f6f3c437SSimon Horman 
16601da177e4SLinus Torvalds /*
16611da177e4SLinus Torvalds  * Does a critical section need to be broken due to another
166295c354feSNick Piggin  * task waiting?: (technically does not depend on CONFIG_PREEMPT,
166395c354feSNick Piggin  * but a general need for low latency)
16641da177e4SLinus Torvalds  */
166595c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock)
16661da177e4SLinus Torvalds {
166795c354feSNick Piggin #ifdef CONFIG_PREEMPT
166895c354feSNick Piggin 	return spin_is_contended(lock);
166995c354feSNick Piggin #else
16701da177e4SLinus Torvalds 	return 0;
167195c354feSNick Piggin #endif
16721da177e4SLinus Torvalds }
16731da177e4SLinus Torvalds 
167475f93fedSPeter Zijlstra static __always_inline bool need_resched(void)
167575f93fedSPeter Zijlstra {
167675f93fedSPeter Zijlstra 	return unlikely(tif_need_resched());
167775f93fedSPeter Zijlstra }
167875f93fedSPeter Zijlstra 
1679ee761f62SThomas Gleixner /*
16801da177e4SLinus Torvalds  * Wrappers for p->thread_info->cpu access. No-op on UP.
16811da177e4SLinus Torvalds  */
16821da177e4SLinus Torvalds #ifdef CONFIG_SMP
16831da177e4SLinus Torvalds 
16841da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
16851da177e4SLinus Torvalds {
1686c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
1687c65eacbeSAndy Lutomirski 	return p->cpu;
1688c65eacbeSAndy Lutomirski #else
1689a1261f54SAl Viro 	return task_thread_info(p)->cpu;
1690c65eacbeSAndy Lutomirski #endif
16911da177e4SLinus Torvalds }
16921da177e4SLinus Torvalds 
1693c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu);
16941da177e4SLinus Torvalds 
16951da177e4SLinus Torvalds #else
16961da177e4SLinus Torvalds 
16971da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
16981da177e4SLinus Torvalds {
16991da177e4SLinus Torvalds 	return 0;
17001da177e4SLinus Torvalds }
17011da177e4SLinus Torvalds 
17021da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu)
17031da177e4SLinus Torvalds {
17041da177e4SLinus Torvalds }
17051da177e4SLinus Torvalds 
17061da177e4SLinus Torvalds #endif /* CONFIG_SMP */
17071da177e4SLinus Torvalds 
1708d9345c65SPan Xinhui /*
1709d9345c65SPan Xinhui  * In order to reduce various lock holder preemption latencies provide an
1710d9345c65SPan Xinhui  * interface to see if a vCPU is currently running or not.
1711d9345c65SPan Xinhui  *
1712d9345c65SPan Xinhui  * This allows us to terminate optimistic spin loops and block, analogous to
1713d9345c65SPan Xinhui  * the native optimistic spin heuristic of testing if the lock owner task is
1714d9345c65SPan Xinhui  * running or not.
1715d9345c65SPan Xinhui  */
1716d9345c65SPan Xinhui #ifndef vcpu_is_preempted
1717d9345c65SPan Xinhui # define vcpu_is_preempted(cpu)	false
1718d9345c65SPan Xinhui #endif
1719d9345c65SPan Xinhui 
172096f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask);
172196f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask);
17225c45bf27SSiddha, Suresh B 
172382455257SDave Hansen #ifndef TASK_SIZE_OF
172482455257SDave Hansen #define TASK_SIZE_OF(tsk)	TASK_SIZE
172582455257SDave Hansen #endif
172682455257SDave Hansen 
17271da177e4SLinus Torvalds #endif
1728