xref: /linux/include/linux/sched.h (revision 050e9baa9dc9fbd9ce2b27f0056990fc9e0a08a0)
1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */
21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H
31da177e4SLinus Torvalds #define _LINUX_SCHED_H
41da177e4SLinus Torvalds 
55eca1c10SIngo Molnar /*
65eca1c10SIngo Molnar  * Define 'struct task_struct' and provide the main scheduler
75eca1c10SIngo Molnar  * APIs (schedule(), wakeup variants, etc.)
85eca1c10SIngo Molnar  */
95eca1c10SIngo Molnar 
10607ca46eSDavid Howells #include <uapi/linux/sched.h>
11b7b3c76aSDavid Woodhouse 
1270b8157eSIngo Molnar #include <asm/current.h>
1370b8157eSIngo Molnar 
145eca1c10SIngo Molnar #include <linux/pid.h>
155eca1c10SIngo Molnar #include <linux/sem.h>
165eca1c10SIngo Molnar #include <linux/shm.h>
175eca1c10SIngo Molnar #include <linux/kcov.h>
185eca1c10SIngo Molnar #include <linux/mutex.h>
195eca1c10SIngo Molnar #include <linux/plist.h>
205eca1c10SIngo Molnar #include <linux/hrtimer.h>
215eca1c10SIngo Molnar #include <linux/seccomp.h>
225eca1c10SIngo Molnar #include <linux/nodemask.h>
235eca1c10SIngo Molnar #include <linux/rcupdate.h>
245eca1c10SIngo Molnar #include <linux/resource.h>
255eca1c10SIngo Molnar #include <linux/latencytop.h>
265eca1c10SIngo Molnar #include <linux/sched/prio.h>
275eca1c10SIngo Molnar #include <linux/signal_types.h>
285eca1c10SIngo Molnar #include <linux/mm_types_task.h>
295eca1c10SIngo Molnar #include <linux/task_io_accounting.h>
30d7822b1eSMathieu Desnoyers #include <linux/rseq.h>
315eca1c10SIngo Molnar 
325eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */
33c7af7877SIngo Molnar struct audit_context;
34c7af7877SIngo Molnar struct backing_dev_info;
35c7af7877SIngo Molnar struct bio_list;
36c7af7877SIngo Molnar struct blk_plug;
37c7af7877SIngo Molnar struct cfs_rq;
38c7af7877SIngo Molnar struct fs_struct;
39c7af7877SIngo Molnar struct futex_pi_state;
40c7af7877SIngo Molnar struct io_context;
41c7af7877SIngo Molnar struct mempolicy;
42c7af7877SIngo Molnar struct nameidata;
43c7af7877SIngo Molnar struct nsproxy;
44c7af7877SIngo Molnar struct perf_event_context;
45c7af7877SIngo Molnar struct pid_namespace;
46c7af7877SIngo Molnar struct pipe_inode_info;
47c7af7877SIngo Molnar struct rcu_node;
48c7af7877SIngo Molnar struct reclaim_state;
49c7af7877SIngo Molnar struct robust_list_head;
50e2d1e2aeSIngo Molnar struct sched_attr;
51e2d1e2aeSIngo Molnar struct sched_param;
5243ae34cbSIngo Molnar struct seq_file;
53c7af7877SIngo Molnar struct sighand_struct;
54c7af7877SIngo Molnar struct signal_struct;
55c7af7877SIngo Molnar struct task_delay_info;
564cf86d77SIngo Molnar struct task_group;
571da177e4SLinus Torvalds 
584a8342d2SLinus Torvalds /*
594a8342d2SLinus Torvalds  * Task state bitmask. NOTE! These bits are also
604a8342d2SLinus Torvalds  * encoded in fs/proc/array.c: get_task_state().
614a8342d2SLinus Torvalds  *
624a8342d2SLinus Torvalds  * We have two separate sets of flags: task->state
634a8342d2SLinus Torvalds  * is about runnability, while task->exit_state are
644a8342d2SLinus Torvalds  * about the task exiting. Confusing, but this way
654a8342d2SLinus Torvalds  * modifying one set can't modify the other one by
664a8342d2SLinus Torvalds  * mistake.
674a8342d2SLinus Torvalds  */
685eca1c10SIngo Molnar 
695eca1c10SIngo Molnar /* Used in tsk->state: */
7092c4bc9fSPeter Zijlstra #define TASK_RUNNING			0x0000
7192c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE		0x0001
7292c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE		0x0002
7392c4bc9fSPeter Zijlstra #define __TASK_STOPPED			0x0004
7492c4bc9fSPeter Zijlstra #define __TASK_TRACED			0x0008
755eca1c10SIngo Molnar /* Used in tsk->exit_state: */
7692c4bc9fSPeter Zijlstra #define EXIT_DEAD			0x0010
7792c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE			0x0020
78abd50b39SOleg Nesterov #define EXIT_TRACE			(EXIT_ZOMBIE | EXIT_DEAD)
795eca1c10SIngo Molnar /* Used in tsk->state again: */
808ef9925bSPeter Zijlstra #define TASK_PARKED			0x0040
818ef9925bSPeter Zijlstra #define TASK_DEAD			0x0080
828ef9925bSPeter Zijlstra #define TASK_WAKEKILL			0x0100
838ef9925bSPeter Zijlstra #define TASK_WAKING			0x0200
8492c4bc9fSPeter Zijlstra #define TASK_NOLOAD			0x0400
8592c4bc9fSPeter Zijlstra #define TASK_NEW			0x0800
8692c4bc9fSPeter Zijlstra #define TASK_STATE_MAX			0x1000
87f021a3c2SMatthew Wilcox 
885eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */
89f021a3c2SMatthew Wilcox #define TASK_KILLABLE			(TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
90f021a3c2SMatthew Wilcox #define TASK_STOPPED			(TASK_WAKEKILL | __TASK_STOPPED)
91f021a3c2SMatthew Wilcox #define TASK_TRACED			(TASK_WAKEKILL | __TASK_TRACED)
921da177e4SLinus Torvalds 
9380ed87c8SPeter Zijlstra #define TASK_IDLE			(TASK_UNINTERRUPTIBLE | TASK_NOLOAD)
9480ed87c8SPeter Zijlstra 
955eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */
9692a1f4bcSMatthew Wilcox #define TASK_NORMAL			(TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
9792a1f4bcSMatthew Wilcox 
985eca1c10SIngo Molnar /* get_task_state(): */
9992a1f4bcSMatthew Wilcox #define TASK_REPORT			(TASK_RUNNING | TASK_INTERRUPTIBLE | \
100f021a3c2SMatthew Wilcox 					 TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
1018ef9925bSPeter Zijlstra 					 __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \
1028ef9925bSPeter Zijlstra 					 TASK_PARKED)
10392a1f4bcSMatthew Wilcox 
104f021a3c2SMatthew Wilcox #define task_is_traced(task)		((task->state & __TASK_TRACED) != 0)
1055eca1c10SIngo Molnar 
106f021a3c2SMatthew Wilcox #define task_is_stopped(task)		((task->state & __TASK_STOPPED) != 0)
1075eca1c10SIngo Molnar 
1085eca1c10SIngo Molnar #define task_is_stopped_or_traced(task)	((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
1095eca1c10SIngo Molnar 
1105eca1c10SIngo Molnar #define task_contributes_to_load(task)	((task->state & TASK_UNINTERRUPTIBLE) != 0 && \
11180ed87c8SPeter Zijlstra 					 (task->flags & PF_FROZEN) == 0 && \
11280ed87c8SPeter Zijlstra 					 (task->state & TASK_NOLOAD) == 0)
1131da177e4SLinus Torvalds 
1148eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
1158eb23b9fSPeter Zijlstra 
116b5bf9a90SPeter Zijlstra /*
117b5bf9a90SPeter Zijlstra  * Special states are those that do not use the normal wait-loop pattern. See
118b5bf9a90SPeter Zijlstra  * the comment with set_special_state().
119b5bf9a90SPeter Zijlstra  */
120b5bf9a90SPeter Zijlstra #define is_special_task_state(state)				\
121b5bf9a90SPeter Zijlstra 	((state) & (__TASK_STOPPED | __TASK_TRACED | TASK_DEAD))
122b5bf9a90SPeter Zijlstra 
1238eb23b9fSPeter Zijlstra #define __set_current_state(state_value)			\
1248eb23b9fSPeter Zijlstra 	do {							\
125b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(is_special_task_state(state_value));\
1268eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
1278eb23b9fSPeter Zijlstra 		current->state = (state_value);			\
1288eb23b9fSPeter Zijlstra 	} while (0)
129b5bf9a90SPeter Zijlstra 
1308eb23b9fSPeter Zijlstra #define set_current_state(state_value)				\
1318eb23b9fSPeter Zijlstra 	do {							\
132b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(is_special_task_state(state_value));\
1338eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
134b92b8b35SPeter Zijlstra 		smp_store_mb(current->state, (state_value));	\
1358eb23b9fSPeter Zijlstra 	} while (0)
1368eb23b9fSPeter Zijlstra 
137b5bf9a90SPeter Zijlstra #define set_special_state(state_value)					\
138b5bf9a90SPeter Zijlstra 	do {								\
139b5bf9a90SPeter Zijlstra 		unsigned long flags; /* may shadow */			\
140b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(!is_special_task_state(state_value));	\
141b5bf9a90SPeter Zijlstra 		raw_spin_lock_irqsave(&current->pi_lock, flags);	\
142b5bf9a90SPeter Zijlstra 		current->task_state_change = _THIS_IP_;			\
143b5bf9a90SPeter Zijlstra 		current->state = (state_value);				\
144b5bf9a90SPeter Zijlstra 		raw_spin_unlock_irqrestore(&current->pi_lock, flags);	\
145b5bf9a90SPeter Zijlstra 	} while (0)
1468eb23b9fSPeter Zijlstra #else
147498d0c57SAndrew Morton /*
148498d0c57SAndrew Morton  * set_current_state() includes a barrier so that the write of current->state
149498d0c57SAndrew Morton  * is correctly serialised wrt the caller's subsequent test of whether to
150498d0c57SAndrew Morton  * actually sleep:
151498d0c57SAndrew Morton  *
152a2250238SPeter Zijlstra  *   for (;;) {
153498d0c57SAndrew Morton  *	set_current_state(TASK_UNINTERRUPTIBLE);
154a2250238SPeter Zijlstra  *	if (!need_sleep)
155a2250238SPeter Zijlstra  *		break;
156498d0c57SAndrew Morton  *
157a2250238SPeter Zijlstra  *	schedule();
158a2250238SPeter Zijlstra  *   }
159a2250238SPeter Zijlstra  *   __set_current_state(TASK_RUNNING);
160a2250238SPeter Zijlstra  *
161a2250238SPeter Zijlstra  * If the caller does not need such serialisation (because, for instance, the
162a2250238SPeter Zijlstra  * condition test and condition change and wakeup are under the same lock) then
163a2250238SPeter Zijlstra  * use __set_current_state().
164a2250238SPeter Zijlstra  *
165a2250238SPeter Zijlstra  * The above is typically ordered against the wakeup, which does:
166a2250238SPeter Zijlstra  *
167a2250238SPeter Zijlstra  *   need_sleep = false;
168a2250238SPeter Zijlstra  *   wake_up_state(p, TASK_UNINTERRUPTIBLE);
169a2250238SPeter Zijlstra  *
170a2250238SPeter Zijlstra  * Where wake_up_state() (and all other wakeup primitives) imply enough
171a2250238SPeter Zijlstra  * barriers to order the store of the variable against wakeup.
172a2250238SPeter Zijlstra  *
173a2250238SPeter Zijlstra  * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is,
174a2250238SPeter Zijlstra  * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a
175a2250238SPeter Zijlstra  * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING).
176a2250238SPeter Zijlstra  *
177b5bf9a90SPeter Zijlstra  * However, with slightly different timing the wakeup TASK_RUNNING store can
178b5bf9a90SPeter Zijlstra  * also collide with the TASK_UNINTERRUPTIBLE store. Loosing that store is not
179b5bf9a90SPeter Zijlstra  * a problem either because that will result in one extra go around the loop
180b5bf9a90SPeter Zijlstra  * and our @cond test will save the day.
181a2250238SPeter Zijlstra  *
182a2250238SPeter Zijlstra  * Also see the comments of try_to_wake_up().
183498d0c57SAndrew Morton  */
184b5bf9a90SPeter Zijlstra #define __set_current_state(state_value)				\
185b5bf9a90SPeter Zijlstra 	current->state = (state_value)
186b5bf9a90SPeter Zijlstra 
187b5bf9a90SPeter Zijlstra #define set_current_state(state_value)					\
188b5bf9a90SPeter Zijlstra 	smp_store_mb(current->state, (state_value))
189b5bf9a90SPeter Zijlstra 
190b5bf9a90SPeter Zijlstra /*
191b5bf9a90SPeter Zijlstra  * set_special_state() should be used for those states when the blocking task
192b5bf9a90SPeter Zijlstra  * can not use the regular condition based wait-loop. In that case we must
193b5bf9a90SPeter Zijlstra  * serialize against wakeups such that any possible in-flight TASK_RUNNING stores
194b5bf9a90SPeter Zijlstra  * will not collide with our state change.
195b5bf9a90SPeter Zijlstra  */
196b5bf9a90SPeter Zijlstra #define set_special_state(state_value)					\
197b5bf9a90SPeter Zijlstra 	do {								\
198b5bf9a90SPeter Zijlstra 		unsigned long flags; /* may shadow */			\
199b5bf9a90SPeter Zijlstra 		raw_spin_lock_irqsave(&current->pi_lock, flags);	\
200b5bf9a90SPeter Zijlstra 		current->state = (state_value);				\
201b5bf9a90SPeter Zijlstra 		raw_spin_unlock_irqrestore(&current->pi_lock, flags);	\
202b5bf9a90SPeter Zijlstra 	} while (0)
203b5bf9a90SPeter Zijlstra 
2048eb23b9fSPeter Zijlstra #endif
2058eb23b9fSPeter Zijlstra 
2065eca1c10SIngo Molnar /* Task command name length: */
2071da177e4SLinus Torvalds #define TASK_COMM_LEN			16
2081da177e4SLinus Torvalds 
2091da177e4SLinus Torvalds extern void scheduler_tick(void);
2101da177e4SLinus Torvalds 
2111da177e4SLinus Torvalds #define	MAX_SCHEDULE_TIMEOUT		LONG_MAX
2125eca1c10SIngo Molnar 
2135eca1c10SIngo Molnar extern long schedule_timeout(long timeout);
2145eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout);
2155eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout);
2165eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout);
2175eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout);
2181da177e4SLinus Torvalds asmlinkage void schedule(void);
219c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void);
2201da177e4SLinus Torvalds 
22110ab5643STejun Heo extern int __must_check io_schedule_prepare(void);
22210ab5643STejun Heo extern void io_schedule_finish(int token);
2239cff8adeSNeilBrown extern long io_schedule_timeout(long timeout);
22410ab5643STejun Heo extern void io_schedule(void);
2259cff8adeSNeilBrown 
226f06febc9SFrank Mayhar /**
2270ba42a59SMasanari Iida  * struct prev_cputime - snapshot of system and user cputime
228d37f761dSFrederic Weisbecker  * @utime: time spent in user mode
229d37f761dSFrederic Weisbecker  * @stime: time spent in system mode
2309d7fb042SPeter Zijlstra  * @lock: protects the above two fields
231d37f761dSFrederic Weisbecker  *
2329d7fb042SPeter Zijlstra  * Stores previous user/system time values such that we can guarantee
2339d7fb042SPeter Zijlstra  * monotonicity.
234d37f761dSFrederic Weisbecker  */
2359d7fb042SPeter Zijlstra struct prev_cputime {
2369d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
2375613fda9SFrederic Weisbecker 	u64				utime;
2385613fda9SFrederic Weisbecker 	u64				stime;
2399d7fb042SPeter Zijlstra 	raw_spinlock_t			lock;
2409d7fb042SPeter Zijlstra #endif
241d37f761dSFrederic Weisbecker };
242d37f761dSFrederic Weisbecker 
243d37f761dSFrederic Weisbecker /**
244f06febc9SFrank Mayhar  * struct task_cputime - collected CPU time counts
2455613fda9SFrederic Weisbecker  * @utime:		time spent in user mode, in nanoseconds
2465613fda9SFrederic Weisbecker  * @stime:		time spent in kernel mode, in nanoseconds
247f06febc9SFrank Mayhar  * @sum_exec_runtime:	total time spent on the CPU, in nanoseconds
248f06febc9SFrank Mayhar  *
2499d7fb042SPeter Zijlstra  * This structure groups together three kinds of CPU time that are tracked for
2509d7fb042SPeter Zijlstra  * threads and thread groups.  Most things considering CPU time want to group
2519d7fb042SPeter Zijlstra  * these counts together and treat all three of them in parallel.
252f06febc9SFrank Mayhar  */
253f06febc9SFrank Mayhar struct task_cputime {
2545613fda9SFrederic Weisbecker 	u64				utime;
2555613fda9SFrederic Weisbecker 	u64				stime;
256f06febc9SFrank Mayhar 	unsigned long long		sum_exec_runtime;
257f06febc9SFrank Mayhar };
2589d7fb042SPeter Zijlstra 
2595eca1c10SIngo Molnar /* Alternate field names when used on cache expirations: */
260f06febc9SFrank Mayhar #define virt_exp			utime
2619d7fb042SPeter Zijlstra #define prof_exp			stime
262f06febc9SFrank Mayhar #define sched_exp			sum_exec_runtime
263f06febc9SFrank Mayhar 
264bac5b6b6SFrederic Weisbecker enum vtime_state {
265bac5b6b6SFrederic Weisbecker 	/* Task is sleeping or running in a CPU with VTIME inactive: */
266bac5b6b6SFrederic Weisbecker 	VTIME_INACTIVE = 0,
267bac5b6b6SFrederic Weisbecker 	/* Task runs in userspace in a CPU with VTIME active: */
268bac5b6b6SFrederic Weisbecker 	VTIME_USER,
269bac5b6b6SFrederic Weisbecker 	/* Task runs in kernelspace in a CPU with VTIME active: */
270bac5b6b6SFrederic Weisbecker 	VTIME_SYS,
271bac5b6b6SFrederic Weisbecker };
272bac5b6b6SFrederic Weisbecker 
273bac5b6b6SFrederic Weisbecker struct vtime {
274bac5b6b6SFrederic Weisbecker 	seqcount_t		seqcount;
275bac5b6b6SFrederic Weisbecker 	unsigned long long	starttime;
276bac5b6b6SFrederic Weisbecker 	enum vtime_state	state;
2772a42eb95SWanpeng Li 	u64			utime;
2782a42eb95SWanpeng Li 	u64			stime;
2792a42eb95SWanpeng Li 	u64			gtime;
280bac5b6b6SFrederic Weisbecker };
281bac5b6b6SFrederic Weisbecker 
2821da177e4SLinus Torvalds struct sched_info {
2837f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO
2845eca1c10SIngo Molnar 	/* Cumulative counters: */
2851da177e4SLinus Torvalds 
2865eca1c10SIngo Molnar 	/* # of times we have run on this CPU: */
2875eca1c10SIngo Molnar 	unsigned long			pcount;
2885eca1c10SIngo Molnar 
2895eca1c10SIngo Molnar 	/* Time spent waiting on a runqueue: */
2905eca1c10SIngo Molnar 	unsigned long long		run_delay;
2915eca1c10SIngo Molnar 
2925eca1c10SIngo Molnar 	/* Timestamps: */
2935eca1c10SIngo Molnar 
2945eca1c10SIngo Molnar 	/* When did we last run on a CPU? */
2955eca1c10SIngo Molnar 	unsigned long long		last_arrival;
2965eca1c10SIngo Molnar 
2975eca1c10SIngo Molnar 	/* When were we last queued to run? */
2985eca1c10SIngo Molnar 	unsigned long long		last_queued;
2995eca1c10SIngo Molnar 
300f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */
3017f5f8e8dSIngo Molnar };
3021da177e4SLinus Torvalds 
3031da177e4SLinus Torvalds /*
3046ecdd749SYuyang Du  * Integer metrics need fixed point arithmetic, e.g., sched/fair
3056ecdd749SYuyang Du  * has a few: load, load_avg, util_avg, freq, and capacity.
3066ecdd749SYuyang Du  *
3076ecdd749SYuyang Du  * We define a basic fixed point arithmetic range, and then formalize
3086ecdd749SYuyang Du  * all these metrics based on that basic range.
3096ecdd749SYuyang Du  */
3106ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT		10
3116ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE		(1L << SCHED_FIXEDPOINT_SHIFT)
3126ecdd749SYuyang Du 
31320b8a59fSIngo Molnar struct load_weight {
3149dbdb155SPeter Zijlstra 	unsigned long			weight;
3159dbdb155SPeter Zijlstra 	u32				inv_weight;
31620b8a59fSIngo Molnar };
31720b8a59fSIngo Molnar 
3187f65ea42SPatrick Bellasi /**
3197f65ea42SPatrick Bellasi  * struct util_est - Estimation utilization of FAIR tasks
3207f65ea42SPatrick Bellasi  * @enqueued: instantaneous estimated utilization of a task/cpu
3217f65ea42SPatrick Bellasi  * @ewma:     the Exponential Weighted Moving Average (EWMA)
3227f65ea42SPatrick Bellasi  *            utilization of a task
3237f65ea42SPatrick Bellasi  *
3247f65ea42SPatrick Bellasi  * Support data structure to track an Exponential Weighted Moving Average
3257f65ea42SPatrick Bellasi  * (EWMA) of a FAIR task's utilization. New samples are added to the moving
3267f65ea42SPatrick Bellasi  * average each time a task completes an activation. Sample's weight is chosen
3277f65ea42SPatrick Bellasi  * so that the EWMA will be relatively insensitive to transient changes to the
3287f65ea42SPatrick Bellasi  * task's workload.
3297f65ea42SPatrick Bellasi  *
3307f65ea42SPatrick Bellasi  * The enqueued attribute has a slightly different meaning for tasks and cpus:
3317f65ea42SPatrick Bellasi  * - task:   the task's util_avg at last task dequeue time
3327f65ea42SPatrick Bellasi  * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU
3337f65ea42SPatrick Bellasi  * Thus, the util_est.enqueued of a task represents the contribution on the
3347f65ea42SPatrick Bellasi  * estimated utilization of the CPU where that task is currently enqueued.
3357f65ea42SPatrick Bellasi  *
3367f65ea42SPatrick Bellasi  * Only for tasks we track a moving average of the past instantaneous
3377f65ea42SPatrick Bellasi  * estimated utilization. This allows to absorb sporadic drops in utilization
3387f65ea42SPatrick Bellasi  * of an otherwise almost periodic task.
3397f65ea42SPatrick Bellasi  */
3407f65ea42SPatrick Bellasi struct util_est {
3417f65ea42SPatrick Bellasi 	unsigned int			enqueued;
3427f65ea42SPatrick Bellasi 	unsigned int			ewma;
3437f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT		2
344317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64))));
3457f65ea42SPatrick Bellasi 
3469d89c257SYuyang Du /*
3477b595334SYuyang Du  * The load_avg/util_avg accumulates an infinite geometric series
3487b595334SYuyang Du  * (see __update_load_avg() in kernel/sched/fair.c).
3497b595334SYuyang Du  *
3507b595334SYuyang Du  * [load_avg definition]
3517b595334SYuyang Du  *
3527b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load)
3537b595334SYuyang Du  *
3547b595334SYuyang Du  * where runnable% is the time ratio that a sched_entity is runnable.
3557b595334SYuyang Du  * For cfs_rq, it is the aggregated load_avg of all runnable and
3569d89c257SYuyang Du  * blocked sched_entities.
3577b595334SYuyang Du  *
3587b595334SYuyang Du  * load_avg may also take frequency scaling into account:
3597b595334SYuyang Du  *
3607b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load) * freq%
3617b595334SYuyang Du  *
3627b595334SYuyang Du  * where freq% is the CPU frequency normalized to the highest frequency.
3637b595334SYuyang Du  *
3647b595334SYuyang Du  * [util_avg definition]
3657b595334SYuyang Du  *
3667b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE
3677b595334SYuyang Du  *
3687b595334SYuyang Du  * where running% is the time ratio that a sched_entity is running on
3697b595334SYuyang Du  * a CPU. For cfs_rq, it is the aggregated util_avg of all runnable
3707b595334SYuyang Du  * and blocked sched_entities.
3717b595334SYuyang Du  *
3727b595334SYuyang Du  * util_avg may also factor frequency scaling and CPU capacity scaling:
3737b595334SYuyang Du  *
3747b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE * freq% * capacity%
3757b595334SYuyang Du  *
3767b595334SYuyang Du  * where freq% is the same as above, and capacity% is the CPU capacity
3777b595334SYuyang Du  * normalized to the greatest capacity (due to uarch differences, etc).
3787b595334SYuyang Du  *
3797b595334SYuyang Du  * N.B., the above ratios (runnable%, running%, freq%, and capacity%)
3807b595334SYuyang Du  * themselves are in the range of [0, 1]. To do fixed point arithmetics,
3817b595334SYuyang Du  * we therefore scale them to as large a range as necessary. This is for
3827b595334SYuyang Du  * example reflected by util_avg's SCHED_CAPACITY_SCALE.
3837b595334SYuyang Du  *
3847b595334SYuyang Du  * [Overflow issue]
3857b595334SYuyang Du  *
3867b595334SYuyang Du  * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities
3877b595334SYuyang Du  * with the highest load (=88761), always runnable on a single cfs_rq,
3887b595334SYuyang Du  * and should not overflow as the number already hits PID_MAX_LIMIT.
3897b595334SYuyang Du  *
3907b595334SYuyang Du  * For all other cases (including 32-bit kernels), struct load_weight's
3917b595334SYuyang Du  * weight will overflow first before we do, because:
3927b595334SYuyang Du  *
3937b595334SYuyang Du  *    Max(load_avg) <= Max(load.weight)
3947b595334SYuyang Du  *
3957b595334SYuyang Du  * Then it is the load_weight's responsibility to consider overflow
3967b595334SYuyang Du  * issues.
3979d89c257SYuyang Du  */
3989d85f21cSPaul Turner struct sched_avg {
3995eca1c10SIngo Molnar 	u64				last_update_time;
4005eca1c10SIngo Molnar 	u64				load_sum;
4011ea6c46aSPeter Zijlstra 	u64				runnable_load_sum;
4025eca1c10SIngo Molnar 	u32				util_sum;
4035eca1c10SIngo Molnar 	u32				period_contrib;
4045eca1c10SIngo Molnar 	unsigned long			load_avg;
4051ea6c46aSPeter Zijlstra 	unsigned long			runnable_load_avg;
4065eca1c10SIngo Molnar 	unsigned long			util_avg;
4077f65ea42SPatrick Bellasi 	struct util_est			util_est;
408317d359dSPeter Zijlstra } ____cacheline_aligned;
4099d85f21cSPaul Turner 
41041acab88SLucas De Marchi struct sched_statistics {
4117f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS
41294c18227SIngo Molnar 	u64				wait_start;
41394c18227SIngo Molnar 	u64				wait_max;
4146d082592SArjan van de Ven 	u64				wait_count;
4156d082592SArjan van de Ven 	u64				wait_sum;
4168f0dfc34SArjan van de Ven 	u64				iowait_count;
4178f0dfc34SArjan van de Ven 	u64				iowait_sum;
41894c18227SIngo Molnar 
41994c18227SIngo Molnar 	u64				sleep_start;
42020b8a59fSIngo Molnar 	u64				sleep_max;
42194c18227SIngo Molnar 	s64				sum_sleep_runtime;
42294c18227SIngo Molnar 
42394c18227SIngo Molnar 	u64				block_start;
42420b8a59fSIngo Molnar 	u64				block_max;
42520b8a59fSIngo Molnar 	u64				exec_max;
426eba1ed4bSIngo Molnar 	u64				slice_max;
427cc367732SIngo Molnar 
428cc367732SIngo Molnar 	u64				nr_migrations_cold;
429cc367732SIngo Molnar 	u64				nr_failed_migrations_affine;
430cc367732SIngo Molnar 	u64				nr_failed_migrations_running;
431cc367732SIngo Molnar 	u64				nr_failed_migrations_hot;
432cc367732SIngo Molnar 	u64				nr_forced_migrations;
433cc367732SIngo Molnar 
434cc367732SIngo Molnar 	u64				nr_wakeups;
435cc367732SIngo Molnar 	u64				nr_wakeups_sync;
436cc367732SIngo Molnar 	u64				nr_wakeups_migrate;
437cc367732SIngo Molnar 	u64				nr_wakeups_local;
438cc367732SIngo Molnar 	u64				nr_wakeups_remote;
439cc367732SIngo Molnar 	u64				nr_wakeups_affine;
440cc367732SIngo Molnar 	u64				nr_wakeups_affine_attempts;
441cc367732SIngo Molnar 	u64				nr_wakeups_passive;
442cc367732SIngo Molnar 	u64				nr_wakeups_idle;
44341acab88SLucas De Marchi #endif
4447f5f8e8dSIngo Molnar };
44541acab88SLucas De Marchi 
44641acab88SLucas De Marchi struct sched_entity {
4475eca1c10SIngo Molnar 	/* For load-balancing: */
4485eca1c10SIngo Molnar 	struct load_weight		load;
4491ea6c46aSPeter Zijlstra 	unsigned long			runnable_weight;
45041acab88SLucas De Marchi 	struct rb_node			run_node;
45141acab88SLucas De Marchi 	struct list_head		group_node;
45241acab88SLucas De Marchi 	unsigned int			on_rq;
45341acab88SLucas De Marchi 
45441acab88SLucas De Marchi 	u64				exec_start;
45541acab88SLucas De Marchi 	u64				sum_exec_runtime;
45641acab88SLucas De Marchi 	u64				vruntime;
45741acab88SLucas De Marchi 	u64				prev_sum_exec_runtime;
45841acab88SLucas De Marchi 
45941acab88SLucas De Marchi 	u64				nr_migrations;
46041acab88SLucas De Marchi 
46141acab88SLucas De Marchi 	struct sched_statistics		statistics;
46294c18227SIngo Molnar 
46320b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED
464fed14d45SPeter Zijlstra 	int				depth;
46520b8a59fSIngo Molnar 	struct sched_entity		*parent;
46620b8a59fSIngo Molnar 	/* rq on which this entity is (to be) queued: */
46720b8a59fSIngo Molnar 	struct cfs_rq			*cfs_rq;
46820b8a59fSIngo Molnar 	/* rq "owned" by this entity/group: */
46920b8a59fSIngo Molnar 	struct cfs_rq			*my_q;
47020b8a59fSIngo Molnar #endif
4718bd75c77SClark Williams 
472141965c7SAlex Shi #ifdef CONFIG_SMP
4735a107804SJiri Olsa 	/*
4745a107804SJiri Olsa 	 * Per entity load average tracking.
4755a107804SJiri Olsa 	 *
4765a107804SJiri Olsa 	 * Put into separate cache line so it does not
4775a107804SJiri Olsa 	 * collide with read-mostly values above.
4785a107804SJiri Olsa 	 */
479317d359dSPeter Zijlstra 	struct sched_avg		avg;
4809d85f21cSPaul Turner #endif
48120b8a59fSIngo Molnar };
48270b97a7fSIngo Molnar 
483fa717060SPeter Zijlstra struct sched_rt_entity {
484fa717060SPeter Zijlstra 	struct list_head		run_list;
48578f2c7dbSPeter Zijlstra 	unsigned long			timeout;
48657d2aa00SYing Xue 	unsigned long			watchdog_stamp;
487bee367edSRichard Kennedy 	unsigned int			time_slice;
488ff77e468SPeter Zijlstra 	unsigned short			on_rq;
489ff77e468SPeter Zijlstra 	unsigned short			on_list;
4906f505b16SPeter Zijlstra 
49158d6c2d7SPeter Zijlstra 	struct sched_rt_entity		*back;
492052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED
4936f505b16SPeter Zijlstra 	struct sched_rt_entity		*parent;
4946f505b16SPeter Zijlstra 	/* rq on which this entity is (to be) queued: */
4956f505b16SPeter Zijlstra 	struct rt_rq			*rt_rq;
4966f505b16SPeter Zijlstra 	/* rq "owned" by this entity/group: */
4976f505b16SPeter Zijlstra 	struct rt_rq			*my_q;
4986f505b16SPeter Zijlstra #endif
4993859a271SKees Cook } __randomize_layout;
500fa717060SPeter Zijlstra 
501aab03e05SDario Faggioli struct sched_dl_entity {
502aab03e05SDario Faggioli 	struct rb_node			rb_node;
503aab03e05SDario Faggioli 
504aab03e05SDario Faggioli 	/*
505aab03e05SDario Faggioli 	 * Original scheduling parameters. Copied here from sched_attr
5064027d080Sxiaofeng.yan 	 * during sched_setattr(), they will remain the same until
5074027d080Sxiaofeng.yan 	 * the next sched_setattr().
508aab03e05SDario Faggioli 	 */
5095eca1c10SIngo Molnar 	u64				dl_runtime;	/* Maximum runtime for each instance	*/
5105eca1c10SIngo Molnar 	u64				dl_deadline;	/* Relative deadline of each instance	*/
5115eca1c10SIngo Molnar 	u64				dl_period;	/* Separation of two instances (period) */
51254d6d303SDaniel Bristot de Oliveira 	u64				dl_bw;		/* dl_runtime / dl_period		*/
5133effcb42SDaniel Bristot de Oliveira 	u64				dl_density;	/* dl_runtime / dl_deadline		*/
514aab03e05SDario Faggioli 
515aab03e05SDario Faggioli 	/*
516aab03e05SDario Faggioli 	 * Actual scheduling parameters. Initialized with the values above,
517aab03e05SDario Faggioli 	 * they are continously updated during task execution. Note that
518aab03e05SDario Faggioli 	 * the remaining runtime could be < 0 in case we are in overrun.
519aab03e05SDario Faggioli 	 */
5205eca1c10SIngo Molnar 	s64				runtime;	/* Remaining runtime for this instance	*/
5215eca1c10SIngo Molnar 	u64				deadline;	/* Absolute deadline for this instance	*/
5225eca1c10SIngo Molnar 	unsigned int			flags;		/* Specifying the scheduler behaviour	*/
523aab03e05SDario Faggioli 
524aab03e05SDario Faggioli 	/*
525aab03e05SDario Faggioli 	 * Some bool flags:
526aab03e05SDario Faggioli 	 *
527aab03e05SDario Faggioli 	 * @dl_throttled tells if we exhausted the runtime. If so, the
528aab03e05SDario Faggioli 	 * task has to wait for a replenishment to be performed at the
529aab03e05SDario Faggioli 	 * next firing of dl_timer.
530aab03e05SDario Faggioli 	 *
5312d3d891dSDario Faggioli 	 * @dl_boosted tells if we are boosted due to DI. If so we are
5322d3d891dSDario Faggioli 	 * outside bandwidth enforcement mechanism (but only until we
5335bfd126eSJuri Lelli 	 * exit the critical section);
5345bfd126eSJuri Lelli 	 *
5355eca1c10SIngo Molnar 	 * @dl_yielded tells if task gave up the CPU before consuming
5365bfd126eSJuri Lelli 	 * all its available runtime during the last job.
537209a0cbdSLuca Abeni 	 *
538209a0cbdSLuca Abeni 	 * @dl_non_contending tells if the task is inactive while still
539209a0cbdSLuca Abeni 	 * contributing to the active utilization. In other words, it
540209a0cbdSLuca Abeni 	 * indicates if the inactive timer has been armed and its handler
541209a0cbdSLuca Abeni 	 * has not been executed yet. This flag is useful to avoid race
542209a0cbdSLuca Abeni 	 * conditions between the inactive timer handler and the wakeup
543209a0cbdSLuca Abeni 	 * code.
54434be3930SJuri Lelli 	 *
54534be3930SJuri Lelli 	 * @dl_overrun tells if the task asked to be informed about runtime
54634be3930SJuri Lelli 	 * overruns.
547aab03e05SDario Faggioli 	 */
548aa5222e9SDan Carpenter 	unsigned int			dl_throttled      : 1;
549aa5222e9SDan Carpenter 	unsigned int			dl_boosted        : 1;
550aa5222e9SDan Carpenter 	unsigned int			dl_yielded        : 1;
551aa5222e9SDan Carpenter 	unsigned int			dl_non_contending : 1;
55234be3930SJuri Lelli 	unsigned int			dl_overrun	  : 1;
553aab03e05SDario Faggioli 
554aab03e05SDario Faggioli 	/*
555aab03e05SDario Faggioli 	 * Bandwidth enforcement timer. Each -deadline task has its
556aab03e05SDario Faggioli 	 * own bandwidth to be enforced, thus we need one timer per task.
557aab03e05SDario Faggioli 	 */
558aab03e05SDario Faggioli 	struct hrtimer			dl_timer;
559209a0cbdSLuca Abeni 
560209a0cbdSLuca Abeni 	/*
561209a0cbdSLuca Abeni 	 * Inactive timer, responsible for decreasing the active utilization
562209a0cbdSLuca Abeni 	 * at the "0-lag time". When a -deadline task blocks, it contributes
563209a0cbdSLuca Abeni 	 * to GRUB's active utilization until the "0-lag time", hence a
564209a0cbdSLuca Abeni 	 * timer is needed to decrease the active utilization at the correct
565209a0cbdSLuca Abeni 	 * time.
566209a0cbdSLuca Abeni 	 */
567209a0cbdSLuca Abeni 	struct hrtimer inactive_timer;
568aab03e05SDario Faggioli };
5698bd75c77SClark Williams 
5701d082fd0SPaul E. McKenney union rcu_special {
5711d082fd0SPaul E. McKenney 	struct {
5728203d6d0SPaul E. McKenney 		u8			blocked;
5738203d6d0SPaul E. McKenney 		u8			need_qs;
5748203d6d0SPaul E. McKenney 		u8			exp_need_qs;
5755eca1c10SIngo Molnar 
5765eca1c10SIngo Molnar 		/* Otherwise the compiler can store garbage here: */
5775eca1c10SIngo Molnar 		u8			pad;
5788203d6d0SPaul E. McKenney 	} b; /* Bits. */
5798203d6d0SPaul E. McKenney 	u32 s; /* Set of bits. */
5801d082fd0SPaul E. McKenney };
58186848966SPaul E. McKenney 
5828dc85d54SPeter Zijlstra enum perf_event_task_context {
5838dc85d54SPeter Zijlstra 	perf_invalid_context = -1,
5848dc85d54SPeter Zijlstra 	perf_hw_context = 0,
58589a1e187SPeter Zijlstra 	perf_sw_context,
5868dc85d54SPeter Zijlstra 	perf_nr_task_contexts,
5878dc85d54SPeter Zijlstra };
5888dc85d54SPeter Zijlstra 
589eb61baf6SIngo Molnar struct wake_q_node {
590eb61baf6SIngo Molnar 	struct wake_q_node *next;
591eb61baf6SIngo Molnar };
592eb61baf6SIngo Molnar 
5931da177e4SLinus Torvalds struct task_struct {
594c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
595c65eacbeSAndy Lutomirski 	/*
596c65eacbeSAndy Lutomirski 	 * For reasons of header soup (see current_thread_info()), this
597c65eacbeSAndy Lutomirski 	 * must be the first element of task_struct.
598c65eacbeSAndy Lutomirski 	 */
599c65eacbeSAndy Lutomirski 	struct thread_info		thread_info;
600c65eacbeSAndy Lutomirski #endif
6015eca1c10SIngo Molnar 	/* -1 unrunnable, 0 runnable, >0 stopped: */
6025eca1c10SIngo Molnar 	volatile long			state;
60329e48ce8SKees Cook 
60429e48ce8SKees Cook 	/*
60529e48ce8SKees Cook 	 * This begins the randomizable portion of task_struct. Only
60629e48ce8SKees Cook 	 * scheduling-critical items should be added above here.
60729e48ce8SKees Cook 	 */
60829e48ce8SKees Cook 	randomized_struct_fields_start
60929e48ce8SKees Cook 
610f7e4217bSRoman Zippel 	void				*stack;
6111da177e4SLinus Torvalds 	atomic_t			usage;
6125eca1c10SIngo Molnar 	/* Per task flags (PF_*), defined further below: */
6135eca1c10SIngo Molnar 	unsigned int			flags;
61497dc32cdSWilliam Cohen 	unsigned int			ptrace;
6151da177e4SLinus Torvalds 
6162dd73a4fSPeter Williams #ifdef CONFIG_SMP
617fa14ff4aSPeter Zijlstra 	struct llist_node		wake_entry;
6183ca7a440SPeter Zijlstra 	int				on_cpu;
619c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
6205eca1c10SIngo Molnar 	/* Current CPU: */
6215eca1c10SIngo Molnar 	unsigned int			cpu;
622c65eacbeSAndy Lutomirski #endif
62363b0e9edSMike Galbraith 	unsigned int			wakee_flips;
62462470419SMichael Wang 	unsigned long			wakee_flip_decay_ts;
62563b0e9edSMike Galbraith 	struct task_struct		*last_wakee;
626ac66f547SPeter Zijlstra 
62732e839ddSMel Gorman 	/*
62832e839ddSMel Gorman 	 * recent_used_cpu is initially set as the last CPU used by a task
62932e839ddSMel Gorman 	 * that wakes affine another task. Waker/wakee relationships can
63032e839ddSMel Gorman 	 * push tasks around a CPU where each wakeup moves to the next one.
63132e839ddSMel Gorman 	 * Tracking a recently used CPU allows a quick search for a recently
63232e839ddSMel Gorman 	 * used CPU that may be idle.
63332e839ddSMel Gorman 	 */
63432e839ddSMel Gorman 	int				recent_used_cpu;
635ac66f547SPeter Zijlstra 	int				wake_cpu;
6364866cde0SNick Piggin #endif
637fd2f4419SPeter Zijlstra 	int				on_rq;
63850e645a8SIngo Molnar 
6395eca1c10SIngo Molnar 	int				prio;
6405eca1c10SIngo Molnar 	int				static_prio;
6415eca1c10SIngo Molnar 	int				normal_prio;
642c7aceabaSRichard Kennedy 	unsigned int			rt_priority;
6435eca1c10SIngo Molnar 
6445522d5d5SIngo Molnar 	const struct sched_class	*sched_class;
64520b8a59fSIngo Molnar 	struct sched_entity		se;
646fa717060SPeter Zijlstra 	struct sched_rt_entity		rt;
6478323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED
6488323f26cSPeter Zijlstra 	struct task_group		*sched_task_group;
6498323f26cSPeter Zijlstra #endif
650aab03e05SDario Faggioli 	struct sched_dl_entity		dl;
6511da177e4SLinus Torvalds 
652e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS
6535eca1c10SIngo Molnar 	/* List of struct preempt_notifier: */
654e107be36SAvi Kivity 	struct hlist_head		preempt_notifiers;
655e107be36SAvi Kivity #endif
656e107be36SAvi Kivity 
6576c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE
6582056a782SJens Axboe 	unsigned int			btrace_seq;
6596c5c9341SAlexey Dobriyan #endif
6601da177e4SLinus Torvalds 
66197dc32cdSWilliam Cohen 	unsigned int			policy;
66229baa747SPeter Zijlstra 	int				nr_cpus_allowed;
6631da177e4SLinus Torvalds 	cpumask_t			cpus_allowed;
6641da177e4SLinus Torvalds 
665a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU
666e260be67SPaul E. McKenney 	int				rcu_read_lock_nesting;
6671d082fd0SPaul E. McKenney 	union rcu_special		rcu_read_unlock_special;
668f41d911fSPaul E. McKenney 	struct list_head		rcu_node_entry;
669a57eb940SPaul E. McKenney 	struct rcu_node			*rcu_blocked_node;
67028f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */
6715eca1c10SIngo Molnar 
6728315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU
6738315f422SPaul E. McKenney 	unsigned long			rcu_tasks_nvcsw;
674ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_holdout;
675ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_idx;
676176f8f7aSPaul E. McKenney 	int				rcu_tasks_idle_cpu;
677ccdd29ffSPaul E. McKenney 	struct list_head		rcu_tasks_holdout_list;
6788315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */
679e260be67SPaul E. McKenney 
6801da177e4SLinus Torvalds 	struct sched_info		sched_info;
6811da177e4SLinus Torvalds 
6821da177e4SLinus Torvalds 	struct list_head		tasks;
683806c09a7SDario Faggioli #ifdef CONFIG_SMP
684917b627dSGregory Haskins 	struct plist_node		pushable_tasks;
6851baca4ceSJuri Lelli 	struct rb_node			pushable_dl_tasks;
686806c09a7SDario Faggioli #endif
6871da177e4SLinus Torvalds 
6885eca1c10SIngo Molnar 	struct mm_struct		*mm;
6895eca1c10SIngo Molnar 	struct mm_struct		*active_mm;
690314ff785SIngo Molnar 
691314ff785SIngo Molnar 	/* Per-thread vma caching: */
692314ff785SIngo Molnar 	struct vmacache			vmacache;
693314ff785SIngo Molnar 
6945eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING
69534e55232SKAMEZAWA Hiroyuki 	struct task_rss_stat		rss_stat;
69634e55232SKAMEZAWA Hiroyuki #endif
69797dc32cdSWilliam Cohen 	int				exit_state;
6985eca1c10SIngo Molnar 	int				exit_code;
6995eca1c10SIngo Molnar 	int				exit_signal;
7005eca1c10SIngo Molnar 	/* The signal sent when the parent dies: */
7015eca1c10SIngo Molnar 	int				pdeath_signal;
7025eca1c10SIngo Molnar 	/* JOBCTL_*, siglock protected: */
7035eca1c10SIngo Molnar 	unsigned long			jobctl;
7049b89f6baSAndrei Epure 
7055eca1c10SIngo Molnar 	/* Used for emulating ABI behavior of previous Linux versions: */
70697dc32cdSWilliam Cohen 	unsigned int			personality;
7079b89f6baSAndrei Epure 
7085eca1c10SIngo Molnar 	/* Scheduler bits, serialized by scheduler locks: */
709ca94c442SLennart Poettering 	unsigned			sched_reset_on_fork:1;
710a8e4f2eaSPeter Zijlstra 	unsigned			sched_contributes_to_load:1;
711ff303e66SPeter Zijlstra 	unsigned			sched_migrated:1;
712b7e7ade3SPeter Zijlstra 	unsigned			sched_remote_wakeup:1;
7135eca1c10SIngo Molnar 	/* Force alignment to the next boundary: */
7145eca1c10SIngo Molnar 	unsigned			:0;
715be958bdcSPeter Zijlstra 
7165eca1c10SIngo Molnar 	/* Unserialized, strictly 'current' */
7175eca1c10SIngo Molnar 
7185eca1c10SIngo Molnar 	/* Bit to tell LSMs we're in execve(): */
7195eca1c10SIngo Molnar 	unsigned			in_execve:1;
720be958bdcSPeter Zijlstra 	unsigned			in_iowait:1;
7215eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK
7227e781418SAndy Lutomirski 	unsigned			restore_sigmask:1;
7237e781418SAndy Lutomirski #endif
724626ebc41STejun Heo #ifdef CONFIG_MEMCG
725626ebc41STejun Heo 	unsigned			memcg_may_oom:1;
726127424c8SJohannes Weiner #ifndef CONFIG_SLOB
7276f185c29SVladimir Davydov 	unsigned			memcg_kmem_skip_account:1;
7286f185c29SVladimir Davydov #endif
729127424c8SJohannes Weiner #endif
730ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK
731ff303e66SPeter Zijlstra 	unsigned			brk_randomized:1;
732ff303e66SPeter Zijlstra #endif
73377f88796STejun Heo #ifdef CONFIG_CGROUPS
73477f88796STejun Heo 	/* disallow userland-initiated cgroup migration */
73577f88796STejun Heo 	unsigned			no_cgroup_migration:1;
73677f88796STejun Heo #endif
7376f185c29SVladimir Davydov 
7385eca1c10SIngo Molnar 	unsigned long			atomic_flags; /* Flags requiring atomic access. */
7391d4457f9SKees Cook 
740f56141e3SAndy Lutomirski 	struct restart_block		restart_block;
741f56141e3SAndy Lutomirski 
7421da177e4SLinus Torvalds 	pid_t				pid;
7431da177e4SLinus Torvalds 	pid_t				tgid;
7440a425405SArjan van de Ven 
745*050e9baaSLinus Torvalds #ifdef CONFIG_STACKPROTECTOR
7465eca1c10SIngo Molnar 	/* Canary value for the -fstack-protector GCC feature: */
7470a425405SArjan van de Ven 	unsigned long			stack_canary;
7481314562aSHiroshi Shimamoto #endif
7491da177e4SLinus Torvalds 	/*
7505eca1c10SIngo Molnar 	 * Pointers to the (original) parent process, youngest child, younger sibling,
7511da177e4SLinus Torvalds 	 * older sibling, respectively.  (p->father can be replaced with
752f470021aSRoland McGrath 	 * p->real_parent->pid)
7531da177e4SLinus Torvalds 	 */
7545eca1c10SIngo Molnar 
7555eca1c10SIngo Molnar 	/* Real parent process: */
7565eca1c10SIngo Molnar 	struct task_struct __rcu	*real_parent;
7575eca1c10SIngo Molnar 
7585eca1c10SIngo Molnar 	/* Recipient of SIGCHLD, wait4() reports: */
7595eca1c10SIngo Molnar 	struct task_struct __rcu	*parent;
7601da177e4SLinus Torvalds 
761f470021aSRoland McGrath 	/*
7625eca1c10SIngo Molnar 	 * Children/sibling form the list of natural children:
7635eca1c10SIngo Molnar 	 */
7645eca1c10SIngo Molnar 	struct list_head		children;
7655eca1c10SIngo Molnar 	struct list_head		sibling;
7665eca1c10SIngo Molnar 	struct task_struct		*group_leader;
7675eca1c10SIngo Molnar 
7685eca1c10SIngo Molnar 	/*
7695eca1c10SIngo Molnar 	 * 'ptraced' is the list of tasks this task is using ptrace() on.
7705eca1c10SIngo Molnar 	 *
771f470021aSRoland McGrath 	 * This includes both natural children and PTRACE_ATTACH targets.
7725eca1c10SIngo Molnar 	 * 'ptrace_entry' is this task's link on the p->parent->ptraced list.
773f470021aSRoland McGrath 	 */
774f470021aSRoland McGrath 	struct list_head		ptraced;
775f470021aSRoland McGrath 	struct list_head		ptrace_entry;
776f470021aSRoland McGrath 
7771da177e4SLinus Torvalds 	/* PID/PID hash table linkage. */
77892476d7fSEric W. Biederman 	struct pid_link			pids[PIDTYPE_MAX];
77947e65328SOleg Nesterov 	struct list_head		thread_group;
7800c740d0aSOleg Nesterov 	struct list_head		thread_node;
7811da177e4SLinus Torvalds 
7825eca1c10SIngo Molnar 	struct completion		*vfork_done;
7831da177e4SLinus Torvalds 
7845eca1c10SIngo Molnar 	/* CLONE_CHILD_SETTID: */
7855eca1c10SIngo Molnar 	int __user			*set_child_tid;
7865eca1c10SIngo Molnar 
7875eca1c10SIngo Molnar 	/* CLONE_CHILD_CLEARTID: */
7885eca1c10SIngo Molnar 	int __user			*clear_child_tid;
7895eca1c10SIngo Molnar 
7905eca1c10SIngo Molnar 	u64				utime;
7915eca1c10SIngo Molnar 	u64				stime;
79240565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME
7935eca1c10SIngo Molnar 	u64				utimescaled;
7945eca1c10SIngo Molnar 	u64				stimescaled;
79540565b5aSStanislaw Gruszka #endif
79616a6d9beSFrederic Weisbecker 	u64				gtime;
7979d7fb042SPeter Zijlstra 	struct prev_cputime		prev_cputime;
7986a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
799bac5b6b6SFrederic Weisbecker 	struct vtime			vtime;
8006a61671bSFrederic Weisbecker #endif
801d027d45dSFrederic Weisbecker 
802d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
803f009a7a7SFrederic Weisbecker 	atomic_t			tick_dep_mask;
804d027d45dSFrederic Weisbecker #endif
8055eca1c10SIngo Molnar 	/* Context switch counts: */
8065eca1c10SIngo Molnar 	unsigned long			nvcsw;
8075eca1c10SIngo Molnar 	unsigned long			nivcsw;
8085eca1c10SIngo Molnar 
8095eca1c10SIngo Molnar 	/* Monotonic time in nsecs: */
8105eca1c10SIngo Molnar 	u64				start_time;
8115eca1c10SIngo Molnar 
8125eca1c10SIngo Molnar 	/* Boot based time in nsecs: */
8135eca1c10SIngo Molnar 	u64				real_start_time;
8145eca1c10SIngo Molnar 
8155eca1c10SIngo Molnar 	/* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */
8165eca1c10SIngo Molnar 	unsigned long			min_flt;
8175eca1c10SIngo Molnar 	unsigned long			maj_flt;
8181da177e4SLinus Torvalds 
819b18b6a9cSNicolas Pitre #ifdef CONFIG_POSIX_TIMERS
820f06febc9SFrank Mayhar 	struct task_cputime		cputime_expires;
8211da177e4SLinus Torvalds 	struct list_head		cpu_timers[3];
822b18b6a9cSNicolas Pitre #endif
8231da177e4SLinus Torvalds 
8245eca1c10SIngo Molnar 	/* Process credentials: */
8255eca1c10SIngo Molnar 
8265eca1c10SIngo Molnar 	/* Tracer's credentials at attach: */
8275eca1c10SIngo Molnar 	const struct cred __rcu		*ptracer_cred;
8285eca1c10SIngo Molnar 
8295eca1c10SIngo Molnar 	/* Objective and real subjective task credentials (COW): */
8305eca1c10SIngo Molnar 	const struct cred __rcu		*real_cred;
8315eca1c10SIngo Molnar 
8325eca1c10SIngo Molnar 	/* Effective (overridable) subjective task credentials (COW): */
8335eca1c10SIngo Molnar 	const struct cred __rcu		*cred;
8345eca1c10SIngo Molnar 
8355eca1c10SIngo Molnar 	/*
8365eca1c10SIngo Molnar 	 * executable name, excluding path.
8375eca1c10SIngo Molnar 	 *
8385eca1c10SIngo Molnar 	 * - normally initialized setup_new_exec()
8395eca1c10SIngo Molnar 	 * - access it with [gs]et_task_comm()
8405eca1c10SIngo Molnar 	 * - lock it with task_lock()
8415eca1c10SIngo Molnar 	 */
8425eca1c10SIngo Molnar 	char				comm[TASK_COMM_LEN];
8435eca1c10SIngo Molnar 
844756daf26SNeilBrown 	struct nameidata		*nameidata;
8455eca1c10SIngo Molnar 
8463d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC
8471da177e4SLinus Torvalds 	struct sysv_sem			sysvsem;
848ab602f79SJack Miller 	struct sysv_shm			sysvshm;
8493d5b6fccSAlexey Dobriyan #endif
850e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK
85182a1fcb9SIngo Molnar 	unsigned long			last_switch_count;
85282a1fcb9SIngo Molnar #endif
8535eca1c10SIngo Molnar 	/* Filesystem information: */
8541da177e4SLinus Torvalds 	struct fs_struct		*fs;
8555eca1c10SIngo Molnar 
8565eca1c10SIngo Molnar 	/* Open file information: */
8571da177e4SLinus Torvalds 	struct files_struct		*files;
8585eca1c10SIngo Molnar 
8595eca1c10SIngo Molnar 	/* Namespaces: */
860ab516013SSerge E. Hallyn 	struct nsproxy			*nsproxy;
8615eca1c10SIngo Molnar 
8625eca1c10SIngo Molnar 	/* Signal handlers: */
8631da177e4SLinus Torvalds 	struct signal_struct		*signal;
8641da177e4SLinus Torvalds 	struct sighand_struct		*sighand;
8655eca1c10SIngo Molnar 	sigset_t			blocked;
8665eca1c10SIngo Molnar 	sigset_t			real_blocked;
8675eca1c10SIngo Molnar 	/* Restored if set_restore_sigmask() was used: */
8685eca1c10SIngo Molnar 	sigset_t			saved_sigmask;
8691da177e4SLinus Torvalds 	struct sigpending		pending;
8701da177e4SLinus Torvalds 	unsigned long			sas_ss_sp;
8711da177e4SLinus Torvalds 	size_t				sas_ss_size;
8725eca1c10SIngo Molnar 	unsigned int			sas_ss_flags;
8732e01fabeSOleg Nesterov 
87467d12145SAl Viro 	struct callback_head		*task_works;
875e73f8959SOleg Nesterov 
8761da177e4SLinus Torvalds 	struct audit_context		*audit_context;
877bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL
878e1760bd5SEric W. Biederman 	kuid_t				loginuid;
8794746ec5bSEric Paris 	unsigned int			sessionid;
880bfef93a5SAl Viro #endif
881932ecebbSWill Drewry 	struct seccomp			seccomp;
8821da177e4SLinus Torvalds 
8835eca1c10SIngo Molnar 	/* Thread group tracking: */
8841da177e4SLinus Torvalds 	u32				parent_exec_id;
8851da177e4SLinus Torvalds 	u32				self_exec_id;
8865eca1c10SIngo Molnar 
8875eca1c10SIngo Molnar 	/* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */
8881da177e4SLinus Torvalds 	spinlock_t			alloc_lock;
8891da177e4SLinus Torvalds 
890b29739f9SIngo Molnar 	/* Protection of the PI data structures: */
8911d615482SThomas Gleixner 	raw_spinlock_t			pi_lock;
892b29739f9SIngo Molnar 
89376751049SPeter Zijlstra 	struct wake_q_node		wake_q;
89476751049SPeter Zijlstra 
89523f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES
8965eca1c10SIngo Molnar 	/* PI waiters blocked on a rt_mutex held by this task: */
897a23ba907SDavidlohr Bueso 	struct rb_root_cached		pi_waiters;
898e96a7705SXunlei Pang 	/* Updated under owner's pi_lock and rq lock */
899e96a7705SXunlei Pang 	struct task_struct		*pi_top_task;
9005eca1c10SIngo Molnar 	/* Deadlock detection and priority inheritance handling: */
90123f78d4aSIngo Molnar 	struct rt_mutex_waiter		*pi_blocked_on;
90223f78d4aSIngo Molnar #endif
90323f78d4aSIngo Molnar 
904408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES
9055eca1c10SIngo Molnar 	/* Mutex deadlock detection: */
906408894eeSIngo Molnar 	struct mutex_waiter		*blocked_on;
907408894eeSIngo Molnar #endif
9085eca1c10SIngo Molnar 
909de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS
910de30a2b3SIngo Molnar 	unsigned int			irq_events;
911de30a2b3SIngo Molnar 	unsigned long			hardirq_enable_ip;
912de30a2b3SIngo Molnar 	unsigned long			hardirq_disable_ip;
913fa1452e8SHiroshi Shimamoto 	unsigned int			hardirq_enable_event;
914de30a2b3SIngo Molnar 	unsigned int			hardirq_disable_event;
915fa1452e8SHiroshi Shimamoto 	int				hardirqs_enabled;
916de30a2b3SIngo Molnar 	int				hardirq_context;
917fa1452e8SHiroshi Shimamoto 	unsigned long			softirq_disable_ip;
918fa1452e8SHiroshi Shimamoto 	unsigned long			softirq_enable_ip;
919fa1452e8SHiroshi Shimamoto 	unsigned int			softirq_disable_event;
920fa1452e8SHiroshi Shimamoto 	unsigned int			softirq_enable_event;
921fa1452e8SHiroshi Shimamoto 	int				softirqs_enabled;
922de30a2b3SIngo Molnar 	int				softirq_context;
923de30a2b3SIngo Molnar #endif
9245eca1c10SIngo Molnar 
925fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP
926bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH			48UL
927fbb9ce95SIngo Molnar 	u64				curr_chain_key;
928fbb9ce95SIngo Molnar 	int				lockdep_depth;
929fbb9ce95SIngo Molnar 	unsigned int			lockdep_recursion;
930c7aceabaSRichard Kennedy 	struct held_lock		held_locks[MAX_LOCK_DEPTH];
931fbb9ce95SIngo Molnar #endif
9325eca1c10SIngo Molnar 
933c6d30853SAndrey Ryabinin #ifdef CONFIG_UBSAN
934c6d30853SAndrey Ryabinin 	unsigned int			in_ubsan;
935c6d30853SAndrey Ryabinin #endif
936408894eeSIngo Molnar 
9375eca1c10SIngo Molnar 	/* Journalling filesystem info: */
9381da177e4SLinus Torvalds 	void				*journal_info;
9391da177e4SLinus Torvalds 
9405eca1c10SIngo Molnar 	/* Stacked block device info: */
941bddd87c7SAkinobu Mita 	struct bio_list			*bio_list;
942d89d8796SNeil Brown 
94373c10101SJens Axboe #ifdef CONFIG_BLOCK
9445eca1c10SIngo Molnar 	/* Stack plugging: */
94573c10101SJens Axboe 	struct blk_plug			*plug;
94673c10101SJens Axboe #endif
94773c10101SJens Axboe 
9485eca1c10SIngo Molnar 	/* VM state: */
9491da177e4SLinus Torvalds 	struct reclaim_state		*reclaim_state;
9501da177e4SLinus Torvalds 
9511da177e4SLinus Torvalds 	struct backing_dev_info		*backing_dev_info;
9521da177e4SLinus Torvalds 
9531da177e4SLinus Torvalds 	struct io_context		*io_context;
9541da177e4SLinus Torvalds 
9555eca1c10SIngo Molnar 	/* Ptrace state: */
9561da177e4SLinus Torvalds 	unsigned long			ptrace_message;
9575eca1c10SIngo Molnar 	siginfo_t			*last_siginfo;
9585eca1c10SIngo Molnar 
9597c3ab738SAndrew Morton 	struct task_io_accounting	ioac;
9605eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT
9615eca1c10SIngo Molnar 	/* Accumulated RSS usage: */
9625eca1c10SIngo Molnar 	u64				acct_rss_mem1;
9635eca1c10SIngo Molnar 	/* Accumulated virtual memory usage: */
9645eca1c10SIngo Molnar 	u64				acct_vm_mem1;
9655eca1c10SIngo Molnar 	/* stime + utime since last update: */
9665eca1c10SIngo Molnar 	u64				acct_timexpd;
9671da177e4SLinus Torvalds #endif
9681da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS
9695eca1c10SIngo Molnar 	/* Protected by ->alloc_lock: */
9705eca1c10SIngo Molnar 	nodemask_t			mems_allowed;
9715eca1c10SIngo Molnar 	/* Seqence number to catch updates: */
9725eca1c10SIngo Molnar 	seqcount_t			mems_allowed_seq;
973825a46afSPaul Jackson 	int				cpuset_mem_spread_rotor;
9746adef3ebSJack Steiner 	int				cpuset_slab_spread_rotor;
9751da177e4SLinus Torvalds #endif
976ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS
9775eca1c10SIngo Molnar 	/* Control Group info protected by css_set_lock: */
9782c392b8cSArnd Bergmann 	struct css_set __rcu		*cgroups;
9795eca1c10SIngo Molnar 	/* cg_list protected by css_set_lock and tsk->alloc_lock: */
980817929ecSPaul Menage 	struct list_head		cg_list;
981ddbcc7e8SPaul Menage #endif
982f01d7d51SVikas Shivappa #ifdef CONFIG_INTEL_RDT
9830734ded1SVikas Shivappa 	u32				closid;
984d6aaba61SVikas Shivappa 	u32				rmid;
985e02737d5SFenghua Yu #endif
98642b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX
9870771dfefSIngo Molnar 	struct robust_list_head __user	*robust_list;
98834f192c6SIngo Molnar #ifdef CONFIG_COMPAT
98934f192c6SIngo Molnar 	struct compat_robust_list_head __user *compat_robust_list;
99034f192c6SIngo Molnar #endif
991c87e2837SIngo Molnar 	struct list_head		pi_state_list;
992c87e2837SIngo Molnar 	struct futex_pi_state		*pi_state_cache;
99342b2dd0aSAlexey Dobriyan #endif
994cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS
9958dc85d54SPeter Zijlstra 	struct perf_event_context	*perf_event_ctxp[perf_nr_task_contexts];
996cdd6c482SIngo Molnar 	struct mutex			perf_event_mutex;
997cdd6c482SIngo Molnar 	struct list_head		perf_event_list;
998a63eaf34SPaul Mackerras #endif
9998f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT
10008f47b187SThomas Gleixner 	unsigned long			preempt_disable_ip;
10018f47b187SThomas Gleixner #endif
1002c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA
10035eca1c10SIngo Molnar 	/* Protected by alloc_lock: */
10045eca1c10SIngo Molnar 	struct mempolicy		*mempolicy;
100545816682SVlastimil Babka 	short				il_prev;
1006207205a2SEric Dumazet 	short				pref_node_fork;
1007c7aceabaSRichard Kennedy #endif
1008cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING
1009cbee9f88SPeter Zijlstra 	int				numa_scan_seq;
1010cbee9f88SPeter Zijlstra 	unsigned int			numa_scan_period;
1011598f0ec0SMel Gorman 	unsigned int			numa_scan_period_max;
1012de1c9ce6SRik van Riel 	int				numa_preferred_nid;
10136b9a7460SMel Gorman 	unsigned long			numa_migrate_retry;
10145eca1c10SIngo Molnar 	/* Migration stamp: */
10155eca1c10SIngo Molnar 	u64				node_stamp;
10167e2703e6SRik van Riel 	u64				last_task_numa_placement;
10177e2703e6SRik van Riel 	u64				last_sum_exec_runtime;
1018cbee9f88SPeter Zijlstra 	struct callback_head		numa_work;
1019f809ca9aSMel Gorman 
10208c8a743cSPeter Zijlstra 	struct list_head		numa_entry;
10218c8a743cSPeter Zijlstra 	struct numa_group		*numa_group;
10228c8a743cSPeter Zijlstra 
1023745d6147SMel Gorman 	/*
102444dba3d5SIulia Manda 	 * numa_faults is an array split into four regions:
102544dba3d5SIulia Manda 	 * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer
102644dba3d5SIulia Manda 	 * in this precise order.
102744dba3d5SIulia Manda 	 *
102844dba3d5SIulia Manda 	 * faults_memory: Exponential decaying average of faults on a per-node
102944dba3d5SIulia Manda 	 * basis. Scheduling placement decisions are made based on these
103044dba3d5SIulia Manda 	 * counts. The values remain static for the duration of a PTE scan.
103144dba3d5SIulia Manda 	 * faults_cpu: Track the nodes the process was running on when a NUMA
103244dba3d5SIulia Manda 	 * hinting fault was incurred.
103344dba3d5SIulia Manda 	 * faults_memory_buffer and faults_cpu_buffer: Record faults per node
103444dba3d5SIulia Manda 	 * during the current scan window. When the scan completes, the counts
103544dba3d5SIulia Manda 	 * in faults_memory and faults_cpu decay and these values are copied.
1036745d6147SMel Gorman 	 */
103744dba3d5SIulia Manda 	unsigned long			*numa_faults;
103883e1d2cdSMel Gorman 	unsigned long			total_numa_faults;
1039745d6147SMel Gorman 
1040745d6147SMel Gorman 	/*
104104bb2f94SRik van Riel 	 * numa_faults_locality tracks if faults recorded during the last
1042074c2381SMel Gorman 	 * scan window were remote/local or failed to migrate. The task scan
1043074c2381SMel Gorman 	 * period is adapted based on the locality of the faults with different
1044074c2381SMel Gorman 	 * weights depending on whether they were shared or private faults
104504bb2f94SRik van Riel 	 */
1046074c2381SMel Gorman 	unsigned long			numa_faults_locality[3];
104704bb2f94SRik van Riel 
1048b32e86b4SIngo Molnar 	unsigned long			numa_pages_migrated;
1049cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */
1050cbee9f88SPeter Zijlstra 
1051d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ
1052d7822b1eSMathieu Desnoyers 	struct rseq __user *rseq;
1053d7822b1eSMathieu Desnoyers 	u32 rseq_len;
1054d7822b1eSMathieu Desnoyers 	u32 rseq_sig;
1055d7822b1eSMathieu Desnoyers 	/*
1056d7822b1eSMathieu Desnoyers 	 * RmW on rseq_event_mask must be performed atomically
1057d7822b1eSMathieu Desnoyers 	 * with respect to preemption.
1058d7822b1eSMathieu Desnoyers 	 */
1059d7822b1eSMathieu Desnoyers 	unsigned long rseq_event_mask;
1060d7822b1eSMathieu Desnoyers #endif
1061d7822b1eSMathieu Desnoyers 
106272b252aeSMel Gorman 	struct tlbflush_unmap_batch	tlb_ubc;
106372b252aeSMel Gorman 
1064e56d0903SIngo Molnar 	struct rcu_head			rcu;
1065b92ce558SJens Axboe 
10665eca1c10SIngo Molnar 	/* Cache last used pipe for splice(): */
1067b92ce558SJens Axboe 	struct pipe_inode_info		*splice_pipe;
10685640f768SEric Dumazet 
10695640f768SEric Dumazet 	struct page_frag		task_frag;
10705640f768SEric Dumazet 
1071ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT
1072ca74e92bSShailabh Nagar 	struct task_delay_info		*delays;
1073ca74e92bSShailabh Nagar #endif
107447913d4eSIngo Molnar 
1075f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION
1076f4f154fdSAkinobu Mita 	int				make_it_fail;
10779049f2f6SAkinobu Mita 	unsigned int			fail_nth;
1078f4f154fdSAkinobu Mita #endif
10799d823e8fSWu Fengguang 	/*
10805eca1c10SIngo Molnar 	 * When (nr_dirtied >= nr_dirtied_pause), it's time to call
10815eca1c10SIngo Molnar 	 * balance_dirty_pages() for a dirty throttling pause:
10829d823e8fSWu Fengguang 	 */
10839d823e8fSWu Fengguang 	int				nr_dirtied;
10849d823e8fSWu Fengguang 	int				nr_dirtied_pause;
10855eca1c10SIngo Molnar 	/* Start of a write-and-pause period: */
10865eca1c10SIngo Molnar 	unsigned long			dirty_paused_when;
10879d823e8fSWu Fengguang 
10889745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP
10899745512cSArjan van de Ven 	int				latency_record_count;
10909745512cSArjan van de Ven 	struct latency_record		latency_record[LT_SAVECOUNT];
10919745512cSArjan van de Ven #endif
10926976675dSArjan van de Ven 	/*
10935eca1c10SIngo Molnar 	 * Time slack values; these are used to round up poll() and
10946976675dSArjan van de Ven 	 * select() etc timeout values. These are in nanoseconds.
10956976675dSArjan van de Ven 	 */
1096da8b44d5SJohn Stultz 	u64				timer_slack_ns;
1097da8b44d5SJohn Stultz 	u64				default_timer_slack_ns;
1098f8d570a4SDavid Miller 
10990b24beccSAndrey Ryabinin #ifdef CONFIG_KASAN
11000b24beccSAndrey Ryabinin 	unsigned int			kasan_depth;
11010b24beccSAndrey Ryabinin #endif
11025eca1c10SIngo Molnar 
1103fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER
11045eca1c10SIngo Molnar 	/* Index of current stored address in ret_stack: */
1105f201ae23SFrederic Weisbecker 	int				curr_ret_stack;
11065eca1c10SIngo Molnar 
11075eca1c10SIngo Molnar 	/* Stack of return addresses for return function tracing: */
1108f201ae23SFrederic Weisbecker 	struct ftrace_ret_stack		*ret_stack;
11095eca1c10SIngo Molnar 
11105eca1c10SIngo Molnar 	/* Timestamp for last schedule: */
11118aef2d28SSteven Rostedt 	unsigned long long		ftrace_timestamp;
11125eca1c10SIngo Molnar 
1113f201ae23SFrederic Weisbecker 	/*
1114f201ae23SFrederic Weisbecker 	 * Number of functions that haven't been traced
11155eca1c10SIngo Molnar 	 * because of depth overrun:
1116f201ae23SFrederic Weisbecker 	 */
1117f201ae23SFrederic Weisbecker 	atomic_t			trace_overrun;
11185eca1c10SIngo Molnar 
11195eca1c10SIngo Molnar 	/* Pause tracing: */
1120380c4b14SFrederic Weisbecker 	atomic_t			tracing_graph_pause;
1121f201ae23SFrederic Weisbecker #endif
11225eca1c10SIngo Molnar 
1123ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING
11245eca1c10SIngo Molnar 	/* State flags for use by tracers: */
1125ea4e2bc4SSteven Rostedt 	unsigned long			trace;
11265eca1c10SIngo Molnar 
11275eca1c10SIngo Molnar 	/* Bitmask and counter of trace recursion: */
1128261842b7SSteven Rostedt 	unsigned long			trace_recursion;
1129261842b7SSteven Rostedt #endif /* CONFIG_TRACING */
11305eca1c10SIngo Molnar 
11315c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV
11325eca1c10SIngo Molnar 	/* Coverage collection mode enabled for this task (0 if disabled): */
11335c9a8750SDmitry Vyukov 	enum kcov_mode			kcov_mode;
11345eca1c10SIngo Molnar 
11355eca1c10SIngo Molnar 	/* Size of the kcov_area: */
11365eca1c10SIngo Molnar 	unsigned int			kcov_size;
11375eca1c10SIngo Molnar 
11385eca1c10SIngo Molnar 	/* Buffer for coverage collection: */
11395c9a8750SDmitry Vyukov 	void				*kcov_area;
11405eca1c10SIngo Molnar 
11415eca1c10SIngo Molnar 	/* KCOV descriptor wired with this task or NULL: */
11425c9a8750SDmitry Vyukov 	struct kcov			*kcov;
11435c9a8750SDmitry Vyukov #endif
11445eca1c10SIngo Molnar 
11456f185c29SVladimir Davydov #ifdef CONFIG_MEMCG
1146626ebc41STejun Heo 	struct mem_cgroup		*memcg_in_oom;
1147626ebc41STejun Heo 	gfp_t				memcg_oom_gfp_mask;
1148626ebc41STejun Heo 	int				memcg_oom_order;
1149b23afb93STejun Heo 
11505eca1c10SIngo Molnar 	/* Number of pages to reclaim on returning to userland: */
1151b23afb93STejun Heo 	unsigned int			memcg_nr_pages_over_high;
1152569b846dSKAMEZAWA Hiroyuki #endif
11535eca1c10SIngo Molnar 
11540326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES
11550326f5a9SSrikar Dronamraju 	struct uprobe_task		*utask;
11560326f5a9SSrikar Dronamraju #endif
1157cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE)
1158cafe5635SKent Overstreet 	unsigned int			sequential_io;
1159cafe5635SKent Overstreet 	unsigned int			sequential_io_avg;
1160cafe5635SKent Overstreet #endif
11618eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
11628eb23b9fSPeter Zijlstra 	unsigned long			task_state_change;
11638eb23b9fSPeter Zijlstra #endif
11648bcbde54SDavid Hildenbrand 	int				pagefault_disabled;
116503049269SMichal Hocko #ifdef CONFIG_MMU
116629c696e1SVladimir Davydov 	struct task_struct		*oom_reaper_list;
116703049269SMichal Hocko #endif
1168ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK
1169ba14a194SAndy Lutomirski 	struct vm_struct		*stack_vm_area;
1170ba14a194SAndy Lutomirski #endif
117168f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
11725eca1c10SIngo Molnar 	/* A live task holds one reference: */
117368f24b08SAndy Lutomirski 	atomic_t			stack_refcount;
117468f24b08SAndy Lutomirski #endif
1175d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH
1176d83a7cb3SJosh Poimboeuf 	int patch_state;
1177d83a7cb3SJosh Poimboeuf #endif
1178e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY
1179e4e55b47STetsuo Handa 	/* Used by LSM modules for access restriction: */
1180e4e55b47STetsuo Handa 	void				*security;
1181e4e55b47STetsuo Handa #endif
118229e48ce8SKees Cook 
118329e48ce8SKees Cook 	/*
118429e48ce8SKees Cook 	 * New fields for task_struct should be added above here, so that
118529e48ce8SKees Cook 	 * they are included in the randomized portion of task_struct.
118629e48ce8SKees Cook 	 */
118729e48ce8SKees Cook 	randomized_struct_fields_end
118829e48ce8SKees Cook 
11895eca1c10SIngo Molnar 	/* CPU-specific state of this task: */
11900c8c0f03SDave Hansen 	struct thread_struct		thread;
11915eca1c10SIngo Molnar 
11920c8c0f03SDave Hansen 	/*
11930c8c0f03SDave Hansen 	 * WARNING: on x86, 'thread_struct' contains a variable-sized
11940c8c0f03SDave Hansen 	 * structure.  It *MUST* be at the end of 'task_struct'.
11950c8c0f03SDave Hansen 	 *
11960c8c0f03SDave Hansen 	 * Do not put anything below here!
11970c8c0f03SDave Hansen 	 */
11981da177e4SLinus Torvalds };
11991da177e4SLinus Torvalds 
1200e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task)
120122c935f4SEric W. Biederman {
120222c935f4SEric W. Biederman 	return task->pids[PIDTYPE_PID].pid;
120322c935f4SEric W. Biederman }
120422c935f4SEric W. Biederman 
1205e868171aSAlexey Dobriyan static inline struct pid *task_tgid(struct task_struct *task)
120622c935f4SEric W. Biederman {
120722c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_PID].pid;
120822c935f4SEric W. Biederman }
120922c935f4SEric W. Biederman 
12106dda81f4SOleg Nesterov /*
12115eca1c10SIngo Molnar  * Without tasklist or RCU lock it is not safe to dereference
12126dda81f4SOleg Nesterov  * the result of task_pgrp/task_session even if task == current,
12136dda81f4SOleg Nesterov  * we can race with another thread doing sys_setsid/sys_setpgid.
12146dda81f4SOleg Nesterov  */
1215e868171aSAlexey Dobriyan static inline struct pid *task_pgrp(struct task_struct *task)
121622c935f4SEric W. Biederman {
121722c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_PGID].pid;
121822c935f4SEric W. Biederman }
121922c935f4SEric W. Biederman 
1220e868171aSAlexey Dobriyan static inline struct pid *task_session(struct task_struct *task)
122122c935f4SEric W. Biederman {
122222c935f4SEric W. Biederman 	return task->group_leader->pids[PIDTYPE_SID].pid;
122322c935f4SEric W. Biederman }
122422c935f4SEric W. Biederman 
12257af57294SPavel Emelyanov /*
12267af57294SPavel Emelyanov  * the helpers to get the task's different pids as they are seen
12277af57294SPavel Emelyanov  * from various namespaces
12287af57294SPavel Emelyanov  *
12297af57294SPavel Emelyanov  * task_xid_nr()     : global id, i.e. the id seen from the init namespace;
123044c4e1b2SEric W. Biederman  * task_xid_vnr()    : virtual id, i.e. the id seen from the pid namespace of
123144c4e1b2SEric W. Biederman  *                     current.
12327af57294SPavel Emelyanov  * task_xid_nr_ns()  : id seen from the ns specified;
12337af57294SPavel Emelyanov  *
12347af57294SPavel Emelyanov  * see also pid_nr() etc in include/linux/pid.h
12357af57294SPavel Emelyanov  */
12365eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns);
12377af57294SPavel Emelyanov 
1238e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk)
12397af57294SPavel Emelyanov {
12407af57294SPavel Emelyanov 	return tsk->pid;
12417af57294SPavel Emelyanov }
12427af57294SPavel Emelyanov 
12435eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
124452ee2dfdSOleg Nesterov {
124552ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
124652ee2dfdSOleg Nesterov }
12477af57294SPavel Emelyanov 
12487af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk)
12497af57294SPavel Emelyanov {
125052ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
12517af57294SPavel Emelyanov }
12527af57294SPavel Emelyanov 
12537af57294SPavel Emelyanov 
1254e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk)
12557af57294SPavel Emelyanov {
12567af57294SPavel Emelyanov 	return tsk->tgid;
12577af57294SPavel Emelyanov }
12587af57294SPavel Emelyanov 
12595eca1c10SIngo Molnar /**
12605eca1c10SIngo Molnar  * pid_alive - check that a task structure is not stale
12615eca1c10SIngo Molnar  * @p: Task structure to be checked.
12625eca1c10SIngo Molnar  *
12635eca1c10SIngo Molnar  * Test if a process is not yet dead (at most zombie state)
12645eca1c10SIngo Molnar  * If pid_alive fails, then pointers within the task structure
12655eca1c10SIngo Molnar  * can be stale and must not be dereferenced.
12665eca1c10SIngo Molnar  *
12675eca1c10SIngo Molnar  * Return: 1 if the process is alive. 0 otherwise.
12685eca1c10SIngo Molnar  */
12695eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p)
12705eca1c10SIngo Molnar {
12715eca1c10SIngo Molnar 	return p->pids[PIDTYPE_PID].pid != NULL;
12725eca1c10SIngo Molnar }
12737af57294SPavel Emelyanov 
12745eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
12757af57294SPavel Emelyanov {
127652ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
12777af57294SPavel Emelyanov }
12787af57294SPavel Emelyanov 
12797af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
12807af57294SPavel Emelyanov {
128152ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
12827af57294SPavel Emelyanov }
12837af57294SPavel Emelyanov 
12847af57294SPavel Emelyanov 
12855eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
12867af57294SPavel Emelyanov {
128752ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
12887af57294SPavel Emelyanov }
12897af57294SPavel Emelyanov 
12907af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk)
12917af57294SPavel Emelyanov {
129252ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
12937af57294SPavel Emelyanov }
12947af57294SPavel Emelyanov 
1295dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
1296dd1c1f2fSOleg Nesterov {
1297dd1c1f2fSOleg Nesterov 	return __task_pid_nr_ns(tsk, __PIDTYPE_TGID, ns);
1298dd1c1f2fSOleg Nesterov }
1299dd1c1f2fSOleg Nesterov 
1300dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk)
1301dd1c1f2fSOleg Nesterov {
1302dd1c1f2fSOleg Nesterov 	return __task_pid_nr_ns(tsk, __PIDTYPE_TGID, NULL);
1303dd1c1f2fSOleg Nesterov }
1304dd1c1f2fSOleg Nesterov 
1305dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns)
1306dd1c1f2fSOleg Nesterov {
1307dd1c1f2fSOleg Nesterov 	pid_t pid = 0;
1308dd1c1f2fSOleg Nesterov 
1309dd1c1f2fSOleg Nesterov 	rcu_read_lock();
1310dd1c1f2fSOleg Nesterov 	if (pid_alive(tsk))
1311dd1c1f2fSOleg Nesterov 		pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns);
1312dd1c1f2fSOleg Nesterov 	rcu_read_unlock();
1313dd1c1f2fSOleg Nesterov 
1314dd1c1f2fSOleg Nesterov 	return pid;
1315dd1c1f2fSOleg Nesterov }
1316dd1c1f2fSOleg Nesterov 
1317dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk)
1318dd1c1f2fSOleg Nesterov {
1319dd1c1f2fSOleg Nesterov 	return task_ppid_nr_ns(tsk, &init_pid_ns);
1320dd1c1f2fSOleg Nesterov }
1321dd1c1f2fSOleg Nesterov 
13225eca1c10SIngo Molnar /* Obsolete, do not use: */
13231b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk)
13241b0f7ffdSOleg Nesterov {
13251b0f7ffdSOleg Nesterov 	return task_pgrp_nr_ns(tsk, &init_pid_ns);
13261b0f7ffdSOleg Nesterov }
13277af57294SPavel Emelyanov 
132806eb6184SPeter Zijlstra #define TASK_REPORT_IDLE	(TASK_REPORT + 1)
132906eb6184SPeter Zijlstra #define TASK_REPORT_MAX		(TASK_REPORT_IDLE << 1)
133006eb6184SPeter Zijlstra 
13311d48b080SPeter Zijlstra static inline unsigned int task_state_index(struct task_struct *tsk)
133220435d84SXie XiuQi {
13331593baabSPeter Zijlstra 	unsigned int tsk_state = READ_ONCE(tsk->state);
13341593baabSPeter Zijlstra 	unsigned int state = (tsk_state | tsk->exit_state) & TASK_REPORT;
133520435d84SXie XiuQi 
133606eb6184SPeter Zijlstra 	BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX);
133706eb6184SPeter Zijlstra 
133806eb6184SPeter Zijlstra 	if (tsk_state == TASK_IDLE)
133906eb6184SPeter Zijlstra 		state = TASK_REPORT_IDLE;
134006eb6184SPeter Zijlstra 
13411593baabSPeter Zijlstra 	return fls(state);
13421593baabSPeter Zijlstra }
134320435d84SXie XiuQi 
13441d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state)
13451593baabSPeter Zijlstra {
13468ef9925bSPeter Zijlstra 	static const char state_char[] = "RSDTtXZPI";
13471593baabSPeter Zijlstra 
134806eb6184SPeter Zijlstra 	BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1);
13491593baabSPeter Zijlstra 
13501593baabSPeter Zijlstra 	return state_char[state];
13511593baabSPeter Zijlstra }
13521593baabSPeter Zijlstra 
13531593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk)
13541593baabSPeter Zijlstra {
13551d48b080SPeter Zijlstra 	return task_index_to_char(task_state_index(tsk));
135620435d84SXie XiuQi }
135720435d84SXie XiuQi 
13581da177e4SLinus Torvalds /**
1359570f5241SSergey Senozhatsky  * is_global_init - check if a task structure is init. Since init
1360570f5241SSergey Senozhatsky  * is free to have sub-threads we need to check tgid.
13613260259fSHenne  * @tsk: Task structure to be checked.
13623260259fSHenne  *
13633260259fSHenne  * Check if a task structure is the first user space task the kernel created.
1364e69f6186SYacine Belkadi  *
1365e69f6186SYacine Belkadi  * Return: 1 if the task structure is init. 0 otherwise.
1366f400e198SSukadev Bhattiprolu  */
1367e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk)
1368b461cc03SPavel Emelyanov {
1369570f5241SSergey Senozhatsky 	return task_tgid_nr(tsk) == 1;
1370b461cc03SPavel Emelyanov }
1371b460cbc5SSerge E. Hallyn 
13729ec52099SCedric Le Goater extern struct pid *cad_pid;
13739ec52099SCedric Le Goater 
13741da177e4SLinus Torvalds /*
13751da177e4SLinus Torvalds  * Per process flags
13761da177e4SLinus Torvalds  */
1377c1de45caSPeter Zijlstra #define PF_IDLE			0x00000002	/* I am an IDLE thread */
13785eca1c10SIngo Molnar #define PF_EXITING		0x00000004	/* Getting shut down */
13795eca1c10SIngo Molnar #define PF_EXITPIDONE		0x00000008	/* PI exit done on shut down */
138094886b84SLaurent Vivier #define PF_VCPU			0x00000010	/* I'm a virtual CPU */
138121aa9af0STejun Heo #define PF_WQ_WORKER		0x00000020	/* I'm a workqueue worker */
13825eca1c10SIngo Molnar #define PF_FORKNOEXEC		0x00000040	/* Forked but didn't exec */
13835eca1c10SIngo Molnar #define PF_MCE_PROCESS		0x00000080      /* Process policy on mce errors */
13845eca1c10SIngo Molnar #define PF_SUPERPRIV		0x00000100	/* Used super-user privileges */
13855eca1c10SIngo Molnar #define PF_DUMPCORE		0x00000200	/* Dumped core */
13865eca1c10SIngo Molnar #define PF_SIGNALED		0x00000400	/* Killed by a signal */
13871da177e4SLinus Torvalds #define PF_MEMALLOC		0x00000800	/* Allocating memory */
13885eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED	0x00001000	/* set_user() noticed that RLIMIT_NPROC was exceeded */
13895eca1c10SIngo Molnar #define PF_USED_MATH		0x00002000	/* If unset the fpu must be initialized before use */
13905eca1c10SIngo Molnar #define PF_USED_ASYNC		0x00004000	/* Used async_schedule*(), used by module init */
13915eca1c10SIngo Molnar #define PF_NOFREEZE		0x00008000	/* This thread should not be frozen */
13925eca1c10SIngo Molnar #define PF_FROZEN		0x00010000	/* Frozen for system suspend */
13937dea19f9SMichal Hocko #define PF_KSWAPD		0x00020000	/* I am kswapd */
13947dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS	0x00040000	/* All allocation requests will inherit GFP_NOFS */
13957dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO	0x00080000	/* All allocation requests will inherit GFP_NOIO */
13961da177e4SLinus Torvalds #define PF_LESS_THROTTLE	0x00100000	/* Throttle me less: I clean memory */
1397246bb0b1SOleg Nesterov #define PF_KTHREAD		0x00200000	/* I am a kernel thread */
13985eca1c10SIngo Molnar #define PF_RANDOMIZE		0x00400000	/* Randomize virtual address space */
1399b31dc66aSJens Axboe #define PF_SWAPWRITE		0x00800000	/* Allowed to write to swap */
140014a40ffcSTejun Heo #define PF_NO_SETAFFINITY	0x04000000	/* Userland is not allowed to meddle with cpus_allowed */
14014db96cf0SAndi Kleen #define PF_MCE_EARLY		0x08000000      /* Early kill for mce process policy */
140261a87122SThomas Gleixner #define PF_MUTEX_TESTER		0x20000000	/* Thread belongs to the rt mutex tester */
140358a69cb4STejun Heo #define PF_FREEZER_SKIP		0x40000000	/* Freezer should not count it as freezable */
14045eca1c10SIngo Molnar #define PF_SUSPEND_TASK		0x80000000      /* This thread called freeze_processes() and should not be frozen */
14051da177e4SLinus Torvalds 
14061da177e4SLinus Torvalds /*
14071da177e4SLinus Torvalds  * Only the _current_ task can read/write to tsk->flags, but other
14081da177e4SLinus Torvalds  * tasks can access tsk->flags in readonly mode for example
14091da177e4SLinus Torvalds  * with tsk_used_math (like during threaded core dumping).
14101da177e4SLinus Torvalds  * There is however an exception to this rule during ptrace
14111da177e4SLinus Torvalds  * or during fork: the ptracer task is allowed to write to the
14121da177e4SLinus Torvalds  * child->flags of its traced child (same goes for fork, the parent
14131da177e4SLinus Torvalds  * can write to the child->flags), because we're guaranteed the
14141da177e4SLinus Torvalds  * child is not running and in turn not changing child->flags
14151da177e4SLinus Torvalds  * at the same time the parent does it.
14161da177e4SLinus Torvalds  */
14171da177e4SLinus Torvalds #define clear_stopped_child_used_math(child)	do { (child)->flags &= ~PF_USED_MATH; } while (0)
14181da177e4SLinus Torvalds #define set_stopped_child_used_math(child)	do { (child)->flags |= PF_USED_MATH; } while (0)
14191da177e4SLinus Torvalds #define clear_used_math()			clear_stopped_child_used_math(current)
14201da177e4SLinus Torvalds #define set_used_math()				set_stopped_child_used_math(current)
14215eca1c10SIngo Molnar 
14221da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \
14231da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0)
14245eca1c10SIngo Molnar 
14255eca1c10SIngo Molnar #define conditional_used_math(condition)	conditional_stopped_child_used_math(condition, current)
14265eca1c10SIngo Molnar 
14271da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \
14281da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0)
14295eca1c10SIngo Molnar 
14301da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */
14311da177e4SLinus Torvalds #define tsk_used_math(p)			((p)->flags & PF_USED_MATH)
14321da177e4SLinus Torvalds #define used_math()				tsk_used_math(current)
14331da177e4SLinus Torvalds 
143462ec05ddSThomas Gleixner static inline bool is_percpu_thread(void)
143562ec05ddSThomas Gleixner {
143662ec05ddSThomas Gleixner #ifdef CONFIG_SMP
143762ec05ddSThomas Gleixner 	return (current->flags & PF_NO_SETAFFINITY) &&
143862ec05ddSThomas Gleixner 		(current->nr_cpus_allowed  == 1);
143962ec05ddSThomas Gleixner #else
144062ec05ddSThomas Gleixner 	return true;
144162ec05ddSThomas Gleixner #endif
144262ec05ddSThomas Gleixner }
144362ec05ddSThomas Gleixner 
14441d4457f9SKees Cook /* Per-process atomic flags. */
1445a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS		0	/* May not gain new privileges. */
14462ad654bcSZefan Li #define PFA_SPREAD_PAGE			1	/* Spread page cache over cpuset */
14472ad654bcSZefan Li #define PFA_SPREAD_SLAB			2	/* Spread some slab caches over cpuset */
1448356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE		3	/* Speculative Store Bypass disabled */
1449356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE	4	/* Speculative Store Bypass force disabled*/
14501d4457f9SKees Cook 
1451e0e5070bSZefan Li #define TASK_PFA_TEST(name, func)					\
1452e0e5070bSZefan Li 	static inline bool task_##func(struct task_struct *p)		\
1453e0e5070bSZefan Li 	{ return test_bit(PFA_##name, &p->atomic_flags); }
14545eca1c10SIngo Molnar 
1455e0e5070bSZefan Li #define TASK_PFA_SET(name, func)					\
1456e0e5070bSZefan Li 	static inline void task_set_##func(struct task_struct *p)	\
1457e0e5070bSZefan Li 	{ set_bit(PFA_##name, &p->atomic_flags); }
14585eca1c10SIngo Molnar 
1459e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func)					\
1460e0e5070bSZefan Li 	static inline void task_clear_##func(struct task_struct *p)	\
1461e0e5070bSZefan Li 	{ clear_bit(PFA_##name, &p->atomic_flags); }
14621d4457f9SKees Cook 
1463e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs)
1464e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs)
14651d4457f9SKees Cook 
14662ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page)
14672ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page)
14682ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
14692ad654bcSZefan Li 
14702ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
14712ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab)
14722ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
1473544b2c91STejun Heo 
1474356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable)
1475356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable)
1476356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable)
1477356e4bffSThomas Gleixner 
1478356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1479356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1480356e4bffSThomas Gleixner 
14815eca1c10SIngo Molnar static inline void
1482717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags)
1483907aed48SMel Gorman {
1484717a94b5SNeilBrown 	current->flags &= ~flags;
1485717a94b5SNeilBrown 	current->flags |= orig_flags & flags;
1486907aed48SMel Gorman }
1487907aed48SMel Gorman 
14885eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial);
14895eca1c10SIngo Molnar extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_cpus_allowed);
14901da177e4SLinus Torvalds #ifdef CONFIG_SMP
14915eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask);
14925eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask);
14931da177e4SLinus Torvalds #else
14945eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask)
14951e1b6c51SKOSAKI Motohiro {
14961e1b6c51SKOSAKI Motohiro }
14975eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask)
14981da177e4SLinus Torvalds {
149996f874e2SRusty Russell 	if (!cpumask_test_cpu(0, new_mask))
15001da177e4SLinus Torvalds 		return -EINVAL;
15011da177e4SLinus Torvalds 	return 0;
15021da177e4SLinus Torvalds }
15031da177e4SLinus Torvalds #endif
1504e0ad9556SRusty Russell 
15056d0d2878SChristian Borntraeger #ifndef cpu_relax_yield
15066d0d2878SChristian Borntraeger #define cpu_relax_yield() cpu_relax()
15076d0d2878SChristian Borntraeger #endif
15086d0d2878SChristian Borntraeger 
1509fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt);
151036c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice);
151136c8b586SIngo Molnar extern int task_prio(const struct task_struct *p);
15125eca1c10SIngo Molnar 
1513d0ea0268SDongsheng Yang /**
1514d0ea0268SDongsheng Yang  * task_nice - return the nice value of a given task.
1515d0ea0268SDongsheng Yang  * @p: the task in question.
1516d0ea0268SDongsheng Yang  *
1517d0ea0268SDongsheng Yang  * Return: The nice value [ -20 ... 0 ... 19 ].
1518d0ea0268SDongsheng Yang  */
1519d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p)
1520d0ea0268SDongsheng Yang {
1521d0ea0268SDongsheng Yang 	return PRIO_TO_NICE((p)->static_prio);
1522d0ea0268SDongsheng Yang }
15235eca1c10SIngo Molnar 
152436c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice);
152536c8b586SIngo Molnar extern int task_curr(const struct task_struct *p);
15261da177e4SLinus Torvalds extern int idle_cpu(int cpu);
1527943d355dSRohit Jain extern int available_idle_cpu(int cpu);
15285eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *);
15295eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *);
15305eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *);
1531794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *);
153236c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu);
15335eca1c10SIngo Molnar 
1534c4f30608SPaul E. McKenney /**
1535c4f30608SPaul E. McKenney  * is_idle_task - is the specified task an idle task?
1536fa757281SRandy Dunlap  * @p: the task in question.
1537e69f6186SYacine Belkadi  *
1538e69f6186SYacine Belkadi  * Return: 1 if @p is an idle task. 0 otherwise.
1539c4f30608SPaul E. McKenney  */
15407061ca3bSPaul E. McKenney static inline bool is_idle_task(const struct task_struct *p)
1541c4f30608SPaul E. McKenney {
1542c1de45caSPeter Zijlstra 	return !!(p->flags & PF_IDLE);
1543c4f30608SPaul E. McKenney }
15445eca1c10SIngo Molnar 
154536c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu);
1546a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p);
15471da177e4SLinus Torvalds 
15481da177e4SLinus Torvalds void yield(void);
15491da177e4SLinus Torvalds 
15501da177e4SLinus Torvalds union thread_union {
15510500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK
15520500871fSDavid Howells 	struct task_struct task;
15530500871fSDavid Howells #endif
1554c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK
15551da177e4SLinus Torvalds 	struct thread_info thread_info;
1556c65eacbeSAndy Lutomirski #endif
15571da177e4SLinus Torvalds 	unsigned long stack[THREAD_SIZE/sizeof(long)];
15581da177e4SLinus Torvalds };
15591da177e4SLinus Torvalds 
15600500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK
15610500871fSDavid Howells extern struct thread_info init_thread_info;
15620500871fSDavid Howells #endif
15630500871fSDavid Howells 
15640500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)];
15650500871fSDavid Howells 
1566f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK
1567f3ac6067SIngo Molnar static inline struct thread_info *task_thread_info(struct task_struct *task)
1568f3ac6067SIngo Molnar {
1569f3ac6067SIngo Molnar 	return &task->thread_info;
1570f3ac6067SIngo Molnar }
1571f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS)
1572f3ac6067SIngo Molnar # define task_thread_info(task)	((struct thread_info *)(task)->stack)
1573f3ac6067SIngo Molnar #endif
1574f3ac6067SIngo Molnar 
1575198fe21bSPavel Emelyanov /*
1576198fe21bSPavel Emelyanov  * find a task by one of its numerical ids
1577198fe21bSPavel Emelyanov  *
1578198fe21bSPavel Emelyanov  * find_task_by_pid_ns():
1579198fe21bSPavel Emelyanov  *      finds a task by its pid in the specified namespace
1580228ebcbeSPavel Emelyanov  * find_task_by_vpid():
1581228ebcbeSPavel Emelyanov  *      finds a task by its virtual pid
1582198fe21bSPavel Emelyanov  *
1583e49859e7SPavel Emelyanov  * see also find_vpid() etc in include/linux/pid.h
1584198fe21bSPavel Emelyanov  */
1585198fe21bSPavel Emelyanov 
1586228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr);
15875eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns);
1588198fe21bSPavel Emelyanov 
15892ee08260SMike Rapoport /*
15902ee08260SMike Rapoport  * find a task by its virtual pid and get the task struct
15912ee08260SMike Rapoport  */
15922ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr);
15932ee08260SMike Rapoport 
1594b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state);
1595b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk);
15963e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk);
15975eca1c10SIngo Molnar 
15981da177e4SLinus Torvalds #ifdef CONFIG_SMP
15991da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk);
16001da177e4SLinus Torvalds #else
16011da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { }
16021da177e4SLinus Torvalds #endif
16031da177e4SLinus Torvalds 
160482b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
16055eca1c10SIngo Molnar 
160682b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from)
160782b89778SAdrian Hunter {
160882b89778SAdrian Hunter 	__set_task_comm(tsk, from, false);
160982b89778SAdrian Hunter }
16105eca1c10SIngo Molnar 
16113756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk);
16123756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({			\
16133756f640SArnd Bergmann 	BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN);	\
16143756f640SArnd Bergmann 	__get_task_comm(buf, sizeof(buf), tsk);		\
16153756f640SArnd Bergmann })
16161da177e4SLinus Torvalds 
16171da177e4SLinus Torvalds #ifdef CONFIG_SMP
1618317f3941SPeter Zijlstra void scheduler_ipi(void);
161985ba2d86SRoland McGrath extern unsigned long wait_task_inactive(struct task_struct *, long match_state);
16201da177e4SLinus Torvalds #else
1621184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { }
16225eca1c10SIngo Molnar static inline unsigned long wait_task_inactive(struct task_struct *p, long match_state)
162385ba2d86SRoland McGrath {
162485ba2d86SRoland McGrath 	return 1;
162585ba2d86SRoland McGrath }
16261da177e4SLinus Torvalds #endif
16271da177e4SLinus Torvalds 
16285eca1c10SIngo Molnar /*
16295eca1c10SIngo Molnar  * Set thread flags in other task's structures.
16305eca1c10SIngo Molnar  * See asm/thread_info.h for TIF_xxxx flags available:
16311da177e4SLinus Torvalds  */
16321da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag)
16331da177e4SLinus Torvalds {
1634a1261f54SAl Viro 	set_ti_thread_flag(task_thread_info(tsk), flag);
16351da177e4SLinus Torvalds }
16361da177e4SLinus Torvalds 
16371da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag)
16381da177e4SLinus Torvalds {
1639a1261f54SAl Viro 	clear_ti_thread_flag(task_thread_info(tsk), flag);
16401da177e4SLinus Torvalds }
16411da177e4SLinus Torvalds 
164293ee37c2SDave Martin static inline void update_tsk_thread_flag(struct task_struct *tsk, int flag,
164393ee37c2SDave Martin 					  bool value)
164493ee37c2SDave Martin {
164593ee37c2SDave Martin 	update_ti_thread_flag(task_thread_info(tsk), flag, value);
164693ee37c2SDave Martin }
164793ee37c2SDave Martin 
16481da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag)
16491da177e4SLinus Torvalds {
1650a1261f54SAl Viro 	return test_and_set_ti_thread_flag(task_thread_info(tsk), flag);
16511da177e4SLinus Torvalds }
16521da177e4SLinus Torvalds 
16531da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag)
16541da177e4SLinus Torvalds {
1655a1261f54SAl Viro 	return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag);
16561da177e4SLinus Torvalds }
16571da177e4SLinus Torvalds 
16581da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag)
16591da177e4SLinus Torvalds {
1660a1261f54SAl Viro 	return test_ti_thread_flag(task_thread_info(tsk), flag);
16611da177e4SLinus Torvalds }
16621da177e4SLinus Torvalds 
16631da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk)
16641da177e4SLinus Torvalds {
16651da177e4SLinus Torvalds 	set_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
16661da177e4SLinus Torvalds }
16671da177e4SLinus Torvalds 
16681da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk)
16691da177e4SLinus Torvalds {
16701da177e4SLinus Torvalds 	clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
16711da177e4SLinus Torvalds }
16721da177e4SLinus Torvalds 
16738ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk)
16748ae121acSGregory Haskins {
16758ae121acSGregory Haskins 	return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
16768ae121acSGregory Haskins }
16778ae121acSGregory Haskins 
16781da177e4SLinus Torvalds /*
16791da177e4SLinus Torvalds  * cond_resched() and cond_resched_lock(): latency reduction via
16801da177e4SLinus Torvalds  * explicit rescheduling in places that are safe. The return
16811da177e4SLinus Torvalds  * value indicates whether a reschedule was done in fact.
16821da177e4SLinus Torvalds  * cond_resched_lock() will drop the spinlock before scheduling,
16831da177e4SLinus Torvalds  */
168435a773a0SPeter Zijlstra #ifndef CONFIG_PREEMPT
1685c3921ab7SLinus Torvalds extern int _cond_resched(void);
168635a773a0SPeter Zijlstra #else
168735a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; }
168835a773a0SPeter Zijlstra #endif
16896f80bd98SFrederic Weisbecker 
1690613afbf8SFrederic Weisbecker #define cond_resched() ({			\
16913427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, 0);	\
1692613afbf8SFrederic Weisbecker 	_cond_resched();			\
1693613afbf8SFrederic Weisbecker })
16946f80bd98SFrederic Weisbecker 
1695613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock);
1696613afbf8SFrederic Weisbecker 
1697613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({				\
16983427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\
1699613afbf8SFrederic Weisbecker 	__cond_resched_lock(lock);				\
1700613afbf8SFrederic Weisbecker })
1701613afbf8SFrederic Weisbecker 
1702f6f3c437SSimon Horman static inline void cond_resched_rcu(void)
1703f6f3c437SSimon Horman {
1704f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU)
1705f6f3c437SSimon Horman 	rcu_read_unlock();
1706f6f3c437SSimon Horman 	cond_resched();
1707f6f3c437SSimon Horman 	rcu_read_lock();
1708f6f3c437SSimon Horman #endif
1709f6f3c437SSimon Horman }
1710f6f3c437SSimon Horman 
17111da177e4SLinus Torvalds /*
17121da177e4SLinus Torvalds  * Does a critical section need to be broken due to another
171395c354feSNick Piggin  * task waiting?: (technically does not depend on CONFIG_PREEMPT,
171495c354feSNick Piggin  * but a general need for low latency)
17151da177e4SLinus Torvalds  */
171695c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock)
17171da177e4SLinus Torvalds {
171895c354feSNick Piggin #ifdef CONFIG_PREEMPT
171995c354feSNick Piggin 	return spin_is_contended(lock);
172095c354feSNick Piggin #else
17211da177e4SLinus Torvalds 	return 0;
172295c354feSNick Piggin #endif
17231da177e4SLinus Torvalds }
17241da177e4SLinus Torvalds 
172575f93fedSPeter Zijlstra static __always_inline bool need_resched(void)
172675f93fedSPeter Zijlstra {
172775f93fedSPeter Zijlstra 	return unlikely(tif_need_resched());
172875f93fedSPeter Zijlstra }
172975f93fedSPeter Zijlstra 
1730ee761f62SThomas Gleixner /*
17311da177e4SLinus Torvalds  * Wrappers for p->thread_info->cpu access. No-op on UP.
17321da177e4SLinus Torvalds  */
17331da177e4SLinus Torvalds #ifdef CONFIG_SMP
17341da177e4SLinus Torvalds 
17351da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
17361da177e4SLinus Torvalds {
1737c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
1738c65eacbeSAndy Lutomirski 	return p->cpu;
1739c65eacbeSAndy Lutomirski #else
1740a1261f54SAl Viro 	return task_thread_info(p)->cpu;
1741c65eacbeSAndy Lutomirski #endif
17421da177e4SLinus Torvalds }
17431da177e4SLinus Torvalds 
1744c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu);
17451da177e4SLinus Torvalds 
17461da177e4SLinus Torvalds #else
17471da177e4SLinus Torvalds 
17481da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
17491da177e4SLinus Torvalds {
17501da177e4SLinus Torvalds 	return 0;
17511da177e4SLinus Torvalds }
17521da177e4SLinus Torvalds 
17531da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu)
17541da177e4SLinus Torvalds {
17551da177e4SLinus Torvalds }
17561da177e4SLinus Torvalds 
17571da177e4SLinus Torvalds #endif /* CONFIG_SMP */
17581da177e4SLinus Torvalds 
1759d9345c65SPan Xinhui /*
1760d9345c65SPan Xinhui  * In order to reduce various lock holder preemption latencies provide an
1761d9345c65SPan Xinhui  * interface to see if a vCPU is currently running or not.
1762d9345c65SPan Xinhui  *
1763d9345c65SPan Xinhui  * This allows us to terminate optimistic spin loops and block, analogous to
1764d9345c65SPan Xinhui  * the native optimistic spin heuristic of testing if the lock owner task is
1765d9345c65SPan Xinhui  * running or not.
1766d9345c65SPan Xinhui  */
1767d9345c65SPan Xinhui #ifndef vcpu_is_preempted
1768d9345c65SPan Xinhui # define vcpu_is_preempted(cpu)	false
1769d9345c65SPan Xinhui #endif
1770d9345c65SPan Xinhui 
177196f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask);
177296f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask);
17735c45bf27SSiddha, Suresh B 
177482455257SDave Hansen #ifndef TASK_SIZE_OF
177582455257SDave Hansen #define TASK_SIZE_OF(tsk)	TASK_SIZE
177682455257SDave Hansen #endif
177782455257SDave Hansen 
1778d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ
1779d7822b1eSMathieu Desnoyers 
1780d7822b1eSMathieu Desnoyers /*
1781d7822b1eSMathieu Desnoyers  * Map the event mask on the user-space ABI enum rseq_cs_flags
1782d7822b1eSMathieu Desnoyers  * for direct mask checks.
1783d7822b1eSMathieu Desnoyers  */
1784d7822b1eSMathieu Desnoyers enum rseq_event_mask_bits {
1785d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_PREEMPT_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_PREEMPT_BIT,
1786d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_SIGNAL_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_SIGNAL_BIT,
1787d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_MIGRATE_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_MIGRATE_BIT,
1788d7822b1eSMathieu Desnoyers };
1789d7822b1eSMathieu Desnoyers 
1790d7822b1eSMathieu Desnoyers enum rseq_event_mask {
1791d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_PREEMPT	= (1U << RSEQ_EVENT_PREEMPT_BIT),
1792d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_SIGNAL	= (1U << RSEQ_EVENT_SIGNAL_BIT),
1793d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_MIGRATE	= (1U << RSEQ_EVENT_MIGRATE_BIT),
1794d7822b1eSMathieu Desnoyers };
1795d7822b1eSMathieu Desnoyers 
1796d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t)
1797d7822b1eSMathieu Desnoyers {
1798d7822b1eSMathieu Desnoyers 	if (t->rseq)
1799d7822b1eSMathieu Desnoyers 		set_tsk_thread_flag(t, TIF_NOTIFY_RESUME);
1800d7822b1eSMathieu Desnoyers }
1801d7822b1eSMathieu Desnoyers 
1802d7822b1eSMathieu Desnoyers void __rseq_handle_notify_resume(struct pt_regs *regs);
1803d7822b1eSMathieu Desnoyers 
1804d7822b1eSMathieu Desnoyers static inline void rseq_handle_notify_resume(struct pt_regs *regs)
1805d7822b1eSMathieu Desnoyers {
1806d7822b1eSMathieu Desnoyers 	if (current->rseq)
1807d7822b1eSMathieu Desnoyers 		__rseq_handle_notify_resume(regs);
1808d7822b1eSMathieu Desnoyers }
1809d7822b1eSMathieu Desnoyers 
1810d7822b1eSMathieu Desnoyers static inline void rseq_signal_deliver(struct pt_regs *regs)
1811d7822b1eSMathieu Desnoyers {
1812d7822b1eSMathieu Desnoyers 	preempt_disable();
1813d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_SIGNAL_BIT, &current->rseq_event_mask);
1814d7822b1eSMathieu Desnoyers 	preempt_enable();
1815d7822b1eSMathieu Desnoyers 	rseq_handle_notify_resume(regs);
1816d7822b1eSMathieu Desnoyers }
1817d7822b1eSMathieu Desnoyers 
1818d7822b1eSMathieu Desnoyers /* rseq_preempt() requires preemption to be disabled. */
1819d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t)
1820d7822b1eSMathieu Desnoyers {
1821d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_PREEMPT_BIT, &t->rseq_event_mask);
1822d7822b1eSMathieu Desnoyers 	rseq_set_notify_resume(t);
1823d7822b1eSMathieu Desnoyers }
1824d7822b1eSMathieu Desnoyers 
1825d7822b1eSMathieu Desnoyers /* rseq_migrate() requires preemption to be disabled. */
1826d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t)
1827d7822b1eSMathieu Desnoyers {
1828d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_MIGRATE_BIT, &t->rseq_event_mask);
1829d7822b1eSMathieu Desnoyers 	rseq_set_notify_resume(t);
1830d7822b1eSMathieu Desnoyers }
1831d7822b1eSMathieu Desnoyers 
1832d7822b1eSMathieu Desnoyers /*
1833d7822b1eSMathieu Desnoyers  * If parent process has a registered restartable sequences area, the
1834d7822b1eSMathieu Desnoyers  * child inherits. Only applies when forking a process, not a thread. In
1835d7822b1eSMathieu Desnoyers  * case a parent fork() in the middle of a restartable sequence, set the
1836d7822b1eSMathieu Desnoyers  * resume notifier to force the child to retry.
1837d7822b1eSMathieu Desnoyers  */
1838d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags)
1839d7822b1eSMathieu Desnoyers {
1840d7822b1eSMathieu Desnoyers 	if (clone_flags & CLONE_THREAD) {
1841d7822b1eSMathieu Desnoyers 		t->rseq = NULL;
1842d7822b1eSMathieu Desnoyers 		t->rseq_len = 0;
1843d7822b1eSMathieu Desnoyers 		t->rseq_sig = 0;
1844d7822b1eSMathieu Desnoyers 		t->rseq_event_mask = 0;
1845d7822b1eSMathieu Desnoyers 	} else {
1846d7822b1eSMathieu Desnoyers 		t->rseq = current->rseq;
1847d7822b1eSMathieu Desnoyers 		t->rseq_len = current->rseq_len;
1848d7822b1eSMathieu Desnoyers 		t->rseq_sig = current->rseq_sig;
1849d7822b1eSMathieu Desnoyers 		t->rseq_event_mask = current->rseq_event_mask;
1850d7822b1eSMathieu Desnoyers 		rseq_preempt(t);
1851d7822b1eSMathieu Desnoyers 	}
1852d7822b1eSMathieu Desnoyers }
1853d7822b1eSMathieu Desnoyers 
1854d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t)
1855d7822b1eSMathieu Desnoyers {
1856d7822b1eSMathieu Desnoyers 	t->rseq = NULL;
1857d7822b1eSMathieu Desnoyers 	t->rseq_len = 0;
1858d7822b1eSMathieu Desnoyers 	t->rseq_sig = 0;
1859d7822b1eSMathieu Desnoyers 	t->rseq_event_mask = 0;
1860d7822b1eSMathieu Desnoyers }
1861d7822b1eSMathieu Desnoyers 
1862d7822b1eSMathieu Desnoyers #else
1863d7822b1eSMathieu Desnoyers 
1864d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t)
1865d7822b1eSMathieu Desnoyers {
1866d7822b1eSMathieu Desnoyers }
1867d7822b1eSMathieu Desnoyers static inline void rseq_handle_notify_resume(struct pt_regs *regs)
1868d7822b1eSMathieu Desnoyers {
1869d7822b1eSMathieu Desnoyers }
1870d7822b1eSMathieu Desnoyers static inline void rseq_signal_deliver(struct pt_regs *regs)
1871d7822b1eSMathieu Desnoyers {
1872d7822b1eSMathieu Desnoyers }
1873d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t)
1874d7822b1eSMathieu Desnoyers {
1875d7822b1eSMathieu Desnoyers }
1876d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t)
1877d7822b1eSMathieu Desnoyers {
1878d7822b1eSMathieu Desnoyers }
1879d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags)
1880d7822b1eSMathieu Desnoyers {
1881d7822b1eSMathieu Desnoyers }
1882d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t)
1883d7822b1eSMathieu Desnoyers {
1884d7822b1eSMathieu Desnoyers }
1885d7822b1eSMathieu Desnoyers 
1886d7822b1eSMathieu Desnoyers #endif
1887d7822b1eSMathieu Desnoyers 
1888d7822b1eSMathieu Desnoyers #ifdef CONFIG_DEBUG_RSEQ
1889d7822b1eSMathieu Desnoyers 
1890d7822b1eSMathieu Desnoyers void rseq_syscall(struct pt_regs *regs);
1891d7822b1eSMathieu Desnoyers 
1892d7822b1eSMathieu Desnoyers #else
1893d7822b1eSMathieu Desnoyers 
1894d7822b1eSMathieu Desnoyers static inline void rseq_syscall(struct pt_regs *regs)
1895d7822b1eSMathieu Desnoyers {
1896d7822b1eSMathieu Desnoyers }
1897d7822b1eSMathieu Desnoyers 
1898d7822b1eSMathieu Desnoyers #endif
1899d7822b1eSMathieu Desnoyers 
19001da177e4SLinus Torvalds #endif
1901