xref: /linux/include/linux/sched.h (revision a1dfb6311c7739e21e160bc4c5575a1b21b48c87)
1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */
21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H
31da177e4SLinus Torvalds #define _LINUX_SCHED_H
41da177e4SLinus Torvalds 
55eca1c10SIngo Molnar /*
65eca1c10SIngo Molnar  * Define 'struct task_struct' and provide the main scheduler
75eca1c10SIngo Molnar  * APIs (schedule(), wakeup variants, etc.)
85eca1c10SIngo Molnar  */
95eca1c10SIngo Molnar 
10607ca46eSDavid Howells #include <uapi/linux/sched.h>
11b7b3c76aSDavid Woodhouse 
1270b8157eSIngo Molnar #include <asm/current.h>
1370b8157eSIngo Molnar 
145eca1c10SIngo Molnar #include <linux/pid.h>
155eca1c10SIngo Molnar #include <linux/sem.h>
165eca1c10SIngo Molnar #include <linux/shm.h>
175eca1c10SIngo Molnar #include <linux/mutex.h>
185eca1c10SIngo Molnar #include <linux/plist.h>
195eca1c10SIngo Molnar #include <linux/hrtimer.h>
200584df9cSMarco Elver #include <linux/irqflags.h>
215eca1c10SIngo Molnar #include <linux/seccomp.h>
225eca1c10SIngo Molnar #include <linux/nodemask.h>
235eca1c10SIngo Molnar #include <linux/rcupdate.h>
24ec1d2819SElena Reshetova #include <linux/refcount.h>
255eca1c10SIngo Molnar #include <linux/resource.h>
265eca1c10SIngo Molnar #include <linux/latencytop.h>
275eca1c10SIngo Molnar #include <linux/sched/prio.h>
289eacb5c7SThomas Gleixner #include <linux/sched/types.h>
295eca1c10SIngo Molnar #include <linux/signal_types.h>
301446e1dfSGabriel Krisman Bertazi #include <linux/syscall_user_dispatch.h>
315eca1c10SIngo Molnar #include <linux/mm_types_task.h>
325eca1c10SIngo Molnar #include <linux/task_io_accounting.h>
332b69942fSThomas Gleixner #include <linux/posix-timers.h>
34d7822b1eSMathieu Desnoyers #include <linux/rseq.h>
350cd39f46SPeter Zijlstra #include <linux/seqlock.h>
36dfd402a4SMarco Elver #include <linux/kcsan.h>
375fbda3ecSThomas Gleixner #include <asm/kmap_size.h>
385eca1c10SIngo Molnar 
395eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */
40c7af7877SIngo Molnar struct audit_context;
41c7af7877SIngo Molnar struct backing_dev_info;
42c7af7877SIngo Molnar struct bio_list;
43c7af7877SIngo Molnar struct blk_plug;
44a10787e6SSong Liu struct bpf_local_storage;
453c93a0c0SQais Yousef struct capture_control;
46c7af7877SIngo Molnar struct cfs_rq;
47c7af7877SIngo Molnar struct fs_struct;
48c7af7877SIngo Molnar struct futex_pi_state;
49c7af7877SIngo Molnar struct io_context;
501875dc5bSPeter Oskolkov struct io_uring_task;
51c7af7877SIngo Molnar struct mempolicy;
52c7af7877SIngo Molnar struct nameidata;
53c7af7877SIngo Molnar struct nsproxy;
54c7af7877SIngo Molnar struct perf_event_context;
55c7af7877SIngo Molnar struct pid_namespace;
56c7af7877SIngo Molnar struct pipe_inode_info;
57c7af7877SIngo Molnar struct rcu_node;
58c7af7877SIngo Molnar struct reclaim_state;
59c7af7877SIngo Molnar struct robust_list_head;
603c93a0c0SQais Yousef struct root_domain;
613c93a0c0SQais Yousef struct rq;
62e2d1e2aeSIngo Molnar struct sched_attr;
63e2d1e2aeSIngo Molnar struct sched_param;
6443ae34cbSIngo Molnar struct seq_file;
65c7af7877SIngo Molnar struct sighand_struct;
66c7af7877SIngo Molnar struct signal_struct;
67c7af7877SIngo Molnar struct task_delay_info;
684cf86d77SIngo Molnar struct task_group;
691da177e4SLinus Torvalds 
704a8342d2SLinus Torvalds /*
714a8342d2SLinus Torvalds  * Task state bitmask. NOTE! These bits are also
724a8342d2SLinus Torvalds  * encoded in fs/proc/array.c: get_task_state().
734a8342d2SLinus Torvalds  *
744a8342d2SLinus Torvalds  * We have two separate sets of flags: task->state
754a8342d2SLinus Torvalds  * is about runnability, while task->exit_state are
764a8342d2SLinus Torvalds  * about the task exiting. Confusing, but this way
774a8342d2SLinus Torvalds  * modifying one set can't modify the other one by
784a8342d2SLinus Torvalds  * mistake.
794a8342d2SLinus Torvalds  */
805eca1c10SIngo Molnar 
815eca1c10SIngo Molnar /* Used in tsk->state: */
8292c4bc9fSPeter Zijlstra #define TASK_RUNNING			0x0000
8392c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE		0x0001
8492c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE		0x0002
8592c4bc9fSPeter Zijlstra #define __TASK_STOPPED			0x0004
8692c4bc9fSPeter Zijlstra #define __TASK_TRACED			0x0008
875eca1c10SIngo Molnar /* Used in tsk->exit_state: */
8892c4bc9fSPeter Zijlstra #define EXIT_DEAD			0x0010
8992c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE			0x0020
90abd50b39SOleg Nesterov #define EXIT_TRACE			(EXIT_ZOMBIE | EXIT_DEAD)
915eca1c10SIngo Molnar /* Used in tsk->state again: */
928ef9925bSPeter Zijlstra #define TASK_PARKED			0x0040
938ef9925bSPeter Zijlstra #define TASK_DEAD			0x0080
948ef9925bSPeter Zijlstra #define TASK_WAKEKILL			0x0100
958ef9925bSPeter Zijlstra #define TASK_WAKING			0x0200
9692c4bc9fSPeter Zijlstra #define TASK_NOLOAD			0x0400
9792c4bc9fSPeter Zijlstra #define TASK_NEW			0x0800
9892c4bc9fSPeter Zijlstra #define TASK_STATE_MAX			0x1000
99f021a3c2SMatthew Wilcox 
1005eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */
101f021a3c2SMatthew Wilcox #define TASK_KILLABLE			(TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
102f021a3c2SMatthew Wilcox #define TASK_STOPPED			(TASK_WAKEKILL | __TASK_STOPPED)
103f021a3c2SMatthew Wilcox #define TASK_TRACED			(TASK_WAKEKILL | __TASK_TRACED)
1041da177e4SLinus Torvalds 
10580ed87c8SPeter Zijlstra #define TASK_IDLE			(TASK_UNINTERRUPTIBLE | TASK_NOLOAD)
10680ed87c8SPeter Zijlstra 
1075eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */
10892a1f4bcSMatthew Wilcox #define TASK_NORMAL			(TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
10992a1f4bcSMatthew Wilcox 
1105eca1c10SIngo Molnar /* get_task_state(): */
11192a1f4bcSMatthew Wilcox #define TASK_REPORT			(TASK_RUNNING | TASK_INTERRUPTIBLE | \
112f021a3c2SMatthew Wilcox 					 TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
1138ef9925bSPeter Zijlstra 					 __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \
1148ef9925bSPeter Zijlstra 					 TASK_PARKED)
11592a1f4bcSMatthew Wilcox 
116f021a3c2SMatthew Wilcox #define task_is_traced(task)		((task->state & __TASK_TRACED) != 0)
1175eca1c10SIngo Molnar 
118f021a3c2SMatthew Wilcox #define task_is_stopped(task)		((task->state & __TASK_STOPPED) != 0)
1195eca1c10SIngo Molnar 
1205eca1c10SIngo Molnar #define task_is_stopped_or_traced(task)	((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
1215eca1c10SIngo Molnar 
1228eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
1238eb23b9fSPeter Zijlstra 
124b5bf9a90SPeter Zijlstra /*
125b5bf9a90SPeter Zijlstra  * Special states are those that do not use the normal wait-loop pattern. See
126b5bf9a90SPeter Zijlstra  * the comment with set_special_state().
127b5bf9a90SPeter Zijlstra  */
128b5bf9a90SPeter Zijlstra #define is_special_task_state(state)				\
1291cef1150SPeter Zijlstra 	((state) & (__TASK_STOPPED | __TASK_TRACED | TASK_PARKED | TASK_DEAD))
130b5bf9a90SPeter Zijlstra 
1318eb23b9fSPeter Zijlstra #define __set_current_state(state_value)			\
1328eb23b9fSPeter Zijlstra 	do {							\
133b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(is_special_task_state(state_value));\
1348eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
1358eb23b9fSPeter Zijlstra 		current->state = (state_value);			\
1368eb23b9fSPeter Zijlstra 	} while (0)
137b5bf9a90SPeter Zijlstra 
1388eb23b9fSPeter Zijlstra #define set_current_state(state_value)				\
1398eb23b9fSPeter Zijlstra 	do {							\
140b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(is_special_task_state(state_value));\
1418eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;		\
142b92b8b35SPeter Zijlstra 		smp_store_mb(current->state, (state_value));	\
1438eb23b9fSPeter Zijlstra 	} while (0)
1448eb23b9fSPeter Zijlstra 
145b5bf9a90SPeter Zijlstra #define set_special_state(state_value)					\
146b5bf9a90SPeter Zijlstra 	do {								\
147b5bf9a90SPeter Zijlstra 		unsigned long flags; /* may shadow */			\
148b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(!is_special_task_state(state_value));	\
149b5bf9a90SPeter Zijlstra 		raw_spin_lock_irqsave(&current->pi_lock, flags);	\
150b5bf9a90SPeter Zijlstra 		current->task_state_change = _THIS_IP_;			\
151b5bf9a90SPeter Zijlstra 		current->state = (state_value);				\
152b5bf9a90SPeter Zijlstra 		raw_spin_unlock_irqrestore(&current->pi_lock, flags);	\
153b5bf9a90SPeter Zijlstra 	} while (0)
1548eb23b9fSPeter Zijlstra #else
155498d0c57SAndrew Morton /*
156498d0c57SAndrew Morton  * set_current_state() includes a barrier so that the write of current->state
157498d0c57SAndrew Morton  * is correctly serialised wrt the caller's subsequent test of whether to
158498d0c57SAndrew Morton  * actually sleep:
159498d0c57SAndrew Morton  *
160a2250238SPeter Zijlstra  *   for (;;) {
161498d0c57SAndrew Morton  *	set_current_state(TASK_UNINTERRUPTIBLE);
16258877d34SPeter Zijlstra  *	if (CONDITION)
163a2250238SPeter Zijlstra  *	   break;
164498d0c57SAndrew Morton  *
165a2250238SPeter Zijlstra  *	schedule();
166a2250238SPeter Zijlstra  *   }
167a2250238SPeter Zijlstra  *   __set_current_state(TASK_RUNNING);
168a2250238SPeter Zijlstra  *
169a2250238SPeter Zijlstra  * If the caller does not need such serialisation (because, for instance, the
17058877d34SPeter Zijlstra  * CONDITION test and condition change and wakeup are under the same lock) then
171a2250238SPeter Zijlstra  * use __set_current_state().
172a2250238SPeter Zijlstra  *
173a2250238SPeter Zijlstra  * The above is typically ordered against the wakeup, which does:
174a2250238SPeter Zijlstra  *
17558877d34SPeter Zijlstra  *   CONDITION = 1;
176a2250238SPeter Zijlstra  *   wake_up_state(p, TASK_UNINTERRUPTIBLE);
177a2250238SPeter Zijlstra  *
17858877d34SPeter Zijlstra  * where wake_up_state()/try_to_wake_up() executes a full memory barrier before
17958877d34SPeter Zijlstra  * accessing p->state.
180a2250238SPeter Zijlstra  *
181a2250238SPeter Zijlstra  * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is,
182a2250238SPeter Zijlstra  * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a
183a2250238SPeter Zijlstra  * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING).
184a2250238SPeter Zijlstra  *
185b5bf9a90SPeter Zijlstra  * However, with slightly different timing the wakeup TASK_RUNNING store can
186dfcb245eSIngo Molnar  * also collide with the TASK_UNINTERRUPTIBLE store. Losing that store is not
187b5bf9a90SPeter Zijlstra  * a problem either because that will result in one extra go around the loop
188b5bf9a90SPeter Zijlstra  * and our @cond test will save the day.
189a2250238SPeter Zijlstra  *
190a2250238SPeter Zijlstra  * Also see the comments of try_to_wake_up().
191498d0c57SAndrew Morton  */
192b5bf9a90SPeter Zijlstra #define __set_current_state(state_value)				\
193b5bf9a90SPeter Zijlstra 	current->state = (state_value)
194b5bf9a90SPeter Zijlstra 
195b5bf9a90SPeter Zijlstra #define set_current_state(state_value)					\
196b5bf9a90SPeter Zijlstra 	smp_store_mb(current->state, (state_value))
197b5bf9a90SPeter Zijlstra 
198b5bf9a90SPeter Zijlstra /*
199b5bf9a90SPeter Zijlstra  * set_special_state() should be used for those states when the blocking task
200b5bf9a90SPeter Zijlstra  * can not use the regular condition based wait-loop. In that case we must
201b5bf9a90SPeter Zijlstra  * serialize against wakeups such that any possible in-flight TASK_RUNNING stores
202b5bf9a90SPeter Zijlstra  * will not collide with our state change.
203b5bf9a90SPeter Zijlstra  */
204b5bf9a90SPeter Zijlstra #define set_special_state(state_value)					\
205b5bf9a90SPeter Zijlstra 	do {								\
206b5bf9a90SPeter Zijlstra 		unsigned long flags; /* may shadow */			\
207b5bf9a90SPeter Zijlstra 		raw_spin_lock_irqsave(&current->pi_lock, flags);	\
208b5bf9a90SPeter Zijlstra 		current->state = (state_value);				\
209b5bf9a90SPeter Zijlstra 		raw_spin_unlock_irqrestore(&current->pi_lock, flags);	\
210b5bf9a90SPeter Zijlstra 	} while (0)
211b5bf9a90SPeter Zijlstra 
2128eb23b9fSPeter Zijlstra #endif
2138eb23b9fSPeter Zijlstra 
2145eca1c10SIngo Molnar /* Task command name length: */
2151da177e4SLinus Torvalds #define TASK_COMM_LEN			16
2161da177e4SLinus Torvalds 
2171da177e4SLinus Torvalds extern void scheduler_tick(void);
2181da177e4SLinus Torvalds 
2191da177e4SLinus Torvalds #define	MAX_SCHEDULE_TIMEOUT		LONG_MAX
2205eca1c10SIngo Molnar 
2215eca1c10SIngo Molnar extern long schedule_timeout(long timeout);
2225eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout);
2235eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout);
2245eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout);
2255eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout);
2261da177e4SLinus Torvalds asmlinkage void schedule(void);
227c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void);
22819c95f26SJulien Thierry asmlinkage void preempt_schedule_irq(void);
2291da177e4SLinus Torvalds 
23010ab5643STejun Heo extern int __must_check io_schedule_prepare(void);
23110ab5643STejun Heo extern void io_schedule_finish(int token);
2329cff8adeSNeilBrown extern long io_schedule_timeout(long timeout);
23310ab5643STejun Heo extern void io_schedule(void);
2349cff8adeSNeilBrown 
235f06febc9SFrank Mayhar /**
2360ba42a59SMasanari Iida  * struct prev_cputime - snapshot of system and user cputime
237d37f761dSFrederic Weisbecker  * @utime: time spent in user mode
238d37f761dSFrederic Weisbecker  * @stime: time spent in system mode
2399d7fb042SPeter Zijlstra  * @lock: protects the above two fields
240d37f761dSFrederic Weisbecker  *
2419d7fb042SPeter Zijlstra  * Stores previous user/system time values such that we can guarantee
2429d7fb042SPeter Zijlstra  * monotonicity.
243d37f761dSFrederic Weisbecker  */
2449d7fb042SPeter Zijlstra struct prev_cputime {
2459d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
2465613fda9SFrederic Weisbecker 	u64				utime;
2475613fda9SFrederic Weisbecker 	u64				stime;
2489d7fb042SPeter Zijlstra 	raw_spinlock_t			lock;
2499d7fb042SPeter Zijlstra #endif
250d37f761dSFrederic Weisbecker };
251d37f761dSFrederic Weisbecker 
252bac5b6b6SFrederic Weisbecker enum vtime_state {
253bac5b6b6SFrederic Weisbecker 	/* Task is sleeping or running in a CPU with VTIME inactive: */
254bac5b6b6SFrederic Weisbecker 	VTIME_INACTIVE = 0,
25514faf6fcSFrederic Weisbecker 	/* Task is idle */
25614faf6fcSFrederic Weisbecker 	VTIME_IDLE,
257bac5b6b6SFrederic Weisbecker 	/* Task runs in kernelspace in a CPU with VTIME active: */
258bac5b6b6SFrederic Weisbecker 	VTIME_SYS,
25914faf6fcSFrederic Weisbecker 	/* Task runs in userspace in a CPU with VTIME active: */
26014faf6fcSFrederic Weisbecker 	VTIME_USER,
261e6d5bf3eSFrederic Weisbecker 	/* Task runs as guests in a CPU with VTIME active: */
262e6d5bf3eSFrederic Weisbecker 	VTIME_GUEST,
263bac5b6b6SFrederic Weisbecker };
264bac5b6b6SFrederic Weisbecker 
265bac5b6b6SFrederic Weisbecker struct vtime {
266bac5b6b6SFrederic Weisbecker 	seqcount_t		seqcount;
267bac5b6b6SFrederic Weisbecker 	unsigned long long	starttime;
268bac5b6b6SFrederic Weisbecker 	enum vtime_state	state;
269802f4a82SFrederic Weisbecker 	unsigned int		cpu;
2702a42eb95SWanpeng Li 	u64			utime;
2712a42eb95SWanpeng Li 	u64			stime;
2722a42eb95SWanpeng Li 	u64			gtime;
273bac5b6b6SFrederic Weisbecker };
274bac5b6b6SFrederic Weisbecker 
27569842cbaSPatrick Bellasi /*
27669842cbaSPatrick Bellasi  * Utilization clamp constraints.
27769842cbaSPatrick Bellasi  * @UCLAMP_MIN:	Minimum utilization
27869842cbaSPatrick Bellasi  * @UCLAMP_MAX:	Maximum utilization
27969842cbaSPatrick Bellasi  * @UCLAMP_CNT:	Utilization clamp constraints count
28069842cbaSPatrick Bellasi  */
28169842cbaSPatrick Bellasi enum uclamp_id {
28269842cbaSPatrick Bellasi 	UCLAMP_MIN = 0,
28369842cbaSPatrick Bellasi 	UCLAMP_MAX,
28469842cbaSPatrick Bellasi 	UCLAMP_CNT
28569842cbaSPatrick Bellasi };
28669842cbaSPatrick Bellasi 
287f9a25f77SMathieu Poirier #ifdef CONFIG_SMP
288f9a25f77SMathieu Poirier extern struct root_domain def_root_domain;
289f9a25f77SMathieu Poirier extern struct mutex sched_domains_mutex;
290f9a25f77SMathieu Poirier #endif
291f9a25f77SMathieu Poirier 
2921da177e4SLinus Torvalds struct sched_info {
2937f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO
2945eca1c10SIngo Molnar 	/* Cumulative counters: */
2951da177e4SLinus Torvalds 
2965eca1c10SIngo Molnar 	/* # of times we have run on this CPU: */
2975eca1c10SIngo Molnar 	unsigned long			pcount;
2985eca1c10SIngo Molnar 
2995eca1c10SIngo Molnar 	/* Time spent waiting on a runqueue: */
3005eca1c10SIngo Molnar 	unsigned long long		run_delay;
3015eca1c10SIngo Molnar 
3025eca1c10SIngo Molnar 	/* Timestamps: */
3035eca1c10SIngo Molnar 
3045eca1c10SIngo Molnar 	/* When did we last run on a CPU? */
3055eca1c10SIngo Molnar 	unsigned long long		last_arrival;
3065eca1c10SIngo Molnar 
3075eca1c10SIngo Molnar 	/* When were we last queued to run? */
3085eca1c10SIngo Molnar 	unsigned long long		last_queued;
3095eca1c10SIngo Molnar 
310f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */
3117f5f8e8dSIngo Molnar };
3121da177e4SLinus Torvalds 
3131da177e4SLinus Torvalds /*
3146ecdd749SYuyang Du  * Integer metrics need fixed point arithmetic, e.g., sched/fair
3156ecdd749SYuyang Du  * has a few: load, load_avg, util_avg, freq, and capacity.
3166ecdd749SYuyang Du  *
3176ecdd749SYuyang Du  * We define a basic fixed point arithmetic range, and then formalize
3186ecdd749SYuyang Du  * all these metrics based on that basic range.
3196ecdd749SYuyang Du  */
3206ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT		10
3216ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE		(1L << SCHED_FIXEDPOINT_SHIFT)
3226ecdd749SYuyang Du 
32369842cbaSPatrick Bellasi /* Increase resolution of cpu_capacity calculations */
32469842cbaSPatrick Bellasi # define SCHED_CAPACITY_SHIFT		SCHED_FIXEDPOINT_SHIFT
32569842cbaSPatrick Bellasi # define SCHED_CAPACITY_SCALE		(1L << SCHED_CAPACITY_SHIFT)
32669842cbaSPatrick Bellasi 
32720b8a59fSIngo Molnar struct load_weight {
3289dbdb155SPeter Zijlstra 	unsigned long			weight;
3299dbdb155SPeter Zijlstra 	u32				inv_weight;
33020b8a59fSIngo Molnar };
33120b8a59fSIngo Molnar 
3327f65ea42SPatrick Bellasi /**
3337f65ea42SPatrick Bellasi  * struct util_est - Estimation utilization of FAIR tasks
3347f65ea42SPatrick Bellasi  * @enqueued: instantaneous estimated utilization of a task/cpu
3357f65ea42SPatrick Bellasi  * @ewma:     the Exponential Weighted Moving Average (EWMA)
3367f65ea42SPatrick Bellasi  *            utilization of a task
3377f65ea42SPatrick Bellasi  *
3387f65ea42SPatrick Bellasi  * Support data structure to track an Exponential Weighted Moving Average
3397f65ea42SPatrick Bellasi  * (EWMA) of a FAIR task's utilization. New samples are added to the moving
3407f65ea42SPatrick Bellasi  * average each time a task completes an activation. Sample's weight is chosen
3417f65ea42SPatrick Bellasi  * so that the EWMA will be relatively insensitive to transient changes to the
3427f65ea42SPatrick Bellasi  * task's workload.
3437f65ea42SPatrick Bellasi  *
3447f65ea42SPatrick Bellasi  * The enqueued attribute has a slightly different meaning for tasks and cpus:
3457f65ea42SPatrick Bellasi  * - task:   the task's util_avg at last task dequeue time
3467f65ea42SPatrick Bellasi  * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU
3477f65ea42SPatrick Bellasi  * Thus, the util_est.enqueued of a task represents the contribution on the
3487f65ea42SPatrick Bellasi  * estimated utilization of the CPU where that task is currently enqueued.
3497f65ea42SPatrick Bellasi  *
3507f65ea42SPatrick Bellasi  * Only for tasks we track a moving average of the past instantaneous
3517f65ea42SPatrick Bellasi  * estimated utilization. This allows to absorb sporadic drops in utilization
3527f65ea42SPatrick Bellasi  * of an otherwise almost periodic task.
3537f65ea42SPatrick Bellasi  */
3547f65ea42SPatrick Bellasi struct util_est {
3557f65ea42SPatrick Bellasi 	unsigned int			enqueued;
3567f65ea42SPatrick Bellasi 	unsigned int			ewma;
3577f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT		2
358317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64))));
3597f65ea42SPatrick Bellasi 
3609d89c257SYuyang Du /*
3619f683953SVincent Guittot  * The load/runnable/util_avg accumulates an infinite geometric series
3620dacee1bSVincent Guittot  * (see __update_load_avg_cfs_rq() in kernel/sched/pelt.c).
3637b595334SYuyang Du  *
3647b595334SYuyang Du  * [load_avg definition]
3657b595334SYuyang Du  *
3667b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load)
3677b595334SYuyang Du  *
3689f683953SVincent Guittot  * [runnable_avg definition]
3699f683953SVincent Guittot  *
3709f683953SVincent Guittot  *   runnable_avg = runnable% * SCHED_CAPACITY_SCALE
3717b595334SYuyang Du  *
3727b595334SYuyang Du  * [util_avg definition]
3737b595334SYuyang Du  *
3747b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE
3757b595334SYuyang Du  *
3769f683953SVincent Guittot  * where runnable% is the time ratio that a sched_entity is runnable and
3779f683953SVincent Guittot  * running% the time ratio that a sched_entity is running.
3787b595334SYuyang Du  *
3799f683953SVincent Guittot  * For cfs_rq, they are the aggregated values of all runnable and blocked
3809f683953SVincent Guittot  * sched_entities.
3819f683953SVincent Guittot  *
382c1b7b8d4S王文虎  * The load/runnable/util_avg doesn't directly factor frequency scaling and CPU
3839f683953SVincent Guittot  * capacity scaling. The scaling is done through the rq_clock_pelt that is used
3849f683953SVincent Guittot  * for computing those signals (see update_rq_clock_pelt())
3857b595334SYuyang Du  *
38623127296SVincent Guittot  * N.B., the above ratios (runnable% and running%) themselves are in the
38723127296SVincent Guittot  * range of [0, 1]. To do fixed point arithmetics, we therefore scale them
38823127296SVincent Guittot  * to as large a range as necessary. This is for example reflected by
38923127296SVincent Guittot  * util_avg's SCHED_CAPACITY_SCALE.
3907b595334SYuyang Du  *
3917b595334SYuyang Du  * [Overflow issue]
3927b595334SYuyang Du  *
3937b595334SYuyang Du  * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities
3947b595334SYuyang Du  * with the highest load (=88761), always runnable on a single cfs_rq,
3957b595334SYuyang Du  * and should not overflow as the number already hits PID_MAX_LIMIT.
3967b595334SYuyang Du  *
3977b595334SYuyang Du  * For all other cases (including 32-bit kernels), struct load_weight's
3987b595334SYuyang Du  * weight will overflow first before we do, because:
3997b595334SYuyang Du  *
4007b595334SYuyang Du  *    Max(load_avg) <= Max(load.weight)
4017b595334SYuyang Du  *
4027b595334SYuyang Du  * Then it is the load_weight's responsibility to consider overflow
4037b595334SYuyang Du  * issues.
4049d89c257SYuyang Du  */
4059d85f21cSPaul Turner struct sched_avg {
4065eca1c10SIngo Molnar 	u64				last_update_time;
4075eca1c10SIngo Molnar 	u64				load_sum;
4089f683953SVincent Guittot 	u64				runnable_sum;
4095eca1c10SIngo Molnar 	u32				util_sum;
4105eca1c10SIngo Molnar 	u32				period_contrib;
4115eca1c10SIngo Molnar 	unsigned long			load_avg;
4129f683953SVincent Guittot 	unsigned long			runnable_avg;
4135eca1c10SIngo Molnar 	unsigned long			util_avg;
4147f65ea42SPatrick Bellasi 	struct util_est			util_est;
415317d359dSPeter Zijlstra } ____cacheline_aligned;
4169d85f21cSPaul Turner 
41741acab88SLucas De Marchi struct sched_statistics {
4187f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS
41994c18227SIngo Molnar 	u64				wait_start;
42094c18227SIngo Molnar 	u64				wait_max;
4216d082592SArjan van de Ven 	u64				wait_count;
4226d082592SArjan van de Ven 	u64				wait_sum;
4238f0dfc34SArjan van de Ven 	u64				iowait_count;
4248f0dfc34SArjan van de Ven 	u64				iowait_sum;
42594c18227SIngo Molnar 
42694c18227SIngo Molnar 	u64				sleep_start;
42720b8a59fSIngo Molnar 	u64				sleep_max;
42894c18227SIngo Molnar 	s64				sum_sleep_runtime;
42994c18227SIngo Molnar 
43094c18227SIngo Molnar 	u64				block_start;
43120b8a59fSIngo Molnar 	u64				block_max;
43220b8a59fSIngo Molnar 	u64				exec_max;
433eba1ed4bSIngo Molnar 	u64				slice_max;
434cc367732SIngo Molnar 
435cc367732SIngo Molnar 	u64				nr_migrations_cold;
436cc367732SIngo Molnar 	u64				nr_failed_migrations_affine;
437cc367732SIngo Molnar 	u64				nr_failed_migrations_running;
438cc367732SIngo Molnar 	u64				nr_failed_migrations_hot;
439cc367732SIngo Molnar 	u64				nr_forced_migrations;
440cc367732SIngo Molnar 
441cc367732SIngo Molnar 	u64				nr_wakeups;
442cc367732SIngo Molnar 	u64				nr_wakeups_sync;
443cc367732SIngo Molnar 	u64				nr_wakeups_migrate;
444cc367732SIngo Molnar 	u64				nr_wakeups_local;
445cc367732SIngo Molnar 	u64				nr_wakeups_remote;
446cc367732SIngo Molnar 	u64				nr_wakeups_affine;
447cc367732SIngo Molnar 	u64				nr_wakeups_affine_attempts;
448cc367732SIngo Molnar 	u64				nr_wakeups_passive;
449cc367732SIngo Molnar 	u64				nr_wakeups_idle;
45041acab88SLucas De Marchi #endif
4517f5f8e8dSIngo Molnar };
45241acab88SLucas De Marchi 
45341acab88SLucas De Marchi struct sched_entity {
4545eca1c10SIngo Molnar 	/* For load-balancing: */
4555eca1c10SIngo Molnar 	struct load_weight		load;
45641acab88SLucas De Marchi 	struct rb_node			run_node;
45741acab88SLucas De Marchi 	struct list_head		group_node;
45841acab88SLucas De Marchi 	unsigned int			on_rq;
45941acab88SLucas De Marchi 
46041acab88SLucas De Marchi 	u64				exec_start;
46141acab88SLucas De Marchi 	u64				sum_exec_runtime;
46241acab88SLucas De Marchi 	u64				vruntime;
46341acab88SLucas De Marchi 	u64				prev_sum_exec_runtime;
46441acab88SLucas De Marchi 
46541acab88SLucas De Marchi 	u64				nr_migrations;
46641acab88SLucas De Marchi 
46741acab88SLucas De Marchi 	struct sched_statistics		statistics;
46894c18227SIngo Molnar 
46920b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED
470fed14d45SPeter Zijlstra 	int				depth;
47120b8a59fSIngo Molnar 	struct sched_entity		*parent;
47220b8a59fSIngo Molnar 	/* rq on which this entity is (to be) queued: */
47320b8a59fSIngo Molnar 	struct cfs_rq			*cfs_rq;
47420b8a59fSIngo Molnar 	/* rq "owned" by this entity/group: */
47520b8a59fSIngo Molnar 	struct cfs_rq			*my_q;
4769f683953SVincent Guittot 	/* cached value of my_q->h_nr_running */
4779f683953SVincent Guittot 	unsigned long			runnable_weight;
47820b8a59fSIngo Molnar #endif
4798bd75c77SClark Williams 
480141965c7SAlex Shi #ifdef CONFIG_SMP
4815a107804SJiri Olsa 	/*
4825a107804SJiri Olsa 	 * Per entity load average tracking.
4835a107804SJiri Olsa 	 *
4845a107804SJiri Olsa 	 * Put into separate cache line so it does not
4855a107804SJiri Olsa 	 * collide with read-mostly values above.
4865a107804SJiri Olsa 	 */
487317d359dSPeter Zijlstra 	struct sched_avg		avg;
4889d85f21cSPaul Turner #endif
48920b8a59fSIngo Molnar };
49070b97a7fSIngo Molnar 
491fa717060SPeter Zijlstra struct sched_rt_entity {
492fa717060SPeter Zijlstra 	struct list_head		run_list;
49378f2c7dbSPeter Zijlstra 	unsigned long			timeout;
49457d2aa00SYing Xue 	unsigned long			watchdog_stamp;
495bee367edSRichard Kennedy 	unsigned int			time_slice;
496ff77e468SPeter Zijlstra 	unsigned short			on_rq;
497ff77e468SPeter Zijlstra 	unsigned short			on_list;
4986f505b16SPeter Zijlstra 
49958d6c2d7SPeter Zijlstra 	struct sched_rt_entity		*back;
500052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED
5016f505b16SPeter Zijlstra 	struct sched_rt_entity		*parent;
5026f505b16SPeter Zijlstra 	/* rq on which this entity is (to be) queued: */
5036f505b16SPeter Zijlstra 	struct rt_rq			*rt_rq;
5046f505b16SPeter Zijlstra 	/* rq "owned" by this entity/group: */
5056f505b16SPeter Zijlstra 	struct rt_rq			*my_q;
5066f505b16SPeter Zijlstra #endif
5073859a271SKees Cook } __randomize_layout;
508fa717060SPeter Zijlstra 
509aab03e05SDario Faggioli struct sched_dl_entity {
510aab03e05SDario Faggioli 	struct rb_node			rb_node;
511aab03e05SDario Faggioli 
512aab03e05SDario Faggioli 	/*
513aab03e05SDario Faggioli 	 * Original scheduling parameters. Copied here from sched_attr
5144027d080Sxiaofeng.yan 	 * during sched_setattr(), they will remain the same until
5154027d080Sxiaofeng.yan 	 * the next sched_setattr().
516aab03e05SDario Faggioli 	 */
5175eca1c10SIngo Molnar 	u64				dl_runtime;	/* Maximum runtime for each instance	*/
5185eca1c10SIngo Molnar 	u64				dl_deadline;	/* Relative deadline of each instance	*/
5195eca1c10SIngo Molnar 	u64				dl_period;	/* Separation of two instances (period) */
52054d6d303SDaniel Bristot de Oliveira 	u64				dl_bw;		/* dl_runtime / dl_period		*/
5213effcb42SDaniel Bristot de Oliveira 	u64				dl_density;	/* dl_runtime / dl_deadline		*/
522aab03e05SDario Faggioli 
523aab03e05SDario Faggioli 	/*
524aab03e05SDario Faggioli 	 * Actual scheduling parameters. Initialized with the values above,
525dfcb245eSIngo Molnar 	 * they are continuously updated during task execution. Note that
526aab03e05SDario Faggioli 	 * the remaining runtime could be < 0 in case we are in overrun.
527aab03e05SDario Faggioli 	 */
5285eca1c10SIngo Molnar 	s64				runtime;	/* Remaining runtime for this instance	*/
5295eca1c10SIngo Molnar 	u64				deadline;	/* Absolute deadline for this instance	*/
5305eca1c10SIngo Molnar 	unsigned int			flags;		/* Specifying the scheduler behaviour	*/
531aab03e05SDario Faggioli 
532aab03e05SDario Faggioli 	/*
533aab03e05SDario Faggioli 	 * Some bool flags:
534aab03e05SDario Faggioli 	 *
535aab03e05SDario Faggioli 	 * @dl_throttled tells if we exhausted the runtime. If so, the
536aab03e05SDario Faggioli 	 * task has to wait for a replenishment to be performed at the
537aab03e05SDario Faggioli 	 * next firing of dl_timer.
538aab03e05SDario Faggioli 	 *
5392d3d891dSDario Faggioli 	 * @dl_boosted tells if we are boosted due to DI. If so we are
5402d3d891dSDario Faggioli 	 * outside bandwidth enforcement mechanism (but only until we
5415bfd126eSJuri Lelli 	 * exit the critical section);
5425bfd126eSJuri Lelli 	 *
5435eca1c10SIngo Molnar 	 * @dl_yielded tells if task gave up the CPU before consuming
5445bfd126eSJuri Lelli 	 * all its available runtime during the last job.
545209a0cbdSLuca Abeni 	 *
546209a0cbdSLuca Abeni 	 * @dl_non_contending tells if the task is inactive while still
547209a0cbdSLuca Abeni 	 * contributing to the active utilization. In other words, it
548209a0cbdSLuca Abeni 	 * indicates if the inactive timer has been armed and its handler
549209a0cbdSLuca Abeni 	 * has not been executed yet. This flag is useful to avoid race
550209a0cbdSLuca Abeni 	 * conditions between the inactive timer handler and the wakeup
551209a0cbdSLuca Abeni 	 * code.
55234be3930SJuri Lelli 	 *
55334be3930SJuri Lelli 	 * @dl_overrun tells if the task asked to be informed about runtime
55434be3930SJuri Lelli 	 * overruns.
555aab03e05SDario Faggioli 	 */
556aa5222e9SDan Carpenter 	unsigned int			dl_throttled      : 1;
557aa5222e9SDan Carpenter 	unsigned int			dl_yielded        : 1;
558aa5222e9SDan Carpenter 	unsigned int			dl_non_contending : 1;
55934be3930SJuri Lelli 	unsigned int			dl_overrun	  : 1;
560aab03e05SDario Faggioli 
561aab03e05SDario Faggioli 	/*
562aab03e05SDario Faggioli 	 * Bandwidth enforcement timer. Each -deadline task has its
563aab03e05SDario Faggioli 	 * own bandwidth to be enforced, thus we need one timer per task.
564aab03e05SDario Faggioli 	 */
565aab03e05SDario Faggioli 	struct hrtimer			dl_timer;
566209a0cbdSLuca Abeni 
567209a0cbdSLuca Abeni 	/*
568209a0cbdSLuca Abeni 	 * Inactive timer, responsible for decreasing the active utilization
569209a0cbdSLuca Abeni 	 * at the "0-lag time". When a -deadline task blocks, it contributes
570209a0cbdSLuca Abeni 	 * to GRUB's active utilization until the "0-lag time", hence a
571209a0cbdSLuca Abeni 	 * timer is needed to decrease the active utilization at the correct
572209a0cbdSLuca Abeni 	 * time.
573209a0cbdSLuca Abeni 	 */
574209a0cbdSLuca Abeni 	struct hrtimer inactive_timer;
5752279f540SJuri Lelli 
5762279f540SJuri Lelli #ifdef CONFIG_RT_MUTEXES
5772279f540SJuri Lelli 	/*
5782279f540SJuri Lelli 	 * Priority Inheritance. When a DEADLINE scheduling entity is boosted
5792279f540SJuri Lelli 	 * pi_se points to the donor, otherwise points to the dl_se it belongs
5802279f540SJuri Lelli 	 * to (the original one/itself).
5812279f540SJuri Lelli 	 */
5822279f540SJuri Lelli 	struct sched_dl_entity *pi_se;
5832279f540SJuri Lelli #endif
584aab03e05SDario Faggioli };
5858bd75c77SClark Williams 
58669842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK
58769842cbaSPatrick Bellasi /* Number of utilization clamp buckets (shorter alias) */
58869842cbaSPatrick Bellasi #define UCLAMP_BUCKETS CONFIG_UCLAMP_BUCKETS_COUNT
58969842cbaSPatrick Bellasi 
59069842cbaSPatrick Bellasi /*
59169842cbaSPatrick Bellasi  * Utilization clamp for a scheduling entity
59269842cbaSPatrick Bellasi  * @value:		clamp value "assigned" to a se
59369842cbaSPatrick Bellasi  * @bucket_id:		bucket index corresponding to the "assigned" value
594e8f14172SPatrick Bellasi  * @active:		the se is currently refcounted in a rq's bucket
595a509a7cdSPatrick Bellasi  * @user_defined:	the requested clamp value comes from user-space
59669842cbaSPatrick Bellasi  *
59769842cbaSPatrick Bellasi  * The bucket_id is the index of the clamp bucket matching the clamp value
59869842cbaSPatrick Bellasi  * which is pre-computed and stored to avoid expensive integer divisions from
59969842cbaSPatrick Bellasi  * the fast path.
600e8f14172SPatrick Bellasi  *
601e8f14172SPatrick Bellasi  * The active bit is set whenever a task has got an "effective" value assigned,
602e8f14172SPatrick Bellasi  * which can be different from the clamp value "requested" from user-space.
603e8f14172SPatrick Bellasi  * This allows to know a task is refcounted in the rq's bucket corresponding
604e8f14172SPatrick Bellasi  * to the "effective" bucket_id.
605a509a7cdSPatrick Bellasi  *
606a509a7cdSPatrick Bellasi  * The user_defined bit is set whenever a task has got a task-specific clamp
607a509a7cdSPatrick Bellasi  * value requested from userspace, i.e. the system defaults apply to this task
608a509a7cdSPatrick Bellasi  * just as a restriction. This allows to relax default clamps when a less
609a509a7cdSPatrick Bellasi  * restrictive task-specific value has been requested, thus allowing to
610a509a7cdSPatrick Bellasi  * implement a "nice" semantic. For example, a task running with a 20%
611a509a7cdSPatrick Bellasi  * default boost can still drop its own boosting to 0%.
61269842cbaSPatrick Bellasi  */
61369842cbaSPatrick Bellasi struct uclamp_se {
61469842cbaSPatrick Bellasi 	unsigned int value		: bits_per(SCHED_CAPACITY_SCALE);
61569842cbaSPatrick Bellasi 	unsigned int bucket_id		: bits_per(UCLAMP_BUCKETS);
616e8f14172SPatrick Bellasi 	unsigned int active		: 1;
617a509a7cdSPatrick Bellasi 	unsigned int user_defined	: 1;
61869842cbaSPatrick Bellasi };
61969842cbaSPatrick Bellasi #endif /* CONFIG_UCLAMP_TASK */
62069842cbaSPatrick Bellasi 
6211d082fd0SPaul E. McKenney union rcu_special {
6221d082fd0SPaul E. McKenney 	struct {
6238203d6d0SPaul E. McKenney 		u8			blocked;
6248203d6d0SPaul E. McKenney 		u8			need_qs;
62505f41571SPaul E. McKenney 		u8			exp_hint; /* Hint for performance. */
626276c4104SPaul E. McKenney 		u8			need_mb; /* Readers need smp_mb(). */
6278203d6d0SPaul E. McKenney 	} b; /* Bits. */
62805f41571SPaul E. McKenney 	u32 s; /* Set of bits. */
6291d082fd0SPaul E. McKenney };
63086848966SPaul E. McKenney 
6318dc85d54SPeter Zijlstra enum perf_event_task_context {
6328dc85d54SPeter Zijlstra 	perf_invalid_context = -1,
6338dc85d54SPeter Zijlstra 	perf_hw_context = 0,
63489a1e187SPeter Zijlstra 	perf_sw_context,
6358dc85d54SPeter Zijlstra 	perf_nr_task_contexts,
6368dc85d54SPeter Zijlstra };
6378dc85d54SPeter Zijlstra 
638eb61baf6SIngo Molnar struct wake_q_node {
639eb61baf6SIngo Molnar 	struct wake_q_node *next;
640eb61baf6SIngo Molnar };
641eb61baf6SIngo Molnar 
6425fbda3ecSThomas Gleixner struct kmap_ctrl {
6435fbda3ecSThomas Gleixner #ifdef CONFIG_KMAP_LOCAL
6445fbda3ecSThomas Gleixner 	int				idx;
6455fbda3ecSThomas Gleixner 	pte_t				pteval[KM_MAX_IDX];
6465fbda3ecSThomas Gleixner #endif
6475fbda3ecSThomas Gleixner };
6485fbda3ecSThomas Gleixner 
6491da177e4SLinus Torvalds struct task_struct {
650c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
651c65eacbeSAndy Lutomirski 	/*
652c65eacbeSAndy Lutomirski 	 * For reasons of header soup (see current_thread_info()), this
653c65eacbeSAndy Lutomirski 	 * must be the first element of task_struct.
654c65eacbeSAndy Lutomirski 	 */
655c65eacbeSAndy Lutomirski 	struct thread_info		thread_info;
656c65eacbeSAndy Lutomirski #endif
6575eca1c10SIngo Molnar 	/* -1 unrunnable, 0 runnable, >0 stopped: */
6585eca1c10SIngo Molnar 	volatile long			state;
65929e48ce8SKees Cook 
66029e48ce8SKees Cook 	/*
66129e48ce8SKees Cook 	 * This begins the randomizable portion of task_struct. Only
66229e48ce8SKees Cook 	 * scheduling-critical items should be added above here.
66329e48ce8SKees Cook 	 */
66429e48ce8SKees Cook 	randomized_struct_fields_start
66529e48ce8SKees Cook 
666f7e4217bSRoman Zippel 	void				*stack;
667ec1d2819SElena Reshetova 	refcount_t			usage;
6685eca1c10SIngo Molnar 	/* Per task flags (PF_*), defined further below: */
6695eca1c10SIngo Molnar 	unsigned int			flags;
67097dc32cdSWilliam Cohen 	unsigned int			ptrace;
6711da177e4SLinus Torvalds 
6722dd73a4fSPeter Williams #ifdef CONFIG_SMP
6733ca7a440SPeter Zijlstra 	int				on_cpu;
6748c4890d1SPeter Zijlstra 	struct __call_single_node	wake_entry;
675c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
6765eca1c10SIngo Molnar 	/* Current CPU: */
6775eca1c10SIngo Molnar 	unsigned int			cpu;
678c65eacbeSAndy Lutomirski #endif
67963b0e9edSMike Galbraith 	unsigned int			wakee_flips;
68062470419SMichael Wang 	unsigned long			wakee_flip_decay_ts;
68163b0e9edSMike Galbraith 	struct task_struct		*last_wakee;
682ac66f547SPeter Zijlstra 
68332e839ddSMel Gorman 	/*
68432e839ddSMel Gorman 	 * recent_used_cpu is initially set as the last CPU used by a task
68532e839ddSMel Gorman 	 * that wakes affine another task. Waker/wakee relationships can
68632e839ddSMel Gorman 	 * push tasks around a CPU where each wakeup moves to the next one.
68732e839ddSMel Gorman 	 * Tracking a recently used CPU allows a quick search for a recently
68832e839ddSMel Gorman 	 * used CPU that may be idle.
68932e839ddSMel Gorman 	 */
69032e839ddSMel Gorman 	int				recent_used_cpu;
691ac66f547SPeter Zijlstra 	int				wake_cpu;
6924866cde0SNick Piggin #endif
693fd2f4419SPeter Zijlstra 	int				on_rq;
69450e645a8SIngo Molnar 
6955eca1c10SIngo Molnar 	int				prio;
6965eca1c10SIngo Molnar 	int				static_prio;
6975eca1c10SIngo Molnar 	int				normal_prio;
698c7aceabaSRichard Kennedy 	unsigned int			rt_priority;
6995eca1c10SIngo Molnar 
7005522d5d5SIngo Molnar 	const struct sched_class	*sched_class;
70120b8a59fSIngo Molnar 	struct sched_entity		se;
702fa717060SPeter Zijlstra 	struct sched_rt_entity		rt;
7038323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED
7048323f26cSPeter Zijlstra 	struct task_group		*sched_task_group;
7058323f26cSPeter Zijlstra #endif
706aab03e05SDario Faggioli 	struct sched_dl_entity		dl;
7071da177e4SLinus Torvalds 
70869842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK
70913685c4aSQais Yousef 	/*
71013685c4aSQais Yousef 	 * Clamp values requested for a scheduling entity.
71113685c4aSQais Yousef 	 * Must be updated with task_rq_lock() held.
71213685c4aSQais Yousef 	 */
713e8f14172SPatrick Bellasi 	struct uclamp_se		uclamp_req[UCLAMP_CNT];
71413685c4aSQais Yousef 	/*
71513685c4aSQais Yousef 	 * Effective clamp values used for a scheduling entity.
71613685c4aSQais Yousef 	 * Must be updated with task_rq_lock() held.
71713685c4aSQais Yousef 	 */
71869842cbaSPatrick Bellasi 	struct uclamp_se		uclamp[UCLAMP_CNT];
71969842cbaSPatrick Bellasi #endif
72069842cbaSPatrick Bellasi 
721e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS
7225eca1c10SIngo Molnar 	/* List of struct preempt_notifier: */
723e107be36SAvi Kivity 	struct hlist_head		preempt_notifiers;
724e107be36SAvi Kivity #endif
725e107be36SAvi Kivity 
7266c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE
7272056a782SJens Axboe 	unsigned int			btrace_seq;
7286c5c9341SAlexey Dobriyan #endif
7291da177e4SLinus Torvalds 
73097dc32cdSWilliam Cohen 	unsigned int			policy;
73129baa747SPeter Zijlstra 	int				nr_cpus_allowed;
7323bd37062SSebastian Andrzej Siewior 	const cpumask_t			*cpus_ptr;
7333bd37062SSebastian Andrzej Siewior 	cpumask_t			cpus_mask;
7346d337eabSPeter Zijlstra 	void				*migration_pending;
73574d862b6SThomas Gleixner #ifdef CONFIG_SMP
736a7c81556SPeter Zijlstra 	unsigned short			migration_disabled;
737af449901SPeter Zijlstra #endif
738a7c81556SPeter Zijlstra 	unsigned short			migration_flags;
7391da177e4SLinus Torvalds 
740a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU
741e260be67SPaul E. McKenney 	int				rcu_read_lock_nesting;
7421d082fd0SPaul E. McKenney 	union rcu_special		rcu_read_unlock_special;
743f41d911fSPaul E. McKenney 	struct list_head		rcu_node_entry;
744a57eb940SPaul E. McKenney 	struct rcu_node			*rcu_blocked_node;
74528f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */
7465eca1c10SIngo Molnar 
7478315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU
7488315f422SPaul E. McKenney 	unsigned long			rcu_tasks_nvcsw;
749ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_holdout;
750ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_idx;
751176f8f7aSPaul E. McKenney 	int				rcu_tasks_idle_cpu;
752ccdd29ffSPaul E. McKenney 	struct list_head		rcu_tasks_holdout_list;
7538315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */
754e260be67SPaul E. McKenney 
755d5f177d3SPaul E. McKenney #ifdef CONFIG_TASKS_TRACE_RCU
756d5f177d3SPaul E. McKenney 	int				trc_reader_nesting;
757d5f177d3SPaul E. McKenney 	int				trc_ipi_to_cpu;
758276c4104SPaul E. McKenney 	union rcu_special		trc_reader_special;
759d5f177d3SPaul E. McKenney 	bool				trc_reader_checked;
760d5f177d3SPaul E. McKenney 	struct list_head		trc_holdout_list;
761d5f177d3SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_TRACE_RCU */
762d5f177d3SPaul E. McKenney 
7631da177e4SLinus Torvalds 	struct sched_info		sched_info;
7641da177e4SLinus Torvalds 
7651da177e4SLinus Torvalds 	struct list_head		tasks;
766806c09a7SDario Faggioli #ifdef CONFIG_SMP
767917b627dSGregory Haskins 	struct plist_node		pushable_tasks;
7681baca4ceSJuri Lelli 	struct rb_node			pushable_dl_tasks;
769806c09a7SDario Faggioli #endif
7701da177e4SLinus Torvalds 
7715eca1c10SIngo Molnar 	struct mm_struct		*mm;
7725eca1c10SIngo Molnar 	struct mm_struct		*active_mm;
773314ff785SIngo Molnar 
774314ff785SIngo Molnar 	/* Per-thread vma caching: */
775314ff785SIngo Molnar 	struct vmacache			vmacache;
776314ff785SIngo Molnar 
7775eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING
77834e55232SKAMEZAWA Hiroyuki 	struct task_rss_stat		rss_stat;
77934e55232SKAMEZAWA Hiroyuki #endif
78097dc32cdSWilliam Cohen 	int				exit_state;
7815eca1c10SIngo Molnar 	int				exit_code;
7825eca1c10SIngo Molnar 	int				exit_signal;
7835eca1c10SIngo Molnar 	/* The signal sent when the parent dies: */
7845eca1c10SIngo Molnar 	int				pdeath_signal;
7855eca1c10SIngo Molnar 	/* JOBCTL_*, siglock protected: */
7865eca1c10SIngo Molnar 	unsigned long			jobctl;
7879b89f6baSAndrei Epure 
7885eca1c10SIngo Molnar 	/* Used for emulating ABI behavior of previous Linux versions: */
78997dc32cdSWilliam Cohen 	unsigned int			personality;
7909b89f6baSAndrei Epure 
7915eca1c10SIngo Molnar 	/* Scheduler bits, serialized by scheduler locks: */
792ca94c442SLennart Poettering 	unsigned			sched_reset_on_fork:1;
793a8e4f2eaSPeter Zijlstra 	unsigned			sched_contributes_to_load:1;
794ff303e66SPeter Zijlstra 	unsigned			sched_migrated:1;
795eb414681SJohannes Weiner #ifdef CONFIG_PSI
796eb414681SJohannes Weiner 	unsigned			sched_psi_wake_requeue:1;
797eb414681SJohannes Weiner #endif
798eb414681SJohannes Weiner 
7995eca1c10SIngo Molnar 	/* Force alignment to the next boundary: */
8005eca1c10SIngo Molnar 	unsigned			:0;
801be958bdcSPeter Zijlstra 
8025eca1c10SIngo Molnar 	/* Unserialized, strictly 'current' */
8035eca1c10SIngo Molnar 
804f97bb527SPeter Zijlstra 	/*
805f97bb527SPeter Zijlstra 	 * This field must not be in the scheduler word above due to wakelist
806f97bb527SPeter Zijlstra 	 * queueing no longer being serialized by p->on_cpu. However:
807f97bb527SPeter Zijlstra 	 *
808f97bb527SPeter Zijlstra 	 * p->XXX = X;			ttwu()
809f97bb527SPeter Zijlstra 	 * schedule()			  if (p->on_rq && ..) // false
810f97bb527SPeter Zijlstra 	 *   smp_mb__after_spinlock();	  if (smp_load_acquire(&p->on_cpu) && //true
811f97bb527SPeter Zijlstra 	 *   deactivate_task()		      ttwu_queue_wakelist())
812f97bb527SPeter Zijlstra 	 *     p->on_rq = 0;			p->sched_remote_wakeup = Y;
813f97bb527SPeter Zijlstra 	 *
814f97bb527SPeter Zijlstra 	 * guarantees all stores of 'current' are visible before
815f97bb527SPeter Zijlstra 	 * ->sched_remote_wakeup gets used, so it can be in this word.
816f97bb527SPeter Zijlstra 	 */
817f97bb527SPeter Zijlstra 	unsigned			sched_remote_wakeup:1;
818f97bb527SPeter Zijlstra 
8195eca1c10SIngo Molnar 	/* Bit to tell LSMs we're in execve(): */
8205eca1c10SIngo Molnar 	unsigned			in_execve:1;
821be958bdcSPeter Zijlstra 	unsigned			in_iowait:1;
8225eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK
8237e781418SAndy Lutomirski 	unsigned			restore_sigmask:1;
8247e781418SAndy Lutomirski #endif
825626ebc41STejun Heo #ifdef CONFIG_MEMCG
82629ef680aSMichal Hocko 	unsigned			in_user_fault:1;
827127424c8SJohannes Weiner #endif
828ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK
829ff303e66SPeter Zijlstra 	unsigned			brk_randomized:1;
830ff303e66SPeter Zijlstra #endif
83177f88796STejun Heo #ifdef CONFIG_CGROUPS
83277f88796STejun Heo 	/* disallow userland-initiated cgroup migration */
83377f88796STejun Heo 	unsigned			no_cgroup_migration:1;
83476f969e8SRoman Gushchin 	/* task is frozen/stopped (used by the cgroup freezer) */
83576f969e8SRoman Gushchin 	unsigned			frozen:1;
83677f88796STejun Heo #endif
837d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP
838d09d8df3SJosef Bacik 	unsigned			use_memdelay:1;
839d09d8df3SJosef Bacik #endif
8401066d1b6SYafang Shao #ifdef CONFIG_PSI
8411066d1b6SYafang Shao 	/* Stalled due to lack of memory */
8421066d1b6SYafang Shao 	unsigned			in_memstall:1;
8431066d1b6SYafang Shao #endif
8448e9b16c4SSergei Trofimovich #ifdef CONFIG_PAGE_OWNER
8458e9b16c4SSergei Trofimovich 	/* Used by page_owner=on to detect recursion in page tracking. */
8468e9b16c4SSergei Trofimovich 	unsigned			in_page_owner:1;
8478e9b16c4SSergei Trofimovich #endif
8486f185c29SVladimir Davydov 
8495eca1c10SIngo Molnar 	unsigned long			atomic_flags; /* Flags requiring atomic access. */
8501d4457f9SKees Cook 
851f56141e3SAndy Lutomirski 	struct restart_block		restart_block;
852f56141e3SAndy Lutomirski 
8531da177e4SLinus Torvalds 	pid_t				pid;
8541da177e4SLinus Torvalds 	pid_t				tgid;
8550a425405SArjan van de Ven 
856050e9baaSLinus Torvalds #ifdef CONFIG_STACKPROTECTOR
8575eca1c10SIngo Molnar 	/* Canary value for the -fstack-protector GCC feature: */
8580a425405SArjan van de Ven 	unsigned long			stack_canary;
8591314562aSHiroshi Shimamoto #endif
8601da177e4SLinus Torvalds 	/*
8615eca1c10SIngo Molnar 	 * Pointers to the (original) parent process, youngest child, younger sibling,
8621da177e4SLinus Torvalds 	 * older sibling, respectively.  (p->father can be replaced with
863f470021aSRoland McGrath 	 * p->real_parent->pid)
8641da177e4SLinus Torvalds 	 */
8655eca1c10SIngo Molnar 
8665eca1c10SIngo Molnar 	/* Real parent process: */
8675eca1c10SIngo Molnar 	struct task_struct __rcu	*real_parent;
8685eca1c10SIngo Molnar 
8695eca1c10SIngo Molnar 	/* Recipient of SIGCHLD, wait4() reports: */
8705eca1c10SIngo Molnar 	struct task_struct __rcu	*parent;
8711da177e4SLinus Torvalds 
872f470021aSRoland McGrath 	/*
8735eca1c10SIngo Molnar 	 * Children/sibling form the list of natural children:
8745eca1c10SIngo Molnar 	 */
8755eca1c10SIngo Molnar 	struct list_head		children;
8765eca1c10SIngo Molnar 	struct list_head		sibling;
8775eca1c10SIngo Molnar 	struct task_struct		*group_leader;
8785eca1c10SIngo Molnar 
8795eca1c10SIngo Molnar 	/*
8805eca1c10SIngo Molnar 	 * 'ptraced' is the list of tasks this task is using ptrace() on.
8815eca1c10SIngo Molnar 	 *
882f470021aSRoland McGrath 	 * This includes both natural children and PTRACE_ATTACH targets.
8835eca1c10SIngo Molnar 	 * 'ptrace_entry' is this task's link on the p->parent->ptraced list.
884f470021aSRoland McGrath 	 */
885f470021aSRoland McGrath 	struct list_head		ptraced;
886f470021aSRoland McGrath 	struct list_head		ptrace_entry;
887f470021aSRoland McGrath 
8881da177e4SLinus Torvalds 	/* PID/PID hash table linkage. */
8892c470475SEric W. Biederman 	struct pid			*thread_pid;
8902c470475SEric W. Biederman 	struct hlist_node		pid_links[PIDTYPE_MAX];
89147e65328SOleg Nesterov 	struct list_head		thread_group;
8920c740d0aSOleg Nesterov 	struct list_head		thread_node;
8931da177e4SLinus Torvalds 
8945eca1c10SIngo Molnar 	struct completion		*vfork_done;
8951da177e4SLinus Torvalds 
8965eca1c10SIngo Molnar 	/* CLONE_CHILD_SETTID: */
8975eca1c10SIngo Molnar 	int __user			*set_child_tid;
8985eca1c10SIngo Molnar 
8995eca1c10SIngo Molnar 	/* CLONE_CHILD_CLEARTID: */
9005eca1c10SIngo Molnar 	int __user			*clear_child_tid;
9015eca1c10SIngo Molnar 
9023bfe6106SJens Axboe 	/* PF_IO_WORKER */
9033bfe6106SJens Axboe 	void				*pf_io_worker;
9043bfe6106SJens Axboe 
9055eca1c10SIngo Molnar 	u64				utime;
9065eca1c10SIngo Molnar 	u64				stime;
90740565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME
9085eca1c10SIngo Molnar 	u64				utimescaled;
9095eca1c10SIngo Molnar 	u64				stimescaled;
91040565b5aSStanislaw Gruszka #endif
91116a6d9beSFrederic Weisbecker 	u64				gtime;
9129d7fb042SPeter Zijlstra 	struct prev_cputime		prev_cputime;
9136a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
914bac5b6b6SFrederic Weisbecker 	struct vtime			vtime;
9156a61671bSFrederic Weisbecker #endif
916d027d45dSFrederic Weisbecker 
917d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
918f009a7a7SFrederic Weisbecker 	atomic_t			tick_dep_mask;
919d027d45dSFrederic Weisbecker #endif
9205eca1c10SIngo Molnar 	/* Context switch counts: */
9215eca1c10SIngo Molnar 	unsigned long			nvcsw;
9225eca1c10SIngo Molnar 	unsigned long			nivcsw;
9235eca1c10SIngo Molnar 
9245eca1c10SIngo Molnar 	/* Monotonic time in nsecs: */
9255eca1c10SIngo Molnar 	u64				start_time;
9265eca1c10SIngo Molnar 
9275eca1c10SIngo Molnar 	/* Boot based time in nsecs: */
928cf25e24dSPeter Zijlstra 	u64				start_boottime;
9295eca1c10SIngo Molnar 
9305eca1c10SIngo Molnar 	/* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */
9315eca1c10SIngo Molnar 	unsigned long			min_flt;
9325eca1c10SIngo Molnar 	unsigned long			maj_flt;
9331da177e4SLinus Torvalds 
9342b69942fSThomas Gleixner 	/* Empty if CONFIG_POSIX_CPUTIMERS=n */
9352b69942fSThomas Gleixner 	struct posix_cputimers		posix_cputimers;
9361da177e4SLinus Torvalds 
9371fb497ddSThomas Gleixner #ifdef CONFIG_POSIX_CPU_TIMERS_TASK_WORK
9381fb497ddSThomas Gleixner 	struct posix_cputimers_work	posix_cputimers_work;
9391fb497ddSThomas Gleixner #endif
9401fb497ddSThomas Gleixner 
9415eca1c10SIngo Molnar 	/* Process credentials: */
9425eca1c10SIngo Molnar 
9435eca1c10SIngo Molnar 	/* Tracer's credentials at attach: */
9445eca1c10SIngo Molnar 	const struct cred __rcu		*ptracer_cred;
9455eca1c10SIngo Molnar 
9465eca1c10SIngo Molnar 	/* Objective and real subjective task credentials (COW): */
9475eca1c10SIngo Molnar 	const struct cred __rcu		*real_cred;
9485eca1c10SIngo Molnar 
9495eca1c10SIngo Molnar 	/* Effective (overridable) subjective task credentials (COW): */
9505eca1c10SIngo Molnar 	const struct cred __rcu		*cred;
9515eca1c10SIngo Molnar 
9527743c48eSDavid Howells #ifdef CONFIG_KEYS
9537743c48eSDavid Howells 	/* Cached requested key. */
9547743c48eSDavid Howells 	struct key			*cached_requested_key;
9557743c48eSDavid Howells #endif
9567743c48eSDavid Howells 
9575eca1c10SIngo Molnar 	/*
9585eca1c10SIngo Molnar 	 * executable name, excluding path.
9595eca1c10SIngo Molnar 	 *
9605eca1c10SIngo Molnar 	 * - normally initialized setup_new_exec()
9615eca1c10SIngo Molnar 	 * - access it with [gs]et_task_comm()
9625eca1c10SIngo Molnar 	 * - lock it with task_lock()
9635eca1c10SIngo Molnar 	 */
9645eca1c10SIngo Molnar 	char				comm[TASK_COMM_LEN];
9655eca1c10SIngo Molnar 
966756daf26SNeilBrown 	struct nameidata		*nameidata;
9675eca1c10SIngo Molnar 
9683d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC
9691da177e4SLinus Torvalds 	struct sysv_sem			sysvsem;
970ab602f79SJack Miller 	struct sysv_shm			sysvshm;
9713d5b6fccSAlexey Dobriyan #endif
972e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK
97382a1fcb9SIngo Molnar 	unsigned long			last_switch_count;
974a2e51445SDmitry Vyukov 	unsigned long			last_switch_time;
97582a1fcb9SIngo Molnar #endif
9765eca1c10SIngo Molnar 	/* Filesystem information: */
9771da177e4SLinus Torvalds 	struct fs_struct		*fs;
9785eca1c10SIngo Molnar 
9795eca1c10SIngo Molnar 	/* Open file information: */
9801da177e4SLinus Torvalds 	struct files_struct		*files;
9815eca1c10SIngo Molnar 
9820f212204SJens Axboe #ifdef CONFIG_IO_URING
9830f212204SJens Axboe 	struct io_uring_task		*io_uring;
9840f212204SJens Axboe #endif
9850f212204SJens Axboe 
9865eca1c10SIngo Molnar 	/* Namespaces: */
987ab516013SSerge E. Hallyn 	struct nsproxy			*nsproxy;
9885eca1c10SIngo Molnar 
9895eca1c10SIngo Molnar 	/* Signal handlers: */
9901da177e4SLinus Torvalds 	struct signal_struct		*signal;
991913292c9SMadhuparna Bhowmik 	struct sighand_struct __rcu		*sighand;
9924bad58ebSThomas Gleixner 	struct sigqueue			*sigqueue_cache;
9935eca1c10SIngo Molnar 	sigset_t			blocked;
9945eca1c10SIngo Molnar 	sigset_t			real_blocked;
9955eca1c10SIngo Molnar 	/* Restored if set_restore_sigmask() was used: */
9965eca1c10SIngo Molnar 	sigset_t			saved_sigmask;
9971da177e4SLinus Torvalds 	struct sigpending		pending;
9981da177e4SLinus Torvalds 	unsigned long			sas_ss_sp;
9991da177e4SLinus Torvalds 	size_t				sas_ss_size;
10005eca1c10SIngo Molnar 	unsigned int			sas_ss_flags;
10012e01fabeSOleg Nesterov 
100267d12145SAl Viro 	struct callback_head		*task_works;
1003e73f8959SOleg Nesterov 
10044b7d248bSRichard Guy Briggs #ifdef CONFIG_AUDIT
1005bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL
10065f3d544fSRichard Guy Briggs 	struct audit_context		*audit_context;
10075f3d544fSRichard Guy Briggs #endif
1008e1760bd5SEric W. Biederman 	kuid_t				loginuid;
10094746ec5bSEric Paris 	unsigned int			sessionid;
1010bfef93a5SAl Viro #endif
1011932ecebbSWill Drewry 	struct seccomp			seccomp;
10121446e1dfSGabriel Krisman Bertazi 	struct syscall_user_dispatch	syscall_dispatch;
10131da177e4SLinus Torvalds 
10145eca1c10SIngo Molnar 	/* Thread group tracking: */
1015d1e7fd64SEric W. Biederman 	u64				parent_exec_id;
1016d1e7fd64SEric W. Biederman 	u64				self_exec_id;
10175eca1c10SIngo Molnar 
10185eca1c10SIngo Molnar 	/* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */
10191da177e4SLinus Torvalds 	spinlock_t			alloc_lock;
10201da177e4SLinus Torvalds 
1021b29739f9SIngo Molnar 	/* Protection of the PI data structures: */
10221d615482SThomas Gleixner 	raw_spinlock_t			pi_lock;
1023b29739f9SIngo Molnar 
102476751049SPeter Zijlstra 	struct wake_q_node		wake_q;
102576751049SPeter Zijlstra 
102623f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES
10275eca1c10SIngo Molnar 	/* PI waiters blocked on a rt_mutex held by this task: */
1028a23ba907SDavidlohr Bueso 	struct rb_root_cached		pi_waiters;
1029e96a7705SXunlei Pang 	/* Updated under owner's pi_lock and rq lock */
1030e96a7705SXunlei Pang 	struct task_struct		*pi_top_task;
10315eca1c10SIngo Molnar 	/* Deadlock detection and priority inheritance handling: */
103223f78d4aSIngo Molnar 	struct rt_mutex_waiter		*pi_blocked_on;
103323f78d4aSIngo Molnar #endif
103423f78d4aSIngo Molnar 
1035408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES
10365eca1c10SIngo Molnar 	/* Mutex deadlock detection: */
1037408894eeSIngo Molnar 	struct mutex_waiter		*blocked_on;
1038408894eeSIngo Molnar #endif
10395eca1c10SIngo Molnar 
1040312364f3SDaniel Vetter #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
1041312364f3SDaniel Vetter 	int				non_block_count;
1042312364f3SDaniel Vetter #endif
1043312364f3SDaniel Vetter 
1044de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS
10450584df9cSMarco Elver 	struct irqtrace_events		irqtrace;
1046de8f5e4fSPeter Zijlstra 	unsigned int			hardirq_threaded;
1047c86e9b98SPeter Zijlstra 	u64				hardirq_chain_key;
1048fa1452e8SHiroshi Shimamoto 	int				softirqs_enabled;
1049de30a2b3SIngo Molnar 	int				softirq_context;
105040db1739SSebastian Andrzej Siewior 	int				irq_config;
1051de30a2b3SIngo Molnar #endif
1052728b478dSThomas Gleixner #ifdef CONFIG_PREEMPT_RT
1053728b478dSThomas Gleixner 	int				softirq_disable_cnt;
1054728b478dSThomas Gleixner #endif
10555eca1c10SIngo Molnar 
1056fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP
1057bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH			48UL
1058fbb9ce95SIngo Molnar 	u64				curr_chain_key;
1059fbb9ce95SIngo Molnar 	int				lockdep_depth;
1060fbb9ce95SIngo Molnar 	unsigned int			lockdep_recursion;
1061c7aceabaSRichard Kennedy 	struct held_lock		held_locks[MAX_LOCK_DEPTH];
1062fbb9ce95SIngo Molnar #endif
10635eca1c10SIngo Molnar 
10645cf53f3cSElena Petrova #if defined(CONFIG_UBSAN) && !defined(CONFIG_UBSAN_TRAP)
1065c6d30853SAndrey Ryabinin 	unsigned int			in_ubsan;
1066c6d30853SAndrey Ryabinin #endif
1067408894eeSIngo Molnar 
10685eca1c10SIngo Molnar 	/* Journalling filesystem info: */
10691da177e4SLinus Torvalds 	void				*journal_info;
10701da177e4SLinus Torvalds 
10715eca1c10SIngo Molnar 	/* Stacked block device info: */
1072bddd87c7SAkinobu Mita 	struct bio_list			*bio_list;
1073d89d8796SNeil Brown 
107473c10101SJens Axboe #ifdef CONFIG_BLOCK
10755eca1c10SIngo Molnar 	/* Stack plugging: */
107673c10101SJens Axboe 	struct blk_plug			*plug;
107773c10101SJens Axboe #endif
107873c10101SJens Axboe 
10795eca1c10SIngo Molnar 	/* VM state: */
10801da177e4SLinus Torvalds 	struct reclaim_state		*reclaim_state;
10811da177e4SLinus Torvalds 
10821da177e4SLinus Torvalds 	struct backing_dev_info		*backing_dev_info;
10831da177e4SLinus Torvalds 
10841da177e4SLinus Torvalds 	struct io_context		*io_context;
10851da177e4SLinus Torvalds 
10865e1f0f09SMel Gorman #ifdef CONFIG_COMPACTION
10875e1f0f09SMel Gorman 	struct capture_control		*capture_control;
10885e1f0f09SMel Gorman #endif
10895eca1c10SIngo Molnar 	/* Ptrace state: */
10901da177e4SLinus Torvalds 	unsigned long			ptrace_message;
1091ae7795bcSEric W. Biederman 	kernel_siginfo_t		*last_siginfo;
10925eca1c10SIngo Molnar 
10937c3ab738SAndrew Morton 	struct task_io_accounting	ioac;
1094eb414681SJohannes Weiner #ifdef CONFIG_PSI
1095eb414681SJohannes Weiner 	/* Pressure stall state */
1096eb414681SJohannes Weiner 	unsigned int			psi_flags;
1097eb414681SJohannes Weiner #endif
10985eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT
10995eca1c10SIngo Molnar 	/* Accumulated RSS usage: */
11005eca1c10SIngo Molnar 	u64				acct_rss_mem1;
11015eca1c10SIngo Molnar 	/* Accumulated virtual memory usage: */
11025eca1c10SIngo Molnar 	u64				acct_vm_mem1;
11035eca1c10SIngo Molnar 	/* stime + utime since last update: */
11045eca1c10SIngo Molnar 	u64				acct_timexpd;
11051da177e4SLinus Torvalds #endif
11061da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS
11075eca1c10SIngo Molnar 	/* Protected by ->alloc_lock: */
11085eca1c10SIngo Molnar 	nodemask_t			mems_allowed;
11093b03706fSIngo Molnar 	/* Sequence number to catch updates: */
1110b7505861SAhmed S. Darwish 	seqcount_spinlock_t		mems_allowed_seq;
1111825a46afSPaul Jackson 	int				cpuset_mem_spread_rotor;
11126adef3ebSJack Steiner 	int				cpuset_slab_spread_rotor;
11131da177e4SLinus Torvalds #endif
1114ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS
11155eca1c10SIngo Molnar 	/* Control Group info protected by css_set_lock: */
11162c392b8cSArnd Bergmann 	struct css_set __rcu		*cgroups;
11175eca1c10SIngo Molnar 	/* cg_list protected by css_set_lock and tsk->alloc_lock: */
1118817929ecSPaul Menage 	struct list_head		cg_list;
1119ddbcc7e8SPaul Menage #endif
1120e6d42931SJohannes Weiner #ifdef CONFIG_X86_CPU_RESCTRL
11210734ded1SVikas Shivappa 	u32				closid;
1122d6aaba61SVikas Shivappa 	u32				rmid;
1123e02737d5SFenghua Yu #endif
112442b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX
11250771dfefSIngo Molnar 	struct robust_list_head __user	*robust_list;
112634f192c6SIngo Molnar #ifdef CONFIG_COMPAT
112734f192c6SIngo Molnar 	struct compat_robust_list_head __user *compat_robust_list;
112834f192c6SIngo Molnar #endif
1129c87e2837SIngo Molnar 	struct list_head		pi_state_list;
1130c87e2837SIngo Molnar 	struct futex_pi_state		*pi_state_cache;
11313f186d97SThomas Gleixner 	struct mutex			futex_exit_mutex;
11323d4775dfSThomas Gleixner 	unsigned int			futex_state;
113342b2dd0aSAlexey Dobriyan #endif
1134cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS
11358dc85d54SPeter Zijlstra 	struct perf_event_context	*perf_event_ctxp[perf_nr_task_contexts];
1136cdd6c482SIngo Molnar 	struct mutex			perf_event_mutex;
1137cdd6c482SIngo Molnar 	struct list_head		perf_event_list;
1138a63eaf34SPaul Mackerras #endif
11398f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT
11408f47b187SThomas Gleixner 	unsigned long			preempt_disable_ip;
11418f47b187SThomas Gleixner #endif
1142c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA
11435eca1c10SIngo Molnar 	/* Protected by alloc_lock: */
11445eca1c10SIngo Molnar 	struct mempolicy		*mempolicy;
114545816682SVlastimil Babka 	short				il_prev;
1146207205a2SEric Dumazet 	short				pref_node_fork;
1147c7aceabaSRichard Kennedy #endif
1148cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING
1149cbee9f88SPeter Zijlstra 	int				numa_scan_seq;
1150cbee9f88SPeter Zijlstra 	unsigned int			numa_scan_period;
1151598f0ec0SMel Gorman 	unsigned int			numa_scan_period_max;
1152de1c9ce6SRik van Riel 	int				numa_preferred_nid;
11536b9a7460SMel Gorman 	unsigned long			numa_migrate_retry;
11545eca1c10SIngo Molnar 	/* Migration stamp: */
11555eca1c10SIngo Molnar 	u64				node_stamp;
11567e2703e6SRik van Riel 	u64				last_task_numa_placement;
11577e2703e6SRik van Riel 	u64				last_sum_exec_runtime;
1158cbee9f88SPeter Zijlstra 	struct callback_head		numa_work;
1159f809ca9aSMel Gorman 
1160cb361d8cSJann Horn 	/*
1161cb361d8cSJann Horn 	 * This pointer is only modified for current in syscall and
1162cb361d8cSJann Horn 	 * pagefault context (and for tasks being destroyed), so it can be read
1163cb361d8cSJann Horn 	 * from any of the following contexts:
1164cb361d8cSJann Horn 	 *  - RCU read-side critical section
1165cb361d8cSJann Horn 	 *  - current->numa_group from everywhere
1166cb361d8cSJann Horn 	 *  - task's runqueue locked, task not running
1167cb361d8cSJann Horn 	 */
1168cb361d8cSJann Horn 	struct numa_group __rcu		*numa_group;
11698c8a743cSPeter Zijlstra 
1170745d6147SMel Gorman 	/*
117144dba3d5SIulia Manda 	 * numa_faults is an array split into four regions:
117244dba3d5SIulia Manda 	 * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer
117344dba3d5SIulia Manda 	 * in this precise order.
117444dba3d5SIulia Manda 	 *
117544dba3d5SIulia Manda 	 * faults_memory: Exponential decaying average of faults on a per-node
117644dba3d5SIulia Manda 	 * basis. Scheduling placement decisions are made based on these
117744dba3d5SIulia Manda 	 * counts. The values remain static for the duration of a PTE scan.
117844dba3d5SIulia Manda 	 * faults_cpu: Track the nodes the process was running on when a NUMA
117944dba3d5SIulia Manda 	 * hinting fault was incurred.
118044dba3d5SIulia Manda 	 * faults_memory_buffer and faults_cpu_buffer: Record faults per node
118144dba3d5SIulia Manda 	 * during the current scan window. When the scan completes, the counts
118244dba3d5SIulia Manda 	 * in faults_memory and faults_cpu decay and these values are copied.
1183745d6147SMel Gorman 	 */
118444dba3d5SIulia Manda 	unsigned long			*numa_faults;
118583e1d2cdSMel Gorman 	unsigned long			total_numa_faults;
1186745d6147SMel Gorman 
1187745d6147SMel Gorman 	/*
118804bb2f94SRik van Riel 	 * numa_faults_locality tracks if faults recorded during the last
1189074c2381SMel Gorman 	 * scan window were remote/local or failed to migrate. The task scan
1190074c2381SMel Gorman 	 * period is adapted based on the locality of the faults with different
1191074c2381SMel Gorman 	 * weights depending on whether they were shared or private faults
119204bb2f94SRik van Riel 	 */
1193074c2381SMel Gorman 	unsigned long			numa_faults_locality[3];
119404bb2f94SRik van Riel 
1195b32e86b4SIngo Molnar 	unsigned long			numa_pages_migrated;
1196cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */
1197cbee9f88SPeter Zijlstra 
1198d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ
1199d7822b1eSMathieu Desnoyers 	struct rseq __user *rseq;
1200d7822b1eSMathieu Desnoyers 	u32 rseq_sig;
1201d7822b1eSMathieu Desnoyers 	/*
1202d7822b1eSMathieu Desnoyers 	 * RmW on rseq_event_mask must be performed atomically
1203d7822b1eSMathieu Desnoyers 	 * with respect to preemption.
1204d7822b1eSMathieu Desnoyers 	 */
1205d7822b1eSMathieu Desnoyers 	unsigned long rseq_event_mask;
1206d7822b1eSMathieu Desnoyers #endif
1207d7822b1eSMathieu Desnoyers 
120872b252aeSMel Gorman 	struct tlbflush_unmap_batch	tlb_ubc;
120972b252aeSMel Gorman 
12103fbd7ee2SEric W. Biederman 	union {
12113fbd7ee2SEric W. Biederman 		refcount_t		rcu_users;
1212e56d0903SIngo Molnar 		struct rcu_head		rcu;
12133fbd7ee2SEric W. Biederman 	};
1214b92ce558SJens Axboe 
12155eca1c10SIngo Molnar 	/* Cache last used pipe for splice(): */
1216b92ce558SJens Axboe 	struct pipe_inode_info		*splice_pipe;
12175640f768SEric Dumazet 
12185640f768SEric Dumazet 	struct page_frag		task_frag;
12195640f768SEric Dumazet 
1220ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT
1221ca74e92bSShailabh Nagar 	struct task_delay_info		*delays;
1222ca74e92bSShailabh Nagar #endif
122347913d4eSIngo Molnar 
1224f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION
1225f4f154fdSAkinobu Mita 	int				make_it_fail;
12269049f2f6SAkinobu Mita 	unsigned int			fail_nth;
1227f4f154fdSAkinobu Mita #endif
12289d823e8fSWu Fengguang 	/*
12295eca1c10SIngo Molnar 	 * When (nr_dirtied >= nr_dirtied_pause), it's time to call
12305eca1c10SIngo Molnar 	 * balance_dirty_pages() for a dirty throttling pause:
12319d823e8fSWu Fengguang 	 */
12329d823e8fSWu Fengguang 	int				nr_dirtied;
12339d823e8fSWu Fengguang 	int				nr_dirtied_pause;
12345eca1c10SIngo Molnar 	/* Start of a write-and-pause period: */
12355eca1c10SIngo Molnar 	unsigned long			dirty_paused_when;
12369d823e8fSWu Fengguang 
12379745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP
12389745512cSArjan van de Ven 	int				latency_record_count;
12399745512cSArjan van de Ven 	struct latency_record		latency_record[LT_SAVECOUNT];
12409745512cSArjan van de Ven #endif
12416976675dSArjan van de Ven 	/*
12425eca1c10SIngo Molnar 	 * Time slack values; these are used to round up poll() and
12436976675dSArjan van de Ven 	 * select() etc timeout values. These are in nanoseconds.
12446976675dSArjan van de Ven 	 */
1245da8b44d5SJohn Stultz 	u64				timer_slack_ns;
1246da8b44d5SJohn Stultz 	u64				default_timer_slack_ns;
1247f8d570a4SDavid Miller 
1248d73b4936SAndrey Konovalov #if defined(CONFIG_KASAN_GENERIC) || defined(CONFIG_KASAN_SW_TAGS)
12490b24beccSAndrey Ryabinin 	unsigned int			kasan_depth;
12500b24beccSAndrey Ryabinin #endif
125192c209acSMarco Elver 
1252dfd402a4SMarco Elver #ifdef CONFIG_KCSAN
1253dfd402a4SMarco Elver 	struct kcsan_ctx		kcsan_ctx;
125492c209acSMarco Elver #ifdef CONFIG_TRACE_IRQFLAGS
125592c209acSMarco Elver 	struct irqtrace_events		kcsan_save_irqtrace;
125692c209acSMarco Elver #endif
1257dfd402a4SMarco Elver #endif
12585eca1c10SIngo Molnar 
1259393824f6SPatricia Alfonso #if IS_ENABLED(CONFIG_KUNIT)
1260393824f6SPatricia Alfonso 	struct kunit			*kunit_test;
1261393824f6SPatricia Alfonso #endif
1262393824f6SPatricia Alfonso 
1263fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER
12645eca1c10SIngo Molnar 	/* Index of current stored address in ret_stack: */
1265f201ae23SFrederic Weisbecker 	int				curr_ret_stack;
126639eb456dSSteven Rostedt (VMware) 	int				curr_ret_depth;
12675eca1c10SIngo Molnar 
12685eca1c10SIngo Molnar 	/* Stack of return addresses for return function tracing: */
1269f201ae23SFrederic Weisbecker 	struct ftrace_ret_stack		*ret_stack;
12705eca1c10SIngo Molnar 
12715eca1c10SIngo Molnar 	/* Timestamp for last schedule: */
12728aef2d28SSteven Rostedt 	unsigned long long		ftrace_timestamp;
12735eca1c10SIngo Molnar 
1274f201ae23SFrederic Weisbecker 	/*
1275f201ae23SFrederic Weisbecker 	 * Number of functions that haven't been traced
12765eca1c10SIngo Molnar 	 * because of depth overrun:
1277f201ae23SFrederic Weisbecker 	 */
1278f201ae23SFrederic Weisbecker 	atomic_t			trace_overrun;
12795eca1c10SIngo Molnar 
12805eca1c10SIngo Molnar 	/* Pause tracing: */
1281380c4b14SFrederic Weisbecker 	atomic_t			tracing_graph_pause;
1282f201ae23SFrederic Weisbecker #endif
12835eca1c10SIngo Molnar 
1284ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING
12855eca1c10SIngo Molnar 	/* State flags for use by tracers: */
1286ea4e2bc4SSteven Rostedt 	unsigned long			trace;
12875eca1c10SIngo Molnar 
12885eca1c10SIngo Molnar 	/* Bitmask and counter of trace recursion: */
1289261842b7SSteven Rostedt 	unsigned long			trace_recursion;
1290261842b7SSteven Rostedt #endif /* CONFIG_TRACING */
12915eca1c10SIngo Molnar 
12925c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV
1293eec028c9SAndrey Konovalov 	/* See kernel/kcov.c for more details. */
1294eec028c9SAndrey Konovalov 
12955eca1c10SIngo Molnar 	/* Coverage collection mode enabled for this task (0 if disabled): */
12960ed557aaSMark Rutland 	unsigned int			kcov_mode;
12975eca1c10SIngo Molnar 
12985eca1c10SIngo Molnar 	/* Size of the kcov_area: */
12995eca1c10SIngo Molnar 	unsigned int			kcov_size;
13005eca1c10SIngo Molnar 
13015eca1c10SIngo Molnar 	/* Buffer for coverage collection: */
13025c9a8750SDmitry Vyukov 	void				*kcov_area;
13035eca1c10SIngo Molnar 
13045eca1c10SIngo Molnar 	/* KCOV descriptor wired with this task or NULL: */
13055c9a8750SDmitry Vyukov 	struct kcov			*kcov;
1306eec028c9SAndrey Konovalov 
1307eec028c9SAndrey Konovalov 	/* KCOV common handle for remote coverage collection: */
1308eec028c9SAndrey Konovalov 	u64				kcov_handle;
1309eec028c9SAndrey Konovalov 
1310eec028c9SAndrey Konovalov 	/* KCOV sequence number: */
1311eec028c9SAndrey Konovalov 	int				kcov_sequence;
13125ff3b30aSAndrey Konovalov 
13135ff3b30aSAndrey Konovalov 	/* Collect coverage from softirq context: */
13145ff3b30aSAndrey Konovalov 	unsigned int			kcov_softirq;
13155c9a8750SDmitry Vyukov #endif
13165eca1c10SIngo Molnar 
13176f185c29SVladimir Davydov #ifdef CONFIG_MEMCG
1318626ebc41STejun Heo 	struct mem_cgroup		*memcg_in_oom;
1319626ebc41STejun Heo 	gfp_t				memcg_oom_gfp_mask;
1320626ebc41STejun Heo 	int				memcg_oom_order;
1321b23afb93STejun Heo 
13225eca1c10SIngo Molnar 	/* Number of pages to reclaim on returning to userland: */
1323b23afb93STejun Heo 	unsigned int			memcg_nr_pages_over_high;
1324d46eb14bSShakeel Butt 
1325d46eb14bSShakeel Butt 	/* Used by memcontrol for targeted memcg charge: */
1326d46eb14bSShakeel Butt 	struct mem_cgroup		*active_memcg;
1327569b846dSKAMEZAWA Hiroyuki #endif
13285eca1c10SIngo Molnar 
1329d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP
1330d09d8df3SJosef Bacik 	struct request_queue		*throttle_queue;
1331d09d8df3SJosef Bacik #endif
1332d09d8df3SJosef Bacik 
13330326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES
13340326f5a9SSrikar Dronamraju 	struct uprobe_task		*utask;
13350326f5a9SSrikar Dronamraju #endif
1336cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE)
1337cafe5635SKent Overstreet 	unsigned int			sequential_io;
1338cafe5635SKent Overstreet 	unsigned int			sequential_io_avg;
1339cafe5635SKent Overstreet #endif
13405fbda3ecSThomas Gleixner 	struct kmap_ctrl		kmap_ctrl;
13418eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
13428eb23b9fSPeter Zijlstra 	unsigned long			task_state_change;
13438eb23b9fSPeter Zijlstra #endif
13448bcbde54SDavid Hildenbrand 	int				pagefault_disabled;
134503049269SMichal Hocko #ifdef CONFIG_MMU
134629c696e1SVladimir Davydov 	struct task_struct		*oom_reaper_list;
134703049269SMichal Hocko #endif
1348ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK
1349ba14a194SAndy Lutomirski 	struct vm_struct		*stack_vm_area;
1350ba14a194SAndy Lutomirski #endif
135168f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
13525eca1c10SIngo Molnar 	/* A live task holds one reference: */
1353f0b89d39SElena Reshetova 	refcount_t			stack_refcount;
135468f24b08SAndy Lutomirski #endif
1355d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH
1356d83a7cb3SJosh Poimboeuf 	int patch_state;
1357d83a7cb3SJosh Poimboeuf #endif
1358e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY
1359e4e55b47STetsuo Handa 	/* Used by LSM modules for access restriction: */
1360e4e55b47STetsuo Handa 	void				*security;
1361e4e55b47STetsuo Handa #endif
1362a10787e6SSong Liu #ifdef CONFIG_BPF_SYSCALL
1363a10787e6SSong Liu 	/* Used by BPF task local storage */
1364a10787e6SSong Liu 	struct bpf_local_storage __rcu	*bpf_storage;
1365a10787e6SSong Liu #endif
136629e48ce8SKees Cook 
1367afaef01cSAlexander Popov #ifdef CONFIG_GCC_PLUGIN_STACKLEAK
1368afaef01cSAlexander Popov 	unsigned long			lowest_stack;
1369c8d12627SAlexander Popov 	unsigned long			prev_lowest_stack;
1370afaef01cSAlexander Popov #endif
1371afaef01cSAlexander Popov 
13725567d11cSPeter Zijlstra #ifdef CONFIG_X86_MCE
1373c0ab7ffcSTony Luck 	void __user			*mce_vaddr;
1374c0ab7ffcSTony Luck 	__u64				mce_kflags;
13755567d11cSPeter Zijlstra 	u64				mce_addr;
137617fae129STony Luck 	__u64				mce_ripv : 1,
137717fae129STony Luck 					mce_whole_page : 1,
137817fae129STony Luck 					__mce_reserved : 62;
13795567d11cSPeter Zijlstra 	struct callback_head		mce_kill_me;
13805567d11cSPeter Zijlstra #endif
13815567d11cSPeter Zijlstra 
1382d741bf41SPeter Zijlstra #ifdef CONFIG_KRETPROBES
1383d741bf41SPeter Zijlstra 	struct llist_head               kretprobe_instances;
1384d741bf41SPeter Zijlstra #endif
1385d741bf41SPeter Zijlstra 
138629e48ce8SKees Cook 	/*
138729e48ce8SKees Cook 	 * New fields for task_struct should be added above here, so that
138829e48ce8SKees Cook 	 * they are included in the randomized portion of task_struct.
138929e48ce8SKees Cook 	 */
139029e48ce8SKees Cook 	randomized_struct_fields_end
139129e48ce8SKees Cook 
13925eca1c10SIngo Molnar 	/* CPU-specific state of this task: */
13930c8c0f03SDave Hansen 	struct thread_struct		thread;
13945eca1c10SIngo Molnar 
13950c8c0f03SDave Hansen 	/*
13960c8c0f03SDave Hansen 	 * WARNING: on x86, 'thread_struct' contains a variable-sized
13970c8c0f03SDave Hansen 	 * structure.  It *MUST* be at the end of 'task_struct'.
13980c8c0f03SDave Hansen 	 *
13990c8c0f03SDave Hansen 	 * Do not put anything below here!
14000c8c0f03SDave Hansen 	 */
14011da177e4SLinus Torvalds };
14021da177e4SLinus Torvalds 
1403e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task)
140422c935f4SEric W. Biederman {
14052c470475SEric W. Biederman 	return task->thread_pid;
140622c935f4SEric W. Biederman }
140722c935f4SEric W. Biederman 
14087af57294SPavel Emelyanov /*
14097af57294SPavel Emelyanov  * the helpers to get the task's different pids as they are seen
14107af57294SPavel Emelyanov  * from various namespaces
14117af57294SPavel Emelyanov  *
14127af57294SPavel Emelyanov  * task_xid_nr()     : global id, i.e. the id seen from the init namespace;
141344c4e1b2SEric W. Biederman  * task_xid_vnr()    : virtual id, i.e. the id seen from the pid namespace of
141444c4e1b2SEric W. Biederman  *                     current.
14157af57294SPavel Emelyanov  * task_xid_nr_ns()  : id seen from the ns specified;
14167af57294SPavel Emelyanov  *
14177af57294SPavel Emelyanov  * see also pid_nr() etc in include/linux/pid.h
14187af57294SPavel Emelyanov  */
14195eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns);
14207af57294SPavel Emelyanov 
1421e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk)
14227af57294SPavel Emelyanov {
14237af57294SPavel Emelyanov 	return tsk->pid;
14247af57294SPavel Emelyanov }
14257af57294SPavel Emelyanov 
14265eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
142752ee2dfdSOleg Nesterov {
142852ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
142952ee2dfdSOleg Nesterov }
14307af57294SPavel Emelyanov 
14317af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk)
14327af57294SPavel Emelyanov {
143352ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
14347af57294SPavel Emelyanov }
14357af57294SPavel Emelyanov 
14367af57294SPavel Emelyanov 
1437e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk)
14387af57294SPavel Emelyanov {
14397af57294SPavel Emelyanov 	return tsk->tgid;
14407af57294SPavel Emelyanov }
14417af57294SPavel Emelyanov 
14425eca1c10SIngo Molnar /**
14435eca1c10SIngo Molnar  * pid_alive - check that a task structure is not stale
14445eca1c10SIngo Molnar  * @p: Task structure to be checked.
14455eca1c10SIngo Molnar  *
14465eca1c10SIngo Molnar  * Test if a process is not yet dead (at most zombie state)
14475eca1c10SIngo Molnar  * If pid_alive fails, then pointers within the task structure
14485eca1c10SIngo Molnar  * can be stale and must not be dereferenced.
14495eca1c10SIngo Molnar  *
14505eca1c10SIngo Molnar  * Return: 1 if the process is alive. 0 otherwise.
14515eca1c10SIngo Molnar  */
14525eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p)
14535eca1c10SIngo Molnar {
14542c470475SEric W. Biederman 	return p->thread_pid != NULL;
14555eca1c10SIngo Molnar }
14567af57294SPavel Emelyanov 
14575eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
14587af57294SPavel Emelyanov {
145952ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
14607af57294SPavel Emelyanov }
14617af57294SPavel Emelyanov 
14627af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
14637af57294SPavel Emelyanov {
146452ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
14657af57294SPavel Emelyanov }
14667af57294SPavel Emelyanov 
14677af57294SPavel Emelyanov 
14685eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
14697af57294SPavel Emelyanov {
147052ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
14717af57294SPavel Emelyanov }
14727af57294SPavel Emelyanov 
14737af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk)
14747af57294SPavel Emelyanov {
147552ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
14767af57294SPavel Emelyanov }
14777af57294SPavel Emelyanov 
1478dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
1479dd1c1f2fSOleg Nesterov {
14806883f81aSEric W. Biederman 	return __task_pid_nr_ns(tsk, PIDTYPE_TGID, ns);
1481dd1c1f2fSOleg Nesterov }
1482dd1c1f2fSOleg Nesterov 
1483dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk)
1484dd1c1f2fSOleg Nesterov {
14856883f81aSEric W. Biederman 	return __task_pid_nr_ns(tsk, PIDTYPE_TGID, NULL);
1486dd1c1f2fSOleg Nesterov }
1487dd1c1f2fSOleg Nesterov 
1488dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns)
1489dd1c1f2fSOleg Nesterov {
1490dd1c1f2fSOleg Nesterov 	pid_t pid = 0;
1491dd1c1f2fSOleg Nesterov 
1492dd1c1f2fSOleg Nesterov 	rcu_read_lock();
1493dd1c1f2fSOleg Nesterov 	if (pid_alive(tsk))
1494dd1c1f2fSOleg Nesterov 		pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns);
1495dd1c1f2fSOleg Nesterov 	rcu_read_unlock();
1496dd1c1f2fSOleg Nesterov 
1497dd1c1f2fSOleg Nesterov 	return pid;
1498dd1c1f2fSOleg Nesterov }
1499dd1c1f2fSOleg Nesterov 
1500dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk)
1501dd1c1f2fSOleg Nesterov {
1502dd1c1f2fSOleg Nesterov 	return task_ppid_nr_ns(tsk, &init_pid_ns);
1503dd1c1f2fSOleg Nesterov }
1504dd1c1f2fSOleg Nesterov 
15055eca1c10SIngo Molnar /* Obsolete, do not use: */
15061b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk)
15071b0f7ffdSOleg Nesterov {
15081b0f7ffdSOleg Nesterov 	return task_pgrp_nr_ns(tsk, &init_pid_ns);
15091b0f7ffdSOleg Nesterov }
15107af57294SPavel Emelyanov 
151106eb6184SPeter Zijlstra #define TASK_REPORT_IDLE	(TASK_REPORT + 1)
151206eb6184SPeter Zijlstra #define TASK_REPORT_MAX		(TASK_REPORT_IDLE << 1)
151306eb6184SPeter Zijlstra 
15141d48b080SPeter Zijlstra static inline unsigned int task_state_index(struct task_struct *tsk)
151520435d84SXie XiuQi {
15161593baabSPeter Zijlstra 	unsigned int tsk_state = READ_ONCE(tsk->state);
15171593baabSPeter Zijlstra 	unsigned int state = (tsk_state | tsk->exit_state) & TASK_REPORT;
151820435d84SXie XiuQi 
151906eb6184SPeter Zijlstra 	BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX);
152006eb6184SPeter Zijlstra 
152106eb6184SPeter Zijlstra 	if (tsk_state == TASK_IDLE)
152206eb6184SPeter Zijlstra 		state = TASK_REPORT_IDLE;
152306eb6184SPeter Zijlstra 
15241593baabSPeter Zijlstra 	return fls(state);
15251593baabSPeter Zijlstra }
152620435d84SXie XiuQi 
15271d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state)
15281593baabSPeter Zijlstra {
15298ef9925bSPeter Zijlstra 	static const char state_char[] = "RSDTtXZPI";
15301593baabSPeter Zijlstra 
153106eb6184SPeter Zijlstra 	BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1);
15321593baabSPeter Zijlstra 
15331593baabSPeter Zijlstra 	return state_char[state];
15341593baabSPeter Zijlstra }
15351593baabSPeter Zijlstra 
15361593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk)
15371593baabSPeter Zijlstra {
15381d48b080SPeter Zijlstra 	return task_index_to_char(task_state_index(tsk));
153920435d84SXie XiuQi }
154020435d84SXie XiuQi 
15411da177e4SLinus Torvalds /**
1542570f5241SSergey Senozhatsky  * is_global_init - check if a task structure is init. Since init
1543570f5241SSergey Senozhatsky  * is free to have sub-threads we need to check tgid.
15443260259fSHenne  * @tsk: Task structure to be checked.
15453260259fSHenne  *
15463260259fSHenne  * Check if a task structure is the first user space task the kernel created.
1547e69f6186SYacine Belkadi  *
1548e69f6186SYacine Belkadi  * Return: 1 if the task structure is init. 0 otherwise.
1549f400e198SSukadev Bhattiprolu  */
1550e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk)
1551b461cc03SPavel Emelyanov {
1552570f5241SSergey Senozhatsky 	return task_tgid_nr(tsk) == 1;
1553b461cc03SPavel Emelyanov }
1554b460cbc5SSerge E. Hallyn 
15559ec52099SCedric Le Goater extern struct pid *cad_pid;
15569ec52099SCedric Le Goater 
15571da177e4SLinus Torvalds /*
15581da177e4SLinus Torvalds  * Per process flags
15591da177e4SLinus Torvalds  */
156001ccf592SSebastian Andrzej Siewior #define PF_VCPU			0x00000001	/* I'm a virtual CPU */
1561c1de45caSPeter Zijlstra #define PF_IDLE			0x00000002	/* I am an IDLE thread */
15625eca1c10SIngo Molnar #define PF_EXITING		0x00000004	/* Getting shut down */
156301ccf592SSebastian Andrzej Siewior #define PF_IO_WORKER		0x00000010	/* Task is an IO worker */
156421aa9af0STejun Heo #define PF_WQ_WORKER		0x00000020	/* I'm a workqueue worker */
15655eca1c10SIngo Molnar #define PF_FORKNOEXEC		0x00000040	/* Forked but didn't exec */
15665eca1c10SIngo Molnar #define PF_MCE_PROCESS		0x00000080      /* Process policy on mce errors */
15675eca1c10SIngo Molnar #define PF_SUPERPRIV		0x00000100	/* Used super-user privileges */
15685eca1c10SIngo Molnar #define PF_DUMPCORE		0x00000200	/* Dumped core */
15695eca1c10SIngo Molnar #define PF_SIGNALED		0x00000400	/* Killed by a signal */
15701da177e4SLinus Torvalds #define PF_MEMALLOC		0x00000800	/* Allocating memory */
15715eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED	0x00001000	/* set_user() noticed that RLIMIT_NPROC was exceeded */
15725eca1c10SIngo Molnar #define PF_USED_MATH		0x00002000	/* If unset the fpu must be initialized before use */
15735eca1c10SIngo Molnar #define PF_USED_ASYNC		0x00004000	/* Used async_schedule*(), used by module init */
15745eca1c10SIngo Molnar #define PF_NOFREEZE		0x00008000	/* This thread should not be frozen */
15755eca1c10SIngo Molnar #define PF_FROZEN		0x00010000	/* Frozen for system suspend */
15767dea19f9SMichal Hocko #define PF_KSWAPD		0x00020000	/* I am kswapd */
15777dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS	0x00040000	/* All allocation requests will inherit GFP_NOFS */
15787dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO	0x00080000	/* All allocation requests will inherit GFP_NOIO */
1579a37b0715SNeilBrown #define PF_LOCAL_THROTTLE	0x00100000	/* Throttle writes only against the bdi I write to,
1580a37b0715SNeilBrown 						 * I am cleaning dirty pages from some other bdi. */
1581246bb0b1SOleg Nesterov #define PF_KTHREAD		0x00200000	/* I am a kernel thread */
15825eca1c10SIngo Molnar #define PF_RANDOMIZE		0x00400000	/* Randomize virtual address space */
1583b31dc66aSJens Axboe #define PF_SWAPWRITE		0x00800000	/* Allowed to write to swap */
15843bd37062SSebastian Andrzej Siewior #define PF_NO_SETAFFINITY	0x04000000	/* Userland is not allowed to meddle with cpus_mask */
15854db96cf0SAndi Kleen #define PF_MCE_EARLY		0x08000000      /* Early kill for mce process policy */
15861a08ae36SPavel Tatashin #define PF_MEMALLOC_PIN		0x10000000	/* Allocation context constrained to zones which allow long term pinning. */
158758a69cb4STejun Heo #define PF_FREEZER_SKIP		0x40000000	/* Freezer should not count it as freezable */
15885eca1c10SIngo Molnar #define PF_SUSPEND_TASK		0x80000000      /* This thread called freeze_processes() and should not be frozen */
15891da177e4SLinus Torvalds 
15901da177e4SLinus Torvalds /*
15911da177e4SLinus Torvalds  * Only the _current_ task can read/write to tsk->flags, but other
15921da177e4SLinus Torvalds  * tasks can access tsk->flags in readonly mode for example
15931da177e4SLinus Torvalds  * with tsk_used_math (like during threaded core dumping).
15941da177e4SLinus Torvalds  * There is however an exception to this rule during ptrace
15951da177e4SLinus Torvalds  * or during fork: the ptracer task is allowed to write to the
15961da177e4SLinus Torvalds  * child->flags of its traced child (same goes for fork, the parent
15971da177e4SLinus Torvalds  * can write to the child->flags), because we're guaranteed the
15981da177e4SLinus Torvalds  * child is not running and in turn not changing child->flags
15991da177e4SLinus Torvalds  * at the same time the parent does it.
16001da177e4SLinus Torvalds  */
16011da177e4SLinus Torvalds #define clear_stopped_child_used_math(child)	do { (child)->flags &= ~PF_USED_MATH; } while (0)
16021da177e4SLinus Torvalds #define set_stopped_child_used_math(child)	do { (child)->flags |= PF_USED_MATH; } while (0)
16031da177e4SLinus Torvalds #define clear_used_math()			clear_stopped_child_used_math(current)
16041da177e4SLinus Torvalds #define set_used_math()				set_stopped_child_used_math(current)
16055eca1c10SIngo Molnar 
16061da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \
16071da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0)
16085eca1c10SIngo Molnar 
16095eca1c10SIngo Molnar #define conditional_used_math(condition)	conditional_stopped_child_used_math(condition, current)
16105eca1c10SIngo Molnar 
16111da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \
16121da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0)
16135eca1c10SIngo Molnar 
16141da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */
16151da177e4SLinus Torvalds #define tsk_used_math(p)			((p)->flags & PF_USED_MATH)
16161da177e4SLinus Torvalds #define used_math()				tsk_used_math(current)
16171da177e4SLinus Torvalds 
161862ec05ddSThomas Gleixner static inline bool is_percpu_thread(void)
161962ec05ddSThomas Gleixner {
162062ec05ddSThomas Gleixner #ifdef CONFIG_SMP
162162ec05ddSThomas Gleixner 	return (current->flags & PF_NO_SETAFFINITY) &&
162262ec05ddSThomas Gleixner 		(current->nr_cpus_allowed  == 1);
162362ec05ddSThomas Gleixner #else
162462ec05ddSThomas Gleixner 	return true;
162562ec05ddSThomas Gleixner #endif
162662ec05ddSThomas Gleixner }
162762ec05ddSThomas Gleixner 
16281d4457f9SKees Cook /* Per-process atomic flags. */
1629a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS		0	/* May not gain new privileges. */
16302ad654bcSZefan Li #define PFA_SPREAD_PAGE			1	/* Spread page cache over cpuset */
16312ad654bcSZefan Li #define PFA_SPREAD_SLAB			2	/* Spread some slab caches over cpuset */
1632356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE		3	/* Speculative Store Bypass disabled */
1633356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE	4	/* Speculative Store Bypass force disabled*/
16349137bb27SThomas Gleixner #define PFA_SPEC_IB_DISABLE		5	/* Indirect branch speculation restricted */
16359137bb27SThomas Gleixner #define PFA_SPEC_IB_FORCE_DISABLE	6	/* Indirect branch speculation permanently restricted */
163671368af9SWaiman Long #define PFA_SPEC_SSB_NOEXEC		7	/* Speculative Store Bypass clear on execve() */
16371d4457f9SKees Cook 
1638e0e5070bSZefan Li #define TASK_PFA_TEST(name, func)					\
1639e0e5070bSZefan Li 	static inline bool task_##func(struct task_struct *p)		\
1640e0e5070bSZefan Li 	{ return test_bit(PFA_##name, &p->atomic_flags); }
16415eca1c10SIngo Molnar 
1642e0e5070bSZefan Li #define TASK_PFA_SET(name, func)					\
1643e0e5070bSZefan Li 	static inline void task_set_##func(struct task_struct *p)	\
1644e0e5070bSZefan Li 	{ set_bit(PFA_##name, &p->atomic_flags); }
16455eca1c10SIngo Molnar 
1646e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func)					\
1647e0e5070bSZefan Li 	static inline void task_clear_##func(struct task_struct *p)	\
1648e0e5070bSZefan Li 	{ clear_bit(PFA_##name, &p->atomic_flags); }
16491d4457f9SKees Cook 
1650e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs)
1651e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs)
16521d4457f9SKees Cook 
16532ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page)
16542ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page)
16552ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
16562ad654bcSZefan Li 
16572ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
16582ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab)
16592ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
1660544b2c91STejun Heo 
1661356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable)
1662356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable)
1663356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable)
1664356e4bffSThomas Gleixner 
166571368af9SWaiman Long TASK_PFA_TEST(SPEC_SSB_NOEXEC, spec_ssb_noexec)
166671368af9SWaiman Long TASK_PFA_SET(SPEC_SSB_NOEXEC, spec_ssb_noexec)
166771368af9SWaiman Long TASK_PFA_CLEAR(SPEC_SSB_NOEXEC, spec_ssb_noexec)
166871368af9SWaiman Long 
1669356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1670356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1671356e4bffSThomas Gleixner 
16729137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_DISABLE, spec_ib_disable)
16739137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_DISABLE, spec_ib_disable)
16749137bb27SThomas Gleixner TASK_PFA_CLEAR(SPEC_IB_DISABLE, spec_ib_disable)
16759137bb27SThomas Gleixner 
16769137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable)
16779137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable)
16789137bb27SThomas Gleixner 
16795eca1c10SIngo Molnar static inline void
1680717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags)
1681907aed48SMel Gorman {
1682717a94b5SNeilBrown 	current->flags &= ~flags;
1683717a94b5SNeilBrown 	current->flags |= orig_flags & flags;
1684907aed48SMel Gorman }
1685907aed48SMel Gorman 
16865eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial);
16875eca1c10SIngo Molnar extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_cpus_allowed);
16881da177e4SLinus Torvalds #ifdef CONFIG_SMP
16895eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask);
16905eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask);
16911da177e4SLinus Torvalds #else
16925eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask)
16931e1b6c51SKOSAKI Motohiro {
16941e1b6c51SKOSAKI Motohiro }
16955eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask)
16961da177e4SLinus Torvalds {
169796f874e2SRusty Russell 	if (!cpumask_test_cpu(0, new_mask))
16981da177e4SLinus Torvalds 		return -EINVAL;
16991da177e4SLinus Torvalds 	return 0;
17001da177e4SLinus Torvalds }
17011da177e4SLinus Torvalds #endif
1702e0ad9556SRusty Russell 
1703fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt);
170436c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice);
170536c8b586SIngo Molnar extern int task_prio(const struct task_struct *p);
17065eca1c10SIngo Molnar 
1707d0ea0268SDongsheng Yang /**
1708d0ea0268SDongsheng Yang  * task_nice - return the nice value of a given task.
1709d0ea0268SDongsheng Yang  * @p: the task in question.
1710d0ea0268SDongsheng Yang  *
1711d0ea0268SDongsheng Yang  * Return: The nice value [ -20 ... 0 ... 19 ].
1712d0ea0268SDongsheng Yang  */
1713d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p)
1714d0ea0268SDongsheng Yang {
1715d0ea0268SDongsheng Yang 	return PRIO_TO_NICE((p)->static_prio);
1716d0ea0268SDongsheng Yang }
17175eca1c10SIngo Molnar 
171836c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice);
171936c8b586SIngo Molnar extern int task_curr(const struct task_struct *p);
17201da177e4SLinus Torvalds extern int idle_cpu(int cpu);
1721943d355dSRohit Jain extern int available_idle_cpu(int cpu);
17225eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *);
17235eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *);
17248b700983SPeter Zijlstra extern void sched_set_fifo(struct task_struct *p);
17258b700983SPeter Zijlstra extern void sched_set_fifo_low(struct task_struct *p);
17268b700983SPeter Zijlstra extern void sched_set_normal(struct task_struct *p, int nice);
17275eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *);
1728794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *);
172936c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu);
17305eca1c10SIngo Molnar 
1731c4f30608SPaul E. McKenney /**
1732c4f30608SPaul E. McKenney  * is_idle_task - is the specified task an idle task?
1733fa757281SRandy Dunlap  * @p: the task in question.
1734e69f6186SYacine Belkadi  *
1735e69f6186SYacine Belkadi  * Return: 1 if @p is an idle task. 0 otherwise.
1736c4f30608SPaul E. McKenney  */
1737c94a88f3SMarco Elver static __always_inline bool is_idle_task(const struct task_struct *p)
1738c4f30608SPaul E. McKenney {
1739c1de45caSPeter Zijlstra 	return !!(p->flags & PF_IDLE);
1740c4f30608SPaul E. McKenney }
17415eca1c10SIngo Molnar 
174236c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu);
1743a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p);
17441da177e4SLinus Torvalds 
17451da177e4SLinus Torvalds void yield(void);
17461da177e4SLinus Torvalds 
17471da177e4SLinus Torvalds union thread_union {
17480500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK
17490500871fSDavid Howells 	struct task_struct task;
17500500871fSDavid Howells #endif
1751c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK
17521da177e4SLinus Torvalds 	struct thread_info thread_info;
1753c65eacbeSAndy Lutomirski #endif
17541da177e4SLinus Torvalds 	unsigned long stack[THREAD_SIZE/sizeof(long)];
17551da177e4SLinus Torvalds };
17561da177e4SLinus Torvalds 
17570500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK
17580500871fSDavid Howells extern struct thread_info init_thread_info;
17590500871fSDavid Howells #endif
17600500871fSDavid Howells 
17610500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)];
17620500871fSDavid Howells 
1763f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK
1764f3ac6067SIngo Molnar static inline struct thread_info *task_thread_info(struct task_struct *task)
1765f3ac6067SIngo Molnar {
1766f3ac6067SIngo Molnar 	return &task->thread_info;
1767f3ac6067SIngo Molnar }
1768f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS)
1769f3ac6067SIngo Molnar # define task_thread_info(task)	((struct thread_info *)(task)->stack)
1770f3ac6067SIngo Molnar #endif
1771f3ac6067SIngo Molnar 
1772198fe21bSPavel Emelyanov /*
1773198fe21bSPavel Emelyanov  * find a task by one of its numerical ids
1774198fe21bSPavel Emelyanov  *
1775198fe21bSPavel Emelyanov  * find_task_by_pid_ns():
1776198fe21bSPavel Emelyanov  *      finds a task by its pid in the specified namespace
1777228ebcbeSPavel Emelyanov  * find_task_by_vpid():
1778228ebcbeSPavel Emelyanov  *      finds a task by its virtual pid
1779198fe21bSPavel Emelyanov  *
1780e49859e7SPavel Emelyanov  * see also find_vpid() etc in include/linux/pid.h
1781198fe21bSPavel Emelyanov  */
1782198fe21bSPavel Emelyanov 
1783228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr);
17845eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns);
1785198fe21bSPavel Emelyanov 
17862ee08260SMike Rapoport /*
17872ee08260SMike Rapoport  * find a task by its virtual pid and get the task struct
17882ee08260SMike Rapoport  */
17892ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr);
17902ee08260SMike Rapoport 
1791b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state);
1792b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk);
17933e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk);
17945eca1c10SIngo Molnar 
17951da177e4SLinus Torvalds #ifdef CONFIG_SMP
17961da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk);
17971da177e4SLinus Torvalds #else
17981da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { }
17991da177e4SLinus Torvalds #endif
18001da177e4SLinus Torvalds 
180182b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
18025eca1c10SIngo Molnar 
180382b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from)
180482b89778SAdrian Hunter {
180582b89778SAdrian Hunter 	__set_task_comm(tsk, from, false);
180682b89778SAdrian Hunter }
18075eca1c10SIngo Molnar 
18083756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk);
18093756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({			\
18103756f640SArnd Bergmann 	BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN);	\
18113756f640SArnd Bergmann 	__get_task_comm(buf, sizeof(buf), tsk);		\
18123756f640SArnd Bergmann })
18131da177e4SLinus Torvalds 
18141da177e4SLinus Torvalds #ifdef CONFIG_SMP
18152a0a24ebSThomas Gleixner static __always_inline void scheduler_ipi(void)
18162a0a24ebSThomas Gleixner {
18172a0a24ebSThomas Gleixner 	/*
18182a0a24ebSThomas Gleixner 	 * Fold TIF_NEED_RESCHED into the preempt_count; anybody setting
18192a0a24ebSThomas Gleixner 	 * TIF_NEED_RESCHED remotely (for the first time) will also send
18202a0a24ebSThomas Gleixner 	 * this IPI.
18212a0a24ebSThomas Gleixner 	 */
18222a0a24ebSThomas Gleixner 	preempt_fold_need_resched();
18232a0a24ebSThomas Gleixner }
182485ba2d86SRoland McGrath extern unsigned long wait_task_inactive(struct task_struct *, long match_state);
18251da177e4SLinus Torvalds #else
1826184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { }
18275eca1c10SIngo Molnar static inline unsigned long wait_task_inactive(struct task_struct *p, long match_state)
182885ba2d86SRoland McGrath {
182985ba2d86SRoland McGrath 	return 1;
183085ba2d86SRoland McGrath }
18311da177e4SLinus Torvalds #endif
18321da177e4SLinus Torvalds 
18335eca1c10SIngo Molnar /*
18345eca1c10SIngo Molnar  * Set thread flags in other task's structures.
18355eca1c10SIngo Molnar  * See asm/thread_info.h for TIF_xxxx flags available:
18361da177e4SLinus Torvalds  */
18371da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag)
18381da177e4SLinus Torvalds {
1839a1261f54SAl Viro 	set_ti_thread_flag(task_thread_info(tsk), flag);
18401da177e4SLinus Torvalds }
18411da177e4SLinus Torvalds 
18421da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag)
18431da177e4SLinus Torvalds {
1844a1261f54SAl Viro 	clear_ti_thread_flag(task_thread_info(tsk), flag);
18451da177e4SLinus Torvalds }
18461da177e4SLinus Torvalds 
184793ee37c2SDave Martin static inline void update_tsk_thread_flag(struct task_struct *tsk, int flag,
184893ee37c2SDave Martin 					  bool value)
184993ee37c2SDave Martin {
185093ee37c2SDave Martin 	update_ti_thread_flag(task_thread_info(tsk), flag, value);
185193ee37c2SDave Martin }
185293ee37c2SDave Martin 
18531da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag)
18541da177e4SLinus Torvalds {
1855a1261f54SAl Viro 	return test_and_set_ti_thread_flag(task_thread_info(tsk), flag);
18561da177e4SLinus Torvalds }
18571da177e4SLinus Torvalds 
18581da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag)
18591da177e4SLinus Torvalds {
1860a1261f54SAl Viro 	return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag);
18611da177e4SLinus Torvalds }
18621da177e4SLinus Torvalds 
18631da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag)
18641da177e4SLinus Torvalds {
1865a1261f54SAl Viro 	return test_ti_thread_flag(task_thread_info(tsk), flag);
18661da177e4SLinus Torvalds }
18671da177e4SLinus Torvalds 
18681da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk)
18691da177e4SLinus Torvalds {
18701da177e4SLinus Torvalds 	set_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
18711da177e4SLinus Torvalds }
18721da177e4SLinus Torvalds 
18731da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk)
18741da177e4SLinus Torvalds {
18751da177e4SLinus Torvalds 	clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
18761da177e4SLinus Torvalds }
18771da177e4SLinus Torvalds 
18788ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk)
18798ae121acSGregory Haskins {
18808ae121acSGregory Haskins 	return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
18818ae121acSGregory Haskins }
18828ae121acSGregory Haskins 
18831da177e4SLinus Torvalds /*
18841da177e4SLinus Torvalds  * cond_resched() and cond_resched_lock(): latency reduction via
18851da177e4SLinus Torvalds  * explicit rescheduling in places that are safe. The return
18861da177e4SLinus Torvalds  * value indicates whether a reschedule was done in fact.
18871da177e4SLinus Torvalds  * cond_resched_lock() will drop the spinlock before scheduling,
18881da177e4SLinus Torvalds  */
1889b965f1ddSPeter Zijlstra (Intel) #if !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC)
1890b965f1ddSPeter Zijlstra (Intel) extern int __cond_resched(void);
1891b965f1ddSPeter Zijlstra (Intel) 
1892b965f1ddSPeter Zijlstra (Intel) #ifdef CONFIG_PREEMPT_DYNAMIC
1893b965f1ddSPeter Zijlstra (Intel) 
1894b965f1ddSPeter Zijlstra (Intel) DECLARE_STATIC_CALL(cond_resched, __cond_resched);
1895b965f1ddSPeter Zijlstra (Intel) 
1896b965f1ddSPeter Zijlstra (Intel) static __always_inline int _cond_resched(void)
1897b965f1ddSPeter Zijlstra (Intel) {
1898ef72661eSPeter Zijlstra 	return static_call_mod(cond_resched)();
1899b965f1ddSPeter Zijlstra (Intel) }
1900b965f1ddSPeter Zijlstra (Intel) 
190135a773a0SPeter Zijlstra #else
1902b965f1ddSPeter Zijlstra (Intel) 
1903b965f1ddSPeter Zijlstra (Intel) static inline int _cond_resched(void)
1904b965f1ddSPeter Zijlstra (Intel) {
1905b965f1ddSPeter Zijlstra (Intel) 	return __cond_resched();
1906b965f1ddSPeter Zijlstra (Intel) }
1907b965f1ddSPeter Zijlstra (Intel) 
1908b965f1ddSPeter Zijlstra (Intel) #endif /* CONFIG_PREEMPT_DYNAMIC */
1909b965f1ddSPeter Zijlstra (Intel) 
1910b965f1ddSPeter Zijlstra (Intel) #else
1911b965f1ddSPeter Zijlstra (Intel) 
191235a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; }
1913b965f1ddSPeter Zijlstra (Intel) 
1914b965f1ddSPeter Zijlstra (Intel) #endif /* !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC) */
19156f80bd98SFrederic Weisbecker 
1916613afbf8SFrederic Weisbecker #define cond_resched() ({			\
19173427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, 0);	\
1918613afbf8SFrederic Weisbecker 	_cond_resched();			\
1919613afbf8SFrederic Weisbecker })
19206f80bd98SFrederic Weisbecker 
1921613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock);
1922f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_read(rwlock_t *lock);
1923f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_write(rwlock_t *lock);
1924613afbf8SFrederic Weisbecker 
1925613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({				\
19263427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\
1927613afbf8SFrederic Weisbecker 	__cond_resched_lock(lock);				\
1928613afbf8SFrederic Weisbecker })
1929613afbf8SFrederic Weisbecker 
1930f3d4b4b1SBen Gardon #define cond_resched_rwlock_read(lock) ({			\
1931f3d4b4b1SBen Gardon 	__might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);	\
1932f3d4b4b1SBen Gardon 	__cond_resched_rwlock_read(lock);			\
1933f3d4b4b1SBen Gardon })
1934f3d4b4b1SBen Gardon 
1935f3d4b4b1SBen Gardon #define cond_resched_rwlock_write(lock) ({			\
1936f3d4b4b1SBen Gardon 	__might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);	\
1937f3d4b4b1SBen Gardon 	__cond_resched_rwlock_write(lock);			\
1938f3d4b4b1SBen Gardon })
1939f3d4b4b1SBen Gardon 
1940f6f3c437SSimon Horman static inline void cond_resched_rcu(void)
1941f6f3c437SSimon Horman {
1942f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU)
1943f6f3c437SSimon Horman 	rcu_read_unlock();
1944f6f3c437SSimon Horman 	cond_resched();
1945f6f3c437SSimon Horman 	rcu_read_lock();
1946f6f3c437SSimon Horman #endif
1947f6f3c437SSimon Horman }
1948f6f3c437SSimon Horman 
19491da177e4SLinus Torvalds /*
19501da177e4SLinus Torvalds  * Does a critical section need to be broken due to another
1951c1a280b6SThomas Gleixner  * task waiting?: (technically does not depend on CONFIG_PREEMPTION,
195295c354feSNick Piggin  * but a general need for low latency)
19531da177e4SLinus Torvalds  */
195495c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock)
19551da177e4SLinus Torvalds {
1956c1a280b6SThomas Gleixner #ifdef CONFIG_PREEMPTION
195795c354feSNick Piggin 	return spin_is_contended(lock);
195895c354feSNick Piggin #else
19591da177e4SLinus Torvalds 	return 0;
196095c354feSNick Piggin #endif
19611da177e4SLinus Torvalds }
19621da177e4SLinus Torvalds 
1963a09a689aSBen Gardon /*
1964a09a689aSBen Gardon  * Check if a rwlock is contended.
1965a09a689aSBen Gardon  * Returns non-zero if there is another task waiting on the rwlock.
1966a09a689aSBen Gardon  * Returns zero if the lock is not contended or the system / underlying
1967a09a689aSBen Gardon  * rwlock implementation does not support contention detection.
1968a09a689aSBen Gardon  * Technically does not depend on CONFIG_PREEMPTION, but a general need
1969a09a689aSBen Gardon  * for low latency.
1970a09a689aSBen Gardon  */
1971a09a689aSBen Gardon static inline int rwlock_needbreak(rwlock_t *lock)
1972a09a689aSBen Gardon {
1973a09a689aSBen Gardon #ifdef CONFIG_PREEMPTION
1974a09a689aSBen Gardon 	return rwlock_is_contended(lock);
1975a09a689aSBen Gardon #else
1976a09a689aSBen Gardon 	return 0;
1977a09a689aSBen Gardon #endif
1978a09a689aSBen Gardon }
1979a09a689aSBen Gardon 
198075f93fedSPeter Zijlstra static __always_inline bool need_resched(void)
198175f93fedSPeter Zijlstra {
198275f93fedSPeter Zijlstra 	return unlikely(tif_need_resched());
198375f93fedSPeter Zijlstra }
198475f93fedSPeter Zijlstra 
1985ee761f62SThomas Gleixner /*
19861da177e4SLinus Torvalds  * Wrappers for p->thread_info->cpu access. No-op on UP.
19871da177e4SLinus Torvalds  */
19881da177e4SLinus Torvalds #ifdef CONFIG_SMP
19891da177e4SLinus Torvalds 
19901da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
19911da177e4SLinus Torvalds {
1992c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
1993c546951dSAndrea Parri 	return READ_ONCE(p->cpu);
1994c65eacbeSAndy Lutomirski #else
1995c546951dSAndrea Parri 	return READ_ONCE(task_thread_info(p)->cpu);
1996c65eacbeSAndy Lutomirski #endif
19971da177e4SLinus Torvalds }
19981da177e4SLinus Torvalds 
1999c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu);
20001da177e4SLinus Torvalds 
20011da177e4SLinus Torvalds #else
20021da177e4SLinus Torvalds 
20031da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
20041da177e4SLinus Torvalds {
20051da177e4SLinus Torvalds 	return 0;
20061da177e4SLinus Torvalds }
20071da177e4SLinus Torvalds 
20081da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu)
20091da177e4SLinus Torvalds {
20101da177e4SLinus Torvalds }
20111da177e4SLinus Torvalds 
20121da177e4SLinus Torvalds #endif /* CONFIG_SMP */
20131da177e4SLinus Torvalds 
2014*a1dfb631SMarcelo Tosatti extern bool sched_task_on_rq(struct task_struct *p);
2015*a1dfb631SMarcelo Tosatti 
2016d9345c65SPan Xinhui /*
2017d9345c65SPan Xinhui  * In order to reduce various lock holder preemption latencies provide an
2018d9345c65SPan Xinhui  * interface to see if a vCPU is currently running or not.
2019d9345c65SPan Xinhui  *
2020d9345c65SPan Xinhui  * This allows us to terminate optimistic spin loops and block, analogous to
2021d9345c65SPan Xinhui  * the native optimistic spin heuristic of testing if the lock owner task is
2022d9345c65SPan Xinhui  * running or not.
2023d9345c65SPan Xinhui  */
2024d9345c65SPan Xinhui #ifndef vcpu_is_preempted
202542fd8baaSQian Cai static inline bool vcpu_is_preempted(int cpu)
202642fd8baaSQian Cai {
202742fd8baaSQian Cai 	return false;
202842fd8baaSQian Cai }
2029d9345c65SPan Xinhui #endif
2030d9345c65SPan Xinhui 
203196f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask);
203296f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask);
20335c45bf27SSiddha, Suresh B 
203482455257SDave Hansen #ifndef TASK_SIZE_OF
203582455257SDave Hansen #define TASK_SIZE_OF(tsk)	TASK_SIZE
203682455257SDave Hansen #endif
203782455257SDave Hansen 
2038a5418be9SViresh Kumar #ifdef CONFIG_SMP
2039a5418be9SViresh Kumar /* Returns effective CPU energy utilization, as seen by the scheduler */
2040a5418be9SViresh Kumar unsigned long sched_cpu_util(int cpu, unsigned long max);
2041a5418be9SViresh Kumar #endif /* CONFIG_SMP */
2042a5418be9SViresh Kumar 
2043d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ
2044d7822b1eSMathieu Desnoyers 
2045d7822b1eSMathieu Desnoyers /*
2046d7822b1eSMathieu Desnoyers  * Map the event mask on the user-space ABI enum rseq_cs_flags
2047d7822b1eSMathieu Desnoyers  * for direct mask checks.
2048d7822b1eSMathieu Desnoyers  */
2049d7822b1eSMathieu Desnoyers enum rseq_event_mask_bits {
2050d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_PREEMPT_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_PREEMPT_BIT,
2051d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_SIGNAL_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_SIGNAL_BIT,
2052d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_MIGRATE_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_MIGRATE_BIT,
2053d7822b1eSMathieu Desnoyers };
2054d7822b1eSMathieu Desnoyers 
2055d7822b1eSMathieu Desnoyers enum rseq_event_mask {
2056d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_PREEMPT	= (1U << RSEQ_EVENT_PREEMPT_BIT),
2057d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_SIGNAL	= (1U << RSEQ_EVENT_SIGNAL_BIT),
2058d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_MIGRATE	= (1U << RSEQ_EVENT_MIGRATE_BIT),
2059d7822b1eSMathieu Desnoyers };
2060d7822b1eSMathieu Desnoyers 
2061d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t)
2062d7822b1eSMathieu Desnoyers {
2063d7822b1eSMathieu Desnoyers 	if (t->rseq)
2064d7822b1eSMathieu Desnoyers 		set_tsk_thread_flag(t, TIF_NOTIFY_RESUME);
2065d7822b1eSMathieu Desnoyers }
2066d7822b1eSMathieu Desnoyers 
2067784e0300SWill Deacon void __rseq_handle_notify_resume(struct ksignal *sig, struct pt_regs *regs);
2068d7822b1eSMathieu Desnoyers 
2069784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig,
2070784e0300SWill Deacon 					     struct pt_regs *regs)
2071d7822b1eSMathieu Desnoyers {
2072d7822b1eSMathieu Desnoyers 	if (current->rseq)
2073784e0300SWill Deacon 		__rseq_handle_notify_resume(ksig, regs);
2074d7822b1eSMathieu Desnoyers }
2075d7822b1eSMathieu Desnoyers 
2076784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig,
2077784e0300SWill Deacon 				       struct pt_regs *regs)
2078d7822b1eSMathieu Desnoyers {
2079d7822b1eSMathieu Desnoyers 	preempt_disable();
2080d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_SIGNAL_BIT, &current->rseq_event_mask);
2081d7822b1eSMathieu Desnoyers 	preempt_enable();
2082784e0300SWill Deacon 	rseq_handle_notify_resume(ksig, regs);
2083d7822b1eSMathieu Desnoyers }
2084d7822b1eSMathieu Desnoyers 
2085d7822b1eSMathieu Desnoyers /* rseq_preempt() requires preemption to be disabled. */
2086d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t)
2087d7822b1eSMathieu Desnoyers {
2088d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_PREEMPT_BIT, &t->rseq_event_mask);
2089d7822b1eSMathieu Desnoyers 	rseq_set_notify_resume(t);
2090d7822b1eSMathieu Desnoyers }
2091d7822b1eSMathieu Desnoyers 
2092d7822b1eSMathieu Desnoyers /* rseq_migrate() requires preemption to be disabled. */
2093d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t)
2094d7822b1eSMathieu Desnoyers {
2095d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_MIGRATE_BIT, &t->rseq_event_mask);
2096d7822b1eSMathieu Desnoyers 	rseq_set_notify_resume(t);
2097d7822b1eSMathieu Desnoyers }
2098d7822b1eSMathieu Desnoyers 
2099d7822b1eSMathieu Desnoyers /*
2100d7822b1eSMathieu Desnoyers  * If parent process has a registered restartable sequences area, the
2101463f550fSMathieu Desnoyers  * child inherits. Unregister rseq for a clone with CLONE_VM set.
2102d7822b1eSMathieu Desnoyers  */
2103d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags)
2104d7822b1eSMathieu Desnoyers {
2105463f550fSMathieu Desnoyers 	if (clone_flags & CLONE_VM) {
2106d7822b1eSMathieu Desnoyers 		t->rseq = NULL;
2107d7822b1eSMathieu Desnoyers 		t->rseq_sig = 0;
2108d7822b1eSMathieu Desnoyers 		t->rseq_event_mask = 0;
2109d7822b1eSMathieu Desnoyers 	} else {
2110d7822b1eSMathieu Desnoyers 		t->rseq = current->rseq;
2111d7822b1eSMathieu Desnoyers 		t->rseq_sig = current->rseq_sig;
2112d7822b1eSMathieu Desnoyers 		t->rseq_event_mask = current->rseq_event_mask;
2113d7822b1eSMathieu Desnoyers 	}
2114d7822b1eSMathieu Desnoyers }
2115d7822b1eSMathieu Desnoyers 
2116d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t)
2117d7822b1eSMathieu Desnoyers {
2118d7822b1eSMathieu Desnoyers 	t->rseq = NULL;
2119d7822b1eSMathieu Desnoyers 	t->rseq_sig = 0;
2120d7822b1eSMathieu Desnoyers 	t->rseq_event_mask = 0;
2121d7822b1eSMathieu Desnoyers }
2122d7822b1eSMathieu Desnoyers 
2123d7822b1eSMathieu Desnoyers #else
2124d7822b1eSMathieu Desnoyers 
2125d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t)
2126d7822b1eSMathieu Desnoyers {
2127d7822b1eSMathieu Desnoyers }
2128784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig,
2129784e0300SWill Deacon 					     struct pt_regs *regs)
2130d7822b1eSMathieu Desnoyers {
2131d7822b1eSMathieu Desnoyers }
2132784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig,
2133784e0300SWill Deacon 				       struct pt_regs *regs)
2134d7822b1eSMathieu Desnoyers {
2135d7822b1eSMathieu Desnoyers }
2136d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t)
2137d7822b1eSMathieu Desnoyers {
2138d7822b1eSMathieu Desnoyers }
2139d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t)
2140d7822b1eSMathieu Desnoyers {
2141d7822b1eSMathieu Desnoyers }
2142d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags)
2143d7822b1eSMathieu Desnoyers {
2144d7822b1eSMathieu Desnoyers }
2145d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t)
2146d7822b1eSMathieu Desnoyers {
2147d7822b1eSMathieu Desnoyers }
2148d7822b1eSMathieu Desnoyers 
2149d7822b1eSMathieu Desnoyers #endif
2150d7822b1eSMathieu Desnoyers 
2151d7822b1eSMathieu Desnoyers #ifdef CONFIG_DEBUG_RSEQ
2152d7822b1eSMathieu Desnoyers 
2153d7822b1eSMathieu Desnoyers void rseq_syscall(struct pt_regs *regs);
2154d7822b1eSMathieu Desnoyers 
2155d7822b1eSMathieu Desnoyers #else
2156d7822b1eSMathieu Desnoyers 
2157d7822b1eSMathieu Desnoyers static inline void rseq_syscall(struct pt_regs *regs)
2158d7822b1eSMathieu Desnoyers {
2159d7822b1eSMathieu Desnoyers }
2160d7822b1eSMathieu Desnoyers 
2161d7822b1eSMathieu Desnoyers #endif
2162d7822b1eSMathieu Desnoyers 
21633c93a0c0SQais Yousef const struct sched_avg *sched_trace_cfs_rq_avg(struct cfs_rq *cfs_rq);
21643c93a0c0SQais Yousef char *sched_trace_cfs_rq_path(struct cfs_rq *cfs_rq, char *str, int len);
21653c93a0c0SQais Yousef int sched_trace_cfs_rq_cpu(struct cfs_rq *cfs_rq);
21663c93a0c0SQais Yousef 
21673c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_rt(struct rq *rq);
21683c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_dl(struct rq *rq);
21693c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_irq(struct rq *rq);
21703c93a0c0SQais Yousef 
21713c93a0c0SQais Yousef int sched_trace_rq_cpu(struct rq *rq);
217251cf18c9SVincent Donnefort int sched_trace_rq_cpu_capacity(struct rq *rq);
21739d246053SPhil Auld int sched_trace_rq_nr_running(struct rq *rq);
21743c93a0c0SQais Yousef 
21753c93a0c0SQais Yousef const struct cpumask *sched_trace_rd_span(struct root_domain *rd);
21763c93a0c0SQais Yousef 
21771da177e4SLinus Torvalds #endif
2178