xref: /linux/include/linux/sched.h (revision ceeadb83aea28372e54857bf88ab7e17af48ab7b)
1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */
21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H
31da177e4SLinus Torvalds #define _LINUX_SCHED_H
41da177e4SLinus Torvalds 
55eca1c10SIngo Molnar /*
65eca1c10SIngo Molnar  * Define 'struct task_struct' and provide the main scheduler
75eca1c10SIngo Molnar  * APIs (schedule(), wakeup variants, etc.)
85eca1c10SIngo Molnar  */
95eca1c10SIngo Molnar 
10607ca46eSDavid Howells #include <uapi/linux/sched.h>
11b7b3c76aSDavid Woodhouse 
1270b8157eSIngo Molnar #include <asm/current.h>
1370b8157eSIngo Molnar 
145eca1c10SIngo Molnar #include <linux/pid.h>
155eca1c10SIngo Molnar #include <linux/sem.h>
165eca1c10SIngo Molnar #include <linux/shm.h>
175eca1c10SIngo Molnar #include <linux/mutex.h>
185eca1c10SIngo Molnar #include <linux/plist.h>
195eca1c10SIngo Molnar #include <linux/hrtimer.h>
200584df9cSMarco Elver #include <linux/irqflags.h>
215eca1c10SIngo Molnar #include <linux/seccomp.h>
225eca1c10SIngo Molnar #include <linux/nodemask.h>
235eca1c10SIngo Molnar #include <linux/rcupdate.h>
24ec1d2819SElena Reshetova #include <linux/refcount.h>
255eca1c10SIngo Molnar #include <linux/resource.h>
265eca1c10SIngo Molnar #include <linux/latencytop.h>
275eca1c10SIngo Molnar #include <linux/sched/prio.h>
289eacb5c7SThomas Gleixner #include <linux/sched/types.h>
295eca1c10SIngo Molnar #include <linux/signal_types.h>
301446e1dfSGabriel Krisman Bertazi #include <linux/syscall_user_dispatch.h>
315eca1c10SIngo Molnar #include <linux/mm_types_task.h>
325eca1c10SIngo Molnar #include <linux/task_io_accounting.h>
332b69942fSThomas Gleixner #include <linux/posix-timers.h>
34d7822b1eSMathieu Desnoyers #include <linux/rseq.h>
350cd39f46SPeter Zijlstra #include <linux/seqlock.h>
36dfd402a4SMarco Elver #include <linux/kcsan.h>
375fbda3ecSThomas Gleixner #include <asm/kmap_size.h>
385eca1c10SIngo Molnar 
395eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */
40c7af7877SIngo Molnar struct audit_context;
41c7af7877SIngo Molnar struct backing_dev_info;
42c7af7877SIngo Molnar struct bio_list;
43c7af7877SIngo Molnar struct blk_plug;
44a10787e6SSong Liu struct bpf_local_storage;
45c7603cfaSAndrii Nakryiko struct bpf_run_ctx;
463c93a0c0SQais Yousef struct capture_control;
47c7af7877SIngo Molnar struct cfs_rq;
48c7af7877SIngo Molnar struct fs_struct;
49c7af7877SIngo Molnar struct futex_pi_state;
50c7af7877SIngo Molnar struct io_context;
511875dc5bSPeter Oskolkov struct io_uring_task;
52c7af7877SIngo Molnar struct mempolicy;
53c7af7877SIngo Molnar struct nameidata;
54c7af7877SIngo Molnar struct nsproxy;
55c7af7877SIngo Molnar struct perf_event_context;
56c7af7877SIngo Molnar struct pid_namespace;
57c7af7877SIngo Molnar struct pipe_inode_info;
58c7af7877SIngo Molnar struct rcu_node;
59c7af7877SIngo Molnar struct reclaim_state;
60c7af7877SIngo Molnar struct robust_list_head;
613c93a0c0SQais Yousef struct root_domain;
623c93a0c0SQais Yousef struct rq;
63e2d1e2aeSIngo Molnar struct sched_attr;
64e2d1e2aeSIngo Molnar struct sched_param;
6543ae34cbSIngo Molnar struct seq_file;
66c7af7877SIngo Molnar struct sighand_struct;
67c7af7877SIngo Molnar struct signal_struct;
68c7af7877SIngo Molnar struct task_delay_info;
694cf86d77SIngo Molnar struct task_group;
701da177e4SLinus Torvalds 
714a8342d2SLinus Torvalds /*
724a8342d2SLinus Torvalds  * Task state bitmask. NOTE! These bits are also
734a8342d2SLinus Torvalds  * encoded in fs/proc/array.c: get_task_state().
744a8342d2SLinus Torvalds  *
754a8342d2SLinus Torvalds  * We have two separate sets of flags: task->state
764a8342d2SLinus Torvalds  * is about runnability, while task->exit_state are
774a8342d2SLinus Torvalds  * about the task exiting. Confusing, but this way
784a8342d2SLinus Torvalds  * modifying one set can't modify the other one by
794a8342d2SLinus Torvalds  * mistake.
804a8342d2SLinus Torvalds  */
815eca1c10SIngo Molnar 
825eca1c10SIngo Molnar /* Used in tsk->state: */
8392c4bc9fSPeter Zijlstra #define TASK_RUNNING			0x0000
8492c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE		0x0001
8592c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE		0x0002
8692c4bc9fSPeter Zijlstra #define __TASK_STOPPED			0x0004
8792c4bc9fSPeter Zijlstra #define __TASK_TRACED			0x0008
885eca1c10SIngo Molnar /* Used in tsk->exit_state: */
8992c4bc9fSPeter Zijlstra #define EXIT_DEAD			0x0010
9092c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE			0x0020
91abd50b39SOleg Nesterov #define EXIT_TRACE			(EXIT_ZOMBIE | EXIT_DEAD)
925eca1c10SIngo Molnar /* Used in tsk->state again: */
938ef9925bSPeter Zijlstra #define TASK_PARKED			0x0040
948ef9925bSPeter Zijlstra #define TASK_DEAD			0x0080
958ef9925bSPeter Zijlstra #define TASK_WAKEKILL			0x0100
968ef9925bSPeter Zijlstra #define TASK_WAKING			0x0200
9792c4bc9fSPeter Zijlstra #define TASK_NOLOAD			0x0400
9892c4bc9fSPeter Zijlstra #define TASK_NEW			0x0800
99cd781d0cSThomas Gleixner /* RT specific auxilliary flag to mark RT lock waiters */
100cd781d0cSThomas Gleixner #define TASK_RTLOCK_WAIT		0x1000
101cd781d0cSThomas Gleixner #define TASK_STATE_MAX			0x2000
102f021a3c2SMatthew Wilcox 
1035eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */
104f021a3c2SMatthew Wilcox #define TASK_KILLABLE			(TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
105f021a3c2SMatthew Wilcox #define TASK_STOPPED			(TASK_WAKEKILL | __TASK_STOPPED)
106f021a3c2SMatthew Wilcox #define TASK_TRACED			(TASK_WAKEKILL | __TASK_TRACED)
1071da177e4SLinus Torvalds 
10880ed87c8SPeter Zijlstra #define TASK_IDLE			(TASK_UNINTERRUPTIBLE | TASK_NOLOAD)
10980ed87c8SPeter Zijlstra 
1105eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */
11192a1f4bcSMatthew Wilcox #define TASK_NORMAL			(TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
11292a1f4bcSMatthew Wilcox 
1135eca1c10SIngo Molnar /* get_task_state(): */
11492a1f4bcSMatthew Wilcox #define TASK_REPORT			(TASK_RUNNING | TASK_INTERRUPTIBLE | \
115f021a3c2SMatthew Wilcox 					 TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
1168ef9925bSPeter Zijlstra 					 __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \
1178ef9925bSPeter Zijlstra 					 TASK_PARKED)
11892a1f4bcSMatthew Wilcox 
1192f064a59SPeter Zijlstra #define task_is_running(task)		(READ_ONCE((task)->__state) == TASK_RUNNING)
1205eca1c10SIngo Molnar 
1212f064a59SPeter Zijlstra #define task_is_traced(task)		((READ_ONCE(task->__state) & __TASK_TRACED) != 0)
1225eca1c10SIngo Molnar 
1232f064a59SPeter Zijlstra #define task_is_stopped(task)		((READ_ONCE(task->__state) & __TASK_STOPPED) != 0)
1245eca1c10SIngo Molnar 
1252f064a59SPeter Zijlstra #define task_is_stopped_or_traced(task)	((READ_ONCE(task->__state) & (__TASK_STOPPED | __TASK_TRACED)) != 0)
1265eca1c10SIngo Molnar 
127b5bf9a90SPeter Zijlstra /*
128b5bf9a90SPeter Zijlstra  * Special states are those that do not use the normal wait-loop pattern. See
129b5bf9a90SPeter Zijlstra  * the comment with set_special_state().
130b5bf9a90SPeter Zijlstra  */
131b5bf9a90SPeter Zijlstra #define is_special_task_state(state)				\
1321cef1150SPeter Zijlstra 	((state) & (__TASK_STOPPED | __TASK_TRACED | TASK_PARKED | TASK_DEAD))
133b5bf9a90SPeter Zijlstra 
13485019c16SThomas Gleixner #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
13585019c16SThomas Gleixner # define debug_normal_state_change(state_value)				\
1368eb23b9fSPeter Zijlstra 	do {								\
137b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(is_special_task_state(state_value));	\
1388eb23b9fSPeter Zijlstra 		current->task_state_change = _THIS_IP_;			\
1398eb23b9fSPeter Zijlstra 	} while (0)
140b5bf9a90SPeter Zijlstra 
14185019c16SThomas Gleixner # define debug_special_state_change(state_value)			\
1428eb23b9fSPeter Zijlstra 	do {								\
143b5bf9a90SPeter Zijlstra 		WARN_ON_ONCE(!is_special_task_state(state_value));	\
144b5bf9a90SPeter Zijlstra 		current->task_state_change = _THIS_IP_;			\
145b5bf9a90SPeter Zijlstra 	} while (0)
14685019c16SThomas Gleixner 
1475f220be2SThomas Gleixner # define debug_rtlock_wait_set_state()					\
1485f220be2SThomas Gleixner 	do {								 \
1495f220be2SThomas Gleixner 		current->saved_state_change = current->task_state_change;\
1505f220be2SThomas Gleixner 		current->task_state_change = _THIS_IP_;			 \
1515f220be2SThomas Gleixner 	} while (0)
1525f220be2SThomas Gleixner 
1535f220be2SThomas Gleixner # define debug_rtlock_wait_restore_state()				\
1545f220be2SThomas Gleixner 	do {								 \
1555f220be2SThomas Gleixner 		current->task_state_change = current->saved_state_change;\
1565f220be2SThomas Gleixner 	} while (0)
1575f220be2SThomas Gleixner 
1588eb23b9fSPeter Zijlstra #else
15985019c16SThomas Gleixner # define debug_normal_state_change(cond)	do { } while (0)
16085019c16SThomas Gleixner # define debug_special_state_change(cond)	do { } while (0)
1615f220be2SThomas Gleixner # define debug_rtlock_wait_set_state()		do { } while (0)
1625f220be2SThomas Gleixner # define debug_rtlock_wait_restore_state()	do { } while (0)
16385019c16SThomas Gleixner #endif
16485019c16SThomas Gleixner 
165498d0c57SAndrew Morton /*
166498d0c57SAndrew Morton  * set_current_state() includes a barrier so that the write of current->state
167498d0c57SAndrew Morton  * is correctly serialised wrt the caller's subsequent test of whether to
168498d0c57SAndrew Morton  * actually sleep:
169498d0c57SAndrew Morton  *
170a2250238SPeter Zijlstra  *   for (;;) {
171498d0c57SAndrew Morton  *	set_current_state(TASK_UNINTERRUPTIBLE);
17258877d34SPeter Zijlstra  *	if (CONDITION)
173a2250238SPeter Zijlstra  *	   break;
174498d0c57SAndrew Morton  *
175a2250238SPeter Zijlstra  *	schedule();
176a2250238SPeter Zijlstra  *   }
177a2250238SPeter Zijlstra  *   __set_current_state(TASK_RUNNING);
178a2250238SPeter Zijlstra  *
179a2250238SPeter Zijlstra  * If the caller does not need such serialisation (because, for instance, the
18058877d34SPeter Zijlstra  * CONDITION test and condition change and wakeup are under the same lock) then
181a2250238SPeter Zijlstra  * use __set_current_state().
182a2250238SPeter Zijlstra  *
183a2250238SPeter Zijlstra  * The above is typically ordered against the wakeup, which does:
184a2250238SPeter Zijlstra  *
18558877d34SPeter Zijlstra  *   CONDITION = 1;
186a2250238SPeter Zijlstra  *   wake_up_state(p, TASK_UNINTERRUPTIBLE);
187a2250238SPeter Zijlstra  *
18858877d34SPeter Zijlstra  * where wake_up_state()/try_to_wake_up() executes a full memory barrier before
18958877d34SPeter Zijlstra  * accessing p->state.
190a2250238SPeter Zijlstra  *
191a2250238SPeter Zijlstra  * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is,
192a2250238SPeter Zijlstra  * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a
193a2250238SPeter Zijlstra  * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING).
194a2250238SPeter Zijlstra  *
195b5bf9a90SPeter Zijlstra  * However, with slightly different timing the wakeup TASK_RUNNING store can
196dfcb245eSIngo Molnar  * also collide with the TASK_UNINTERRUPTIBLE store. Losing that store is not
197b5bf9a90SPeter Zijlstra  * a problem either because that will result in one extra go around the loop
198b5bf9a90SPeter Zijlstra  * and our @cond test will save the day.
199a2250238SPeter Zijlstra  *
200a2250238SPeter Zijlstra  * Also see the comments of try_to_wake_up().
201498d0c57SAndrew Morton  */
202b5bf9a90SPeter Zijlstra #define __set_current_state(state_value)				\
20385019c16SThomas Gleixner 	do {								\
20485019c16SThomas Gleixner 		debug_normal_state_change((state_value));		\
20585019c16SThomas Gleixner 		WRITE_ONCE(current->__state, (state_value));		\
20685019c16SThomas Gleixner 	} while (0)
207b5bf9a90SPeter Zijlstra 
208b5bf9a90SPeter Zijlstra #define set_current_state(state_value)					\
20985019c16SThomas Gleixner 	do {								\
21085019c16SThomas Gleixner 		debug_normal_state_change((state_value));		\
21185019c16SThomas Gleixner 		smp_store_mb(current->__state, (state_value));		\
21285019c16SThomas Gleixner 	} while (0)
213b5bf9a90SPeter Zijlstra 
214b5bf9a90SPeter Zijlstra /*
215b5bf9a90SPeter Zijlstra  * set_special_state() should be used for those states when the blocking task
216b5bf9a90SPeter Zijlstra  * can not use the regular condition based wait-loop. In that case we must
21785019c16SThomas Gleixner  * serialize against wakeups such that any possible in-flight TASK_RUNNING
21885019c16SThomas Gleixner  * stores will not collide with our state change.
219b5bf9a90SPeter Zijlstra  */
220b5bf9a90SPeter Zijlstra #define set_special_state(state_value)					\
221b5bf9a90SPeter Zijlstra 	do {								\
222b5bf9a90SPeter Zijlstra 		unsigned long flags; /* may shadow */			\
22385019c16SThomas Gleixner 									\
224b5bf9a90SPeter Zijlstra 		raw_spin_lock_irqsave(&current->pi_lock, flags);	\
22585019c16SThomas Gleixner 		debug_special_state_change((state_value));		\
2262f064a59SPeter Zijlstra 		WRITE_ONCE(current->__state, (state_value));		\
227b5bf9a90SPeter Zijlstra 		raw_spin_unlock_irqrestore(&current->pi_lock, flags);	\
228b5bf9a90SPeter Zijlstra 	} while (0)
229b5bf9a90SPeter Zijlstra 
2305f220be2SThomas Gleixner /*
2315f220be2SThomas Gleixner  * PREEMPT_RT specific variants for "sleeping" spin/rwlocks
2325f220be2SThomas Gleixner  *
2335f220be2SThomas Gleixner  * RT's spin/rwlock substitutions are state preserving. The state of the
2345f220be2SThomas Gleixner  * task when blocking on the lock is saved in task_struct::saved_state and
2355f220be2SThomas Gleixner  * restored after the lock has been acquired.  These operations are
2365f220be2SThomas Gleixner  * serialized by task_struct::pi_lock against try_to_wake_up(). Any non RT
2375f220be2SThomas Gleixner  * lock related wakeups while the task is blocked on the lock are
2385f220be2SThomas Gleixner  * redirected to operate on task_struct::saved_state to ensure that these
2395f220be2SThomas Gleixner  * are not dropped. On restore task_struct::saved_state is set to
2405f220be2SThomas Gleixner  * TASK_RUNNING so any wakeup attempt redirected to saved_state will fail.
2415f220be2SThomas Gleixner  *
2425f220be2SThomas Gleixner  * The lock operation looks like this:
2435f220be2SThomas Gleixner  *
2445f220be2SThomas Gleixner  *	current_save_and_set_rtlock_wait_state();
2455f220be2SThomas Gleixner  *	for (;;) {
2465f220be2SThomas Gleixner  *		if (try_lock())
2475f220be2SThomas Gleixner  *			break;
2485f220be2SThomas Gleixner  *		raw_spin_unlock_irq(&lock->wait_lock);
2495f220be2SThomas Gleixner  *		schedule_rtlock();
2505f220be2SThomas Gleixner  *		raw_spin_lock_irq(&lock->wait_lock);
2515f220be2SThomas Gleixner  *		set_current_state(TASK_RTLOCK_WAIT);
2525f220be2SThomas Gleixner  *	}
2535f220be2SThomas Gleixner  *	current_restore_rtlock_saved_state();
2545f220be2SThomas Gleixner  */
2555f220be2SThomas Gleixner #define current_save_and_set_rtlock_wait_state()			\
2565f220be2SThomas Gleixner 	do {								\
2575f220be2SThomas Gleixner 		lockdep_assert_irqs_disabled();				\
2585f220be2SThomas Gleixner 		raw_spin_lock(&current->pi_lock);			\
2595f220be2SThomas Gleixner 		current->saved_state = current->__state;		\
2605f220be2SThomas Gleixner 		debug_rtlock_wait_set_state();				\
2615f220be2SThomas Gleixner 		WRITE_ONCE(current->__state, TASK_RTLOCK_WAIT);		\
2625f220be2SThomas Gleixner 		raw_spin_unlock(&current->pi_lock);			\
2635f220be2SThomas Gleixner 	} while (0);
2645f220be2SThomas Gleixner 
2655f220be2SThomas Gleixner #define current_restore_rtlock_saved_state()				\
2665f220be2SThomas Gleixner 	do {								\
2675f220be2SThomas Gleixner 		lockdep_assert_irqs_disabled();				\
2685f220be2SThomas Gleixner 		raw_spin_lock(&current->pi_lock);			\
2695f220be2SThomas Gleixner 		debug_rtlock_wait_restore_state();			\
2705f220be2SThomas Gleixner 		WRITE_ONCE(current->__state, current->saved_state);	\
2715f220be2SThomas Gleixner 		current->saved_state = TASK_RUNNING;			\
2725f220be2SThomas Gleixner 		raw_spin_unlock(&current->pi_lock);			\
2735f220be2SThomas Gleixner 	} while (0);
2748eb23b9fSPeter Zijlstra 
2752f064a59SPeter Zijlstra #define get_current_state()	READ_ONCE(current->__state)
276d6c23bb3SPeter Zijlstra 
2775eca1c10SIngo Molnar /* Task command name length: */
2781da177e4SLinus Torvalds #define TASK_COMM_LEN			16
2791da177e4SLinus Torvalds 
2801da177e4SLinus Torvalds extern void scheduler_tick(void);
2811da177e4SLinus Torvalds 
2821da177e4SLinus Torvalds #define	MAX_SCHEDULE_TIMEOUT		LONG_MAX
2835eca1c10SIngo Molnar 
2845eca1c10SIngo Molnar extern long schedule_timeout(long timeout);
2855eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout);
2865eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout);
2875eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout);
2885eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout);
2891da177e4SLinus Torvalds asmlinkage void schedule(void);
290c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void);
29119c95f26SJulien Thierry asmlinkage void preempt_schedule_irq(void);
2926991436cSThomas Gleixner #ifdef CONFIG_PREEMPT_RT
2936991436cSThomas Gleixner  extern void schedule_rtlock(void);
2946991436cSThomas Gleixner #endif
2951da177e4SLinus Torvalds 
29610ab5643STejun Heo extern int __must_check io_schedule_prepare(void);
29710ab5643STejun Heo extern void io_schedule_finish(int token);
2989cff8adeSNeilBrown extern long io_schedule_timeout(long timeout);
29910ab5643STejun Heo extern void io_schedule(void);
3009cff8adeSNeilBrown 
301f06febc9SFrank Mayhar /**
3020ba42a59SMasanari Iida  * struct prev_cputime - snapshot of system and user cputime
303d37f761dSFrederic Weisbecker  * @utime: time spent in user mode
304d37f761dSFrederic Weisbecker  * @stime: time spent in system mode
3059d7fb042SPeter Zijlstra  * @lock: protects the above two fields
306d37f761dSFrederic Weisbecker  *
3079d7fb042SPeter Zijlstra  * Stores previous user/system time values such that we can guarantee
3089d7fb042SPeter Zijlstra  * monotonicity.
309d37f761dSFrederic Weisbecker  */
3109d7fb042SPeter Zijlstra struct prev_cputime {
3119d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
3125613fda9SFrederic Weisbecker 	u64				utime;
3135613fda9SFrederic Weisbecker 	u64				stime;
3149d7fb042SPeter Zijlstra 	raw_spinlock_t			lock;
3159d7fb042SPeter Zijlstra #endif
316d37f761dSFrederic Weisbecker };
317d37f761dSFrederic Weisbecker 
318bac5b6b6SFrederic Weisbecker enum vtime_state {
319bac5b6b6SFrederic Weisbecker 	/* Task is sleeping or running in a CPU with VTIME inactive: */
320bac5b6b6SFrederic Weisbecker 	VTIME_INACTIVE = 0,
32114faf6fcSFrederic Weisbecker 	/* Task is idle */
32214faf6fcSFrederic Weisbecker 	VTIME_IDLE,
323bac5b6b6SFrederic Weisbecker 	/* Task runs in kernelspace in a CPU with VTIME active: */
324bac5b6b6SFrederic Weisbecker 	VTIME_SYS,
32514faf6fcSFrederic Weisbecker 	/* Task runs in userspace in a CPU with VTIME active: */
32614faf6fcSFrederic Weisbecker 	VTIME_USER,
327e6d5bf3eSFrederic Weisbecker 	/* Task runs as guests in a CPU with VTIME active: */
328e6d5bf3eSFrederic Weisbecker 	VTIME_GUEST,
329bac5b6b6SFrederic Weisbecker };
330bac5b6b6SFrederic Weisbecker 
331bac5b6b6SFrederic Weisbecker struct vtime {
332bac5b6b6SFrederic Weisbecker 	seqcount_t		seqcount;
333bac5b6b6SFrederic Weisbecker 	unsigned long long	starttime;
334bac5b6b6SFrederic Weisbecker 	enum vtime_state	state;
335802f4a82SFrederic Weisbecker 	unsigned int		cpu;
3362a42eb95SWanpeng Li 	u64			utime;
3372a42eb95SWanpeng Li 	u64			stime;
3382a42eb95SWanpeng Li 	u64			gtime;
339bac5b6b6SFrederic Weisbecker };
340bac5b6b6SFrederic Weisbecker 
34169842cbaSPatrick Bellasi /*
34269842cbaSPatrick Bellasi  * Utilization clamp constraints.
34369842cbaSPatrick Bellasi  * @UCLAMP_MIN:	Minimum utilization
34469842cbaSPatrick Bellasi  * @UCLAMP_MAX:	Maximum utilization
34569842cbaSPatrick Bellasi  * @UCLAMP_CNT:	Utilization clamp constraints count
34669842cbaSPatrick Bellasi  */
34769842cbaSPatrick Bellasi enum uclamp_id {
34869842cbaSPatrick Bellasi 	UCLAMP_MIN = 0,
34969842cbaSPatrick Bellasi 	UCLAMP_MAX,
35069842cbaSPatrick Bellasi 	UCLAMP_CNT
35169842cbaSPatrick Bellasi };
35269842cbaSPatrick Bellasi 
353f9a25f77SMathieu Poirier #ifdef CONFIG_SMP
354f9a25f77SMathieu Poirier extern struct root_domain def_root_domain;
355f9a25f77SMathieu Poirier extern struct mutex sched_domains_mutex;
356f9a25f77SMathieu Poirier #endif
357f9a25f77SMathieu Poirier 
3581da177e4SLinus Torvalds struct sched_info {
3597f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO
3605eca1c10SIngo Molnar 	/* Cumulative counters: */
3611da177e4SLinus Torvalds 
3625eca1c10SIngo Molnar 	/* # of times we have run on this CPU: */
3635eca1c10SIngo Molnar 	unsigned long			pcount;
3645eca1c10SIngo Molnar 
3655eca1c10SIngo Molnar 	/* Time spent waiting on a runqueue: */
3665eca1c10SIngo Molnar 	unsigned long long		run_delay;
3675eca1c10SIngo Molnar 
3685eca1c10SIngo Molnar 	/* Timestamps: */
3695eca1c10SIngo Molnar 
3705eca1c10SIngo Molnar 	/* When did we last run on a CPU? */
3715eca1c10SIngo Molnar 	unsigned long long		last_arrival;
3725eca1c10SIngo Molnar 
3735eca1c10SIngo Molnar 	/* When were we last queued to run? */
3745eca1c10SIngo Molnar 	unsigned long long		last_queued;
3755eca1c10SIngo Molnar 
376f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */
3777f5f8e8dSIngo Molnar };
3781da177e4SLinus Torvalds 
3791da177e4SLinus Torvalds /*
3806ecdd749SYuyang Du  * Integer metrics need fixed point arithmetic, e.g., sched/fair
3816ecdd749SYuyang Du  * has a few: load, load_avg, util_avg, freq, and capacity.
3826ecdd749SYuyang Du  *
3836ecdd749SYuyang Du  * We define a basic fixed point arithmetic range, and then formalize
3846ecdd749SYuyang Du  * all these metrics based on that basic range.
3856ecdd749SYuyang Du  */
3866ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT		10
3876ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE		(1L << SCHED_FIXEDPOINT_SHIFT)
3886ecdd749SYuyang Du 
38969842cbaSPatrick Bellasi /* Increase resolution of cpu_capacity calculations */
39069842cbaSPatrick Bellasi # define SCHED_CAPACITY_SHIFT		SCHED_FIXEDPOINT_SHIFT
39169842cbaSPatrick Bellasi # define SCHED_CAPACITY_SCALE		(1L << SCHED_CAPACITY_SHIFT)
39269842cbaSPatrick Bellasi 
39320b8a59fSIngo Molnar struct load_weight {
3949dbdb155SPeter Zijlstra 	unsigned long			weight;
3959dbdb155SPeter Zijlstra 	u32				inv_weight;
39620b8a59fSIngo Molnar };
39720b8a59fSIngo Molnar 
3987f65ea42SPatrick Bellasi /**
3997f65ea42SPatrick Bellasi  * struct util_est - Estimation utilization of FAIR tasks
4007f65ea42SPatrick Bellasi  * @enqueued: instantaneous estimated utilization of a task/cpu
4017f65ea42SPatrick Bellasi  * @ewma:     the Exponential Weighted Moving Average (EWMA)
4027f65ea42SPatrick Bellasi  *            utilization of a task
4037f65ea42SPatrick Bellasi  *
4047f65ea42SPatrick Bellasi  * Support data structure to track an Exponential Weighted Moving Average
4057f65ea42SPatrick Bellasi  * (EWMA) of a FAIR task's utilization. New samples are added to the moving
4067f65ea42SPatrick Bellasi  * average each time a task completes an activation. Sample's weight is chosen
4077f65ea42SPatrick Bellasi  * so that the EWMA will be relatively insensitive to transient changes to the
4087f65ea42SPatrick Bellasi  * task's workload.
4097f65ea42SPatrick Bellasi  *
4107f65ea42SPatrick Bellasi  * The enqueued attribute has a slightly different meaning for tasks and cpus:
4117f65ea42SPatrick Bellasi  * - task:   the task's util_avg at last task dequeue time
4127f65ea42SPatrick Bellasi  * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU
4137f65ea42SPatrick Bellasi  * Thus, the util_est.enqueued of a task represents the contribution on the
4147f65ea42SPatrick Bellasi  * estimated utilization of the CPU where that task is currently enqueued.
4157f65ea42SPatrick Bellasi  *
4167f65ea42SPatrick Bellasi  * Only for tasks we track a moving average of the past instantaneous
4177f65ea42SPatrick Bellasi  * estimated utilization. This allows to absorb sporadic drops in utilization
4187f65ea42SPatrick Bellasi  * of an otherwise almost periodic task.
41968d7a190SDietmar Eggemann  *
42068d7a190SDietmar Eggemann  * The UTIL_AVG_UNCHANGED flag is used to synchronize util_est with util_avg
42168d7a190SDietmar Eggemann  * updates. When a task is dequeued, its util_est should not be updated if its
42268d7a190SDietmar Eggemann  * util_avg has not been updated in the meantime.
42368d7a190SDietmar Eggemann  * This information is mapped into the MSB bit of util_est.enqueued at dequeue
42468d7a190SDietmar Eggemann  * time. Since max value of util_est.enqueued for a task is 1024 (PELT util_avg
42568d7a190SDietmar Eggemann  * for a task) it is safe to use MSB.
4267f65ea42SPatrick Bellasi  */
4277f65ea42SPatrick Bellasi struct util_est {
4287f65ea42SPatrick Bellasi 	unsigned int			enqueued;
4297f65ea42SPatrick Bellasi 	unsigned int			ewma;
4307f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT		2
43168d7a190SDietmar Eggemann #define UTIL_AVG_UNCHANGED		0x80000000
432317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64))));
4337f65ea42SPatrick Bellasi 
4349d89c257SYuyang Du /*
4359f683953SVincent Guittot  * The load/runnable/util_avg accumulates an infinite geometric series
4360dacee1bSVincent Guittot  * (see __update_load_avg_cfs_rq() in kernel/sched/pelt.c).
4377b595334SYuyang Du  *
4387b595334SYuyang Du  * [load_avg definition]
4397b595334SYuyang Du  *
4407b595334SYuyang Du  *   load_avg = runnable% * scale_load_down(load)
4417b595334SYuyang Du  *
4429f683953SVincent Guittot  * [runnable_avg definition]
4439f683953SVincent Guittot  *
4449f683953SVincent Guittot  *   runnable_avg = runnable% * SCHED_CAPACITY_SCALE
4457b595334SYuyang Du  *
4467b595334SYuyang Du  * [util_avg definition]
4477b595334SYuyang Du  *
4487b595334SYuyang Du  *   util_avg = running% * SCHED_CAPACITY_SCALE
4497b595334SYuyang Du  *
4509f683953SVincent Guittot  * where runnable% is the time ratio that a sched_entity is runnable and
4519f683953SVincent Guittot  * running% the time ratio that a sched_entity is running.
4527b595334SYuyang Du  *
4539f683953SVincent Guittot  * For cfs_rq, they are the aggregated values of all runnable and blocked
4549f683953SVincent Guittot  * sched_entities.
4559f683953SVincent Guittot  *
456c1b7b8d4S王文虎  * The load/runnable/util_avg doesn't directly factor frequency scaling and CPU
4579f683953SVincent Guittot  * capacity scaling. The scaling is done through the rq_clock_pelt that is used
4589f683953SVincent Guittot  * for computing those signals (see update_rq_clock_pelt())
4597b595334SYuyang Du  *
46023127296SVincent Guittot  * N.B., the above ratios (runnable% and running%) themselves are in the
46123127296SVincent Guittot  * range of [0, 1]. To do fixed point arithmetics, we therefore scale them
46223127296SVincent Guittot  * to as large a range as necessary. This is for example reflected by
46323127296SVincent Guittot  * util_avg's SCHED_CAPACITY_SCALE.
4647b595334SYuyang Du  *
4657b595334SYuyang Du  * [Overflow issue]
4667b595334SYuyang Du  *
4677b595334SYuyang Du  * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities
4687b595334SYuyang Du  * with the highest load (=88761), always runnable on a single cfs_rq,
4697b595334SYuyang Du  * and should not overflow as the number already hits PID_MAX_LIMIT.
4707b595334SYuyang Du  *
4717b595334SYuyang Du  * For all other cases (including 32-bit kernels), struct load_weight's
4727b595334SYuyang Du  * weight will overflow first before we do, because:
4737b595334SYuyang Du  *
4747b595334SYuyang Du  *    Max(load_avg) <= Max(load.weight)
4757b595334SYuyang Du  *
4767b595334SYuyang Du  * Then it is the load_weight's responsibility to consider overflow
4777b595334SYuyang Du  * issues.
4789d89c257SYuyang Du  */
4799d85f21cSPaul Turner struct sched_avg {
4805eca1c10SIngo Molnar 	u64				last_update_time;
4815eca1c10SIngo Molnar 	u64				load_sum;
4829f683953SVincent Guittot 	u64				runnable_sum;
4835eca1c10SIngo Molnar 	u32				util_sum;
4845eca1c10SIngo Molnar 	u32				period_contrib;
4855eca1c10SIngo Molnar 	unsigned long			load_avg;
4869f683953SVincent Guittot 	unsigned long			runnable_avg;
4875eca1c10SIngo Molnar 	unsigned long			util_avg;
4887f65ea42SPatrick Bellasi 	struct util_est			util_est;
489317d359dSPeter Zijlstra } ____cacheline_aligned;
4909d85f21cSPaul Turner 
49141acab88SLucas De Marchi struct sched_statistics {
4927f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS
49394c18227SIngo Molnar 	u64				wait_start;
49494c18227SIngo Molnar 	u64				wait_max;
4956d082592SArjan van de Ven 	u64				wait_count;
4966d082592SArjan van de Ven 	u64				wait_sum;
4978f0dfc34SArjan van de Ven 	u64				iowait_count;
4988f0dfc34SArjan van de Ven 	u64				iowait_sum;
49994c18227SIngo Molnar 
50094c18227SIngo Molnar 	u64				sleep_start;
50120b8a59fSIngo Molnar 	u64				sleep_max;
50294c18227SIngo Molnar 	s64				sum_sleep_runtime;
50394c18227SIngo Molnar 
50494c18227SIngo Molnar 	u64				block_start;
50520b8a59fSIngo Molnar 	u64				block_max;
50620b8a59fSIngo Molnar 	u64				exec_max;
507eba1ed4bSIngo Molnar 	u64				slice_max;
508cc367732SIngo Molnar 
509cc367732SIngo Molnar 	u64				nr_migrations_cold;
510cc367732SIngo Molnar 	u64				nr_failed_migrations_affine;
511cc367732SIngo Molnar 	u64				nr_failed_migrations_running;
512cc367732SIngo Molnar 	u64				nr_failed_migrations_hot;
513cc367732SIngo Molnar 	u64				nr_forced_migrations;
514cc367732SIngo Molnar 
515cc367732SIngo Molnar 	u64				nr_wakeups;
516cc367732SIngo Molnar 	u64				nr_wakeups_sync;
517cc367732SIngo Molnar 	u64				nr_wakeups_migrate;
518cc367732SIngo Molnar 	u64				nr_wakeups_local;
519cc367732SIngo Molnar 	u64				nr_wakeups_remote;
520cc367732SIngo Molnar 	u64				nr_wakeups_affine;
521cc367732SIngo Molnar 	u64				nr_wakeups_affine_attempts;
522cc367732SIngo Molnar 	u64				nr_wakeups_passive;
523cc367732SIngo Molnar 	u64				nr_wakeups_idle;
52441acab88SLucas De Marchi #endif
525*ceeadb83SYafang Shao } ____cacheline_aligned;
52641acab88SLucas De Marchi 
52741acab88SLucas De Marchi struct sched_entity {
5285eca1c10SIngo Molnar 	/* For load-balancing: */
5295eca1c10SIngo Molnar 	struct load_weight		load;
53041acab88SLucas De Marchi 	struct rb_node			run_node;
53141acab88SLucas De Marchi 	struct list_head		group_node;
53241acab88SLucas De Marchi 	unsigned int			on_rq;
53341acab88SLucas De Marchi 
53441acab88SLucas De Marchi 	u64				exec_start;
53541acab88SLucas De Marchi 	u64				sum_exec_runtime;
53641acab88SLucas De Marchi 	u64				vruntime;
53741acab88SLucas De Marchi 	u64				prev_sum_exec_runtime;
53841acab88SLucas De Marchi 
53941acab88SLucas De Marchi 	u64				nr_migrations;
54041acab88SLucas De Marchi 
54120b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED
542fed14d45SPeter Zijlstra 	int				depth;
54320b8a59fSIngo Molnar 	struct sched_entity		*parent;
54420b8a59fSIngo Molnar 	/* rq on which this entity is (to be) queued: */
54520b8a59fSIngo Molnar 	struct cfs_rq			*cfs_rq;
54620b8a59fSIngo Molnar 	/* rq "owned" by this entity/group: */
54720b8a59fSIngo Molnar 	struct cfs_rq			*my_q;
5489f683953SVincent Guittot 	/* cached value of my_q->h_nr_running */
5499f683953SVincent Guittot 	unsigned long			runnable_weight;
55020b8a59fSIngo Molnar #endif
5518bd75c77SClark Williams 
552141965c7SAlex Shi #ifdef CONFIG_SMP
5535a107804SJiri Olsa 	/*
5545a107804SJiri Olsa 	 * Per entity load average tracking.
5555a107804SJiri Olsa 	 *
5565a107804SJiri Olsa 	 * Put into separate cache line so it does not
5575a107804SJiri Olsa 	 * collide with read-mostly values above.
5585a107804SJiri Olsa 	 */
559317d359dSPeter Zijlstra 	struct sched_avg		avg;
5609d85f21cSPaul Turner #endif
56120b8a59fSIngo Molnar };
56270b97a7fSIngo Molnar 
563fa717060SPeter Zijlstra struct sched_rt_entity {
564fa717060SPeter Zijlstra 	struct list_head		run_list;
56578f2c7dbSPeter Zijlstra 	unsigned long			timeout;
56657d2aa00SYing Xue 	unsigned long			watchdog_stamp;
567bee367edSRichard Kennedy 	unsigned int			time_slice;
568ff77e468SPeter Zijlstra 	unsigned short			on_rq;
569ff77e468SPeter Zijlstra 	unsigned short			on_list;
5706f505b16SPeter Zijlstra 
57158d6c2d7SPeter Zijlstra 	struct sched_rt_entity		*back;
572052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED
5736f505b16SPeter Zijlstra 	struct sched_rt_entity		*parent;
5746f505b16SPeter Zijlstra 	/* rq on which this entity is (to be) queued: */
5756f505b16SPeter Zijlstra 	struct rt_rq			*rt_rq;
5766f505b16SPeter Zijlstra 	/* rq "owned" by this entity/group: */
5776f505b16SPeter Zijlstra 	struct rt_rq			*my_q;
5786f505b16SPeter Zijlstra #endif
5793859a271SKees Cook } __randomize_layout;
580fa717060SPeter Zijlstra 
581aab03e05SDario Faggioli struct sched_dl_entity {
582aab03e05SDario Faggioli 	struct rb_node			rb_node;
583aab03e05SDario Faggioli 
584aab03e05SDario Faggioli 	/*
585aab03e05SDario Faggioli 	 * Original scheduling parameters. Copied here from sched_attr
5864027d080Sxiaofeng.yan 	 * during sched_setattr(), they will remain the same until
5874027d080Sxiaofeng.yan 	 * the next sched_setattr().
588aab03e05SDario Faggioli 	 */
5895eca1c10SIngo Molnar 	u64				dl_runtime;	/* Maximum runtime for each instance	*/
5905eca1c10SIngo Molnar 	u64				dl_deadline;	/* Relative deadline of each instance	*/
5915eca1c10SIngo Molnar 	u64				dl_period;	/* Separation of two instances (period) */
59254d6d303SDaniel Bristot de Oliveira 	u64				dl_bw;		/* dl_runtime / dl_period		*/
5933effcb42SDaniel Bristot de Oliveira 	u64				dl_density;	/* dl_runtime / dl_deadline		*/
594aab03e05SDario Faggioli 
595aab03e05SDario Faggioli 	/*
596aab03e05SDario Faggioli 	 * Actual scheduling parameters. Initialized with the values above,
597dfcb245eSIngo Molnar 	 * they are continuously updated during task execution. Note that
598aab03e05SDario Faggioli 	 * the remaining runtime could be < 0 in case we are in overrun.
599aab03e05SDario Faggioli 	 */
6005eca1c10SIngo Molnar 	s64				runtime;	/* Remaining runtime for this instance	*/
6015eca1c10SIngo Molnar 	u64				deadline;	/* Absolute deadline for this instance	*/
6025eca1c10SIngo Molnar 	unsigned int			flags;		/* Specifying the scheduler behaviour	*/
603aab03e05SDario Faggioli 
604aab03e05SDario Faggioli 	/*
605aab03e05SDario Faggioli 	 * Some bool flags:
606aab03e05SDario Faggioli 	 *
607aab03e05SDario Faggioli 	 * @dl_throttled tells if we exhausted the runtime. If so, the
608aab03e05SDario Faggioli 	 * task has to wait for a replenishment to be performed at the
609aab03e05SDario Faggioli 	 * next firing of dl_timer.
610aab03e05SDario Faggioli 	 *
6112d3d891dSDario Faggioli 	 * @dl_boosted tells if we are boosted due to DI. If so we are
6122d3d891dSDario Faggioli 	 * outside bandwidth enforcement mechanism (but only until we
6135bfd126eSJuri Lelli 	 * exit the critical section);
6145bfd126eSJuri Lelli 	 *
6155eca1c10SIngo Molnar 	 * @dl_yielded tells if task gave up the CPU before consuming
6165bfd126eSJuri Lelli 	 * all its available runtime during the last job.
617209a0cbdSLuca Abeni 	 *
618209a0cbdSLuca Abeni 	 * @dl_non_contending tells if the task is inactive while still
619209a0cbdSLuca Abeni 	 * contributing to the active utilization. In other words, it
620209a0cbdSLuca Abeni 	 * indicates if the inactive timer has been armed and its handler
621209a0cbdSLuca Abeni 	 * has not been executed yet. This flag is useful to avoid race
622209a0cbdSLuca Abeni 	 * conditions between the inactive timer handler and the wakeup
623209a0cbdSLuca Abeni 	 * code.
62434be3930SJuri Lelli 	 *
62534be3930SJuri Lelli 	 * @dl_overrun tells if the task asked to be informed about runtime
62634be3930SJuri Lelli 	 * overruns.
627aab03e05SDario Faggioli 	 */
628aa5222e9SDan Carpenter 	unsigned int			dl_throttled      : 1;
629aa5222e9SDan Carpenter 	unsigned int			dl_yielded        : 1;
630aa5222e9SDan Carpenter 	unsigned int			dl_non_contending : 1;
63134be3930SJuri Lelli 	unsigned int			dl_overrun	  : 1;
632aab03e05SDario Faggioli 
633aab03e05SDario Faggioli 	/*
634aab03e05SDario Faggioli 	 * Bandwidth enforcement timer. Each -deadline task has its
635aab03e05SDario Faggioli 	 * own bandwidth to be enforced, thus we need one timer per task.
636aab03e05SDario Faggioli 	 */
637aab03e05SDario Faggioli 	struct hrtimer			dl_timer;
638209a0cbdSLuca Abeni 
639209a0cbdSLuca Abeni 	/*
640209a0cbdSLuca Abeni 	 * Inactive timer, responsible for decreasing the active utilization
641209a0cbdSLuca Abeni 	 * at the "0-lag time". When a -deadline task blocks, it contributes
642209a0cbdSLuca Abeni 	 * to GRUB's active utilization until the "0-lag time", hence a
643209a0cbdSLuca Abeni 	 * timer is needed to decrease the active utilization at the correct
644209a0cbdSLuca Abeni 	 * time.
645209a0cbdSLuca Abeni 	 */
646209a0cbdSLuca Abeni 	struct hrtimer inactive_timer;
6472279f540SJuri Lelli 
6482279f540SJuri Lelli #ifdef CONFIG_RT_MUTEXES
6492279f540SJuri Lelli 	/*
6502279f540SJuri Lelli 	 * Priority Inheritance. When a DEADLINE scheduling entity is boosted
6512279f540SJuri Lelli 	 * pi_se points to the donor, otherwise points to the dl_se it belongs
6522279f540SJuri Lelli 	 * to (the original one/itself).
6532279f540SJuri Lelli 	 */
6542279f540SJuri Lelli 	struct sched_dl_entity *pi_se;
6552279f540SJuri Lelli #endif
656aab03e05SDario Faggioli };
6578bd75c77SClark Williams 
65869842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK
65969842cbaSPatrick Bellasi /* Number of utilization clamp buckets (shorter alias) */
66069842cbaSPatrick Bellasi #define UCLAMP_BUCKETS CONFIG_UCLAMP_BUCKETS_COUNT
66169842cbaSPatrick Bellasi 
66269842cbaSPatrick Bellasi /*
66369842cbaSPatrick Bellasi  * Utilization clamp for a scheduling entity
66469842cbaSPatrick Bellasi  * @value:		clamp value "assigned" to a se
66569842cbaSPatrick Bellasi  * @bucket_id:		bucket index corresponding to the "assigned" value
666e8f14172SPatrick Bellasi  * @active:		the se is currently refcounted in a rq's bucket
667a509a7cdSPatrick Bellasi  * @user_defined:	the requested clamp value comes from user-space
66869842cbaSPatrick Bellasi  *
66969842cbaSPatrick Bellasi  * The bucket_id is the index of the clamp bucket matching the clamp value
67069842cbaSPatrick Bellasi  * which is pre-computed and stored to avoid expensive integer divisions from
67169842cbaSPatrick Bellasi  * the fast path.
672e8f14172SPatrick Bellasi  *
673e8f14172SPatrick Bellasi  * The active bit is set whenever a task has got an "effective" value assigned,
674e8f14172SPatrick Bellasi  * which can be different from the clamp value "requested" from user-space.
675e8f14172SPatrick Bellasi  * This allows to know a task is refcounted in the rq's bucket corresponding
676e8f14172SPatrick Bellasi  * to the "effective" bucket_id.
677a509a7cdSPatrick Bellasi  *
678a509a7cdSPatrick Bellasi  * The user_defined bit is set whenever a task has got a task-specific clamp
679a509a7cdSPatrick Bellasi  * value requested from userspace, i.e. the system defaults apply to this task
680a509a7cdSPatrick Bellasi  * just as a restriction. This allows to relax default clamps when a less
681a509a7cdSPatrick Bellasi  * restrictive task-specific value has been requested, thus allowing to
682a509a7cdSPatrick Bellasi  * implement a "nice" semantic. For example, a task running with a 20%
683a509a7cdSPatrick Bellasi  * default boost can still drop its own boosting to 0%.
68469842cbaSPatrick Bellasi  */
68569842cbaSPatrick Bellasi struct uclamp_se {
68669842cbaSPatrick Bellasi 	unsigned int value		: bits_per(SCHED_CAPACITY_SCALE);
68769842cbaSPatrick Bellasi 	unsigned int bucket_id		: bits_per(UCLAMP_BUCKETS);
688e8f14172SPatrick Bellasi 	unsigned int active		: 1;
689a509a7cdSPatrick Bellasi 	unsigned int user_defined	: 1;
69069842cbaSPatrick Bellasi };
69169842cbaSPatrick Bellasi #endif /* CONFIG_UCLAMP_TASK */
69269842cbaSPatrick Bellasi 
6931d082fd0SPaul E. McKenney union rcu_special {
6941d082fd0SPaul E. McKenney 	struct {
6958203d6d0SPaul E. McKenney 		u8			blocked;
6968203d6d0SPaul E. McKenney 		u8			need_qs;
69705f41571SPaul E. McKenney 		u8			exp_hint; /* Hint for performance. */
698276c4104SPaul E. McKenney 		u8			need_mb; /* Readers need smp_mb(). */
6998203d6d0SPaul E. McKenney 	} b; /* Bits. */
70005f41571SPaul E. McKenney 	u32 s; /* Set of bits. */
7011d082fd0SPaul E. McKenney };
70286848966SPaul E. McKenney 
7038dc85d54SPeter Zijlstra enum perf_event_task_context {
7048dc85d54SPeter Zijlstra 	perf_invalid_context = -1,
7058dc85d54SPeter Zijlstra 	perf_hw_context = 0,
70689a1e187SPeter Zijlstra 	perf_sw_context,
7078dc85d54SPeter Zijlstra 	perf_nr_task_contexts,
7088dc85d54SPeter Zijlstra };
7098dc85d54SPeter Zijlstra 
710eb61baf6SIngo Molnar struct wake_q_node {
711eb61baf6SIngo Molnar 	struct wake_q_node *next;
712eb61baf6SIngo Molnar };
713eb61baf6SIngo Molnar 
7145fbda3ecSThomas Gleixner struct kmap_ctrl {
7155fbda3ecSThomas Gleixner #ifdef CONFIG_KMAP_LOCAL
7165fbda3ecSThomas Gleixner 	int				idx;
7175fbda3ecSThomas Gleixner 	pte_t				pteval[KM_MAX_IDX];
7185fbda3ecSThomas Gleixner #endif
7195fbda3ecSThomas Gleixner };
7205fbda3ecSThomas Gleixner 
7211da177e4SLinus Torvalds struct task_struct {
722c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
723c65eacbeSAndy Lutomirski 	/*
724c65eacbeSAndy Lutomirski 	 * For reasons of header soup (see current_thread_info()), this
725c65eacbeSAndy Lutomirski 	 * must be the first element of task_struct.
726c65eacbeSAndy Lutomirski 	 */
727c65eacbeSAndy Lutomirski 	struct thread_info		thread_info;
728c65eacbeSAndy Lutomirski #endif
7292f064a59SPeter Zijlstra 	unsigned int			__state;
73029e48ce8SKees Cook 
7315f220be2SThomas Gleixner #ifdef CONFIG_PREEMPT_RT
7325f220be2SThomas Gleixner 	/* saved state for "spinlock sleepers" */
7335f220be2SThomas Gleixner 	unsigned int			saved_state;
7345f220be2SThomas Gleixner #endif
7355f220be2SThomas Gleixner 
73629e48ce8SKees Cook 	/*
73729e48ce8SKees Cook 	 * This begins the randomizable portion of task_struct. Only
73829e48ce8SKees Cook 	 * scheduling-critical items should be added above here.
73929e48ce8SKees Cook 	 */
74029e48ce8SKees Cook 	randomized_struct_fields_start
74129e48ce8SKees Cook 
742f7e4217bSRoman Zippel 	void				*stack;
743ec1d2819SElena Reshetova 	refcount_t			usage;
7445eca1c10SIngo Molnar 	/* Per task flags (PF_*), defined further below: */
7455eca1c10SIngo Molnar 	unsigned int			flags;
74697dc32cdSWilliam Cohen 	unsigned int			ptrace;
7471da177e4SLinus Torvalds 
7482dd73a4fSPeter Williams #ifdef CONFIG_SMP
7493ca7a440SPeter Zijlstra 	int				on_cpu;
7508c4890d1SPeter Zijlstra 	struct __call_single_node	wake_entry;
751c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
7525eca1c10SIngo Molnar 	/* Current CPU: */
7535eca1c10SIngo Molnar 	unsigned int			cpu;
754c65eacbeSAndy Lutomirski #endif
75563b0e9edSMike Galbraith 	unsigned int			wakee_flips;
75662470419SMichael Wang 	unsigned long			wakee_flip_decay_ts;
75763b0e9edSMike Galbraith 	struct task_struct		*last_wakee;
758ac66f547SPeter Zijlstra 
75932e839ddSMel Gorman 	/*
76032e839ddSMel Gorman 	 * recent_used_cpu is initially set as the last CPU used by a task
76132e839ddSMel Gorman 	 * that wakes affine another task. Waker/wakee relationships can
76232e839ddSMel Gorman 	 * push tasks around a CPU where each wakeup moves to the next one.
76332e839ddSMel Gorman 	 * Tracking a recently used CPU allows a quick search for a recently
76432e839ddSMel Gorman 	 * used CPU that may be idle.
76532e839ddSMel Gorman 	 */
76632e839ddSMel Gorman 	int				recent_used_cpu;
767ac66f547SPeter Zijlstra 	int				wake_cpu;
7684866cde0SNick Piggin #endif
769fd2f4419SPeter Zijlstra 	int				on_rq;
77050e645a8SIngo Molnar 
7715eca1c10SIngo Molnar 	int				prio;
7725eca1c10SIngo Molnar 	int				static_prio;
7735eca1c10SIngo Molnar 	int				normal_prio;
774c7aceabaSRichard Kennedy 	unsigned int			rt_priority;
7755eca1c10SIngo Molnar 
7765522d5d5SIngo Molnar 	const struct sched_class	*sched_class;
77720b8a59fSIngo Molnar 	struct sched_entity		se;
778fa717060SPeter Zijlstra 	struct sched_rt_entity		rt;
7798a311c74SPeter Zijlstra 	struct sched_dl_entity		dl;
7808a311c74SPeter Zijlstra 
7818a311c74SPeter Zijlstra #ifdef CONFIG_SCHED_CORE
7828a311c74SPeter Zijlstra 	struct rb_node			core_node;
7838a311c74SPeter Zijlstra 	unsigned long			core_cookie;
784d2dfa17bSPeter Zijlstra 	unsigned int			core_occupation;
7858a311c74SPeter Zijlstra #endif
7868a311c74SPeter Zijlstra 
7878323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED
7888323f26cSPeter Zijlstra 	struct task_group		*sched_task_group;
7898323f26cSPeter Zijlstra #endif
7901da177e4SLinus Torvalds 
79169842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK
79213685c4aSQais Yousef 	/*
79313685c4aSQais Yousef 	 * Clamp values requested for a scheduling entity.
79413685c4aSQais Yousef 	 * Must be updated with task_rq_lock() held.
79513685c4aSQais Yousef 	 */
796e8f14172SPatrick Bellasi 	struct uclamp_se		uclamp_req[UCLAMP_CNT];
79713685c4aSQais Yousef 	/*
79813685c4aSQais Yousef 	 * Effective clamp values used for a scheduling entity.
79913685c4aSQais Yousef 	 * Must be updated with task_rq_lock() held.
80013685c4aSQais Yousef 	 */
80169842cbaSPatrick Bellasi 	struct uclamp_se		uclamp[UCLAMP_CNT];
80269842cbaSPatrick Bellasi #endif
80369842cbaSPatrick Bellasi 
804*ceeadb83SYafang Shao 	struct sched_statistics         stats;
805*ceeadb83SYafang Shao 
806e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS
8075eca1c10SIngo Molnar 	/* List of struct preempt_notifier: */
808e107be36SAvi Kivity 	struct hlist_head		preempt_notifiers;
809e107be36SAvi Kivity #endif
810e107be36SAvi Kivity 
8116c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE
8122056a782SJens Axboe 	unsigned int			btrace_seq;
8136c5c9341SAlexey Dobriyan #endif
8141da177e4SLinus Torvalds 
81597dc32cdSWilliam Cohen 	unsigned int			policy;
81629baa747SPeter Zijlstra 	int				nr_cpus_allowed;
8173bd37062SSebastian Andrzej Siewior 	const cpumask_t			*cpus_ptr;
818b90ca8baSWill Deacon 	cpumask_t			*user_cpus_ptr;
8193bd37062SSebastian Andrzej Siewior 	cpumask_t			cpus_mask;
8206d337eabSPeter Zijlstra 	void				*migration_pending;
82174d862b6SThomas Gleixner #ifdef CONFIG_SMP
822a7c81556SPeter Zijlstra 	unsigned short			migration_disabled;
823af449901SPeter Zijlstra #endif
824a7c81556SPeter Zijlstra 	unsigned short			migration_flags;
8251da177e4SLinus Torvalds 
826a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU
827e260be67SPaul E. McKenney 	int				rcu_read_lock_nesting;
8281d082fd0SPaul E. McKenney 	union rcu_special		rcu_read_unlock_special;
829f41d911fSPaul E. McKenney 	struct list_head		rcu_node_entry;
830a57eb940SPaul E. McKenney 	struct rcu_node			*rcu_blocked_node;
83128f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */
8325eca1c10SIngo Molnar 
8338315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU
8348315f422SPaul E. McKenney 	unsigned long			rcu_tasks_nvcsw;
835ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_holdout;
836ccdd29ffSPaul E. McKenney 	u8				rcu_tasks_idx;
837176f8f7aSPaul E. McKenney 	int				rcu_tasks_idle_cpu;
838ccdd29ffSPaul E. McKenney 	struct list_head		rcu_tasks_holdout_list;
8398315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */
840e260be67SPaul E. McKenney 
841d5f177d3SPaul E. McKenney #ifdef CONFIG_TASKS_TRACE_RCU
842d5f177d3SPaul E. McKenney 	int				trc_reader_nesting;
843d5f177d3SPaul E. McKenney 	int				trc_ipi_to_cpu;
844276c4104SPaul E. McKenney 	union rcu_special		trc_reader_special;
845d5f177d3SPaul E. McKenney 	bool				trc_reader_checked;
846d5f177d3SPaul E. McKenney 	struct list_head		trc_holdout_list;
847d5f177d3SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_TRACE_RCU */
848d5f177d3SPaul E. McKenney 
8491da177e4SLinus Torvalds 	struct sched_info		sched_info;
8501da177e4SLinus Torvalds 
8511da177e4SLinus Torvalds 	struct list_head		tasks;
852806c09a7SDario Faggioli #ifdef CONFIG_SMP
853917b627dSGregory Haskins 	struct plist_node		pushable_tasks;
8541baca4ceSJuri Lelli 	struct rb_node			pushable_dl_tasks;
855806c09a7SDario Faggioli #endif
8561da177e4SLinus Torvalds 
8575eca1c10SIngo Molnar 	struct mm_struct		*mm;
8585eca1c10SIngo Molnar 	struct mm_struct		*active_mm;
859314ff785SIngo Molnar 
860314ff785SIngo Molnar 	/* Per-thread vma caching: */
861314ff785SIngo Molnar 	struct vmacache			vmacache;
862314ff785SIngo Molnar 
8635eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING
86434e55232SKAMEZAWA Hiroyuki 	struct task_rss_stat		rss_stat;
86534e55232SKAMEZAWA Hiroyuki #endif
86697dc32cdSWilliam Cohen 	int				exit_state;
8675eca1c10SIngo Molnar 	int				exit_code;
8685eca1c10SIngo Molnar 	int				exit_signal;
8695eca1c10SIngo Molnar 	/* The signal sent when the parent dies: */
8705eca1c10SIngo Molnar 	int				pdeath_signal;
8715eca1c10SIngo Molnar 	/* JOBCTL_*, siglock protected: */
8725eca1c10SIngo Molnar 	unsigned long			jobctl;
8739b89f6baSAndrei Epure 
8745eca1c10SIngo Molnar 	/* Used for emulating ABI behavior of previous Linux versions: */
87597dc32cdSWilliam Cohen 	unsigned int			personality;
8769b89f6baSAndrei Epure 
8775eca1c10SIngo Molnar 	/* Scheduler bits, serialized by scheduler locks: */
878ca94c442SLennart Poettering 	unsigned			sched_reset_on_fork:1;
879a8e4f2eaSPeter Zijlstra 	unsigned			sched_contributes_to_load:1;
880ff303e66SPeter Zijlstra 	unsigned			sched_migrated:1;
881eb414681SJohannes Weiner #ifdef CONFIG_PSI
882eb414681SJohannes Weiner 	unsigned			sched_psi_wake_requeue:1;
883eb414681SJohannes Weiner #endif
884eb414681SJohannes Weiner 
8855eca1c10SIngo Molnar 	/* Force alignment to the next boundary: */
8865eca1c10SIngo Molnar 	unsigned			:0;
887be958bdcSPeter Zijlstra 
8885eca1c10SIngo Molnar 	/* Unserialized, strictly 'current' */
8895eca1c10SIngo Molnar 
890f97bb527SPeter Zijlstra 	/*
891f97bb527SPeter Zijlstra 	 * This field must not be in the scheduler word above due to wakelist
892f97bb527SPeter Zijlstra 	 * queueing no longer being serialized by p->on_cpu. However:
893f97bb527SPeter Zijlstra 	 *
894f97bb527SPeter Zijlstra 	 * p->XXX = X;			ttwu()
895f97bb527SPeter Zijlstra 	 * schedule()			  if (p->on_rq && ..) // false
896f97bb527SPeter Zijlstra 	 *   smp_mb__after_spinlock();	  if (smp_load_acquire(&p->on_cpu) && //true
897f97bb527SPeter Zijlstra 	 *   deactivate_task()		      ttwu_queue_wakelist())
898f97bb527SPeter Zijlstra 	 *     p->on_rq = 0;			p->sched_remote_wakeup = Y;
899f97bb527SPeter Zijlstra 	 *
900f97bb527SPeter Zijlstra 	 * guarantees all stores of 'current' are visible before
901f97bb527SPeter Zijlstra 	 * ->sched_remote_wakeup gets used, so it can be in this word.
902f97bb527SPeter Zijlstra 	 */
903f97bb527SPeter Zijlstra 	unsigned			sched_remote_wakeup:1;
904f97bb527SPeter Zijlstra 
9055eca1c10SIngo Molnar 	/* Bit to tell LSMs we're in execve(): */
9065eca1c10SIngo Molnar 	unsigned			in_execve:1;
907be958bdcSPeter Zijlstra 	unsigned			in_iowait:1;
9085eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK
9097e781418SAndy Lutomirski 	unsigned			restore_sigmask:1;
9107e781418SAndy Lutomirski #endif
911626ebc41STejun Heo #ifdef CONFIG_MEMCG
91229ef680aSMichal Hocko 	unsigned			in_user_fault:1;
913127424c8SJohannes Weiner #endif
914ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK
915ff303e66SPeter Zijlstra 	unsigned			brk_randomized:1;
916ff303e66SPeter Zijlstra #endif
91777f88796STejun Heo #ifdef CONFIG_CGROUPS
91877f88796STejun Heo 	/* disallow userland-initiated cgroup migration */
91977f88796STejun Heo 	unsigned			no_cgroup_migration:1;
92076f969e8SRoman Gushchin 	/* task is frozen/stopped (used by the cgroup freezer) */
92176f969e8SRoman Gushchin 	unsigned			frozen:1;
92277f88796STejun Heo #endif
923d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP
924d09d8df3SJosef Bacik 	unsigned			use_memdelay:1;
925d09d8df3SJosef Bacik #endif
9261066d1b6SYafang Shao #ifdef CONFIG_PSI
9271066d1b6SYafang Shao 	/* Stalled due to lack of memory */
9281066d1b6SYafang Shao 	unsigned			in_memstall:1;
9291066d1b6SYafang Shao #endif
9308e9b16c4SSergei Trofimovich #ifdef CONFIG_PAGE_OWNER
9318e9b16c4SSergei Trofimovich 	/* Used by page_owner=on to detect recursion in page tracking. */
9328e9b16c4SSergei Trofimovich 	unsigned			in_page_owner:1;
9338e9b16c4SSergei Trofimovich #endif
934b542e383SThomas Gleixner #ifdef CONFIG_EVENTFD
935b542e383SThomas Gleixner 	/* Recursion prevention for eventfd_signal() */
936b542e383SThomas Gleixner 	unsigned			in_eventfd_signal:1;
937b542e383SThomas Gleixner #endif
9386f185c29SVladimir Davydov 
9395eca1c10SIngo Molnar 	unsigned long			atomic_flags; /* Flags requiring atomic access. */
9401d4457f9SKees Cook 
941f56141e3SAndy Lutomirski 	struct restart_block		restart_block;
942f56141e3SAndy Lutomirski 
9431da177e4SLinus Torvalds 	pid_t				pid;
9441da177e4SLinus Torvalds 	pid_t				tgid;
9450a425405SArjan van de Ven 
946050e9baaSLinus Torvalds #ifdef CONFIG_STACKPROTECTOR
9475eca1c10SIngo Molnar 	/* Canary value for the -fstack-protector GCC feature: */
9480a425405SArjan van de Ven 	unsigned long			stack_canary;
9491314562aSHiroshi Shimamoto #endif
9501da177e4SLinus Torvalds 	/*
9515eca1c10SIngo Molnar 	 * Pointers to the (original) parent process, youngest child, younger sibling,
9521da177e4SLinus Torvalds 	 * older sibling, respectively.  (p->father can be replaced with
953f470021aSRoland McGrath 	 * p->real_parent->pid)
9541da177e4SLinus Torvalds 	 */
9555eca1c10SIngo Molnar 
9565eca1c10SIngo Molnar 	/* Real parent process: */
9575eca1c10SIngo Molnar 	struct task_struct __rcu	*real_parent;
9585eca1c10SIngo Molnar 
9595eca1c10SIngo Molnar 	/* Recipient of SIGCHLD, wait4() reports: */
9605eca1c10SIngo Molnar 	struct task_struct __rcu	*parent;
9611da177e4SLinus Torvalds 
962f470021aSRoland McGrath 	/*
9635eca1c10SIngo Molnar 	 * Children/sibling form the list of natural children:
9645eca1c10SIngo Molnar 	 */
9655eca1c10SIngo Molnar 	struct list_head		children;
9665eca1c10SIngo Molnar 	struct list_head		sibling;
9675eca1c10SIngo Molnar 	struct task_struct		*group_leader;
9685eca1c10SIngo Molnar 
9695eca1c10SIngo Molnar 	/*
9705eca1c10SIngo Molnar 	 * 'ptraced' is the list of tasks this task is using ptrace() on.
9715eca1c10SIngo Molnar 	 *
972f470021aSRoland McGrath 	 * This includes both natural children and PTRACE_ATTACH targets.
9735eca1c10SIngo Molnar 	 * 'ptrace_entry' is this task's link on the p->parent->ptraced list.
974f470021aSRoland McGrath 	 */
975f470021aSRoland McGrath 	struct list_head		ptraced;
976f470021aSRoland McGrath 	struct list_head		ptrace_entry;
977f470021aSRoland McGrath 
9781da177e4SLinus Torvalds 	/* PID/PID hash table linkage. */
9792c470475SEric W. Biederman 	struct pid			*thread_pid;
9802c470475SEric W. Biederman 	struct hlist_node		pid_links[PIDTYPE_MAX];
98147e65328SOleg Nesterov 	struct list_head		thread_group;
9820c740d0aSOleg Nesterov 	struct list_head		thread_node;
9831da177e4SLinus Torvalds 
9845eca1c10SIngo Molnar 	struct completion		*vfork_done;
9851da177e4SLinus Torvalds 
9865eca1c10SIngo Molnar 	/* CLONE_CHILD_SETTID: */
9875eca1c10SIngo Molnar 	int __user			*set_child_tid;
9885eca1c10SIngo Molnar 
9895eca1c10SIngo Molnar 	/* CLONE_CHILD_CLEARTID: */
9905eca1c10SIngo Molnar 	int __user			*clear_child_tid;
9915eca1c10SIngo Molnar 
9923bfe6106SJens Axboe 	/* PF_IO_WORKER */
9933bfe6106SJens Axboe 	void				*pf_io_worker;
9943bfe6106SJens Axboe 
9955eca1c10SIngo Molnar 	u64				utime;
9965eca1c10SIngo Molnar 	u64				stime;
99740565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME
9985eca1c10SIngo Molnar 	u64				utimescaled;
9995eca1c10SIngo Molnar 	u64				stimescaled;
100040565b5aSStanislaw Gruszka #endif
100116a6d9beSFrederic Weisbecker 	u64				gtime;
10029d7fb042SPeter Zijlstra 	struct prev_cputime		prev_cputime;
10036a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
1004bac5b6b6SFrederic Weisbecker 	struct vtime			vtime;
10056a61671bSFrederic Weisbecker #endif
1006d027d45dSFrederic Weisbecker 
1007d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL
1008f009a7a7SFrederic Weisbecker 	atomic_t			tick_dep_mask;
1009d027d45dSFrederic Weisbecker #endif
10105eca1c10SIngo Molnar 	/* Context switch counts: */
10115eca1c10SIngo Molnar 	unsigned long			nvcsw;
10125eca1c10SIngo Molnar 	unsigned long			nivcsw;
10135eca1c10SIngo Molnar 
10145eca1c10SIngo Molnar 	/* Monotonic time in nsecs: */
10155eca1c10SIngo Molnar 	u64				start_time;
10165eca1c10SIngo Molnar 
10175eca1c10SIngo Molnar 	/* Boot based time in nsecs: */
1018cf25e24dSPeter Zijlstra 	u64				start_boottime;
10195eca1c10SIngo Molnar 
10205eca1c10SIngo Molnar 	/* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */
10215eca1c10SIngo Molnar 	unsigned long			min_flt;
10225eca1c10SIngo Molnar 	unsigned long			maj_flt;
10231da177e4SLinus Torvalds 
10242b69942fSThomas Gleixner 	/* Empty if CONFIG_POSIX_CPUTIMERS=n */
10252b69942fSThomas Gleixner 	struct posix_cputimers		posix_cputimers;
10261da177e4SLinus Torvalds 
10271fb497ddSThomas Gleixner #ifdef CONFIG_POSIX_CPU_TIMERS_TASK_WORK
10281fb497ddSThomas Gleixner 	struct posix_cputimers_work	posix_cputimers_work;
10291fb497ddSThomas Gleixner #endif
10301fb497ddSThomas Gleixner 
10315eca1c10SIngo Molnar 	/* Process credentials: */
10325eca1c10SIngo Molnar 
10335eca1c10SIngo Molnar 	/* Tracer's credentials at attach: */
10345eca1c10SIngo Molnar 	const struct cred __rcu		*ptracer_cred;
10355eca1c10SIngo Molnar 
10365eca1c10SIngo Molnar 	/* Objective and real subjective task credentials (COW): */
10375eca1c10SIngo Molnar 	const struct cred __rcu		*real_cred;
10385eca1c10SIngo Molnar 
10395eca1c10SIngo Molnar 	/* Effective (overridable) subjective task credentials (COW): */
10405eca1c10SIngo Molnar 	const struct cred __rcu		*cred;
10415eca1c10SIngo Molnar 
10427743c48eSDavid Howells #ifdef CONFIG_KEYS
10437743c48eSDavid Howells 	/* Cached requested key. */
10447743c48eSDavid Howells 	struct key			*cached_requested_key;
10457743c48eSDavid Howells #endif
10467743c48eSDavid Howells 
10475eca1c10SIngo Molnar 	/*
10485eca1c10SIngo Molnar 	 * executable name, excluding path.
10495eca1c10SIngo Molnar 	 *
10505eca1c10SIngo Molnar 	 * - normally initialized setup_new_exec()
10515eca1c10SIngo Molnar 	 * - access it with [gs]et_task_comm()
10525eca1c10SIngo Molnar 	 * - lock it with task_lock()
10535eca1c10SIngo Molnar 	 */
10545eca1c10SIngo Molnar 	char				comm[TASK_COMM_LEN];
10555eca1c10SIngo Molnar 
1056756daf26SNeilBrown 	struct nameidata		*nameidata;
10575eca1c10SIngo Molnar 
10583d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC
10591da177e4SLinus Torvalds 	struct sysv_sem			sysvsem;
1060ab602f79SJack Miller 	struct sysv_shm			sysvshm;
10613d5b6fccSAlexey Dobriyan #endif
1062e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK
106382a1fcb9SIngo Molnar 	unsigned long			last_switch_count;
1064a2e51445SDmitry Vyukov 	unsigned long			last_switch_time;
106582a1fcb9SIngo Molnar #endif
10665eca1c10SIngo Molnar 	/* Filesystem information: */
10671da177e4SLinus Torvalds 	struct fs_struct		*fs;
10685eca1c10SIngo Molnar 
10695eca1c10SIngo Molnar 	/* Open file information: */
10701da177e4SLinus Torvalds 	struct files_struct		*files;
10715eca1c10SIngo Molnar 
10720f212204SJens Axboe #ifdef CONFIG_IO_URING
10730f212204SJens Axboe 	struct io_uring_task		*io_uring;
10740f212204SJens Axboe #endif
10750f212204SJens Axboe 
10765eca1c10SIngo Molnar 	/* Namespaces: */
1077ab516013SSerge E. Hallyn 	struct nsproxy			*nsproxy;
10785eca1c10SIngo Molnar 
10795eca1c10SIngo Molnar 	/* Signal handlers: */
10801da177e4SLinus Torvalds 	struct signal_struct		*signal;
1081913292c9SMadhuparna Bhowmik 	struct sighand_struct __rcu		*sighand;
10825eca1c10SIngo Molnar 	sigset_t			blocked;
10835eca1c10SIngo Molnar 	sigset_t			real_blocked;
10845eca1c10SIngo Molnar 	/* Restored if set_restore_sigmask() was used: */
10855eca1c10SIngo Molnar 	sigset_t			saved_sigmask;
10861da177e4SLinus Torvalds 	struct sigpending		pending;
10871da177e4SLinus Torvalds 	unsigned long			sas_ss_sp;
10881da177e4SLinus Torvalds 	size_t				sas_ss_size;
10895eca1c10SIngo Molnar 	unsigned int			sas_ss_flags;
10902e01fabeSOleg Nesterov 
109167d12145SAl Viro 	struct callback_head		*task_works;
1092e73f8959SOleg Nesterov 
10934b7d248bSRichard Guy Briggs #ifdef CONFIG_AUDIT
1094bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL
10955f3d544fSRichard Guy Briggs 	struct audit_context		*audit_context;
10965f3d544fSRichard Guy Briggs #endif
1097e1760bd5SEric W. Biederman 	kuid_t				loginuid;
10984746ec5bSEric Paris 	unsigned int			sessionid;
1099bfef93a5SAl Viro #endif
1100932ecebbSWill Drewry 	struct seccomp			seccomp;
11011446e1dfSGabriel Krisman Bertazi 	struct syscall_user_dispatch	syscall_dispatch;
11021da177e4SLinus Torvalds 
11035eca1c10SIngo Molnar 	/* Thread group tracking: */
1104d1e7fd64SEric W. Biederman 	u64				parent_exec_id;
1105d1e7fd64SEric W. Biederman 	u64				self_exec_id;
11065eca1c10SIngo Molnar 
11075eca1c10SIngo Molnar 	/* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */
11081da177e4SLinus Torvalds 	spinlock_t			alloc_lock;
11091da177e4SLinus Torvalds 
1110b29739f9SIngo Molnar 	/* Protection of the PI data structures: */
11111d615482SThomas Gleixner 	raw_spinlock_t			pi_lock;
1112b29739f9SIngo Molnar 
111376751049SPeter Zijlstra 	struct wake_q_node		wake_q;
111476751049SPeter Zijlstra 
111523f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES
11165eca1c10SIngo Molnar 	/* PI waiters blocked on a rt_mutex held by this task: */
1117a23ba907SDavidlohr Bueso 	struct rb_root_cached		pi_waiters;
1118e96a7705SXunlei Pang 	/* Updated under owner's pi_lock and rq lock */
1119e96a7705SXunlei Pang 	struct task_struct		*pi_top_task;
11205eca1c10SIngo Molnar 	/* Deadlock detection and priority inheritance handling: */
112123f78d4aSIngo Molnar 	struct rt_mutex_waiter		*pi_blocked_on;
112223f78d4aSIngo Molnar #endif
112323f78d4aSIngo Molnar 
1124408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES
11255eca1c10SIngo Molnar 	/* Mutex deadlock detection: */
1126408894eeSIngo Molnar 	struct mutex_waiter		*blocked_on;
1127408894eeSIngo Molnar #endif
11285eca1c10SIngo Molnar 
1129312364f3SDaniel Vetter #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
1130312364f3SDaniel Vetter 	int				non_block_count;
1131312364f3SDaniel Vetter #endif
1132312364f3SDaniel Vetter 
1133de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS
11340584df9cSMarco Elver 	struct irqtrace_events		irqtrace;
1135de8f5e4fSPeter Zijlstra 	unsigned int			hardirq_threaded;
1136c86e9b98SPeter Zijlstra 	u64				hardirq_chain_key;
1137fa1452e8SHiroshi Shimamoto 	int				softirqs_enabled;
1138de30a2b3SIngo Molnar 	int				softirq_context;
113940db1739SSebastian Andrzej Siewior 	int				irq_config;
1140de30a2b3SIngo Molnar #endif
1141728b478dSThomas Gleixner #ifdef CONFIG_PREEMPT_RT
1142728b478dSThomas Gleixner 	int				softirq_disable_cnt;
1143728b478dSThomas Gleixner #endif
11445eca1c10SIngo Molnar 
1145fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP
1146bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH			48UL
1147fbb9ce95SIngo Molnar 	u64				curr_chain_key;
1148fbb9ce95SIngo Molnar 	int				lockdep_depth;
1149fbb9ce95SIngo Molnar 	unsigned int			lockdep_recursion;
1150c7aceabaSRichard Kennedy 	struct held_lock		held_locks[MAX_LOCK_DEPTH];
1151fbb9ce95SIngo Molnar #endif
11525eca1c10SIngo Molnar 
11535cf53f3cSElena Petrova #if defined(CONFIG_UBSAN) && !defined(CONFIG_UBSAN_TRAP)
1154c6d30853SAndrey Ryabinin 	unsigned int			in_ubsan;
1155c6d30853SAndrey Ryabinin #endif
1156408894eeSIngo Molnar 
11575eca1c10SIngo Molnar 	/* Journalling filesystem info: */
11581da177e4SLinus Torvalds 	void				*journal_info;
11591da177e4SLinus Torvalds 
11605eca1c10SIngo Molnar 	/* Stacked block device info: */
1161bddd87c7SAkinobu Mita 	struct bio_list			*bio_list;
1162d89d8796SNeil Brown 
116373c10101SJens Axboe #ifdef CONFIG_BLOCK
11645eca1c10SIngo Molnar 	/* Stack plugging: */
116573c10101SJens Axboe 	struct blk_plug			*plug;
116673c10101SJens Axboe #endif
116773c10101SJens Axboe 
11685eca1c10SIngo Molnar 	/* VM state: */
11691da177e4SLinus Torvalds 	struct reclaim_state		*reclaim_state;
11701da177e4SLinus Torvalds 
11711da177e4SLinus Torvalds 	struct backing_dev_info		*backing_dev_info;
11721da177e4SLinus Torvalds 
11731da177e4SLinus Torvalds 	struct io_context		*io_context;
11741da177e4SLinus Torvalds 
11755e1f0f09SMel Gorman #ifdef CONFIG_COMPACTION
11765e1f0f09SMel Gorman 	struct capture_control		*capture_control;
11775e1f0f09SMel Gorman #endif
11785eca1c10SIngo Molnar 	/* Ptrace state: */
11791da177e4SLinus Torvalds 	unsigned long			ptrace_message;
1180ae7795bcSEric W. Biederman 	kernel_siginfo_t		*last_siginfo;
11815eca1c10SIngo Molnar 
11827c3ab738SAndrew Morton 	struct task_io_accounting	ioac;
1183eb414681SJohannes Weiner #ifdef CONFIG_PSI
1184eb414681SJohannes Weiner 	/* Pressure stall state */
1185eb414681SJohannes Weiner 	unsigned int			psi_flags;
1186eb414681SJohannes Weiner #endif
11875eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT
11885eca1c10SIngo Molnar 	/* Accumulated RSS usage: */
11895eca1c10SIngo Molnar 	u64				acct_rss_mem1;
11905eca1c10SIngo Molnar 	/* Accumulated virtual memory usage: */
11915eca1c10SIngo Molnar 	u64				acct_vm_mem1;
11925eca1c10SIngo Molnar 	/* stime + utime since last update: */
11935eca1c10SIngo Molnar 	u64				acct_timexpd;
11941da177e4SLinus Torvalds #endif
11951da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS
11965eca1c10SIngo Molnar 	/* Protected by ->alloc_lock: */
11975eca1c10SIngo Molnar 	nodemask_t			mems_allowed;
11983b03706fSIngo Molnar 	/* Sequence number to catch updates: */
1199b7505861SAhmed S. Darwish 	seqcount_spinlock_t		mems_allowed_seq;
1200825a46afSPaul Jackson 	int				cpuset_mem_spread_rotor;
12016adef3ebSJack Steiner 	int				cpuset_slab_spread_rotor;
12021da177e4SLinus Torvalds #endif
1203ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS
12045eca1c10SIngo Molnar 	/* Control Group info protected by css_set_lock: */
12052c392b8cSArnd Bergmann 	struct css_set __rcu		*cgroups;
12065eca1c10SIngo Molnar 	/* cg_list protected by css_set_lock and tsk->alloc_lock: */
1207817929ecSPaul Menage 	struct list_head		cg_list;
1208ddbcc7e8SPaul Menage #endif
1209e6d42931SJohannes Weiner #ifdef CONFIG_X86_CPU_RESCTRL
12100734ded1SVikas Shivappa 	u32				closid;
1211d6aaba61SVikas Shivappa 	u32				rmid;
1212e02737d5SFenghua Yu #endif
121342b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX
12140771dfefSIngo Molnar 	struct robust_list_head __user	*robust_list;
121534f192c6SIngo Molnar #ifdef CONFIG_COMPAT
121634f192c6SIngo Molnar 	struct compat_robust_list_head __user *compat_robust_list;
121734f192c6SIngo Molnar #endif
1218c87e2837SIngo Molnar 	struct list_head		pi_state_list;
1219c87e2837SIngo Molnar 	struct futex_pi_state		*pi_state_cache;
12203f186d97SThomas Gleixner 	struct mutex			futex_exit_mutex;
12213d4775dfSThomas Gleixner 	unsigned int			futex_state;
122242b2dd0aSAlexey Dobriyan #endif
1223cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS
12248dc85d54SPeter Zijlstra 	struct perf_event_context	*perf_event_ctxp[perf_nr_task_contexts];
1225cdd6c482SIngo Molnar 	struct mutex			perf_event_mutex;
1226cdd6c482SIngo Molnar 	struct list_head		perf_event_list;
1227a63eaf34SPaul Mackerras #endif
12288f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT
12298f47b187SThomas Gleixner 	unsigned long			preempt_disable_ip;
12308f47b187SThomas Gleixner #endif
1231c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA
12325eca1c10SIngo Molnar 	/* Protected by alloc_lock: */
12335eca1c10SIngo Molnar 	struct mempolicy		*mempolicy;
123445816682SVlastimil Babka 	short				il_prev;
1235207205a2SEric Dumazet 	short				pref_node_fork;
1236c7aceabaSRichard Kennedy #endif
1237cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING
1238cbee9f88SPeter Zijlstra 	int				numa_scan_seq;
1239cbee9f88SPeter Zijlstra 	unsigned int			numa_scan_period;
1240598f0ec0SMel Gorman 	unsigned int			numa_scan_period_max;
1241de1c9ce6SRik van Riel 	int				numa_preferred_nid;
12426b9a7460SMel Gorman 	unsigned long			numa_migrate_retry;
12435eca1c10SIngo Molnar 	/* Migration stamp: */
12445eca1c10SIngo Molnar 	u64				node_stamp;
12457e2703e6SRik van Riel 	u64				last_task_numa_placement;
12467e2703e6SRik van Riel 	u64				last_sum_exec_runtime;
1247cbee9f88SPeter Zijlstra 	struct callback_head		numa_work;
1248f809ca9aSMel Gorman 
1249cb361d8cSJann Horn 	/*
1250cb361d8cSJann Horn 	 * This pointer is only modified for current in syscall and
1251cb361d8cSJann Horn 	 * pagefault context (and for tasks being destroyed), so it can be read
1252cb361d8cSJann Horn 	 * from any of the following contexts:
1253cb361d8cSJann Horn 	 *  - RCU read-side critical section
1254cb361d8cSJann Horn 	 *  - current->numa_group from everywhere
1255cb361d8cSJann Horn 	 *  - task's runqueue locked, task not running
1256cb361d8cSJann Horn 	 */
1257cb361d8cSJann Horn 	struct numa_group __rcu		*numa_group;
12588c8a743cSPeter Zijlstra 
1259745d6147SMel Gorman 	/*
126044dba3d5SIulia Manda 	 * numa_faults is an array split into four regions:
126144dba3d5SIulia Manda 	 * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer
126244dba3d5SIulia Manda 	 * in this precise order.
126344dba3d5SIulia Manda 	 *
126444dba3d5SIulia Manda 	 * faults_memory: Exponential decaying average of faults on a per-node
126544dba3d5SIulia Manda 	 * basis. Scheduling placement decisions are made based on these
126644dba3d5SIulia Manda 	 * counts. The values remain static for the duration of a PTE scan.
126744dba3d5SIulia Manda 	 * faults_cpu: Track the nodes the process was running on when a NUMA
126844dba3d5SIulia Manda 	 * hinting fault was incurred.
126944dba3d5SIulia Manda 	 * faults_memory_buffer and faults_cpu_buffer: Record faults per node
127044dba3d5SIulia Manda 	 * during the current scan window. When the scan completes, the counts
127144dba3d5SIulia Manda 	 * in faults_memory and faults_cpu decay and these values are copied.
1272745d6147SMel Gorman 	 */
127344dba3d5SIulia Manda 	unsigned long			*numa_faults;
127483e1d2cdSMel Gorman 	unsigned long			total_numa_faults;
1275745d6147SMel Gorman 
1276745d6147SMel Gorman 	/*
127704bb2f94SRik van Riel 	 * numa_faults_locality tracks if faults recorded during the last
1278074c2381SMel Gorman 	 * scan window were remote/local or failed to migrate. The task scan
1279074c2381SMel Gorman 	 * period is adapted based on the locality of the faults with different
1280074c2381SMel Gorman 	 * weights depending on whether they were shared or private faults
128104bb2f94SRik van Riel 	 */
1282074c2381SMel Gorman 	unsigned long			numa_faults_locality[3];
128304bb2f94SRik van Riel 
1284b32e86b4SIngo Molnar 	unsigned long			numa_pages_migrated;
1285cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */
1286cbee9f88SPeter Zijlstra 
1287d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ
1288d7822b1eSMathieu Desnoyers 	struct rseq __user *rseq;
1289d7822b1eSMathieu Desnoyers 	u32 rseq_sig;
1290d7822b1eSMathieu Desnoyers 	/*
1291d7822b1eSMathieu Desnoyers 	 * RmW on rseq_event_mask must be performed atomically
1292d7822b1eSMathieu Desnoyers 	 * with respect to preemption.
1293d7822b1eSMathieu Desnoyers 	 */
1294d7822b1eSMathieu Desnoyers 	unsigned long rseq_event_mask;
1295d7822b1eSMathieu Desnoyers #endif
1296d7822b1eSMathieu Desnoyers 
129772b252aeSMel Gorman 	struct tlbflush_unmap_batch	tlb_ubc;
129872b252aeSMel Gorman 
12993fbd7ee2SEric W. Biederman 	union {
13003fbd7ee2SEric W. Biederman 		refcount_t		rcu_users;
1301e56d0903SIngo Molnar 		struct rcu_head		rcu;
13023fbd7ee2SEric W. Biederman 	};
1303b92ce558SJens Axboe 
13045eca1c10SIngo Molnar 	/* Cache last used pipe for splice(): */
1305b92ce558SJens Axboe 	struct pipe_inode_info		*splice_pipe;
13065640f768SEric Dumazet 
13075640f768SEric Dumazet 	struct page_frag		task_frag;
13085640f768SEric Dumazet 
1309ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT
1310ca74e92bSShailabh Nagar 	struct task_delay_info		*delays;
1311ca74e92bSShailabh Nagar #endif
131247913d4eSIngo Molnar 
1313f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION
1314f4f154fdSAkinobu Mita 	int				make_it_fail;
13159049f2f6SAkinobu Mita 	unsigned int			fail_nth;
1316f4f154fdSAkinobu Mita #endif
13179d823e8fSWu Fengguang 	/*
13185eca1c10SIngo Molnar 	 * When (nr_dirtied >= nr_dirtied_pause), it's time to call
13195eca1c10SIngo Molnar 	 * balance_dirty_pages() for a dirty throttling pause:
13209d823e8fSWu Fengguang 	 */
13219d823e8fSWu Fengguang 	int				nr_dirtied;
13229d823e8fSWu Fengguang 	int				nr_dirtied_pause;
13235eca1c10SIngo Molnar 	/* Start of a write-and-pause period: */
13245eca1c10SIngo Molnar 	unsigned long			dirty_paused_when;
13259d823e8fSWu Fengguang 
13269745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP
13279745512cSArjan van de Ven 	int				latency_record_count;
13289745512cSArjan van de Ven 	struct latency_record		latency_record[LT_SAVECOUNT];
13299745512cSArjan van de Ven #endif
13306976675dSArjan van de Ven 	/*
13315eca1c10SIngo Molnar 	 * Time slack values; these are used to round up poll() and
13326976675dSArjan van de Ven 	 * select() etc timeout values. These are in nanoseconds.
13336976675dSArjan van de Ven 	 */
1334da8b44d5SJohn Stultz 	u64				timer_slack_ns;
1335da8b44d5SJohn Stultz 	u64				default_timer_slack_ns;
1336f8d570a4SDavid Miller 
1337d73b4936SAndrey Konovalov #if defined(CONFIG_KASAN_GENERIC) || defined(CONFIG_KASAN_SW_TAGS)
13380b24beccSAndrey Ryabinin 	unsigned int			kasan_depth;
13390b24beccSAndrey Ryabinin #endif
134092c209acSMarco Elver 
1341dfd402a4SMarco Elver #ifdef CONFIG_KCSAN
1342dfd402a4SMarco Elver 	struct kcsan_ctx		kcsan_ctx;
134392c209acSMarco Elver #ifdef CONFIG_TRACE_IRQFLAGS
134492c209acSMarco Elver 	struct irqtrace_events		kcsan_save_irqtrace;
134592c209acSMarco Elver #endif
1346dfd402a4SMarco Elver #endif
13475eca1c10SIngo Molnar 
1348393824f6SPatricia Alfonso #if IS_ENABLED(CONFIG_KUNIT)
1349393824f6SPatricia Alfonso 	struct kunit			*kunit_test;
1350393824f6SPatricia Alfonso #endif
1351393824f6SPatricia Alfonso 
1352fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER
13535eca1c10SIngo Molnar 	/* Index of current stored address in ret_stack: */
1354f201ae23SFrederic Weisbecker 	int				curr_ret_stack;
135539eb456dSSteven Rostedt (VMware) 	int				curr_ret_depth;
13565eca1c10SIngo Molnar 
13575eca1c10SIngo Molnar 	/* Stack of return addresses for return function tracing: */
1358f201ae23SFrederic Weisbecker 	struct ftrace_ret_stack		*ret_stack;
13595eca1c10SIngo Molnar 
13605eca1c10SIngo Molnar 	/* Timestamp for last schedule: */
13618aef2d28SSteven Rostedt 	unsigned long long		ftrace_timestamp;
13625eca1c10SIngo Molnar 
1363f201ae23SFrederic Weisbecker 	/*
1364f201ae23SFrederic Weisbecker 	 * Number of functions that haven't been traced
13655eca1c10SIngo Molnar 	 * because of depth overrun:
1366f201ae23SFrederic Weisbecker 	 */
1367f201ae23SFrederic Weisbecker 	atomic_t			trace_overrun;
13685eca1c10SIngo Molnar 
13695eca1c10SIngo Molnar 	/* Pause tracing: */
1370380c4b14SFrederic Weisbecker 	atomic_t			tracing_graph_pause;
1371f201ae23SFrederic Weisbecker #endif
13725eca1c10SIngo Molnar 
1373ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING
13745eca1c10SIngo Molnar 	/* State flags for use by tracers: */
1375ea4e2bc4SSteven Rostedt 	unsigned long			trace;
13765eca1c10SIngo Molnar 
13775eca1c10SIngo Molnar 	/* Bitmask and counter of trace recursion: */
1378261842b7SSteven Rostedt 	unsigned long			trace_recursion;
1379261842b7SSteven Rostedt #endif /* CONFIG_TRACING */
13805eca1c10SIngo Molnar 
13815c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV
1382eec028c9SAndrey Konovalov 	/* See kernel/kcov.c for more details. */
1383eec028c9SAndrey Konovalov 
13845eca1c10SIngo Molnar 	/* Coverage collection mode enabled for this task (0 if disabled): */
13850ed557aaSMark Rutland 	unsigned int			kcov_mode;
13865eca1c10SIngo Molnar 
13875eca1c10SIngo Molnar 	/* Size of the kcov_area: */
13885eca1c10SIngo Molnar 	unsigned int			kcov_size;
13895eca1c10SIngo Molnar 
13905eca1c10SIngo Molnar 	/* Buffer for coverage collection: */
13915c9a8750SDmitry Vyukov 	void				*kcov_area;
13925eca1c10SIngo Molnar 
13935eca1c10SIngo Molnar 	/* KCOV descriptor wired with this task or NULL: */
13945c9a8750SDmitry Vyukov 	struct kcov			*kcov;
1395eec028c9SAndrey Konovalov 
1396eec028c9SAndrey Konovalov 	/* KCOV common handle for remote coverage collection: */
1397eec028c9SAndrey Konovalov 	u64				kcov_handle;
1398eec028c9SAndrey Konovalov 
1399eec028c9SAndrey Konovalov 	/* KCOV sequence number: */
1400eec028c9SAndrey Konovalov 	int				kcov_sequence;
14015ff3b30aSAndrey Konovalov 
14025ff3b30aSAndrey Konovalov 	/* Collect coverage from softirq context: */
14035ff3b30aSAndrey Konovalov 	unsigned int			kcov_softirq;
14045c9a8750SDmitry Vyukov #endif
14055eca1c10SIngo Molnar 
14066f185c29SVladimir Davydov #ifdef CONFIG_MEMCG
1407626ebc41STejun Heo 	struct mem_cgroup		*memcg_in_oom;
1408626ebc41STejun Heo 	gfp_t				memcg_oom_gfp_mask;
1409626ebc41STejun Heo 	int				memcg_oom_order;
1410b23afb93STejun Heo 
14115eca1c10SIngo Molnar 	/* Number of pages to reclaim on returning to userland: */
1412b23afb93STejun Heo 	unsigned int			memcg_nr_pages_over_high;
1413d46eb14bSShakeel Butt 
1414d46eb14bSShakeel Butt 	/* Used by memcontrol for targeted memcg charge: */
1415d46eb14bSShakeel Butt 	struct mem_cgroup		*active_memcg;
1416569b846dSKAMEZAWA Hiroyuki #endif
14175eca1c10SIngo Molnar 
1418d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP
1419d09d8df3SJosef Bacik 	struct request_queue		*throttle_queue;
1420d09d8df3SJosef Bacik #endif
1421d09d8df3SJosef Bacik 
14220326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES
14230326f5a9SSrikar Dronamraju 	struct uprobe_task		*utask;
14240326f5a9SSrikar Dronamraju #endif
1425cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE)
1426cafe5635SKent Overstreet 	unsigned int			sequential_io;
1427cafe5635SKent Overstreet 	unsigned int			sequential_io_avg;
1428cafe5635SKent Overstreet #endif
14295fbda3ecSThomas Gleixner 	struct kmap_ctrl		kmap_ctrl;
14308eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP
14318eb23b9fSPeter Zijlstra 	unsigned long			task_state_change;
14325f220be2SThomas Gleixner # ifdef CONFIG_PREEMPT_RT
14335f220be2SThomas Gleixner 	unsigned long			saved_state_change;
14345f220be2SThomas Gleixner # endif
14358eb23b9fSPeter Zijlstra #endif
14368bcbde54SDavid Hildenbrand 	int				pagefault_disabled;
143703049269SMichal Hocko #ifdef CONFIG_MMU
143829c696e1SVladimir Davydov 	struct task_struct		*oom_reaper_list;
143903049269SMichal Hocko #endif
1440ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK
1441ba14a194SAndy Lutomirski 	struct vm_struct		*stack_vm_area;
1442ba14a194SAndy Lutomirski #endif
144368f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
14445eca1c10SIngo Molnar 	/* A live task holds one reference: */
1445f0b89d39SElena Reshetova 	refcount_t			stack_refcount;
144668f24b08SAndy Lutomirski #endif
1447d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH
1448d83a7cb3SJosh Poimboeuf 	int patch_state;
1449d83a7cb3SJosh Poimboeuf #endif
1450e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY
1451e4e55b47STetsuo Handa 	/* Used by LSM modules for access restriction: */
1452e4e55b47STetsuo Handa 	void				*security;
1453e4e55b47STetsuo Handa #endif
1454a10787e6SSong Liu #ifdef CONFIG_BPF_SYSCALL
1455a10787e6SSong Liu 	/* Used by BPF task local storage */
1456a10787e6SSong Liu 	struct bpf_local_storage __rcu	*bpf_storage;
1457c7603cfaSAndrii Nakryiko 	/* Used for BPF run context */
1458c7603cfaSAndrii Nakryiko 	struct bpf_run_ctx		*bpf_ctx;
1459a10787e6SSong Liu #endif
146029e48ce8SKees Cook 
1461afaef01cSAlexander Popov #ifdef CONFIG_GCC_PLUGIN_STACKLEAK
1462afaef01cSAlexander Popov 	unsigned long			lowest_stack;
1463c8d12627SAlexander Popov 	unsigned long			prev_lowest_stack;
1464afaef01cSAlexander Popov #endif
1465afaef01cSAlexander Popov 
14665567d11cSPeter Zijlstra #ifdef CONFIG_X86_MCE
1467c0ab7ffcSTony Luck 	void __user			*mce_vaddr;
1468c0ab7ffcSTony Luck 	__u64				mce_kflags;
14695567d11cSPeter Zijlstra 	u64				mce_addr;
147017fae129STony Luck 	__u64				mce_ripv : 1,
147117fae129STony Luck 					mce_whole_page : 1,
147217fae129STony Luck 					__mce_reserved : 62;
14735567d11cSPeter Zijlstra 	struct callback_head		mce_kill_me;
147481065b35STony Luck 	int				mce_count;
14755567d11cSPeter Zijlstra #endif
14765567d11cSPeter Zijlstra 
1477d741bf41SPeter Zijlstra #ifdef CONFIG_KRETPROBES
1478d741bf41SPeter Zijlstra 	struct llist_head               kretprobe_instances;
1479d741bf41SPeter Zijlstra #endif
1480d741bf41SPeter Zijlstra 
148158e106e7SBalbir Singh #ifdef CONFIG_ARCH_HAS_PARANOID_L1D_FLUSH
148258e106e7SBalbir Singh 	/*
148358e106e7SBalbir Singh 	 * If L1D flush is supported on mm context switch
148458e106e7SBalbir Singh 	 * then we use this callback head to queue kill work
148558e106e7SBalbir Singh 	 * to kill tasks that are not running on SMT disabled
148658e106e7SBalbir Singh 	 * cores
148758e106e7SBalbir Singh 	 */
148858e106e7SBalbir Singh 	struct callback_head		l1d_flush_kill;
148958e106e7SBalbir Singh #endif
149058e106e7SBalbir Singh 
149129e48ce8SKees Cook 	/*
149229e48ce8SKees Cook 	 * New fields for task_struct should be added above here, so that
149329e48ce8SKees Cook 	 * they are included in the randomized portion of task_struct.
149429e48ce8SKees Cook 	 */
149529e48ce8SKees Cook 	randomized_struct_fields_end
149629e48ce8SKees Cook 
14975eca1c10SIngo Molnar 	/* CPU-specific state of this task: */
14980c8c0f03SDave Hansen 	struct thread_struct		thread;
14995eca1c10SIngo Molnar 
15000c8c0f03SDave Hansen 	/*
15010c8c0f03SDave Hansen 	 * WARNING: on x86, 'thread_struct' contains a variable-sized
15020c8c0f03SDave Hansen 	 * structure.  It *MUST* be at the end of 'task_struct'.
15030c8c0f03SDave Hansen 	 *
15040c8c0f03SDave Hansen 	 * Do not put anything below here!
15050c8c0f03SDave Hansen 	 */
15061da177e4SLinus Torvalds };
15071da177e4SLinus Torvalds 
1508e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task)
150922c935f4SEric W. Biederman {
15102c470475SEric W. Biederman 	return task->thread_pid;
151122c935f4SEric W. Biederman }
151222c935f4SEric W. Biederman 
15137af57294SPavel Emelyanov /*
15147af57294SPavel Emelyanov  * the helpers to get the task's different pids as they are seen
15157af57294SPavel Emelyanov  * from various namespaces
15167af57294SPavel Emelyanov  *
15177af57294SPavel Emelyanov  * task_xid_nr()     : global id, i.e. the id seen from the init namespace;
151844c4e1b2SEric W. Biederman  * task_xid_vnr()    : virtual id, i.e. the id seen from the pid namespace of
151944c4e1b2SEric W. Biederman  *                     current.
15207af57294SPavel Emelyanov  * task_xid_nr_ns()  : id seen from the ns specified;
15217af57294SPavel Emelyanov  *
15227af57294SPavel Emelyanov  * see also pid_nr() etc in include/linux/pid.h
15237af57294SPavel Emelyanov  */
15245eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns);
15257af57294SPavel Emelyanov 
1526e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk)
15277af57294SPavel Emelyanov {
15287af57294SPavel Emelyanov 	return tsk->pid;
15297af57294SPavel Emelyanov }
15307af57294SPavel Emelyanov 
15315eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
153252ee2dfdSOleg Nesterov {
153352ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
153452ee2dfdSOleg Nesterov }
15357af57294SPavel Emelyanov 
15367af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk)
15377af57294SPavel Emelyanov {
153852ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
15397af57294SPavel Emelyanov }
15407af57294SPavel Emelyanov 
15417af57294SPavel Emelyanov 
1542e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk)
15437af57294SPavel Emelyanov {
15447af57294SPavel Emelyanov 	return tsk->tgid;
15457af57294SPavel Emelyanov }
15467af57294SPavel Emelyanov 
15475eca1c10SIngo Molnar /**
15485eca1c10SIngo Molnar  * pid_alive - check that a task structure is not stale
15495eca1c10SIngo Molnar  * @p: Task structure to be checked.
15505eca1c10SIngo Molnar  *
15515eca1c10SIngo Molnar  * Test if a process is not yet dead (at most zombie state)
15525eca1c10SIngo Molnar  * If pid_alive fails, then pointers within the task structure
15535eca1c10SIngo Molnar  * can be stale and must not be dereferenced.
15545eca1c10SIngo Molnar  *
15555eca1c10SIngo Molnar  * Return: 1 if the process is alive. 0 otherwise.
15565eca1c10SIngo Molnar  */
15575eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p)
15585eca1c10SIngo Molnar {
15592c470475SEric W. Biederman 	return p->thread_pid != NULL;
15605eca1c10SIngo Molnar }
15617af57294SPavel Emelyanov 
15625eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
15637af57294SPavel Emelyanov {
156452ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
15657af57294SPavel Emelyanov }
15667af57294SPavel Emelyanov 
15677af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
15687af57294SPavel Emelyanov {
156952ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
15707af57294SPavel Emelyanov }
15717af57294SPavel Emelyanov 
15727af57294SPavel Emelyanov 
15735eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
15747af57294SPavel Emelyanov {
157552ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
15767af57294SPavel Emelyanov }
15777af57294SPavel Emelyanov 
15787af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk)
15797af57294SPavel Emelyanov {
158052ee2dfdSOleg Nesterov 	return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
15817af57294SPavel Emelyanov }
15827af57294SPavel Emelyanov 
1583dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns)
1584dd1c1f2fSOleg Nesterov {
15856883f81aSEric W. Biederman 	return __task_pid_nr_ns(tsk, PIDTYPE_TGID, ns);
1586dd1c1f2fSOleg Nesterov }
1587dd1c1f2fSOleg Nesterov 
1588dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk)
1589dd1c1f2fSOleg Nesterov {
15906883f81aSEric W. Biederman 	return __task_pid_nr_ns(tsk, PIDTYPE_TGID, NULL);
1591dd1c1f2fSOleg Nesterov }
1592dd1c1f2fSOleg Nesterov 
1593dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns)
1594dd1c1f2fSOleg Nesterov {
1595dd1c1f2fSOleg Nesterov 	pid_t pid = 0;
1596dd1c1f2fSOleg Nesterov 
1597dd1c1f2fSOleg Nesterov 	rcu_read_lock();
1598dd1c1f2fSOleg Nesterov 	if (pid_alive(tsk))
1599dd1c1f2fSOleg Nesterov 		pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns);
1600dd1c1f2fSOleg Nesterov 	rcu_read_unlock();
1601dd1c1f2fSOleg Nesterov 
1602dd1c1f2fSOleg Nesterov 	return pid;
1603dd1c1f2fSOleg Nesterov }
1604dd1c1f2fSOleg Nesterov 
1605dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk)
1606dd1c1f2fSOleg Nesterov {
1607dd1c1f2fSOleg Nesterov 	return task_ppid_nr_ns(tsk, &init_pid_ns);
1608dd1c1f2fSOleg Nesterov }
1609dd1c1f2fSOleg Nesterov 
16105eca1c10SIngo Molnar /* Obsolete, do not use: */
16111b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk)
16121b0f7ffdSOleg Nesterov {
16131b0f7ffdSOleg Nesterov 	return task_pgrp_nr_ns(tsk, &init_pid_ns);
16141b0f7ffdSOleg Nesterov }
16157af57294SPavel Emelyanov 
161606eb6184SPeter Zijlstra #define TASK_REPORT_IDLE	(TASK_REPORT + 1)
161706eb6184SPeter Zijlstra #define TASK_REPORT_MAX		(TASK_REPORT_IDLE << 1)
161806eb6184SPeter Zijlstra 
16191d48b080SPeter Zijlstra static inline unsigned int task_state_index(struct task_struct *tsk)
162020435d84SXie XiuQi {
16212f064a59SPeter Zijlstra 	unsigned int tsk_state = READ_ONCE(tsk->__state);
16221593baabSPeter Zijlstra 	unsigned int state = (tsk_state | tsk->exit_state) & TASK_REPORT;
162320435d84SXie XiuQi 
162406eb6184SPeter Zijlstra 	BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX);
162506eb6184SPeter Zijlstra 
162606eb6184SPeter Zijlstra 	if (tsk_state == TASK_IDLE)
162706eb6184SPeter Zijlstra 		state = TASK_REPORT_IDLE;
162806eb6184SPeter Zijlstra 
16291593baabSPeter Zijlstra 	return fls(state);
16301593baabSPeter Zijlstra }
163120435d84SXie XiuQi 
16321d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state)
16331593baabSPeter Zijlstra {
16348ef9925bSPeter Zijlstra 	static const char state_char[] = "RSDTtXZPI";
16351593baabSPeter Zijlstra 
163606eb6184SPeter Zijlstra 	BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1);
16371593baabSPeter Zijlstra 
16381593baabSPeter Zijlstra 	return state_char[state];
16391593baabSPeter Zijlstra }
16401593baabSPeter Zijlstra 
16411593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk)
16421593baabSPeter Zijlstra {
16431d48b080SPeter Zijlstra 	return task_index_to_char(task_state_index(tsk));
164420435d84SXie XiuQi }
164520435d84SXie XiuQi 
16461da177e4SLinus Torvalds /**
1647570f5241SSergey Senozhatsky  * is_global_init - check if a task structure is init. Since init
1648570f5241SSergey Senozhatsky  * is free to have sub-threads we need to check tgid.
16493260259fSHenne  * @tsk: Task structure to be checked.
16503260259fSHenne  *
16513260259fSHenne  * Check if a task structure is the first user space task the kernel created.
1652e69f6186SYacine Belkadi  *
1653e69f6186SYacine Belkadi  * Return: 1 if the task structure is init. 0 otherwise.
1654f400e198SSukadev Bhattiprolu  */
1655e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk)
1656b461cc03SPavel Emelyanov {
1657570f5241SSergey Senozhatsky 	return task_tgid_nr(tsk) == 1;
1658b461cc03SPavel Emelyanov }
1659b460cbc5SSerge E. Hallyn 
16609ec52099SCedric Le Goater extern struct pid *cad_pid;
16619ec52099SCedric Le Goater 
16621da177e4SLinus Torvalds /*
16631da177e4SLinus Torvalds  * Per process flags
16641da177e4SLinus Torvalds  */
166501ccf592SSebastian Andrzej Siewior #define PF_VCPU			0x00000001	/* I'm a virtual CPU */
1666c1de45caSPeter Zijlstra #define PF_IDLE			0x00000002	/* I am an IDLE thread */
16675eca1c10SIngo Molnar #define PF_EXITING		0x00000004	/* Getting shut down */
166801ccf592SSebastian Andrzej Siewior #define PF_IO_WORKER		0x00000010	/* Task is an IO worker */
166921aa9af0STejun Heo #define PF_WQ_WORKER		0x00000020	/* I'm a workqueue worker */
16705eca1c10SIngo Molnar #define PF_FORKNOEXEC		0x00000040	/* Forked but didn't exec */
16715eca1c10SIngo Molnar #define PF_MCE_PROCESS		0x00000080      /* Process policy on mce errors */
16725eca1c10SIngo Molnar #define PF_SUPERPRIV		0x00000100	/* Used super-user privileges */
16735eca1c10SIngo Molnar #define PF_DUMPCORE		0x00000200	/* Dumped core */
16745eca1c10SIngo Molnar #define PF_SIGNALED		0x00000400	/* Killed by a signal */
16751da177e4SLinus Torvalds #define PF_MEMALLOC		0x00000800	/* Allocating memory */
16765eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED	0x00001000	/* set_user() noticed that RLIMIT_NPROC was exceeded */
16775eca1c10SIngo Molnar #define PF_USED_MATH		0x00002000	/* If unset the fpu must be initialized before use */
16785eca1c10SIngo Molnar #define PF_USED_ASYNC		0x00004000	/* Used async_schedule*(), used by module init */
16795eca1c10SIngo Molnar #define PF_NOFREEZE		0x00008000	/* This thread should not be frozen */
16805eca1c10SIngo Molnar #define PF_FROZEN		0x00010000	/* Frozen for system suspend */
16817dea19f9SMichal Hocko #define PF_KSWAPD		0x00020000	/* I am kswapd */
16827dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS	0x00040000	/* All allocation requests will inherit GFP_NOFS */
16837dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO	0x00080000	/* All allocation requests will inherit GFP_NOIO */
1684a37b0715SNeilBrown #define PF_LOCAL_THROTTLE	0x00100000	/* Throttle writes only against the bdi I write to,
1685a37b0715SNeilBrown 						 * I am cleaning dirty pages from some other bdi. */
1686246bb0b1SOleg Nesterov #define PF_KTHREAD		0x00200000	/* I am a kernel thread */
16875eca1c10SIngo Molnar #define PF_RANDOMIZE		0x00400000	/* Randomize virtual address space */
1688b31dc66aSJens Axboe #define PF_SWAPWRITE		0x00800000	/* Allowed to write to swap */
16893bd37062SSebastian Andrzej Siewior #define PF_NO_SETAFFINITY	0x04000000	/* Userland is not allowed to meddle with cpus_mask */
16904db96cf0SAndi Kleen #define PF_MCE_EARLY		0x08000000      /* Early kill for mce process policy */
16911a08ae36SPavel Tatashin #define PF_MEMALLOC_PIN		0x10000000	/* Allocation context constrained to zones which allow long term pinning. */
169258a69cb4STejun Heo #define PF_FREEZER_SKIP		0x40000000	/* Freezer should not count it as freezable */
16935eca1c10SIngo Molnar #define PF_SUSPEND_TASK		0x80000000      /* This thread called freeze_processes() and should not be frozen */
16941da177e4SLinus Torvalds 
16951da177e4SLinus Torvalds /*
16961da177e4SLinus Torvalds  * Only the _current_ task can read/write to tsk->flags, but other
16971da177e4SLinus Torvalds  * tasks can access tsk->flags in readonly mode for example
16981da177e4SLinus Torvalds  * with tsk_used_math (like during threaded core dumping).
16991da177e4SLinus Torvalds  * There is however an exception to this rule during ptrace
17001da177e4SLinus Torvalds  * or during fork: the ptracer task is allowed to write to the
17011da177e4SLinus Torvalds  * child->flags of its traced child (same goes for fork, the parent
17021da177e4SLinus Torvalds  * can write to the child->flags), because we're guaranteed the
17031da177e4SLinus Torvalds  * child is not running and in turn not changing child->flags
17041da177e4SLinus Torvalds  * at the same time the parent does it.
17051da177e4SLinus Torvalds  */
17061da177e4SLinus Torvalds #define clear_stopped_child_used_math(child)	do { (child)->flags &= ~PF_USED_MATH; } while (0)
17071da177e4SLinus Torvalds #define set_stopped_child_used_math(child)	do { (child)->flags |= PF_USED_MATH; } while (0)
17081da177e4SLinus Torvalds #define clear_used_math()			clear_stopped_child_used_math(current)
17091da177e4SLinus Torvalds #define set_used_math()				set_stopped_child_used_math(current)
17105eca1c10SIngo Molnar 
17111da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \
17121da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0)
17135eca1c10SIngo Molnar 
17145eca1c10SIngo Molnar #define conditional_used_math(condition)	conditional_stopped_child_used_math(condition, current)
17155eca1c10SIngo Molnar 
17161da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \
17171da177e4SLinus Torvalds 	do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0)
17185eca1c10SIngo Molnar 
17191da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */
17201da177e4SLinus Torvalds #define tsk_used_math(p)			((p)->flags & PF_USED_MATH)
17211da177e4SLinus Torvalds #define used_math()				tsk_used_math(current)
17221da177e4SLinus Torvalds 
172383d40a61SPeter Zijlstra static __always_inline bool is_percpu_thread(void)
172462ec05ddSThomas Gleixner {
172562ec05ddSThomas Gleixner #ifdef CONFIG_SMP
172662ec05ddSThomas Gleixner 	return (current->flags & PF_NO_SETAFFINITY) &&
172762ec05ddSThomas Gleixner 		(current->nr_cpus_allowed  == 1);
172862ec05ddSThomas Gleixner #else
172962ec05ddSThomas Gleixner 	return true;
173062ec05ddSThomas Gleixner #endif
173162ec05ddSThomas Gleixner }
173262ec05ddSThomas Gleixner 
17331d4457f9SKees Cook /* Per-process atomic flags. */
1734a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS		0	/* May not gain new privileges. */
17352ad654bcSZefan Li #define PFA_SPREAD_PAGE			1	/* Spread page cache over cpuset */
17362ad654bcSZefan Li #define PFA_SPREAD_SLAB			2	/* Spread some slab caches over cpuset */
1737356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE		3	/* Speculative Store Bypass disabled */
1738356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE	4	/* Speculative Store Bypass force disabled*/
17399137bb27SThomas Gleixner #define PFA_SPEC_IB_DISABLE		5	/* Indirect branch speculation restricted */
17409137bb27SThomas Gleixner #define PFA_SPEC_IB_FORCE_DISABLE	6	/* Indirect branch speculation permanently restricted */
174171368af9SWaiman Long #define PFA_SPEC_SSB_NOEXEC		7	/* Speculative Store Bypass clear on execve() */
17421d4457f9SKees Cook 
1743e0e5070bSZefan Li #define TASK_PFA_TEST(name, func)					\
1744e0e5070bSZefan Li 	static inline bool task_##func(struct task_struct *p)		\
1745e0e5070bSZefan Li 	{ return test_bit(PFA_##name, &p->atomic_flags); }
17465eca1c10SIngo Molnar 
1747e0e5070bSZefan Li #define TASK_PFA_SET(name, func)					\
1748e0e5070bSZefan Li 	static inline void task_set_##func(struct task_struct *p)	\
1749e0e5070bSZefan Li 	{ set_bit(PFA_##name, &p->atomic_flags); }
17505eca1c10SIngo Molnar 
1751e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func)					\
1752e0e5070bSZefan Li 	static inline void task_clear_##func(struct task_struct *p)	\
1753e0e5070bSZefan Li 	{ clear_bit(PFA_##name, &p->atomic_flags); }
17541d4457f9SKees Cook 
1755e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs)
1756e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs)
17571d4457f9SKees Cook 
17582ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page)
17592ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page)
17602ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
17612ad654bcSZefan Li 
17622ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
17632ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab)
17642ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
1765544b2c91STejun Heo 
1766356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable)
1767356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable)
1768356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable)
1769356e4bffSThomas Gleixner 
177071368af9SWaiman Long TASK_PFA_TEST(SPEC_SSB_NOEXEC, spec_ssb_noexec)
177171368af9SWaiman Long TASK_PFA_SET(SPEC_SSB_NOEXEC, spec_ssb_noexec)
177271368af9SWaiman Long TASK_PFA_CLEAR(SPEC_SSB_NOEXEC, spec_ssb_noexec)
177371368af9SWaiman Long 
1774356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1775356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable)
1776356e4bffSThomas Gleixner 
17779137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_DISABLE, spec_ib_disable)
17789137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_DISABLE, spec_ib_disable)
17799137bb27SThomas Gleixner TASK_PFA_CLEAR(SPEC_IB_DISABLE, spec_ib_disable)
17809137bb27SThomas Gleixner 
17819137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable)
17829137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable)
17839137bb27SThomas Gleixner 
17845eca1c10SIngo Molnar static inline void
1785717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags)
1786907aed48SMel Gorman {
1787717a94b5SNeilBrown 	current->flags &= ~flags;
1788717a94b5SNeilBrown 	current->flags |= orig_flags & flags;
1789907aed48SMel Gorman }
1790907aed48SMel Gorman 
17915eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial);
17925eca1c10SIngo Molnar extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_cpus_allowed);
17931da177e4SLinus Torvalds #ifdef CONFIG_SMP
17945eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask);
17955eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask);
1796b90ca8baSWill Deacon extern int dup_user_cpus_ptr(struct task_struct *dst, struct task_struct *src, int node);
1797b90ca8baSWill Deacon extern void release_user_cpus_ptr(struct task_struct *p);
1798234b8ab6SWill Deacon extern int dl_task_check_affinity(struct task_struct *p, const struct cpumask *mask);
179907ec77a1SWill Deacon extern void force_compatible_cpus_allowed_ptr(struct task_struct *p);
180007ec77a1SWill Deacon extern void relax_compatible_cpus_allowed_ptr(struct task_struct *p);
18011da177e4SLinus Torvalds #else
18025eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask)
18031e1b6c51SKOSAKI Motohiro {
18041e1b6c51SKOSAKI Motohiro }
18055eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask)
18061da177e4SLinus Torvalds {
180796f874e2SRusty Russell 	if (!cpumask_test_cpu(0, new_mask))
18081da177e4SLinus Torvalds 		return -EINVAL;
18091da177e4SLinus Torvalds 	return 0;
18101da177e4SLinus Torvalds }
1811b90ca8baSWill Deacon static inline int dup_user_cpus_ptr(struct task_struct *dst, struct task_struct *src, int node)
1812b90ca8baSWill Deacon {
1813b90ca8baSWill Deacon 	if (src->user_cpus_ptr)
1814b90ca8baSWill Deacon 		return -EINVAL;
1815b90ca8baSWill Deacon 	return 0;
1816b90ca8baSWill Deacon }
1817b90ca8baSWill Deacon static inline void release_user_cpus_ptr(struct task_struct *p)
1818b90ca8baSWill Deacon {
1819b90ca8baSWill Deacon 	WARN_ON(p->user_cpus_ptr);
1820b90ca8baSWill Deacon }
1821234b8ab6SWill Deacon 
1822234b8ab6SWill Deacon static inline int dl_task_check_affinity(struct task_struct *p, const struct cpumask *mask)
1823234b8ab6SWill Deacon {
1824234b8ab6SWill Deacon 	return 0;
1825234b8ab6SWill Deacon }
18261da177e4SLinus Torvalds #endif
1827e0ad9556SRusty Russell 
1828fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt);
182936c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice);
183036c8b586SIngo Molnar extern int task_prio(const struct task_struct *p);
18315eca1c10SIngo Molnar 
1832d0ea0268SDongsheng Yang /**
1833d0ea0268SDongsheng Yang  * task_nice - return the nice value of a given task.
1834d0ea0268SDongsheng Yang  * @p: the task in question.
1835d0ea0268SDongsheng Yang  *
1836d0ea0268SDongsheng Yang  * Return: The nice value [ -20 ... 0 ... 19 ].
1837d0ea0268SDongsheng Yang  */
1838d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p)
1839d0ea0268SDongsheng Yang {
1840d0ea0268SDongsheng Yang 	return PRIO_TO_NICE((p)->static_prio);
1841d0ea0268SDongsheng Yang }
18425eca1c10SIngo Molnar 
184336c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice);
184436c8b586SIngo Molnar extern int task_curr(const struct task_struct *p);
18451da177e4SLinus Torvalds extern int idle_cpu(int cpu);
1846943d355dSRohit Jain extern int available_idle_cpu(int cpu);
18475eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *);
18485eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *);
18498b700983SPeter Zijlstra extern void sched_set_fifo(struct task_struct *p);
18508b700983SPeter Zijlstra extern void sched_set_fifo_low(struct task_struct *p);
18518b700983SPeter Zijlstra extern void sched_set_normal(struct task_struct *p, int nice);
18525eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *);
1853794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *);
185436c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu);
18555eca1c10SIngo Molnar 
1856c4f30608SPaul E. McKenney /**
1857c4f30608SPaul E. McKenney  * is_idle_task - is the specified task an idle task?
1858fa757281SRandy Dunlap  * @p: the task in question.
1859e69f6186SYacine Belkadi  *
1860e69f6186SYacine Belkadi  * Return: 1 if @p is an idle task. 0 otherwise.
1861c4f30608SPaul E. McKenney  */
1862c94a88f3SMarco Elver static __always_inline bool is_idle_task(const struct task_struct *p)
1863c4f30608SPaul E. McKenney {
1864c1de45caSPeter Zijlstra 	return !!(p->flags & PF_IDLE);
1865c4f30608SPaul E. McKenney }
18665eca1c10SIngo Molnar 
186736c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu);
1868a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p);
18691da177e4SLinus Torvalds 
18701da177e4SLinus Torvalds void yield(void);
18711da177e4SLinus Torvalds 
18721da177e4SLinus Torvalds union thread_union {
18730500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK
18740500871fSDavid Howells 	struct task_struct task;
18750500871fSDavid Howells #endif
1876c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK
18771da177e4SLinus Torvalds 	struct thread_info thread_info;
1878c65eacbeSAndy Lutomirski #endif
18791da177e4SLinus Torvalds 	unsigned long stack[THREAD_SIZE/sizeof(long)];
18801da177e4SLinus Torvalds };
18811da177e4SLinus Torvalds 
18820500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK
18830500871fSDavid Howells extern struct thread_info init_thread_info;
18840500871fSDavid Howells #endif
18850500871fSDavid Howells 
18860500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)];
18870500871fSDavid Howells 
1888f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK
1889f3ac6067SIngo Molnar static inline struct thread_info *task_thread_info(struct task_struct *task)
1890f3ac6067SIngo Molnar {
1891f3ac6067SIngo Molnar 	return &task->thread_info;
1892f3ac6067SIngo Molnar }
1893f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS)
1894f3ac6067SIngo Molnar # define task_thread_info(task)	((struct thread_info *)(task)->stack)
1895f3ac6067SIngo Molnar #endif
1896f3ac6067SIngo Molnar 
1897198fe21bSPavel Emelyanov /*
1898198fe21bSPavel Emelyanov  * find a task by one of its numerical ids
1899198fe21bSPavel Emelyanov  *
1900198fe21bSPavel Emelyanov  * find_task_by_pid_ns():
1901198fe21bSPavel Emelyanov  *      finds a task by its pid in the specified namespace
1902228ebcbeSPavel Emelyanov  * find_task_by_vpid():
1903228ebcbeSPavel Emelyanov  *      finds a task by its virtual pid
1904198fe21bSPavel Emelyanov  *
1905e49859e7SPavel Emelyanov  * see also find_vpid() etc in include/linux/pid.h
1906198fe21bSPavel Emelyanov  */
1907198fe21bSPavel Emelyanov 
1908228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr);
19095eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns);
1910198fe21bSPavel Emelyanov 
19112ee08260SMike Rapoport /*
19122ee08260SMike Rapoport  * find a task by its virtual pid and get the task struct
19132ee08260SMike Rapoport  */
19142ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr);
19152ee08260SMike Rapoport 
1916b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state);
1917b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk);
19183e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk);
19195eca1c10SIngo Molnar 
19201da177e4SLinus Torvalds #ifdef CONFIG_SMP
19211da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk);
19221da177e4SLinus Torvalds #else
19231da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { }
19241da177e4SLinus Torvalds #endif
19251da177e4SLinus Torvalds 
192682b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
19275eca1c10SIngo Molnar 
192882b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from)
192982b89778SAdrian Hunter {
193082b89778SAdrian Hunter 	__set_task_comm(tsk, from, false);
193182b89778SAdrian Hunter }
19325eca1c10SIngo Molnar 
19333756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk);
19343756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({			\
19353756f640SArnd Bergmann 	BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN);	\
19363756f640SArnd Bergmann 	__get_task_comm(buf, sizeof(buf), tsk);		\
19373756f640SArnd Bergmann })
19381da177e4SLinus Torvalds 
19391da177e4SLinus Torvalds #ifdef CONFIG_SMP
19402a0a24ebSThomas Gleixner static __always_inline void scheduler_ipi(void)
19412a0a24ebSThomas Gleixner {
19422a0a24ebSThomas Gleixner 	/*
19432a0a24ebSThomas Gleixner 	 * Fold TIF_NEED_RESCHED into the preempt_count; anybody setting
19442a0a24ebSThomas Gleixner 	 * TIF_NEED_RESCHED remotely (for the first time) will also send
19452a0a24ebSThomas Gleixner 	 * this IPI.
19462a0a24ebSThomas Gleixner 	 */
19472a0a24ebSThomas Gleixner 	preempt_fold_need_resched();
19482a0a24ebSThomas Gleixner }
19492f064a59SPeter Zijlstra extern unsigned long wait_task_inactive(struct task_struct *, unsigned int match_state);
19501da177e4SLinus Torvalds #else
1951184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { }
19522f064a59SPeter Zijlstra static inline unsigned long wait_task_inactive(struct task_struct *p, unsigned int match_state)
195385ba2d86SRoland McGrath {
195485ba2d86SRoland McGrath 	return 1;
195585ba2d86SRoland McGrath }
19561da177e4SLinus Torvalds #endif
19571da177e4SLinus Torvalds 
19585eca1c10SIngo Molnar /*
19595eca1c10SIngo Molnar  * Set thread flags in other task's structures.
19605eca1c10SIngo Molnar  * See asm/thread_info.h for TIF_xxxx flags available:
19611da177e4SLinus Torvalds  */
19621da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag)
19631da177e4SLinus Torvalds {
1964a1261f54SAl Viro 	set_ti_thread_flag(task_thread_info(tsk), flag);
19651da177e4SLinus Torvalds }
19661da177e4SLinus Torvalds 
19671da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag)
19681da177e4SLinus Torvalds {
1969a1261f54SAl Viro 	clear_ti_thread_flag(task_thread_info(tsk), flag);
19701da177e4SLinus Torvalds }
19711da177e4SLinus Torvalds 
197293ee37c2SDave Martin static inline void update_tsk_thread_flag(struct task_struct *tsk, int flag,
197393ee37c2SDave Martin 					  bool value)
197493ee37c2SDave Martin {
197593ee37c2SDave Martin 	update_ti_thread_flag(task_thread_info(tsk), flag, value);
197693ee37c2SDave Martin }
197793ee37c2SDave Martin 
19781da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag)
19791da177e4SLinus Torvalds {
1980a1261f54SAl Viro 	return test_and_set_ti_thread_flag(task_thread_info(tsk), flag);
19811da177e4SLinus Torvalds }
19821da177e4SLinus Torvalds 
19831da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag)
19841da177e4SLinus Torvalds {
1985a1261f54SAl Viro 	return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag);
19861da177e4SLinus Torvalds }
19871da177e4SLinus Torvalds 
19881da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag)
19891da177e4SLinus Torvalds {
1990a1261f54SAl Viro 	return test_ti_thread_flag(task_thread_info(tsk), flag);
19911da177e4SLinus Torvalds }
19921da177e4SLinus Torvalds 
19931da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk)
19941da177e4SLinus Torvalds {
19951da177e4SLinus Torvalds 	set_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
19961da177e4SLinus Torvalds }
19971da177e4SLinus Torvalds 
19981da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk)
19991da177e4SLinus Torvalds {
20001da177e4SLinus Torvalds 	clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
20011da177e4SLinus Torvalds }
20021da177e4SLinus Torvalds 
20038ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk)
20048ae121acSGregory Haskins {
20058ae121acSGregory Haskins 	return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
20068ae121acSGregory Haskins }
20078ae121acSGregory Haskins 
20081da177e4SLinus Torvalds /*
20091da177e4SLinus Torvalds  * cond_resched() and cond_resched_lock(): latency reduction via
20101da177e4SLinus Torvalds  * explicit rescheduling in places that are safe. The return
20111da177e4SLinus Torvalds  * value indicates whether a reschedule was done in fact.
20121da177e4SLinus Torvalds  * cond_resched_lock() will drop the spinlock before scheduling,
20131da177e4SLinus Torvalds  */
2014b965f1ddSPeter Zijlstra (Intel) #if !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC)
2015b965f1ddSPeter Zijlstra (Intel) extern int __cond_resched(void);
2016b965f1ddSPeter Zijlstra (Intel) 
2017b965f1ddSPeter Zijlstra (Intel) #ifdef CONFIG_PREEMPT_DYNAMIC
2018b965f1ddSPeter Zijlstra (Intel) 
2019b965f1ddSPeter Zijlstra (Intel) DECLARE_STATIC_CALL(cond_resched, __cond_resched);
2020b965f1ddSPeter Zijlstra (Intel) 
2021b965f1ddSPeter Zijlstra (Intel) static __always_inline int _cond_resched(void)
2022b965f1ddSPeter Zijlstra (Intel) {
2023ef72661eSPeter Zijlstra 	return static_call_mod(cond_resched)();
2024b965f1ddSPeter Zijlstra (Intel) }
2025b965f1ddSPeter Zijlstra (Intel) 
202635a773a0SPeter Zijlstra #else
2027b965f1ddSPeter Zijlstra (Intel) 
2028b965f1ddSPeter Zijlstra (Intel) static inline int _cond_resched(void)
2029b965f1ddSPeter Zijlstra (Intel) {
2030b965f1ddSPeter Zijlstra (Intel) 	return __cond_resched();
2031b965f1ddSPeter Zijlstra (Intel) }
2032b965f1ddSPeter Zijlstra (Intel) 
2033b965f1ddSPeter Zijlstra (Intel) #endif /* CONFIG_PREEMPT_DYNAMIC */
2034b965f1ddSPeter Zijlstra (Intel) 
2035b965f1ddSPeter Zijlstra (Intel) #else
2036b965f1ddSPeter Zijlstra (Intel) 
203735a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; }
2038b965f1ddSPeter Zijlstra (Intel) 
2039b965f1ddSPeter Zijlstra (Intel) #endif /* !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC) */
20406f80bd98SFrederic Weisbecker 
2041613afbf8SFrederic Weisbecker #define cond_resched() ({			\
20423427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, 0);	\
2043613afbf8SFrederic Weisbecker 	_cond_resched();			\
2044613afbf8SFrederic Weisbecker })
20456f80bd98SFrederic Weisbecker 
2046613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock);
2047f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_read(rwlock_t *lock);
2048f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_write(rwlock_t *lock);
2049613afbf8SFrederic Weisbecker 
2050613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({				\
20513427445aSPeter Zijlstra 	___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\
2052613afbf8SFrederic Weisbecker 	__cond_resched_lock(lock);				\
2053613afbf8SFrederic Weisbecker })
2054613afbf8SFrederic Weisbecker 
2055f3d4b4b1SBen Gardon #define cond_resched_rwlock_read(lock) ({			\
2056f3d4b4b1SBen Gardon 	__might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);	\
2057f3d4b4b1SBen Gardon 	__cond_resched_rwlock_read(lock);			\
2058f3d4b4b1SBen Gardon })
2059f3d4b4b1SBen Gardon 
2060f3d4b4b1SBen Gardon #define cond_resched_rwlock_write(lock) ({			\
2061f3d4b4b1SBen Gardon 	__might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);	\
2062f3d4b4b1SBen Gardon 	__cond_resched_rwlock_write(lock);			\
2063f3d4b4b1SBen Gardon })
2064f3d4b4b1SBen Gardon 
2065f6f3c437SSimon Horman static inline void cond_resched_rcu(void)
2066f6f3c437SSimon Horman {
2067f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU)
2068f6f3c437SSimon Horman 	rcu_read_unlock();
2069f6f3c437SSimon Horman 	cond_resched();
2070f6f3c437SSimon Horman 	rcu_read_lock();
2071f6f3c437SSimon Horman #endif
2072f6f3c437SSimon Horman }
2073f6f3c437SSimon Horman 
20741da177e4SLinus Torvalds /*
20751da177e4SLinus Torvalds  * Does a critical section need to be broken due to another
2076c1a280b6SThomas Gleixner  * task waiting?: (technically does not depend on CONFIG_PREEMPTION,
207795c354feSNick Piggin  * but a general need for low latency)
20781da177e4SLinus Torvalds  */
207995c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock)
20801da177e4SLinus Torvalds {
2081c1a280b6SThomas Gleixner #ifdef CONFIG_PREEMPTION
208295c354feSNick Piggin 	return spin_is_contended(lock);
208395c354feSNick Piggin #else
20841da177e4SLinus Torvalds 	return 0;
208595c354feSNick Piggin #endif
20861da177e4SLinus Torvalds }
20871da177e4SLinus Torvalds 
2088a09a689aSBen Gardon /*
2089a09a689aSBen Gardon  * Check if a rwlock is contended.
2090a09a689aSBen Gardon  * Returns non-zero if there is another task waiting on the rwlock.
2091a09a689aSBen Gardon  * Returns zero if the lock is not contended or the system / underlying
2092a09a689aSBen Gardon  * rwlock implementation does not support contention detection.
2093a09a689aSBen Gardon  * Technically does not depend on CONFIG_PREEMPTION, but a general need
2094a09a689aSBen Gardon  * for low latency.
2095a09a689aSBen Gardon  */
2096a09a689aSBen Gardon static inline int rwlock_needbreak(rwlock_t *lock)
2097a09a689aSBen Gardon {
2098a09a689aSBen Gardon #ifdef CONFIG_PREEMPTION
2099a09a689aSBen Gardon 	return rwlock_is_contended(lock);
2100a09a689aSBen Gardon #else
2101a09a689aSBen Gardon 	return 0;
2102a09a689aSBen Gardon #endif
2103a09a689aSBen Gardon }
2104a09a689aSBen Gardon 
210575f93fedSPeter Zijlstra static __always_inline bool need_resched(void)
210675f93fedSPeter Zijlstra {
210775f93fedSPeter Zijlstra 	return unlikely(tif_need_resched());
210875f93fedSPeter Zijlstra }
210975f93fedSPeter Zijlstra 
2110ee761f62SThomas Gleixner /*
21111da177e4SLinus Torvalds  * Wrappers for p->thread_info->cpu access. No-op on UP.
21121da177e4SLinus Torvalds  */
21131da177e4SLinus Torvalds #ifdef CONFIG_SMP
21141da177e4SLinus Torvalds 
21151da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
21161da177e4SLinus Torvalds {
2117c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK
2118c546951dSAndrea Parri 	return READ_ONCE(p->cpu);
2119c65eacbeSAndy Lutomirski #else
2120c546951dSAndrea Parri 	return READ_ONCE(task_thread_info(p)->cpu);
2121c65eacbeSAndy Lutomirski #endif
21221da177e4SLinus Torvalds }
21231da177e4SLinus Torvalds 
2124c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu);
21251da177e4SLinus Torvalds 
21261da177e4SLinus Torvalds #else
21271da177e4SLinus Torvalds 
21281da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p)
21291da177e4SLinus Torvalds {
21301da177e4SLinus Torvalds 	return 0;
21311da177e4SLinus Torvalds }
21321da177e4SLinus Torvalds 
21331da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu)
21341da177e4SLinus Torvalds {
21351da177e4SLinus Torvalds }
21361da177e4SLinus Torvalds 
21371da177e4SLinus Torvalds #endif /* CONFIG_SMP */
21381da177e4SLinus Torvalds 
2139a1dfb631SMarcelo Tosatti extern bool sched_task_on_rq(struct task_struct *p);
2140a1dfb631SMarcelo Tosatti 
2141d9345c65SPan Xinhui /*
2142d9345c65SPan Xinhui  * In order to reduce various lock holder preemption latencies provide an
2143d9345c65SPan Xinhui  * interface to see if a vCPU is currently running or not.
2144d9345c65SPan Xinhui  *
2145d9345c65SPan Xinhui  * This allows us to terminate optimistic spin loops and block, analogous to
2146d9345c65SPan Xinhui  * the native optimistic spin heuristic of testing if the lock owner task is
2147d9345c65SPan Xinhui  * running or not.
2148d9345c65SPan Xinhui  */
2149d9345c65SPan Xinhui #ifndef vcpu_is_preempted
215042fd8baaSQian Cai static inline bool vcpu_is_preempted(int cpu)
215142fd8baaSQian Cai {
215242fd8baaSQian Cai 	return false;
215342fd8baaSQian Cai }
2154d9345c65SPan Xinhui #endif
2155d9345c65SPan Xinhui 
215696f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask);
215796f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask);
21585c45bf27SSiddha, Suresh B 
215982455257SDave Hansen #ifndef TASK_SIZE_OF
216082455257SDave Hansen #define TASK_SIZE_OF(tsk)	TASK_SIZE
216182455257SDave Hansen #endif
216282455257SDave Hansen 
2163a5418be9SViresh Kumar #ifdef CONFIG_SMP
2164a5418be9SViresh Kumar /* Returns effective CPU energy utilization, as seen by the scheduler */
2165a5418be9SViresh Kumar unsigned long sched_cpu_util(int cpu, unsigned long max);
2166a5418be9SViresh Kumar #endif /* CONFIG_SMP */
2167a5418be9SViresh Kumar 
2168d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ
2169d7822b1eSMathieu Desnoyers 
2170d7822b1eSMathieu Desnoyers /*
2171d7822b1eSMathieu Desnoyers  * Map the event mask on the user-space ABI enum rseq_cs_flags
2172d7822b1eSMathieu Desnoyers  * for direct mask checks.
2173d7822b1eSMathieu Desnoyers  */
2174d7822b1eSMathieu Desnoyers enum rseq_event_mask_bits {
2175d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_PREEMPT_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_PREEMPT_BIT,
2176d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_SIGNAL_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_SIGNAL_BIT,
2177d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_MIGRATE_BIT	= RSEQ_CS_FLAG_NO_RESTART_ON_MIGRATE_BIT,
2178d7822b1eSMathieu Desnoyers };
2179d7822b1eSMathieu Desnoyers 
2180d7822b1eSMathieu Desnoyers enum rseq_event_mask {
2181d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_PREEMPT	= (1U << RSEQ_EVENT_PREEMPT_BIT),
2182d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_SIGNAL	= (1U << RSEQ_EVENT_SIGNAL_BIT),
2183d7822b1eSMathieu Desnoyers 	RSEQ_EVENT_MIGRATE	= (1U << RSEQ_EVENT_MIGRATE_BIT),
2184d7822b1eSMathieu Desnoyers };
2185d7822b1eSMathieu Desnoyers 
2186d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t)
2187d7822b1eSMathieu Desnoyers {
2188d7822b1eSMathieu Desnoyers 	if (t->rseq)
2189d7822b1eSMathieu Desnoyers 		set_tsk_thread_flag(t, TIF_NOTIFY_RESUME);
2190d7822b1eSMathieu Desnoyers }
2191d7822b1eSMathieu Desnoyers 
2192784e0300SWill Deacon void __rseq_handle_notify_resume(struct ksignal *sig, struct pt_regs *regs);
2193d7822b1eSMathieu Desnoyers 
2194784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig,
2195784e0300SWill Deacon 					     struct pt_regs *regs)
2196d7822b1eSMathieu Desnoyers {
2197d7822b1eSMathieu Desnoyers 	if (current->rseq)
2198784e0300SWill Deacon 		__rseq_handle_notify_resume(ksig, regs);
2199d7822b1eSMathieu Desnoyers }
2200d7822b1eSMathieu Desnoyers 
2201784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig,
2202784e0300SWill Deacon 				       struct pt_regs *regs)
2203d7822b1eSMathieu Desnoyers {
2204d7822b1eSMathieu Desnoyers 	preempt_disable();
2205d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_SIGNAL_BIT, &current->rseq_event_mask);
2206d7822b1eSMathieu Desnoyers 	preempt_enable();
2207784e0300SWill Deacon 	rseq_handle_notify_resume(ksig, regs);
2208d7822b1eSMathieu Desnoyers }
2209d7822b1eSMathieu Desnoyers 
2210d7822b1eSMathieu Desnoyers /* rseq_preempt() requires preemption to be disabled. */
2211d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t)
2212d7822b1eSMathieu Desnoyers {
2213d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_PREEMPT_BIT, &t->rseq_event_mask);
2214d7822b1eSMathieu Desnoyers 	rseq_set_notify_resume(t);
2215d7822b1eSMathieu Desnoyers }
2216d7822b1eSMathieu Desnoyers 
2217d7822b1eSMathieu Desnoyers /* rseq_migrate() requires preemption to be disabled. */
2218d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t)
2219d7822b1eSMathieu Desnoyers {
2220d7822b1eSMathieu Desnoyers 	__set_bit(RSEQ_EVENT_MIGRATE_BIT, &t->rseq_event_mask);
2221d7822b1eSMathieu Desnoyers 	rseq_set_notify_resume(t);
2222d7822b1eSMathieu Desnoyers }
2223d7822b1eSMathieu Desnoyers 
2224d7822b1eSMathieu Desnoyers /*
2225d7822b1eSMathieu Desnoyers  * If parent process has a registered restartable sequences area, the
2226463f550fSMathieu Desnoyers  * child inherits. Unregister rseq for a clone with CLONE_VM set.
2227d7822b1eSMathieu Desnoyers  */
2228d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags)
2229d7822b1eSMathieu Desnoyers {
2230463f550fSMathieu Desnoyers 	if (clone_flags & CLONE_VM) {
2231d7822b1eSMathieu Desnoyers 		t->rseq = NULL;
2232d7822b1eSMathieu Desnoyers 		t->rseq_sig = 0;
2233d7822b1eSMathieu Desnoyers 		t->rseq_event_mask = 0;
2234d7822b1eSMathieu Desnoyers 	} else {
2235d7822b1eSMathieu Desnoyers 		t->rseq = current->rseq;
2236d7822b1eSMathieu Desnoyers 		t->rseq_sig = current->rseq_sig;
2237d7822b1eSMathieu Desnoyers 		t->rseq_event_mask = current->rseq_event_mask;
2238d7822b1eSMathieu Desnoyers 	}
2239d7822b1eSMathieu Desnoyers }
2240d7822b1eSMathieu Desnoyers 
2241d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t)
2242d7822b1eSMathieu Desnoyers {
2243d7822b1eSMathieu Desnoyers 	t->rseq = NULL;
2244d7822b1eSMathieu Desnoyers 	t->rseq_sig = 0;
2245d7822b1eSMathieu Desnoyers 	t->rseq_event_mask = 0;
2246d7822b1eSMathieu Desnoyers }
2247d7822b1eSMathieu Desnoyers 
2248d7822b1eSMathieu Desnoyers #else
2249d7822b1eSMathieu Desnoyers 
2250d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t)
2251d7822b1eSMathieu Desnoyers {
2252d7822b1eSMathieu Desnoyers }
2253784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig,
2254784e0300SWill Deacon 					     struct pt_regs *regs)
2255d7822b1eSMathieu Desnoyers {
2256d7822b1eSMathieu Desnoyers }
2257784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig,
2258784e0300SWill Deacon 				       struct pt_regs *regs)
2259d7822b1eSMathieu Desnoyers {
2260d7822b1eSMathieu Desnoyers }
2261d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t)
2262d7822b1eSMathieu Desnoyers {
2263d7822b1eSMathieu Desnoyers }
2264d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t)
2265d7822b1eSMathieu Desnoyers {
2266d7822b1eSMathieu Desnoyers }
2267d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags)
2268d7822b1eSMathieu Desnoyers {
2269d7822b1eSMathieu Desnoyers }
2270d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t)
2271d7822b1eSMathieu Desnoyers {
2272d7822b1eSMathieu Desnoyers }
2273d7822b1eSMathieu Desnoyers 
2274d7822b1eSMathieu Desnoyers #endif
2275d7822b1eSMathieu Desnoyers 
2276d7822b1eSMathieu Desnoyers #ifdef CONFIG_DEBUG_RSEQ
2277d7822b1eSMathieu Desnoyers 
2278d7822b1eSMathieu Desnoyers void rseq_syscall(struct pt_regs *regs);
2279d7822b1eSMathieu Desnoyers 
2280d7822b1eSMathieu Desnoyers #else
2281d7822b1eSMathieu Desnoyers 
2282d7822b1eSMathieu Desnoyers static inline void rseq_syscall(struct pt_regs *regs)
2283d7822b1eSMathieu Desnoyers {
2284d7822b1eSMathieu Desnoyers }
2285d7822b1eSMathieu Desnoyers 
2286d7822b1eSMathieu Desnoyers #endif
2287d7822b1eSMathieu Desnoyers 
22883c93a0c0SQais Yousef const struct sched_avg *sched_trace_cfs_rq_avg(struct cfs_rq *cfs_rq);
22893c93a0c0SQais Yousef char *sched_trace_cfs_rq_path(struct cfs_rq *cfs_rq, char *str, int len);
22903c93a0c0SQais Yousef int sched_trace_cfs_rq_cpu(struct cfs_rq *cfs_rq);
22913c93a0c0SQais Yousef 
22923c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_rt(struct rq *rq);
22933c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_dl(struct rq *rq);
22943c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_irq(struct rq *rq);
22953c93a0c0SQais Yousef 
22963c93a0c0SQais Yousef int sched_trace_rq_cpu(struct rq *rq);
229751cf18c9SVincent Donnefort int sched_trace_rq_cpu_capacity(struct rq *rq);
22989d246053SPhil Auld int sched_trace_rq_nr_running(struct rq *rq);
22993c93a0c0SQais Yousef 
23003c93a0c0SQais Yousef const struct cpumask *sched_trace_rd_span(struct root_domain *rd);
23013c93a0c0SQais Yousef 
23026e33cad0SPeter Zijlstra #ifdef CONFIG_SCHED_CORE
23036e33cad0SPeter Zijlstra extern void sched_core_free(struct task_struct *tsk);
230485dd3f61SPeter Zijlstra extern void sched_core_fork(struct task_struct *p);
23057ac592aaSChris Hyser extern int sched_core_share_pid(unsigned int cmd, pid_t pid, enum pid_type type,
23067ac592aaSChris Hyser 				unsigned long uaddr);
23076e33cad0SPeter Zijlstra #else
23086e33cad0SPeter Zijlstra static inline void sched_core_free(struct task_struct *tsk) { }
230985dd3f61SPeter Zijlstra static inline void sched_core_fork(struct task_struct *p) { }
23106e33cad0SPeter Zijlstra #endif
23116e33cad0SPeter Zijlstra 
23121da177e4SLinus Torvalds #endif
2313