1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */ 21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H 31da177e4SLinus Torvalds #define _LINUX_SCHED_H 41da177e4SLinus Torvalds 55eca1c10SIngo Molnar /* 65eca1c10SIngo Molnar * Define 'struct task_struct' and provide the main scheduler 75eca1c10SIngo Molnar * APIs (schedule(), wakeup variants, etc.) 85eca1c10SIngo Molnar */ 95eca1c10SIngo Molnar 10607ca46eSDavid Howells #include <uapi/linux/sched.h> 11b7b3c76aSDavid Woodhouse 1270b8157eSIngo Molnar #include <asm/current.h> 1370b8157eSIngo Molnar 145eca1c10SIngo Molnar #include <linux/pid.h> 155eca1c10SIngo Molnar #include <linux/sem.h> 165eca1c10SIngo Molnar #include <linux/shm.h> 175eca1c10SIngo Molnar #include <linux/mutex.h> 185eca1c10SIngo Molnar #include <linux/plist.h> 195eca1c10SIngo Molnar #include <linux/hrtimer.h> 200584df9cSMarco Elver #include <linux/irqflags.h> 215eca1c10SIngo Molnar #include <linux/seccomp.h> 225eca1c10SIngo Molnar #include <linux/nodemask.h> 235eca1c10SIngo Molnar #include <linux/rcupdate.h> 24ec1d2819SElena Reshetova #include <linux/refcount.h> 255eca1c10SIngo Molnar #include <linux/resource.h> 265eca1c10SIngo Molnar #include <linux/latencytop.h> 275eca1c10SIngo Molnar #include <linux/sched/prio.h> 289eacb5c7SThomas Gleixner #include <linux/sched/types.h> 295eca1c10SIngo Molnar #include <linux/signal_types.h> 301446e1dfSGabriel Krisman Bertazi #include <linux/syscall_user_dispatch.h> 315eca1c10SIngo Molnar #include <linux/mm_types_task.h> 325eca1c10SIngo Molnar #include <linux/task_io_accounting.h> 332b69942fSThomas Gleixner #include <linux/posix-timers.h> 34d7822b1eSMathieu Desnoyers #include <linux/rseq.h> 350cd39f46SPeter Zijlstra #include <linux/seqlock.h> 36dfd402a4SMarco Elver #include <linux/kcsan.h> 37102227b9SDaniel Bristot de Oliveira #include <linux/rv.h> 385fbda3ecSThomas Gleixner #include <asm/kmap_size.h> 395eca1c10SIngo Molnar 405eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */ 41c7af7877SIngo Molnar struct audit_context; 42c7af7877SIngo Molnar struct backing_dev_info; 43c7af7877SIngo Molnar struct bio_list; 44c7af7877SIngo Molnar struct blk_plug; 45a10787e6SSong Liu struct bpf_local_storage; 46c7603cfaSAndrii Nakryiko struct bpf_run_ctx; 473c93a0c0SQais Yousef struct capture_control; 48c7af7877SIngo Molnar struct cfs_rq; 49c7af7877SIngo Molnar struct fs_struct; 50c7af7877SIngo Molnar struct futex_pi_state; 51c7af7877SIngo Molnar struct io_context; 521875dc5bSPeter Oskolkov struct io_uring_task; 53c7af7877SIngo Molnar struct mempolicy; 54c7af7877SIngo Molnar struct nameidata; 55c7af7877SIngo Molnar struct nsproxy; 56c7af7877SIngo Molnar struct perf_event_context; 57c7af7877SIngo Molnar struct pid_namespace; 58c7af7877SIngo Molnar struct pipe_inode_info; 59c7af7877SIngo Molnar struct rcu_node; 60c7af7877SIngo Molnar struct reclaim_state; 61c7af7877SIngo Molnar struct robust_list_head; 623c93a0c0SQais Yousef struct root_domain; 633c93a0c0SQais Yousef struct rq; 64e2d1e2aeSIngo Molnar struct sched_attr; 65e2d1e2aeSIngo Molnar struct sched_param; 6643ae34cbSIngo Molnar struct seq_file; 67c7af7877SIngo Molnar struct sighand_struct; 68c7af7877SIngo Molnar struct signal_struct; 69c7af7877SIngo Molnar struct task_delay_info; 704cf86d77SIngo Molnar struct task_group; 711da177e4SLinus Torvalds 724a8342d2SLinus Torvalds /* 734a8342d2SLinus Torvalds * Task state bitmask. NOTE! These bits are also 744a8342d2SLinus Torvalds * encoded in fs/proc/array.c: get_task_state(). 754a8342d2SLinus Torvalds * 764a8342d2SLinus Torvalds * We have two separate sets of flags: task->state 774a8342d2SLinus Torvalds * is about runnability, while task->exit_state are 784a8342d2SLinus Torvalds * about the task exiting. Confusing, but this way 794a8342d2SLinus Torvalds * modifying one set can't modify the other one by 804a8342d2SLinus Torvalds * mistake. 814a8342d2SLinus Torvalds */ 825eca1c10SIngo Molnar 835eca1c10SIngo Molnar /* Used in tsk->state: */ 8492c4bc9fSPeter Zijlstra #define TASK_RUNNING 0x0000 8592c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE 0x0001 8692c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE 0x0002 8792c4bc9fSPeter Zijlstra #define __TASK_STOPPED 0x0004 8892c4bc9fSPeter Zijlstra #define __TASK_TRACED 0x0008 895eca1c10SIngo Molnar /* Used in tsk->exit_state: */ 9092c4bc9fSPeter Zijlstra #define EXIT_DEAD 0x0010 9192c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE 0x0020 92abd50b39SOleg Nesterov #define EXIT_TRACE (EXIT_ZOMBIE | EXIT_DEAD) 935eca1c10SIngo Molnar /* Used in tsk->state again: */ 948ef9925bSPeter Zijlstra #define TASK_PARKED 0x0040 958ef9925bSPeter Zijlstra #define TASK_DEAD 0x0080 968ef9925bSPeter Zijlstra #define TASK_WAKEKILL 0x0100 978ef9925bSPeter Zijlstra #define TASK_WAKING 0x0200 9892c4bc9fSPeter Zijlstra #define TASK_NOLOAD 0x0400 9992c4bc9fSPeter Zijlstra #define TASK_NEW 0x0800 100cd781d0cSThomas Gleixner /* RT specific auxilliary flag to mark RT lock waiters */ 101cd781d0cSThomas Gleixner #define TASK_RTLOCK_WAIT 0x1000 102cd781d0cSThomas Gleixner #define TASK_STATE_MAX 0x2000 103f021a3c2SMatthew Wilcox 1045eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */ 105f021a3c2SMatthew Wilcox #define TASK_KILLABLE (TASK_WAKEKILL | TASK_UNINTERRUPTIBLE) 106f021a3c2SMatthew Wilcox #define TASK_STOPPED (TASK_WAKEKILL | __TASK_STOPPED) 1072500ad1cSEric W. Biederman #define TASK_TRACED __TASK_TRACED 1081da177e4SLinus Torvalds 10980ed87c8SPeter Zijlstra #define TASK_IDLE (TASK_UNINTERRUPTIBLE | TASK_NOLOAD) 11080ed87c8SPeter Zijlstra 1115eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */ 11292a1f4bcSMatthew Wilcox #define TASK_NORMAL (TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE) 11392a1f4bcSMatthew Wilcox 1145eca1c10SIngo Molnar /* get_task_state(): */ 11592a1f4bcSMatthew Wilcox #define TASK_REPORT (TASK_RUNNING | TASK_INTERRUPTIBLE | \ 116f021a3c2SMatthew Wilcox TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \ 1178ef9925bSPeter Zijlstra __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \ 1188ef9925bSPeter Zijlstra TASK_PARKED) 11992a1f4bcSMatthew Wilcox 1202f064a59SPeter Zijlstra #define task_is_running(task) (READ_ONCE((task)->__state) == TASK_RUNNING) 1215eca1c10SIngo Molnar 12231cae1eaSPeter Zijlstra #define task_is_traced(task) ((READ_ONCE(task->jobctl) & JOBCTL_TRACED) != 0) 12331cae1eaSPeter Zijlstra #define task_is_stopped(task) ((READ_ONCE(task->jobctl) & JOBCTL_STOPPED) != 0) 12431cae1eaSPeter Zijlstra #define task_is_stopped_or_traced(task) ((READ_ONCE(task->jobctl) & (JOBCTL_STOPPED | JOBCTL_TRACED)) != 0) 1255eca1c10SIngo Molnar 126b5bf9a90SPeter Zijlstra /* 127b5bf9a90SPeter Zijlstra * Special states are those that do not use the normal wait-loop pattern. See 128b5bf9a90SPeter Zijlstra * the comment with set_special_state(). 129b5bf9a90SPeter Zijlstra */ 130b5bf9a90SPeter Zijlstra #define is_special_task_state(state) \ 1311cef1150SPeter Zijlstra ((state) & (__TASK_STOPPED | __TASK_TRACED | TASK_PARKED | TASK_DEAD)) 132b5bf9a90SPeter Zijlstra 13385019c16SThomas Gleixner #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 13485019c16SThomas Gleixner # define debug_normal_state_change(state_value) \ 1358eb23b9fSPeter Zijlstra do { \ 136b5bf9a90SPeter Zijlstra WARN_ON_ONCE(is_special_task_state(state_value)); \ 1378eb23b9fSPeter Zijlstra current->task_state_change = _THIS_IP_; \ 1388eb23b9fSPeter Zijlstra } while (0) 139b5bf9a90SPeter Zijlstra 14085019c16SThomas Gleixner # define debug_special_state_change(state_value) \ 1418eb23b9fSPeter Zijlstra do { \ 142b5bf9a90SPeter Zijlstra WARN_ON_ONCE(!is_special_task_state(state_value)); \ 143b5bf9a90SPeter Zijlstra current->task_state_change = _THIS_IP_; \ 144b5bf9a90SPeter Zijlstra } while (0) 14585019c16SThomas Gleixner 1465f220be2SThomas Gleixner # define debug_rtlock_wait_set_state() \ 1475f220be2SThomas Gleixner do { \ 1485f220be2SThomas Gleixner current->saved_state_change = current->task_state_change;\ 1495f220be2SThomas Gleixner current->task_state_change = _THIS_IP_; \ 1505f220be2SThomas Gleixner } while (0) 1515f220be2SThomas Gleixner 1525f220be2SThomas Gleixner # define debug_rtlock_wait_restore_state() \ 1535f220be2SThomas Gleixner do { \ 1545f220be2SThomas Gleixner current->task_state_change = current->saved_state_change;\ 1555f220be2SThomas Gleixner } while (0) 1565f220be2SThomas Gleixner 1578eb23b9fSPeter Zijlstra #else 15885019c16SThomas Gleixner # define debug_normal_state_change(cond) do { } while (0) 15985019c16SThomas Gleixner # define debug_special_state_change(cond) do { } while (0) 1605f220be2SThomas Gleixner # define debug_rtlock_wait_set_state() do { } while (0) 1615f220be2SThomas Gleixner # define debug_rtlock_wait_restore_state() do { } while (0) 16285019c16SThomas Gleixner #endif 16385019c16SThomas Gleixner 164498d0c57SAndrew Morton /* 165498d0c57SAndrew Morton * set_current_state() includes a barrier so that the write of current->state 166498d0c57SAndrew Morton * is correctly serialised wrt the caller's subsequent test of whether to 167498d0c57SAndrew Morton * actually sleep: 168498d0c57SAndrew Morton * 169a2250238SPeter Zijlstra * for (;;) { 170498d0c57SAndrew Morton * set_current_state(TASK_UNINTERRUPTIBLE); 17158877d34SPeter Zijlstra * if (CONDITION) 172a2250238SPeter Zijlstra * break; 173498d0c57SAndrew Morton * 174a2250238SPeter Zijlstra * schedule(); 175a2250238SPeter Zijlstra * } 176a2250238SPeter Zijlstra * __set_current_state(TASK_RUNNING); 177a2250238SPeter Zijlstra * 178a2250238SPeter Zijlstra * If the caller does not need such serialisation (because, for instance, the 17958877d34SPeter Zijlstra * CONDITION test and condition change and wakeup are under the same lock) then 180a2250238SPeter Zijlstra * use __set_current_state(). 181a2250238SPeter Zijlstra * 182a2250238SPeter Zijlstra * The above is typically ordered against the wakeup, which does: 183a2250238SPeter Zijlstra * 18458877d34SPeter Zijlstra * CONDITION = 1; 185a2250238SPeter Zijlstra * wake_up_state(p, TASK_UNINTERRUPTIBLE); 186a2250238SPeter Zijlstra * 18758877d34SPeter Zijlstra * where wake_up_state()/try_to_wake_up() executes a full memory barrier before 18858877d34SPeter Zijlstra * accessing p->state. 189a2250238SPeter Zijlstra * 190a2250238SPeter Zijlstra * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is, 191a2250238SPeter Zijlstra * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a 192a2250238SPeter Zijlstra * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING). 193a2250238SPeter Zijlstra * 194b5bf9a90SPeter Zijlstra * However, with slightly different timing the wakeup TASK_RUNNING store can 195dfcb245eSIngo Molnar * also collide with the TASK_UNINTERRUPTIBLE store. Losing that store is not 196b5bf9a90SPeter Zijlstra * a problem either because that will result in one extra go around the loop 197b5bf9a90SPeter Zijlstra * and our @cond test will save the day. 198a2250238SPeter Zijlstra * 199a2250238SPeter Zijlstra * Also see the comments of try_to_wake_up(). 200498d0c57SAndrew Morton */ 201b5bf9a90SPeter Zijlstra #define __set_current_state(state_value) \ 20285019c16SThomas Gleixner do { \ 20385019c16SThomas Gleixner debug_normal_state_change((state_value)); \ 20485019c16SThomas Gleixner WRITE_ONCE(current->__state, (state_value)); \ 20585019c16SThomas Gleixner } while (0) 206b5bf9a90SPeter Zijlstra 207b5bf9a90SPeter Zijlstra #define set_current_state(state_value) \ 20885019c16SThomas Gleixner do { \ 20985019c16SThomas Gleixner debug_normal_state_change((state_value)); \ 21085019c16SThomas Gleixner smp_store_mb(current->__state, (state_value)); \ 21185019c16SThomas Gleixner } while (0) 212b5bf9a90SPeter Zijlstra 213b5bf9a90SPeter Zijlstra /* 214b5bf9a90SPeter Zijlstra * set_special_state() should be used for those states when the blocking task 215b5bf9a90SPeter Zijlstra * can not use the regular condition based wait-loop. In that case we must 21685019c16SThomas Gleixner * serialize against wakeups such that any possible in-flight TASK_RUNNING 21785019c16SThomas Gleixner * stores will not collide with our state change. 218b5bf9a90SPeter Zijlstra */ 219b5bf9a90SPeter Zijlstra #define set_special_state(state_value) \ 220b5bf9a90SPeter Zijlstra do { \ 221b5bf9a90SPeter Zijlstra unsigned long flags; /* may shadow */ \ 22285019c16SThomas Gleixner \ 223b5bf9a90SPeter Zijlstra raw_spin_lock_irqsave(¤t->pi_lock, flags); \ 22485019c16SThomas Gleixner debug_special_state_change((state_value)); \ 2252f064a59SPeter Zijlstra WRITE_ONCE(current->__state, (state_value)); \ 226b5bf9a90SPeter Zijlstra raw_spin_unlock_irqrestore(¤t->pi_lock, flags); \ 227b5bf9a90SPeter Zijlstra } while (0) 228b5bf9a90SPeter Zijlstra 2295f220be2SThomas Gleixner /* 2305f220be2SThomas Gleixner * PREEMPT_RT specific variants for "sleeping" spin/rwlocks 2315f220be2SThomas Gleixner * 2325f220be2SThomas Gleixner * RT's spin/rwlock substitutions are state preserving. The state of the 2335f220be2SThomas Gleixner * task when blocking on the lock is saved in task_struct::saved_state and 2345f220be2SThomas Gleixner * restored after the lock has been acquired. These operations are 2355f220be2SThomas Gleixner * serialized by task_struct::pi_lock against try_to_wake_up(). Any non RT 2365f220be2SThomas Gleixner * lock related wakeups while the task is blocked on the lock are 2375f220be2SThomas Gleixner * redirected to operate on task_struct::saved_state to ensure that these 2385f220be2SThomas Gleixner * are not dropped. On restore task_struct::saved_state is set to 2395f220be2SThomas Gleixner * TASK_RUNNING so any wakeup attempt redirected to saved_state will fail. 2405f220be2SThomas Gleixner * 2415f220be2SThomas Gleixner * The lock operation looks like this: 2425f220be2SThomas Gleixner * 2435f220be2SThomas Gleixner * current_save_and_set_rtlock_wait_state(); 2445f220be2SThomas Gleixner * for (;;) { 2455f220be2SThomas Gleixner * if (try_lock()) 2465f220be2SThomas Gleixner * break; 2475f220be2SThomas Gleixner * raw_spin_unlock_irq(&lock->wait_lock); 2485f220be2SThomas Gleixner * schedule_rtlock(); 2495f220be2SThomas Gleixner * raw_spin_lock_irq(&lock->wait_lock); 2505f220be2SThomas Gleixner * set_current_state(TASK_RTLOCK_WAIT); 2515f220be2SThomas Gleixner * } 2525f220be2SThomas Gleixner * current_restore_rtlock_saved_state(); 2535f220be2SThomas Gleixner */ 2545f220be2SThomas Gleixner #define current_save_and_set_rtlock_wait_state() \ 2555f220be2SThomas Gleixner do { \ 2565f220be2SThomas Gleixner lockdep_assert_irqs_disabled(); \ 2575f220be2SThomas Gleixner raw_spin_lock(¤t->pi_lock); \ 2585f220be2SThomas Gleixner current->saved_state = current->__state; \ 2595f220be2SThomas Gleixner debug_rtlock_wait_set_state(); \ 2605f220be2SThomas Gleixner WRITE_ONCE(current->__state, TASK_RTLOCK_WAIT); \ 2615f220be2SThomas Gleixner raw_spin_unlock(¤t->pi_lock); \ 2625f220be2SThomas Gleixner } while (0); 2635f220be2SThomas Gleixner 2645f220be2SThomas Gleixner #define current_restore_rtlock_saved_state() \ 2655f220be2SThomas Gleixner do { \ 2665f220be2SThomas Gleixner lockdep_assert_irqs_disabled(); \ 2675f220be2SThomas Gleixner raw_spin_lock(¤t->pi_lock); \ 2685f220be2SThomas Gleixner debug_rtlock_wait_restore_state(); \ 2695f220be2SThomas Gleixner WRITE_ONCE(current->__state, current->saved_state); \ 2705f220be2SThomas Gleixner current->saved_state = TASK_RUNNING; \ 2715f220be2SThomas Gleixner raw_spin_unlock(¤t->pi_lock); \ 2725f220be2SThomas Gleixner } while (0); 2738eb23b9fSPeter Zijlstra 2742f064a59SPeter Zijlstra #define get_current_state() READ_ONCE(current->__state) 275d6c23bb3SPeter Zijlstra 2763087c61eSYafang Shao /* 2773087c61eSYafang Shao * Define the task command name length as enum, then it can be visible to 2783087c61eSYafang Shao * BPF programs. 2793087c61eSYafang Shao */ 2803087c61eSYafang Shao enum { 2813087c61eSYafang Shao TASK_COMM_LEN = 16, 2823087c61eSYafang Shao }; 2831da177e4SLinus Torvalds 2841da177e4SLinus Torvalds extern void scheduler_tick(void); 2851da177e4SLinus Torvalds 2861da177e4SLinus Torvalds #define MAX_SCHEDULE_TIMEOUT LONG_MAX 2875eca1c10SIngo Molnar 2885eca1c10SIngo Molnar extern long schedule_timeout(long timeout); 2895eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout); 2905eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout); 2915eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout); 2925eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout); 2931da177e4SLinus Torvalds asmlinkage void schedule(void); 294c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void); 29519c95f26SJulien Thierry asmlinkage void preempt_schedule_irq(void); 2966991436cSThomas Gleixner #ifdef CONFIG_PREEMPT_RT 2976991436cSThomas Gleixner extern void schedule_rtlock(void); 2986991436cSThomas Gleixner #endif 2991da177e4SLinus Torvalds 30010ab5643STejun Heo extern int __must_check io_schedule_prepare(void); 30110ab5643STejun Heo extern void io_schedule_finish(int token); 3029cff8adeSNeilBrown extern long io_schedule_timeout(long timeout); 30310ab5643STejun Heo extern void io_schedule(void); 3049cff8adeSNeilBrown 305f06febc9SFrank Mayhar /** 3060ba42a59SMasanari Iida * struct prev_cputime - snapshot of system and user cputime 307d37f761dSFrederic Weisbecker * @utime: time spent in user mode 308d37f761dSFrederic Weisbecker * @stime: time spent in system mode 3099d7fb042SPeter Zijlstra * @lock: protects the above two fields 310d37f761dSFrederic Weisbecker * 3119d7fb042SPeter Zijlstra * Stores previous user/system time values such that we can guarantee 3129d7fb042SPeter Zijlstra * monotonicity. 313d37f761dSFrederic Weisbecker */ 3149d7fb042SPeter Zijlstra struct prev_cputime { 3159d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE 3165613fda9SFrederic Weisbecker u64 utime; 3175613fda9SFrederic Weisbecker u64 stime; 3189d7fb042SPeter Zijlstra raw_spinlock_t lock; 3199d7fb042SPeter Zijlstra #endif 320d37f761dSFrederic Weisbecker }; 321d37f761dSFrederic Weisbecker 322bac5b6b6SFrederic Weisbecker enum vtime_state { 323bac5b6b6SFrederic Weisbecker /* Task is sleeping or running in a CPU with VTIME inactive: */ 324bac5b6b6SFrederic Weisbecker VTIME_INACTIVE = 0, 32514faf6fcSFrederic Weisbecker /* Task is idle */ 32614faf6fcSFrederic Weisbecker VTIME_IDLE, 327bac5b6b6SFrederic Weisbecker /* Task runs in kernelspace in a CPU with VTIME active: */ 328bac5b6b6SFrederic Weisbecker VTIME_SYS, 32914faf6fcSFrederic Weisbecker /* Task runs in userspace in a CPU with VTIME active: */ 33014faf6fcSFrederic Weisbecker VTIME_USER, 331e6d5bf3eSFrederic Weisbecker /* Task runs as guests in a CPU with VTIME active: */ 332e6d5bf3eSFrederic Weisbecker VTIME_GUEST, 333bac5b6b6SFrederic Weisbecker }; 334bac5b6b6SFrederic Weisbecker 335bac5b6b6SFrederic Weisbecker struct vtime { 336bac5b6b6SFrederic Weisbecker seqcount_t seqcount; 337bac5b6b6SFrederic Weisbecker unsigned long long starttime; 338bac5b6b6SFrederic Weisbecker enum vtime_state state; 339802f4a82SFrederic Weisbecker unsigned int cpu; 3402a42eb95SWanpeng Li u64 utime; 3412a42eb95SWanpeng Li u64 stime; 3422a42eb95SWanpeng Li u64 gtime; 343bac5b6b6SFrederic Weisbecker }; 344bac5b6b6SFrederic Weisbecker 34569842cbaSPatrick Bellasi /* 34669842cbaSPatrick Bellasi * Utilization clamp constraints. 34769842cbaSPatrick Bellasi * @UCLAMP_MIN: Minimum utilization 34869842cbaSPatrick Bellasi * @UCLAMP_MAX: Maximum utilization 34969842cbaSPatrick Bellasi * @UCLAMP_CNT: Utilization clamp constraints count 35069842cbaSPatrick Bellasi */ 35169842cbaSPatrick Bellasi enum uclamp_id { 35269842cbaSPatrick Bellasi UCLAMP_MIN = 0, 35369842cbaSPatrick Bellasi UCLAMP_MAX, 35469842cbaSPatrick Bellasi UCLAMP_CNT 35569842cbaSPatrick Bellasi }; 35669842cbaSPatrick Bellasi 357f9a25f77SMathieu Poirier #ifdef CONFIG_SMP 358f9a25f77SMathieu Poirier extern struct root_domain def_root_domain; 359f9a25f77SMathieu Poirier extern struct mutex sched_domains_mutex; 360f9a25f77SMathieu Poirier #endif 361f9a25f77SMathieu Poirier 3621da177e4SLinus Torvalds struct sched_info { 3637f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO 3645eca1c10SIngo Molnar /* Cumulative counters: */ 3651da177e4SLinus Torvalds 3665eca1c10SIngo Molnar /* # of times we have run on this CPU: */ 3675eca1c10SIngo Molnar unsigned long pcount; 3685eca1c10SIngo Molnar 3695eca1c10SIngo Molnar /* Time spent waiting on a runqueue: */ 3705eca1c10SIngo Molnar unsigned long long run_delay; 3715eca1c10SIngo Molnar 3725eca1c10SIngo Molnar /* Timestamps: */ 3735eca1c10SIngo Molnar 3745eca1c10SIngo Molnar /* When did we last run on a CPU? */ 3755eca1c10SIngo Molnar unsigned long long last_arrival; 3765eca1c10SIngo Molnar 3775eca1c10SIngo Molnar /* When were we last queued to run? */ 3785eca1c10SIngo Molnar unsigned long long last_queued; 3795eca1c10SIngo Molnar 380f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */ 3817f5f8e8dSIngo Molnar }; 3821da177e4SLinus Torvalds 3831da177e4SLinus Torvalds /* 3846ecdd749SYuyang Du * Integer metrics need fixed point arithmetic, e.g., sched/fair 3856ecdd749SYuyang Du * has a few: load, load_avg, util_avg, freq, and capacity. 3866ecdd749SYuyang Du * 3876ecdd749SYuyang Du * We define a basic fixed point arithmetic range, and then formalize 3886ecdd749SYuyang Du * all these metrics based on that basic range. 3896ecdd749SYuyang Du */ 3906ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT 10 3916ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE (1L << SCHED_FIXEDPOINT_SHIFT) 3926ecdd749SYuyang Du 39369842cbaSPatrick Bellasi /* Increase resolution of cpu_capacity calculations */ 39469842cbaSPatrick Bellasi # define SCHED_CAPACITY_SHIFT SCHED_FIXEDPOINT_SHIFT 39569842cbaSPatrick Bellasi # define SCHED_CAPACITY_SCALE (1L << SCHED_CAPACITY_SHIFT) 39669842cbaSPatrick Bellasi 39720b8a59fSIngo Molnar struct load_weight { 3989dbdb155SPeter Zijlstra unsigned long weight; 3999dbdb155SPeter Zijlstra u32 inv_weight; 40020b8a59fSIngo Molnar }; 40120b8a59fSIngo Molnar 4027f65ea42SPatrick Bellasi /** 4037f65ea42SPatrick Bellasi * struct util_est - Estimation utilization of FAIR tasks 4047f65ea42SPatrick Bellasi * @enqueued: instantaneous estimated utilization of a task/cpu 4057f65ea42SPatrick Bellasi * @ewma: the Exponential Weighted Moving Average (EWMA) 4067f65ea42SPatrick Bellasi * utilization of a task 4077f65ea42SPatrick Bellasi * 4087f65ea42SPatrick Bellasi * Support data structure to track an Exponential Weighted Moving Average 4097f65ea42SPatrick Bellasi * (EWMA) of a FAIR task's utilization. New samples are added to the moving 4107f65ea42SPatrick Bellasi * average each time a task completes an activation. Sample's weight is chosen 4117f65ea42SPatrick Bellasi * so that the EWMA will be relatively insensitive to transient changes to the 4127f65ea42SPatrick Bellasi * task's workload. 4137f65ea42SPatrick Bellasi * 4147f65ea42SPatrick Bellasi * The enqueued attribute has a slightly different meaning for tasks and cpus: 4157f65ea42SPatrick Bellasi * - task: the task's util_avg at last task dequeue time 4167f65ea42SPatrick Bellasi * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU 4177f65ea42SPatrick Bellasi * Thus, the util_est.enqueued of a task represents the contribution on the 4187f65ea42SPatrick Bellasi * estimated utilization of the CPU where that task is currently enqueued. 4197f65ea42SPatrick Bellasi * 4207f65ea42SPatrick Bellasi * Only for tasks we track a moving average of the past instantaneous 4217f65ea42SPatrick Bellasi * estimated utilization. This allows to absorb sporadic drops in utilization 4227f65ea42SPatrick Bellasi * of an otherwise almost periodic task. 42368d7a190SDietmar Eggemann * 42468d7a190SDietmar Eggemann * The UTIL_AVG_UNCHANGED flag is used to synchronize util_est with util_avg 42568d7a190SDietmar Eggemann * updates. When a task is dequeued, its util_est should not be updated if its 42668d7a190SDietmar Eggemann * util_avg has not been updated in the meantime. 42768d7a190SDietmar Eggemann * This information is mapped into the MSB bit of util_est.enqueued at dequeue 42868d7a190SDietmar Eggemann * time. Since max value of util_est.enqueued for a task is 1024 (PELT util_avg 42968d7a190SDietmar Eggemann * for a task) it is safe to use MSB. 4307f65ea42SPatrick Bellasi */ 4317f65ea42SPatrick Bellasi struct util_est { 4327f65ea42SPatrick Bellasi unsigned int enqueued; 4337f65ea42SPatrick Bellasi unsigned int ewma; 4347f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT 2 43568d7a190SDietmar Eggemann #define UTIL_AVG_UNCHANGED 0x80000000 436317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64)))); 4377f65ea42SPatrick Bellasi 4389d89c257SYuyang Du /* 4399f683953SVincent Guittot * The load/runnable/util_avg accumulates an infinite geometric series 4400dacee1bSVincent Guittot * (see __update_load_avg_cfs_rq() in kernel/sched/pelt.c). 4417b595334SYuyang Du * 4427b595334SYuyang Du * [load_avg definition] 4437b595334SYuyang Du * 4447b595334SYuyang Du * load_avg = runnable% * scale_load_down(load) 4457b595334SYuyang Du * 4469f683953SVincent Guittot * [runnable_avg definition] 4479f683953SVincent Guittot * 4489f683953SVincent Guittot * runnable_avg = runnable% * SCHED_CAPACITY_SCALE 4497b595334SYuyang Du * 4507b595334SYuyang Du * [util_avg definition] 4517b595334SYuyang Du * 4527b595334SYuyang Du * util_avg = running% * SCHED_CAPACITY_SCALE 4537b595334SYuyang Du * 4549f683953SVincent Guittot * where runnable% is the time ratio that a sched_entity is runnable and 4559f683953SVincent Guittot * running% the time ratio that a sched_entity is running. 4567b595334SYuyang Du * 4579f683953SVincent Guittot * For cfs_rq, they are the aggregated values of all runnable and blocked 4589f683953SVincent Guittot * sched_entities. 4599f683953SVincent Guittot * 460c1b7b8d4S王文虎 * The load/runnable/util_avg doesn't directly factor frequency scaling and CPU 4619f683953SVincent Guittot * capacity scaling. The scaling is done through the rq_clock_pelt that is used 4629f683953SVincent Guittot * for computing those signals (see update_rq_clock_pelt()) 4637b595334SYuyang Du * 46423127296SVincent Guittot * N.B., the above ratios (runnable% and running%) themselves are in the 46523127296SVincent Guittot * range of [0, 1]. To do fixed point arithmetics, we therefore scale them 46623127296SVincent Guittot * to as large a range as necessary. This is for example reflected by 46723127296SVincent Guittot * util_avg's SCHED_CAPACITY_SCALE. 4687b595334SYuyang Du * 4697b595334SYuyang Du * [Overflow issue] 4707b595334SYuyang Du * 4717b595334SYuyang Du * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities 4727b595334SYuyang Du * with the highest load (=88761), always runnable on a single cfs_rq, 4737b595334SYuyang Du * and should not overflow as the number already hits PID_MAX_LIMIT. 4747b595334SYuyang Du * 4757b595334SYuyang Du * For all other cases (including 32-bit kernels), struct load_weight's 4767b595334SYuyang Du * weight will overflow first before we do, because: 4777b595334SYuyang Du * 4787b595334SYuyang Du * Max(load_avg) <= Max(load.weight) 4797b595334SYuyang Du * 4807b595334SYuyang Du * Then it is the load_weight's responsibility to consider overflow 4817b595334SYuyang Du * issues. 4829d89c257SYuyang Du */ 4839d85f21cSPaul Turner struct sched_avg { 4845eca1c10SIngo Molnar u64 last_update_time; 4855eca1c10SIngo Molnar u64 load_sum; 4869f683953SVincent Guittot u64 runnable_sum; 4875eca1c10SIngo Molnar u32 util_sum; 4885eca1c10SIngo Molnar u32 period_contrib; 4895eca1c10SIngo Molnar unsigned long load_avg; 4909f683953SVincent Guittot unsigned long runnable_avg; 4915eca1c10SIngo Molnar unsigned long util_avg; 4927f65ea42SPatrick Bellasi struct util_est util_est; 493317d359dSPeter Zijlstra } ____cacheline_aligned; 4949d85f21cSPaul Turner 49541acab88SLucas De Marchi struct sched_statistics { 4967f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS 49794c18227SIngo Molnar u64 wait_start; 49894c18227SIngo Molnar u64 wait_max; 4996d082592SArjan van de Ven u64 wait_count; 5006d082592SArjan van de Ven u64 wait_sum; 5018f0dfc34SArjan van de Ven u64 iowait_count; 5028f0dfc34SArjan van de Ven u64 iowait_sum; 50394c18227SIngo Molnar 50494c18227SIngo Molnar u64 sleep_start; 50520b8a59fSIngo Molnar u64 sleep_max; 50694c18227SIngo Molnar s64 sum_sleep_runtime; 50794c18227SIngo Molnar 50894c18227SIngo Molnar u64 block_start; 50920b8a59fSIngo Molnar u64 block_max; 510847fc0cdSYafang Shao s64 sum_block_runtime; 511847fc0cdSYafang Shao 51220b8a59fSIngo Molnar u64 exec_max; 513eba1ed4bSIngo Molnar u64 slice_max; 514cc367732SIngo Molnar 515cc367732SIngo Molnar u64 nr_migrations_cold; 516cc367732SIngo Molnar u64 nr_failed_migrations_affine; 517cc367732SIngo Molnar u64 nr_failed_migrations_running; 518cc367732SIngo Molnar u64 nr_failed_migrations_hot; 519cc367732SIngo Molnar u64 nr_forced_migrations; 520cc367732SIngo Molnar 521cc367732SIngo Molnar u64 nr_wakeups; 522cc367732SIngo Molnar u64 nr_wakeups_sync; 523cc367732SIngo Molnar u64 nr_wakeups_migrate; 524cc367732SIngo Molnar u64 nr_wakeups_local; 525cc367732SIngo Molnar u64 nr_wakeups_remote; 526cc367732SIngo Molnar u64 nr_wakeups_affine; 527cc367732SIngo Molnar u64 nr_wakeups_affine_attempts; 528cc367732SIngo Molnar u64 nr_wakeups_passive; 529cc367732SIngo Molnar u64 nr_wakeups_idle; 5304feee7d1SJosh Don 5314feee7d1SJosh Don #ifdef CONFIG_SCHED_CORE 5324feee7d1SJosh Don u64 core_forceidle_sum; 53341acab88SLucas De Marchi #endif 5344feee7d1SJosh Don #endif /* CONFIG_SCHEDSTATS */ 535ceeadb83SYafang Shao } ____cacheline_aligned; 53641acab88SLucas De Marchi 53741acab88SLucas De Marchi struct sched_entity { 5385eca1c10SIngo Molnar /* For load-balancing: */ 5395eca1c10SIngo Molnar struct load_weight load; 54041acab88SLucas De Marchi struct rb_node run_node; 54141acab88SLucas De Marchi struct list_head group_node; 54241acab88SLucas De Marchi unsigned int on_rq; 54341acab88SLucas De Marchi 54441acab88SLucas De Marchi u64 exec_start; 54541acab88SLucas De Marchi u64 sum_exec_runtime; 54641acab88SLucas De Marchi u64 vruntime; 54741acab88SLucas De Marchi u64 prev_sum_exec_runtime; 54841acab88SLucas De Marchi 54941acab88SLucas De Marchi u64 nr_migrations; 55041acab88SLucas De Marchi 55120b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED 552fed14d45SPeter Zijlstra int depth; 55320b8a59fSIngo Molnar struct sched_entity *parent; 55420b8a59fSIngo Molnar /* rq on which this entity is (to be) queued: */ 55520b8a59fSIngo Molnar struct cfs_rq *cfs_rq; 55620b8a59fSIngo Molnar /* rq "owned" by this entity/group: */ 55720b8a59fSIngo Molnar struct cfs_rq *my_q; 5589f683953SVincent Guittot /* cached value of my_q->h_nr_running */ 5599f683953SVincent Guittot unsigned long runnable_weight; 56020b8a59fSIngo Molnar #endif 5618bd75c77SClark Williams 562141965c7SAlex Shi #ifdef CONFIG_SMP 5635a107804SJiri Olsa /* 5645a107804SJiri Olsa * Per entity load average tracking. 5655a107804SJiri Olsa * 5665a107804SJiri Olsa * Put into separate cache line so it does not 5675a107804SJiri Olsa * collide with read-mostly values above. 5685a107804SJiri Olsa */ 569317d359dSPeter Zijlstra struct sched_avg avg; 5709d85f21cSPaul Turner #endif 57120b8a59fSIngo Molnar }; 57270b97a7fSIngo Molnar 573fa717060SPeter Zijlstra struct sched_rt_entity { 574fa717060SPeter Zijlstra struct list_head run_list; 57578f2c7dbSPeter Zijlstra unsigned long timeout; 57657d2aa00SYing Xue unsigned long watchdog_stamp; 577bee367edSRichard Kennedy unsigned int time_slice; 578ff77e468SPeter Zijlstra unsigned short on_rq; 579ff77e468SPeter Zijlstra unsigned short on_list; 5806f505b16SPeter Zijlstra 58158d6c2d7SPeter Zijlstra struct sched_rt_entity *back; 582052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED 5836f505b16SPeter Zijlstra struct sched_rt_entity *parent; 5846f505b16SPeter Zijlstra /* rq on which this entity is (to be) queued: */ 5856f505b16SPeter Zijlstra struct rt_rq *rt_rq; 5866f505b16SPeter Zijlstra /* rq "owned" by this entity/group: */ 5876f505b16SPeter Zijlstra struct rt_rq *my_q; 5886f505b16SPeter Zijlstra #endif 5893859a271SKees Cook } __randomize_layout; 590fa717060SPeter Zijlstra 591aab03e05SDario Faggioli struct sched_dl_entity { 592aab03e05SDario Faggioli struct rb_node rb_node; 593aab03e05SDario Faggioli 594aab03e05SDario Faggioli /* 595aab03e05SDario Faggioli * Original scheduling parameters. Copied here from sched_attr 5964027d080Sxiaofeng.yan * during sched_setattr(), they will remain the same until 5974027d080Sxiaofeng.yan * the next sched_setattr(). 598aab03e05SDario Faggioli */ 5995eca1c10SIngo Molnar u64 dl_runtime; /* Maximum runtime for each instance */ 6005eca1c10SIngo Molnar u64 dl_deadline; /* Relative deadline of each instance */ 6015eca1c10SIngo Molnar u64 dl_period; /* Separation of two instances (period) */ 60254d6d303SDaniel Bristot de Oliveira u64 dl_bw; /* dl_runtime / dl_period */ 6033effcb42SDaniel Bristot de Oliveira u64 dl_density; /* dl_runtime / dl_deadline */ 604aab03e05SDario Faggioli 605aab03e05SDario Faggioli /* 606aab03e05SDario Faggioli * Actual scheduling parameters. Initialized with the values above, 607dfcb245eSIngo Molnar * they are continuously updated during task execution. Note that 608aab03e05SDario Faggioli * the remaining runtime could be < 0 in case we are in overrun. 609aab03e05SDario Faggioli */ 6105eca1c10SIngo Molnar s64 runtime; /* Remaining runtime for this instance */ 6115eca1c10SIngo Molnar u64 deadline; /* Absolute deadline for this instance */ 6125eca1c10SIngo Molnar unsigned int flags; /* Specifying the scheduler behaviour */ 613aab03e05SDario Faggioli 614aab03e05SDario Faggioli /* 615aab03e05SDario Faggioli * Some bool flags: 616aab03e05SDario Faggioli * 617aab03e05SDario Faggioli * @dl_throttled tells if we exhausted the runtime. If so, the 618aab03e05SDario Faggioli * task has to wait for a replenishment to be performed at the 619aab03e05SDario Faggioli * next firing of dl_timer. 620aab03e05SDario Faggioli * 6215eca1c10SIngo Molnar * @dl_yielded tells if task gave up the CPU before consuming 6225bfd126eSJuri Lelli * all its available runtime during the last job. 623209a0cbdSLuca Abeni * 624209a0cbdSLuca Abeni * @dl_non_contending tells if the task is inactive while still 625209a0cbdSLuca Abeni * contributing to the active utilization. In other words, it 626209a0cbdSLuca Abeni * indicates if the inactive timer has been armed and its handler 627209a0cbdSLuca Abeni * has not been executed yet. This flag is useful to avoid race 628209a0cbdSLuca Abeni * conditions between the inactive timer handler and the wakeup 629209a0cbdSLuca Abeni * code. 63034be3930SJuri Lelli * 63134be3930SJuri Lelli * @dl_overrun tells if the task asked to be informed about runtime 63234be3930SJuri Lelli * overruns. 633aab03e05SDario Faggioli */ 634aa5222e9SDan Carpenter unsigned int dl_throttled : 1; 635aa5222e9SDan Carpenter unsigned int dl_yielded : 1; 636aa5222e9SDan Carpenter unsigned int dl_non_contending : 1; 63734be3930SJuri Lelli unsigned int dl_overrun : 1; 638aab03e05SDario Faggioli 639aab03e05SDario Faggioli /* 640aab03e05SDario Faggioli * Bandwidth enforcement timer. Each -deadline task has its 641aab03e05SDario Faggioli * own bandwidth to be enforced, thus we need one timer per task. 642aab03e05SDario Faggioli */ 643aab03e05SDario Faggioli struct hrtimer dl_timer; 644209a0cbdSLuca Abeni 645209a0cbdSLuca Abeni /* 646209a0cbdSLuca Abeni * Inactive timer, responsible for decreasing the active utilization 647209a0cbdSLuca Abeni * at the "0-lag time". When a -deadline task blocks, it contributes 648209a0cbdSLuca Abeni * to GRUB's active utilization until the "0-lag time", hence a 649209a0cbdSLuca Abeni * timer is needed to decrease the active utilization at the correct 650209a0cbdSLuca Abeni * time. 651209a0cbdSLuca Abeni */ 652209a0cbdSLuca Abeni struct hrtimer inactive_timer; 6532279f540SJuri Lelli 6542279f540SJuri Lelli #ifdef CONFIG_RT_MUTEXES 6552279f540SJuri Lelli /* 6562279f540SJuri Lelli * Priority Inheritance. When a DEADLINE scheduling entity is boosted 6572279f540SJuri Lelli * pi_se points to the donor, otherwise points to the dl_se it belongs 6582279f540SJuri Lelli * to (the original one/itself). 6592279f540SJuri Lelli */ 6602279f540SJuri Lelli struct sched_dl_entity *pi_se; 6612279f540SJuri Lelli #endif 662aab03e05SDario Faggioli }; 6638bd75c77SClark Williams 66469842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK 66569842cbaSPatrick Bellasi /* Number of utilization clamp buckets (shorter alias) */ 66669842cbaSPatrick Bellasi #define UCLAMP_BUCKETS CONFIG_UCLAMP_BUCKETS_COUNT 66769842cbaSPatrick Bellasi 66869842cbaSPatrick Bellasi /* 66969842cbaSPatrick Bellasi * Utilization clamp for a scheduling entity 67069842cbaSPatrick Bellasi * @value: clamp value "assigned" to a se 67169842cbaSPatrick Bellasi * @bucket_id: bucket index corresponding to the "assigned" value 672e8f14172SPatrick Bellasi * @active: the se is currently refcounted in a rq's bucket 673a509a7cdSPatrick Bellasi * @user_defined: the requested clamp value comes from user-space 67469842cbaSPatrick Bellasi * 67569842cbaSPatrick Bellasi * The bucket_id is the index of the clamp bucket matching the clamp value 67669842cbaSPatrick Bellasi * which is pre-computed and stored to avoid expensive integer divisions from 67769842cbaSPatrick Bellasi * the fast path. 678e8f14172SPatrick Bellasi * 679e8f14172SPatrick Bellasi * The active bit is set whenever a task has got an "effective" value assigned, 680e8f14172SPatrick Bellasi * which can be different from the clamp value "requested" from user-space. 681e8f14172SPatrick Bellasi * This allows to know a task is refcounted in the rq's bucket corresponding 682e8f14172SPatrick Bellasi * to the "effective" bucket_id. 683a509a7cdSPatrick Bellasi * 684a509a7cdSPatrick Bellasi * The user_defined bit is set whenever a task has got a task-specific clamp 685a509a7cdSPatrick Bellasi * value requested from userspace, i.e. the system defaults apply to this task 686a509a7cdSPatrick Bellasi * just as a restriction. This allows to relax default clamps when a less 687a509a7cdSPatrick Bellasi * restrictive task-specific value has been requested, thus allowing to 688a509a7cdSPatrick Bellasi * implement a "nice" semantic. For example, a task running with a 20% 689a509a7cdSPatrick Bellasi * default boost can still drop its own boosting to 0%. 69069842cbaSPatrick Bellasi */ 69169842cbaSPatrick Bellasi struct uclamp_se { 69269842cbaSPatrick Bellasi unsigned int value : bits_per(SCHED_CAPACITY_SCALE); 69369842cbaSPatrick Bellasi unsigned int bucket_id : bits_per(UCLAMP_BUCKETS); 694e8f14172SPatrick Bellasi unsigned int active : 1; 695a509a7cdSPatrick Bellasi unsigned int user_defined : 1; 69669842cbaSPatrick Bellasi }; 69769842cbaSPatrick Bellasi #endif /* CONFIG_UCLAMP_TASK */ 69869842cbaSPatrick Bellasi 6991d082fd0SPaul E. McKenney union rcu_special { 7001d082fd0SPaul E. McKenney struct { 7018203d6d0SPaul E. McKenney u8 blocked; 7028203d6d0SPaul E. McKenney u8 need_qs; 70305f41571SPaul E. McKenney u8 exp_hint; /* Hint for performance. */ 704276c4104SPaul E. McKenney u8 need_mb; /* Readers need smp_mb(). */ 7058203d6d0SPaul E. McKenney } b; /* Bits. */ 70605f41571SPaul E. McKenney u32 s; /* Set of bits. */ 7071d082fd0SPaul E. McKenney }; 70886848966SPaul E. McKenney 7098dc85d54SPeter Zijlstra enum perf_event_task_context { 7108dc85d54SPeter Zijlstra perf_invalid_context = -1, 7118dc85d54SPeter Zijlstra perf_hw_context = 0, 71289a1e187SPeter Zijlstra perf_sw_context, 7138dc85d54SPeter Zijlstra perf_nr_task_contexts, 7148dc85d54SPeter Zijlstra }; 7158dc85d54SPeter Zijlstra 716eb61baf6SIngo Molnar struct wake_q_node { 717eb61baf6SIngo Molnar struct wake_q_node *next; 718eb61baf6SIngo Molnar }; 719eb61baf6SIngo Molnar 7205fbda3ecSThomas Gleixner struct kmap_ctrl { 7215fbda3ecSThomas Gleixner #ifdef CONFIG_KMAP_LOCAL 7225fbda3ecSThomas Gleixner int idx; 7235fbda3ecSThomas Gleixner pte_t pteval[KM_MAX_IDX]; 7245fbda3ecSThomas Gleixner #endif 7255fbda3ecSThomas Gleixner }; 7265fbda3ecSThomas Gleixner 7271da177e4SLinus Torvalds struct task_struct { 728c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 729c65eacbeSAndy Lutomirski /* 730c65eacbeSAndy Lutomirski * For reasons of header soup (see current_thread_info()), this 731c65eacbeSAndy Lutomirski * must be the first element of task_struct. 732c65eacbeSAndy Lutomirski */ 733c65eacbeSAndy Lutomirski struct thread_info thread_info; 734c65eacbeSAndy Lutomirski #endif 7352f064a59SPeter Zijlstra unsigned int __state; 73629e48ce8SKees Cook 7375f220be2SThomas Gleixner #ifdef CONFIG_PREEMPT_RT 7385f220be2SThomas Gleixner /* saved state for "spinlock sleepers" */ 7395f220be2SThomas Gleixner unsigned int saved_state; 7405f220be2SThomas Gleixner #endif 7415f220be2SThomas Gleixner 74229e48ce8SKees Cook /* 74329e48ce8SKees Cook * This begins the randomizable portion of task_struct. Only 74429e48ce8SKees Cook * scheduling-critical items should be added above here. 74529e48ce8SKees Cook */ 74629e48ce8SKees Cook randomized_struct_fields_start 74729e48ce8SKees Cook 748f7e4217bSRoman Zippel void *stack; 749ec1d2819SElena Reshetova refcount_t usage; 7505eca1c10SIngo Molnar /* Per task flags (PF_*), defined further below: */ 7515eca1c10SIngo Molnar unsigned int flags; 75297dc32cdSWilliam Cohen unsigned int ptrace; 7531da177e4SLinus Torvalds 7542dd73a4fSPeter Williams #ifdef CONFIG_SMP 7553ca7a440SPeter Zijlstra int on_cpu; 7568c4890d1SPeter Zijlstra struct __call_single_node wake_entry; 75763b0e9edSMike Galbraith unsigned int wakee_flips; 75862470419SMichael Wang unsigned long wakee_flip_decay_ts; 75963b0e9edSMike Galbraith struct task_struct *last_wakee; 760ac66f547SPeter Zijlstra 76132e839ddSMel Gorman /* 76232e839ddSMel Gorman * recent_used_cpu is initially set as the last CPU used by a task 76332e839ddSMel Gorman * that wakes affine another task. Waker/wakee relationships can 76432e839ddSMel Gorman * push tasks around a CPU where each wakeup moves to the next one. 76532e839ddSMel Gorman * Tracking a recently used CPU allows a quick search for a recently 76632e839ddSMel Gorman * used CPU that may be idle. 76732e839ddSMel Gorman */ 76832e839ddSMel Gorman int recent_used_cpu; 769ac66f547SPeter Zijlstra int wake_cpu; 7704866cde0SNick Piggin #endif 771fd2f4419SPeter Zijlstra int on_rq; 77250e645a8SIngo Molnar 7735eca1c10SIngo Molnar int prio; 7745eca1c10SIngo Molnar int static_prio; 7755eca1c10SIngo Molnar int normal_prio; 776c7aceabaSRichard Kennedy unsigned int rt_priority; 7775eca1c10SIngo Molnar 77820b8a59fSIngo Molnar struct sched_entity se; 779fa717060SPeter Zijlstra struct sched_rt_entity rt; 7808a311c74SPeter Zijlstra struct sched_dl_entity dl; 781804bccbaSKees Cook const struct sched_class *sched_class; 7828a311c74SPeter Zijlstra 7838a311c74SPeter Zijlstra #ifdef CONFIG_SCHED_CORE 7848a311c74SPeter Zijlstra struct rb_node core_node; 7858a311c74SPeter Zijlstra unsigned long core_cookie; 786d2dfa17bSPeter Zijlstra unsigned int core_occupation; 7878a311c74SPeter Zijlstra #endif 7888a311c74SPeter Zijlstra 7898323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED 7908323f26cSPeter Zijlstra struct task_group *sched_task_group; 7918323f26cSPeter Zijlstra #endif 7921da177e4SLinus Torvalds 79369842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK 79413685c4aSQais Yousef /* 79513685c4aSQais Yousef * Clamp values requested for a scheduling entity. 79613685c4aSQais Yousef * Must be updated with task_rq_lock() held. 79713685c4aSQais Yousef */ 798e8f14172SPatrick Bellasi struct uclamp_se uclamp_req[UCLAMP_CNT]; 79913685c4aSQais Yousef /* 80013685c4aSQais Yousef * Effective clamp values used for a scheduling entity. 80113685c4aSQais Yousef * Must be updated with task_rq_lock() held. 80213685c4aSQais Yousef */ 80369842cbaSPatrick Bellasi struct uclamp_se uclamp[UCLAMP_CNT]; 80469842cbaSPatrick Bellasi #endif 80569842cbaSPatrick Bellasi 806ceeadb83SYafang Shao struct sched_statistics stats; 807ceeadb83SYafang Shao 808e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS 8095eca1c10SIngo Molnar /* List of struct preempt_notifier: */ 810e107be36SAvi Kivity struct hlist_head preempt_notifiers; 811e107be36SAvi Kivity #endif 812e107be36SAvi Kivity 8136c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE 8142056a782SJens Axboe unsigned int btrace_seq; 8156c5c9341SAlexey Dobriyan #endif 8161da177e4SLinus Torvalds 81797dc32cdSWilliam Cohen unsigned int policy; 81829baa747SPeter Zijlstra int nr_cpus_allowed; 8193bd37062SSebastian Andrzej Siewior const cpumask_t *cpus_ptr; 820b90ca8baSWill Deacon cpumask_t *user_cpus_ptr; 8213bd37062SSebastian Andrzej Siewior cpumask_t cpus_mask; 8226d337eabSPeter Zijlstra void *migration_pending; 82374d862b6SThomas Gleixner #ifdef CONFIG_SMP 824a7c81556SPeter Zijlstra unsigned short migration_disabled; 825af449901SPeter Zijlstra #endif 826a7c81556SPeter Zijlstra unsigned short migration_flags; 8271da177e4SLinus Torvalds 828a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU 829e260be67SPaul E. McKenney int rcu_read_lock_nesting; 8301d082fd0SPaul E. McKenney union rcu_special rcu_read_unlock_special; 831f41d911fSPaul E. McKenney struct list_head rcu_node_entry; 832a57eb940SPaul E. McKenney struct rcu_node *rcu_blocked_node; 83328f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */ 8345eca1c10SIngo Molnar 8358315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU 8368315f422SPaul E. McKenney unsigned long rcu_tasks_nvcsw; 837ccdd29ffSPaul E. McKenney u8 rcu_tasks_holdout; 838ccdd29ffSPaul E. McKenney u8 rcu_tasks_idx; 839176f8f7aSPaul E. McKenney int rcu_tasks_idle_cpu; 840ccdd29ffSPaul E. McKenney struct list_head rcu_tasks_holdout_list; 8418315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */ 842e260be67SPaul E. McKenney 843d5f177d3SPaul E. McKenney #ifdef CONFIG_TASKS_TRACE_RCU 844d5f177d3SPaul E. McKenney int trc_reader_nesting; 845d5f177d3SPaul E. McKenney int trc_ipi_to_cpu; 846276c4104SPaul E. McKenney union rcu_special trc_reader_special; 847d5f177d3SPaul E. McKenney struct list_head trc_holdout_list; 848434c9eefSPaul E. McKenney struct list_head trc_blkd_node; 849434c9eefSPaul E. McKenney int trc_blkd_cpu; 850d5f177d3SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_TRACE_RCU */ 851d5f177d3SPaul E. McKenney 8521da177e4SLinus Torvalds struct sched_info sched_info; 8531da177e4SLinus Torvalds 8541da177e4SLinus Torvalds struct list_head tasks; 855806c09a7SDario Faggioli #ifdef CONFIG_SMP 856917b627dSGregory Haskins struct plist_node pushable_tasks; 8571baca4ceSJuri Lelli struct rb_node pushable_dl_tasks; 858806c09a7SDario Faggioli #endif 8591da177e4SLinus Torvalds 8605eca1c10SIngo Molnar struct mm_struct *mm; 8615eca1c10SIngo Molnar struct mm_struct *active_mm; 862314ff785SIngo Molnar 863314ff785SIngo Molnar /* Per-thread vma caching: */ 864314ff785SIngo Molnar struct vmacache vmacache; 865314ff785SIngo Molnar 8665eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING 86734e55232SKAMEZAWA Hiroyuki struct task_rss_stat rss_stat; 86834e55232SKAMEZAWA Hiroyuki #endif 86997dc32cdSWilliam Cohen int exit_state; 8705eca1c10SIngo Molnar int exit_code; 8715eca1c10SIngo Molnar int exit_signal; 8725eca1c10SIngo Molnar /* The signal sent when the parent dies: */ 8735eca1c10SIngo Molnar int pdeath_signal; 8745eca1c10SIngo Molnar /* JOBCTL_*, siglock protected: */ 8755eca1c10SIngo Molnar unsigned long jobctl; 8769b89f6baSAndrei Epure 8775eca1c10SIngo Molnar /* Used for emulating ABI behavior of previous Linux versions: */ 87897dc32cdSWilliam Cohen unsigned int personality; 8799b89f6baSAndrei Epure 8805eca1c10SIngo Molnar /* Scheduler bits, serialized by scheduler locks: */ 881ca94c442SLennart Poettering unsigned sched_reset_on_fork:1; 882a8e4f2eaSPeter Zijlstra unsigned sched_contributes_to_load:1; 883ff303e66SPeter Zijlstra unsigned sched_migrated:1; 884eb414681SJohannes Weiner #ifdef CONFIG_PSI 885eb414681SJohannes Weiner unsigned sched_psi_wake_requeue:1; 886eb414681SJohannes Weiner #endif 887eb414681SJohannes Weiner 8885eca1c10SIngo Molnar /* Force alignment to the next boundary: */ 8895eca1c10SIngo Molnar unsigned :0; 890be958bdcSPeter Zijlstra 8915eca1c10SIngo Molnar /* Unserialized, strictly 'current' */ 8925eca1c10SIngo Molnar 893f97bb527SPeter Zijlstra /* 894f97bb527SPeter Zijlstra * This field must not be in the scheduler word above due to wakelist 895f97bb527SPeter Zijlstra * queueing no longer being serialized by p->on_cpu. However: 896f97bb527SPeter Zijlstra * 897f97bb527SPeter Zijlstra * p->XXX = X; ttwu() 898f97bb527SPeter Zijlstra * schedule() if (p->on_rq && ..) // false 899f97bb527SPeter Zijlstra * smp_mb__after_spinlock(); if (smp_load_acquire(&p->on_cpu) && //true 900f97bb527SPeter Zijlstra * deactivate_task() ttwu_queue_wakelist()) 901f97bb527SPeter Zijlstra * p->on_rq = 0; p->sched_remote_wakeup = Y; 902f97bb527SPeter Zijlstra * 903f97bb527SPeter Zijlstra * guarantees all stores of 'current' are visible before 904f97bb527SPeter Zijlstra * ->sched_remote_wakeup gets used, so it can be in this word. 905f97bb527SPeter Zijlstra */ 906f97bb527SPeter Zijlstra unsigned sched_remote_wakeup:1; 907f97bb527SPeter Zijlstra 9085eca1c10SIngo Molnar /* Bit to tell LSMs we're in execve(): */ 9095eca1c10SIngo Molnar unsigned in_execve:1; 910be958bdcSPeter Zijlstra unsigned in_iowait:1; 9115eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK 9127e781418SAndy Lutomirski unsigned restore_sigmask:1; 9137e781418SAndy Lutomirski #endif 914626ebc41STejun Heo #ifdef CONFIG_MEMCG 91529ef680aSMichal Hocko unsigned in_user_fault:1; 916127424c8SJohannes Weiner #endif 917ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK 918ff303e66SPeter Zijlstra unsigned brk_randomized:1; 919ff303e66SPeter Zijlstra #endif 92077f88796STejun Heo #ifdef CONFIG_CGROUPS 92177f88796STejun Heo /* disallow userland-initiated cgroup migration */ 92277f88796STejun Heo unsigned no_cgroup_migration:1; 92376f969e8SRoman Gushchin /* task is frozen/stopped (used by the cgroup freezer) */ 92476f969e8SRoman Gushchin unsigned frozen:1; 92577f88796STejun Heo #endif 926d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP 927d09d8df3SJosef Bacik unsigned use_memdelay:1; 928d09d8df3SJosef Bacik #endif 9291066d1b6SYafang Shao #ifdef CONFIG_PSI 9301066d1b6SYafang Shao /* Stalled due to lack of memory */ 9311066d1b6SYafang Shao unsigned in_memstall:1; 9321066d1b6SYafang Shao #endif 9338e9b16c4SSergei Trofimovich #ifdef CONFIG_PAGE_OWNER 9348e9b16c4SSergei Trofimovich /* Used by page_owner=on to detect recursion in page tracking. */ 9358e9b16c4SSergei Trofimovich unsigned in_page_owner:1; 9368e9b16c4SSergei Trofimovich #endif 937b542e383SThomas Gleixner #ifdef CONFIG_EVENTFD 938b542e383SThomas Gleixner /* Recursion prevention for eventfd_signal() */ 939b542e383SThomas Gleixner unsigned in_eventfd_signal:1; 940b542e383SThomas Gleixner #endif 941a3d29e82SPeter Zijlstra #ifdef CONFIG_IOMMU_SVA 942a3d29e82SPeter Zijlstra unsigned pasid_activated:1; 943a3d29e82SPeter Zijlstra #endif 944b041b525STony Luck #ifdef CONFIG_CPU_SUP_INTEL 945b041b525STony Luck unsigned reported_split_lock:1; 946b041b525STony Luck #endif 947*aa1cf99bSYang Yang #ifdef CONFIG_TASK_DELAY_ACCT 948*aa1cf99bSYang Yang /* delay due to memory thrashing */ 949*aa1cf99bSYang Yang unsigned in_thrashing:1; 950*aa1cf99bSYang Yang #endif 9516f185c29SVladimir Davydov 9525eca1c10SIngo Molnar unsigned long atomic_flags; /* Flags requiring atomic access. */ 9531d4457f9SKees Cook 954f56141e3SAndy Lutomirski struct restart_block restart_block; 955f56141e3SAndy Lutomirski 9561da177e4SLinus Torvalds pid_t pid; 9571da177e4SLinus Torvalds pid_t tgid; 9580a425405SArjan van de Ven 959050e9baaSLinus Torvalds #ifdef CONFIG_STACKPROTECTOR 9605eca1c10SIngo Molnar /* Canary value for the -fstack-protector GCC feature: */ 9610a425405SArjan van de Ven unsigned long stack_canary; 9621314562aSHiroshi Shimamoto #endif 9631da177e4SLinus Torvalds /* 9645eca1c10SIngo Molnar * Pointers to the (original) parent process, youngest child, younger sibling, 9651da177e4SLinus Torvalds * older sibling, respectively. (p->father can be replaced with 966f470021aSRoland McGrath * p->real_parent->pid) 9671da177e4SLinus Torvalds */ 9685eca1c10SIngo Molnar 9695eca1c10SIngo Molnar /* Real parent process: */ 9705eca1c10SIngo Molnar struct task_struct __rcu *real_parent; 9715eca1c10SIngo Molnar 9725eca1c10SIngo Molnar /* Recipient of SIGCHLD, wait4() reports: */ 9735eca1c10SIngo Molnar struct task_struct __rcu *parent; 9741da177e4SLinus Torvalds 975f470021aSRoland McGrath /* 9765eca1c10SIngo Molnar * Children/sibling form the list of natural children: 9775eca1c10SIngo Molnar */ 9785eca1c10SIngo Molnar struct list_head children; 9795eca1c10SIngo Molnar struct list_head sibling; 9805eca1c10SIngo Molnar struct task_struct *group_leader; 9815eca1c10SIngo Molnar 9825eca1c10SIngo Molnar /* 9835eca1c10SIngo Molnar * 'ptraced' is the list of tasks this task is using ptrace() on. 9845eca1c10SIngo Molnar * 985f470021aSRoland McGrath * This includes both natural children and PTRACE_ATTACH targets. 9865eca1c10SIngo Molnar * 'ptrace_entry' is this task's link on the p->parent->ptraced list. 987f470021aSRoland McGrath */ 988f470021aSRoland McGrath struct list_head ptraced; 989f470021aSRoland McGrath struct list_head ptrace_entry; 990f470021aSRoland McGrath 9911da177e4SLinus Torvalds /* PID/PID hash table linkage. */ 9922c470475SEric W. Biederman struct pid *thread_pid; 9932c470475SEric W. Biederman struct hlist_node pid_links[PIDTYPE_MAX]; 99447e65328SOleg Nesterov struct list_head thread_group; 9950c740d0aSOleg Nesterov struct list_head thread_node; 9961da177e4SLinus Torvalds 9975eca1c10SIngo Molnar struct completion *vfork_done; 9981da177e4SLinus Torvalds 9995eca1c10SIngo Molnar /* CLONE_CHILD_SETTID: */ 10005eca1c10SIngo Molnar int __user *set_child_tid; 10015eca1c10SIngo Molnar 10025eca1c10SIngo Molnar /* CLONE_CHILD_CLEARTID: */ 10035eca1c10SIngo Molnar int __user *clear_child_tid; 10045eca1c10SIngo Molnar 1005e32cf5dfSEric W. Biederman /* PF_KTHREAD | PF_IO_WORKER */ 1006e32cf5dfSEric W. Biederman void *worker_private; 10073bfe6106SJens Axboe 10085eca1c10SIngo Molnar u64 utime; 10095eca1c10SIngo Molnar u64 stime; 101040565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME 10115eca1c10SIngo Molnar u64 utimescaled; 10125eca1c10SIngo Molnar u64 stimescaled; 101340565b5aSStanislaw Gruszka #endif 101416a6d9beSFrederic Weisbecker u64 gtime; 10159d7fb042SPeter Zijlstra struct prev_cputime prev_cputime; 10166a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN 1017bac5b6b6SFrederic Weisbecker struct vtime vtime; 10186a61671bSFrederic Weisbecker #endif 1019d027d45dSFrederic Weisbecker 1020d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL 1021f009a7a7SFrederic Weisbecker atomic_t tick_dep_mask; 1022d027d45dSFrederic Weisbecker #endif 10235eca1c10SIngo Molnar /* Context switch counts: */ 10245eca1c10SIngo Molnar unsigned long nvcsw; 10255eca1c10SIngo Molnar unsigned long nivcsw; 10265eca1c10SIngo Molnar 10275eca1c10SIngo Molnar /* Monotonic time in nsecs: */ 10285eca1c10SIngo Molnar u64 start_time; 10295eca1c10SIngo Molnar 10305eca1c10SIngo Molnar /* Boot based time in nsecs: */ 1031cf25e24dSPeter Zijlstra u64 start_boottime; 10325eca1c10SIngo Molnar 10335eca1c10SIngo Molnar /* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */ 10345eca1c10SIngo Molnar unsigned long min_flt; 10355eca1c10SIngo Molnar unsigned long maj_flt; 10361da177e4SLinus Torvalds 10372b69942fSThomas Gleixner /* Empty if CONFIG_POSIX_CPUTIMERS=n */ 10382b69942fSThomas Gleixner struct posix_cputimers posix_cputimers; 10391da177e4SLinus Torvalds 10401fb497ddSThomas Gleixner #ifdef CONFIG_POSIX_CPU_TIMERS_TASK_WORK 10411fb497ddSThomas Gleixner struct posix_cputimers_work posix_cputimers_work; 10421fb497ddSThomas Gleixner #endif 10431fb497ddSThomas Gleixner 10445eca1c10SIngo Molnar /* Process credentials: */ 10455eca1c10SIngo Molnar 10465eca1c10SIngo Molnar /* Tracer's credentials at attach: */ 10475eca1c10SIngo Molnar const struct cred __rcu *ptracer_cred; 10485eca1c10SIngo Molnar 10495eca1c10SIngo Molnar /* Objective and real subjective task credentials (COW): */ 10505eca1c10SIngo Molnar const struct cred __rcu *real_cred; 10515eca1c10SIngo Molnar 10525eca1c10SIngo Molnar /* Effective (overridable) subjective task credentials (COW): */ 10535eca1c10SIngo Molnar const struct cred __rcu *cred; 10545eca1c10SIngo Molnar 10557743c48eSDavid Howells #ifdef CONFIG_KEYS 10567743c48eSDavid Howells /* Cached requested key. */ 10577743c48eSDavid Howells struct key *cached_requested_key; 10587743c48eSDavid Howells #endif 10597743c48eSDavid Howells 10605eca1c10SIngo Molnar /* 10615eca1c10SIngo Molnar * executable name, excluding path. 10625eca1c10SIngo Molnar * 10635eca1c10SIngo Molnar * - normally initialized setup_new_exec() 10645eca1c10SIngo Molnar * - access it with [gs]et_task_comm() 10655eca1c10SIngo Molnar * - lock it with task_lock() 10665eca1c10SIngo Molnar */ 10675eca1c10SIngo Molnar char comm[TASK_COMM_LEN]; 10685eca1c10SIngo Molnar 1069756daf26SNeilBrown struct nameidata *nameidata; 10705eca1c10SIngo Molnar 10713d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC 10721da177e4SLinus Torvalds struct sysv_sem sysvsem; 1073ab602f79SJack Miller struct sysv_shm sysvshm; 10743d5b6fccSAlexey Dobriyan #endif 1075e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK 107682a1fcb9SIngo Molnar unsigned long last_switch_count; 1077a2e51445SDmitry Vyukov unsigned long last_switch_time; 107882a1fcb9SIngo Molnar #endif 10795eca1c10SIngo Molnar /* Filesystem information: */ 10801da177e4SLinus Torvalds struct fs_struct *fs; 10815eca1c10SIngo Molnar 10825eca1c10SIngo Molnar /* Open file information: */ 10831da177e4SLinus Torvalds struct files_struct *files; 10845eca1c10SIngo Molnar 10850f212204SJens Axboe #ifdef CONFIG_IO_URING 10860f212204SJens Axboe struct io_uring_task *io_uring; 10870f212204SJens Axboe #endif 10880f212204SJens Axboe 10895eca1c10SIngo Molnar /* Namespaces: */ 1090ab516013SSerge E. Hallyn struct nsproxy *nsproxy; 10915eca1c10SIngo Molnar 10925eca1c10SIngo Molnar /* Signal handlers: */ 10931da177e4SLinus Torvalds struct signal_struct *signal; 1094913292c9SMadhuparna Bhowmik struct sighand_struct __rcu *sighand; 10955eca1c10SIngo Molnar sigset_t blocked; 10965eca1c10SIngo Molnar sigset_t real_blocked; 10975eca1c10SIngo Molnar /* Restored if set_restore_sigmask() was used: */ 10985eca1c10SIngo Molnar sigset_t saved_sigmask; 10991da177e4SLinus Torvalds struct sigpending pending; 11001da177e4SLinus Torvalds unsigned long sas_ss_sp; 11011da177e4SLinus Torvalds size_t sas_ss_size; 11025eca1c10SIngo Molnar unsigned int sas_ss_flags; 11032e01fabeSOleg Nesterov 110467d12145SAl Viro struct callback_head *task_works; 1105e73f8959SOleg Nesterov 11064b7d248bSRichard Guy Briggs #ifdef CONFIG_AUDIT 1107bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL 11085f3d544fSRichard Guy Briggs struct audit_context *audit_context; 11095f3d544fSRichard Guy Briggs #endif 1110e1760bd5SEric W. Biederman kuid_t loginuid; 11114746ec5bSEric Paris unsigned int sessionid; 1112bfef93a5SAl Viro #endif 1113932ecebbSWill Drewry struct seccomp seccomp; 11141446e1dfSGabriel Krisman Bertazi struct syscall_user_dispatch syscall_dispatch; 11151da177e4SLinus Torvalds 11165eca1c10SIngo Molnar /* Thread group tracking: */ 1117d1e7fd64SEric W. Biederman u64 parent_exec_id; 1118d1e7fd64SEric W. Biederman u64 self_exec_id; 11195eca1c10SIngo Molnar 11205eca1c10SIngo Molnar /* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */ 11211da177e4SLinus Torvalds spinlock_t alloc_lock; 11221da177e4SLinus Torvalds 1123b29739f9SIngo Molnar /* Protection of the PI data structures: */ 11241d615482SThomas Gleixner raw_spinlock_t pi_lock; 1125b29739f9SIngo Molnar 112676751049SPeter Zijlstra struct wake_q_node wake_q; 112776751049SPeter Zijlstra 112823f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES 11295eca1c10SIngo Molnar /* PI waiters blocked on a rt_mutex held by this task: */ 1130a23ba907SDavidlohr Bueso struct rb_root_cached pi_waiters; 1131e96a7705SXunlei Pang /* Updated under owner's pi_lock and rq lock */ 1132e96a7705SXunlei Pang struct task_struct *pi_top_task; 11335eca1c10SIngo Molnar /* Deadlock detection and priority inheritance handling: */ 113423f78d4aSIngo Molnar struct rt_mutex_waiter *pi_blocked_on; 113523f78d4aSIngo Molnar #endif 113623f78d4aSIngo Molnar 1137408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES 11385eca1c10SIngo Molnar /* Mutex deadlock detection: */ 1139408894eeSIngo Molnar struct mutex_waiter *blocked_on; 1140408894eeSIngo Molnar #endif 11415eca1c10SIngo Molnar 1142312364f3SDaniel Vetter #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 1143312364f3SDaniel Vetter int non_block_count; 1144312364f3SDaniel Vetter #endif 1145312364f3SDaniel Vetter 1146de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS 11470584df9cSMarco Elver struct irqtrace_events irqtrace; 1148de8f5e4fSPeter Zijlstra unsigned int hardirq_threaded; 1149c86e9b98SPeter Zijlstra u64 hardirq_chain_key; 1150fa1452e8SHiroshi Shimamoto int softirqs_enabled; 1151de30a2b3SIngo Molnar int softirq_context; 115240db1739SSebastian Andrzej Siewior int irq_config; 1153de30a2b3SIngo Molnar #endif 1154728b478dSThomas Gleixner #ifdef CONFIG_PREEMPT_RT 1155728b478dSThomas Gleixner int softirq_disable_cnt; 1156728b478dSThomas Gleixner #endif 11575eca1c10SIngo Molnar 1158fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP 1159bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH 48UL 1160fbb9ce95SIngo Molnar u64 curr_chain_key; 1161fbb9ce95SIngo Molnar int lockdep_depth; 1162fbb9ce95SIngo Molnar unsigned int lockdep_recursion; 1163c7aceabaSRichard Kennedy struct held_lock held_locks[MAX_LOCK_DEPTH]; 1164fbb9ce95SIngo Molnar #endif 11655eca1c10SIngo Molnar 11665cf53f3cSElena Petrova #if defined(CONFIG_UBSAN) && !defined(CONFIG_UBSAN_TRAP) 1167c6d30853SAndrey Ryabinin unsigned int in_ubsan; 1168c6d30853SAndrey Ryabinin #endif 1169408894eeSIngo Molnar 11705eca1c10SIngo Molnar /* Journalling filesystem info: */ 11711da177e4SLinus Torvalds void *journal_info; 11721da177e4SLinus Torvalds 11735eca1c10SIngo Molnar /* Stacked block device info: */ 1174bddd87c7SAkinobu Mita struct bio_list *bio_list; 1175d89d8796SNeil Brown 11765eca1c10SIngo Molnar /* Stack plugging: */ 117773c10101SJens Axboe struct blk_plug *plug; 117873c10101SJens Axboe 11795eca1c10SIngo Molnar /* VM state: */ 11801da177e4SLinus Torvalds struct reclaim_state *reclaim_state; 11811da177e4SLinus Torvalds 11821da177e4SLinus Torvalds struct backing_dev_info *backing_dev_info; 11831da177e4SLinus Torvalds 11841da177e4SLinus Torvalds struct io_context *io_context; 11851da177e4SLinus Torvalds 11865e1f0f09SMel Gorman #ifdef CONFIG_COMPACTION 11875e1f0f09SMel Gorman struct capture_control *capture_control; 11885e1f0f09SMel Gorman #endif 11895eca1c10SIngo Molnar /* Ptrace state: */ 11901da177e4SLinus Torvalds unsigned long ptrace_message; 1191ae7795bcSEric W. Biederman kernel_siginfo_t *last_siginfo; 11925eca1c10SIngo Molnar 11937c3ab738SAndrew Morton struct task_io_accounting ioac; 1194eb414681SJohannes Weiner #ifdef CONFIG_PSI 1195eb414681SJohannes Weiner /* Pressure stall state */ 1196eb414681SJohannes Weiner unsigned int psi_flags; 1197eb414681SJohannes Weiner #endif 11985eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT 11995eca1c10SIngo Molnar /* Accumulated RSS usage: */ 12005eca1c10SIngo Molnar u64 acct_rss_mem1; 12015eca1c10SIngo Molnar /* Accumulated virtual memory usage: */ 12025eca1c10SIngo Molnar u64 acct_vm_mem1; 12035eca1c10SIngo Molnar /* stime + utime since last update: */ 12045eca1c10SIngo Molnar u64 acct_timexpd; 12051da177e4SLinus Torvalds #endif 12061da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS 12075eca1c10SIngo Molnar /* Protected by ->alloc_lock: */ 12085eca1c10SIngo Molnar nodemask_t mems_allowed; 12093b03706fSIngo Molnar /* Sequence number to catch updates: */ 1210b7505861SAhmed S. Darwish seqcount_spinlock_t mems_allowed_seq; 1211825a46afSPaul Jackson int cpuset_mem_spread_rotor; 12126adef3ebSJack Steiner int cpuset_slab_spread_rotor; 12131da177e4SLinus Torvalds #endif 1214ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS 12155eca1c10SIngo Molnar /* Control Group info protected by css_set_lock: */ 12162c392b8cSArnd Bergmann struct css_set __rcu *cgroups; 12175eca1c10SIngo Molnar /* cg_list protected by css_set_lock and tsk->alloc_lock: */ 1218817929ecSPaul Menage struct list_head cg_list; 1219ddbcc7e8SPaul Menage #endif 1220e6d42931SJohannes Weiner #ifdef CONFIG_X86_CPU_RESCTRL 12210734ded1SVikas Shivappa u32 closid; 1222d6aaba61SVikas Shivappa u32 rmid; 1223e02737d5SFenghua Yu #endif 122442b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX 12250771dfefSIngo Molnar struct robust_list_head __user *robust_list; 122634f192c6SIngo Molnar #ifdef CONFIG_COMPAT 122734f192c6SIngo Molnar struct compat_robust_list_head __user *compat_robust_list; 122834f192c6SIngo Molnar #endif 1229c87e2837SIngo Molnar struct list_head pi_state_list; 1230c87e2837SIngo Molnar struct futex_pi_state *pi_state_cache; 12313f186d97SThomas Gleixner struct mutex futex_exit_mutex; 12323d4775dfSThomas Gleixner unsigned int futex_state; 123342b2dd0aSAlexey Dobriyan #endif 1234cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS 12358dc85d54SPeter Zijlstra struct perf_event_context *perf_event_ctxp[perf_nr_task_contexts]; 1236cdd6c482SIngo Molnar struct mutex perf_event_mutex; 1237cdd6c482SIngo Molnar struct list_head perf_event_list; 1238a63eaf34SPaul Mackerras #endif 12398f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT 12408f47b187SThomas Gleixner unsigned long preempt_disable_ip; 12418f47b187SThomas Gleixner #endif 1242c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA 12435eca1c10SIngo Molnar /* Protected by alloc_lock: */ 12445eca1c10SIngo Molnar struct mempolicy *mempolicy; 124545816682SVlastimil Babka short il_prev; 1246207205a2SEric Dumazet short pref_node_fork; 1247c7aceabaSRichard Kennedy #endif 1248cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING 1249cbee9f88SPeter Zijlstra int numa_scan_seq; 1250cbee9f88SPeter Zijlstra unsigned int numa_scan_period; 1251598f0ec0SMel Gorman unsigned int numa_scan_period_max; 1252de1c9ce6SRik van Riel int numa_preferred_nid; 12536b9a7460SMel Gorman unsigned long numa_migrate_retry; 12545eca1c10SIngo Molnar /* Migration stamp: */ 12555eca1c10SIngo Molnar u64 node_stamp; 12567e2703e6SRik van Riel u64 last_task_numa_placement; 12577e2703e6SRik van Riel u64 last_sum_exec_runtime; 1258cbee9f88SPeter Zijlstra struct callback_head numa_work; 1259f809ca9aSMel Gorman 1260cb361d8cSJann Horn /* 1261cb361d8cSJann Horn * This pointer is only modified for current in syscall and 1262cb361d8cSJann Horn * pagefault context (and for tasks being destroyed), so it can be read 1263cb361d8cSJann Horn * from any of the following contexts: 1264cb361d8cSJann Horn * - RCU read-side critical section 1265cb361d8cSJann Horn * - current->numa_group from everywhere 1266cb361d8cSJann Horn * - task's runqueue locked, task not running 1267cb361d8cSJann Horn */ 1268cb361d8cSJann Horn struct numa_group __rcu *numa_group; 12698c8a743cSPeter Zijlstra 1270745d6147SMel Gorman /* 127144dba3d5SIulia Manda * numa_faults is an array split into four regions: 127244dba3d5SIulia Manda * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer 127344dba3d5SIulia Manda * in this precise order. 127444dba3d5SIulia Manda * 127544dba3d5SIulia Manda * faults_memory: Exponential decaying average of faults on a per-node 127644dba3d5SIulia Manda * basis. Scheduling placement decisions are made based on these 127744dba3d5SIulia Manda * counts. The values remain static for the duration of a PTE scan. 127844dba3d5SIulia Manda * faults_cpu: Track the nodes the process was running on when a NUMA 127944dba3d5SIulia Manda * hinting fault was incurred. 128044dba3d5SIulia Manda * faults_memory_buffer and faults_cpu_buffer: Record faults per node 128144dba3d5SIulia Manda * during the current scan window. When the scan completes, the counts 128244dba3d5SIulia Manda * in faults_memory and faults_cpu decay and these values are copied. 1283745d6147SMel Gorman */ 128444dba3d5SIulia Manda unsigned long *numa_faults; 128583e1d2cdSMel Gorman unsigned long total_numa_faults; 1286745d6147SMel Gorman 1287745d6147SMel Gorman /* 128804bb2f94SRik van Riel * numa_faults_locality tracks if faults recorded during the last 1289074c2381SMel Gorman * scan window were remote/local or failed to migrate. The task scan 1290074c2381SMel Gorman * period is adapted based on the locality of the faults with different 1291074c2381SMel Gorman * weights depending on whether they were shared or private faults 129204bb2f94SRik van Riel */ 1293074c2381SMel Gorman unsigned long numa_faults_locality[3]; 129404bb2f94SRik van Riel 1295b32e86b4SIngo Molnar unsigned long numa_pages_migrated; 1296cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */ 1297cbee9f88SPeter Zijlstra 1298d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ 1299d7822b1eSMathieu Desnoyers struct rseq __user *rseq; 1300d7822b1eSMathieu Desnoyers u32 rseq_sig; 1301d7822b1eSMathieu Desnoyers /* 1302d7822b1eSMathieu Desnoyers * RmW on rseq_event_mask must be performed atomically 1303d7822b1eSMathieu Desnoyers * with respect to preemption. 1304d7822b1eSMathieu Desnoyers */ 1305d7822b1eSMathieu Desnoyers unsigned long rseq_event_mask; 1306d7822b1eSMathieu Desnoyers #endif 1307d7822b1eSMathieu Desnoyers 130872b252aeSMel Gorman struct tlbflush_unmap_batch tlb_ubc; 130972b252aeSMel Gorman 13103fbd7ee2SEric W. Biederman union { 13113fbd7ee2SEric W. Biederman refcount_t rcu_users; 1312e56d0903SIngo Molnar struct rcu_head rcu; 13133fbd7ee2SEric W. Biederman }; 1314b92ce558SJens Axboe 13155eca1c10SIngo Molnar /* Cache last used pipe for splice(): */ 1316b92ce558SJens Axboe struct pipe_inode_info *splice_pipe; 13175640f768SEric Dumazet 13185640f768SEric Dumazet struct page_frag task_frag; 13195640f768SEric Dumazet 1320ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT 1321ca74e92bSShailabh Nagar struct task_delay_info *delays; 1322ca74e92bSShailabh Nagar #endif 132347913d4eSIngo Molnar 1324f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION 1325f4f154fdSAkinobu Mita int make_it_fail; 13269049f2f6SAkinobu Mita unsigned int fail_nth; 1327f4f154fdSAkinobu Mita #endif 13289d823e8fSWu Fengguang /* 13295eca1c10SIngo Molnar * When (nr_dirtied >= nr_dirtied_pause), it's time to call 13305eca1c10SIngo Molnar * balance_dirty_pages() for a dirty throttling pause: 13319d823e8fSWu Fengguang */ 13329d823e8fSWu Fengguang int nr_dirtied; 13339d823e8fSWu Fengguang int nr_dirtied_pause; 13345eca1c10SIngo Molnar /* Start of a write-and-pause period: */ 13355eca1c10SIngo Molnar unsigned long dirty_paused_when; 13369d823e8fSWu Fengguang 13379745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP 13389745512cSArjan van de Ven int latency_record_count; 13399745512cSArjan van de Ven struct latency_record latency_record[LT_SAVECOUNT]; 13409745512cSArjan van de Ven #endif 13416976675dSArjan van de Ven /* 13425eca1c10SIngo Molnar * Time slack values; these are used to round up poll() and 13436976675dSArjan van de Ven * select() etc timeout values. These are in nanoseconds. 13446976675dSArjan van de Ven */ 1345da8b44d5SJohn Stultz u64 timer_slack_ns; 1346da8b44d5SJohn Stultz u64 default_timer_slack_ns; 1347f8d570a4SDavid Miller 1348d73b4936SAndrey Konovalov #if defined(CONFIG_KASAN_GENERIC) || defined(CONFIG_KASAN_SW_TAGS) 13490b24beccSAndrey Ryabinin unsigned int kasan_depth; 13500b24beccSAndrey Ryabinin #endif 135192c209acSMarco Elver 1352dfd402a4SMarco Elver #ifdef CONFIG_KCSAN 1353dfd402a4SMarco Elver struct kcsan_ctx kcsan_ctx; 135492c209acSMarco Elver #ifdef CONFIG_TRACE_IRQFLAGS 135592c209acSMarco Elver struct irqtrace_events kcsan_save_irqtrace; 135692c209acSMarco Elver #endif 135769562e49SMarco Elver #ifdef CONFIG_KCSAN_WEAK_MEMORY 135869562e49SMarco Elver int kcsan_stack_depth; 135969562e49SMarco Elver #endif 1360dfd402a4SMarco Elver #endif 13615eca1c10SIngo Molnar 1362393824f6SPatricia Alfonso #if IS_ENABLED(CONFIG_KUNIT) 1363393824f6SPatricia Alfonso struct kunit *kunit_test; 1364393824f6SPatricia Alfonso #endif 1365393824f6SPatricia Alfonso 1366fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER 13675eca1c10SIngo Molnar /* Index of current stored address in ret_stack: */ 1368f201ae23SFrederic Weisbecker int curr_ret_stack; 136939eb456dSSteven Rostedt (VMware) int curr_ret_depth; 13705eca1c10SIngo Molnar 13715eca1c10SIngo Molnar /* Stack of return addresses for return function tracing: */ 1372f201ae23SFrederic Weisbecker struct ftrace_ret_stack *ret_stack; 13735eca1c10SIngo Molnar 13745eca1c10SIngo Molnar /* Timestamp for last schedule: */ 13758aef2d28SSteven Rostedt unsigned long long ftrace_timestamp; 13765eca1c10SIngo Molnar 1377f201ae23SFrederic Weisbecker /* 1378f201ae23SFrederic Weisbecker * Number of functions that haven't been traced 13795eca1c10SIngo Molnar * because of depth overrun: 1380f201ae23SFrederic Weisbecker */ 1381f201ae23SFrederic Weisbecker atomic_t trace_overrun; 13825eca1c10SIngo Molnar 13835eca1c10SIngo Molnar /* Pause tracing: */ 1384380c4b14SFrederic Weisbecker atomic_t tracing_graph_pause; 1385f201ae23SFrederic Weisbecker #endif 13865eca1c10SIngo Molnar 1387ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING 13885eca1c10SIngo Molnar /* State flags for use by tracers: */ 1389ea4e2bc4SSteven Rostedt unsigned long trace; 13905eca1c10SIngo Molnar 13915eca1c10SIngo Molnar /* Bitmask and counter of trace recursion: */ 1392261842b7SSteven Rostedt unsigned long trace_recursion; 1393261842b7SSteven Rostedt #endif /* CONFIG_TRACING */ 13945eca1c10SIngo Molnar 13955c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV 1396eec028c9SAndrey Konovalov /* See kernel/kcov.c for more details. */ 1397eec028c9SAndrey Konovalov 13985eca1c10SIngo Molnar /* Coverage collection mode enabled for this task (0 if disabled): */ 13990ed557aaSMark Rutland unsigned int kcov_mode; 14005eca1c10SIngo Molnar 14015eca1c10SIngo Molnar /* Size of the kcov_area: */ 14025eca1c10SIngo Molnar unsigned int kcov_size; 14035eca1c10SIngo Molnar 14045eca1c10SIngo Molnar /* Buffer for coverage collection: */ 14055c9a8750SDmitry Vyukov void *kcov_area; 14065eca1c10SIngo Molnar 14075eca1c10SIngo Molnar /* KCOV descriptor wired with this task or NULL: */ 14085c9a8750SDmitry Vyukov struct kcov *kcov; 1409eec028c9SAndrey Konovalov 1410eec028c9SAndrey Konovalov /* KCOV common handle for remote coverage collection: */ 1411eec028c9SAndrey Konovalov u64 kcov_handle; 1412eec028c9SAndrey Konovalov 1413eec028c9SAndrey Konovalov /* KCOV sequence number: */ 1414eec028c9SAndrey Konovalov int kcov_sequence; 14155ff3b30aSAndrey Konovalov 14165ff3b30aSAndrey Konovalov /* Collect coverage from softirq context: */ 14175ff3b30aSAndrey Konovalov unsigned int kcov_softirq; 14185c9a8750SDmitry Vyukov #endif 14195eca1c10SIngo Molnar 14206f185c29SVladimir Davydov #ifdef CONFIG_MEMCG 1421626ebc41STejun Heo struct mem_cgroup *memcg_in_oom; 1422626ebc41STejun Heo gfp_t memcg_oom_gfp_mask; 1423626ebc41STejun Heo int memcg_oom_order; 1424b23afb93STejun Heo 14255eca1c10SIngo Molnar /* Number of pages to reclaim on returning to userland: */ 1426b23afb93STejun Heo unsigned int memcg_nr_pages_over_high; 1427d46eb14bSShakeel Butt 1428d46eb14bSShakeel Butt /* Used by memcontrol for targeted memcg charge: */ 1429d46eb14bSShakeel Butt struct mem_cgroup *active_memcg; 1430569b846dSKAMEZAWA Hiroyuki #endif 14315eca1c10SIngo Molnar 1432d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP 1433d09d8df3SJosef Bacik struct request_queue *throttle_queue; 1434d09d8df3SJosef Bacik #endif 1435d09d8df3SJosef Bacik 14360326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES 14370326f5a9SSrikar Dronamraju struct uprobe_task *utask; 14380326f5a9SSrikar Dronamraju #endif 1439cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE) 1440cafe5635SKent Overstreet unsigned int sequential_io; 1441cafe5635SKent Overstreet unsigned int sequential_io_avg; 1442cafe5635SKent Overstreet #endif 14435fbda3ecSThomas Gleixner struct kmap_ctrl kmap_ctrl; 14448eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 14458eb23b9fSPeter Zijlstra unsigned long task_state_change; 14465f220be2SThomas Gleixner # ifdef CONFIG_PREEMPT_RT 14475f220be2SThomas Gleixner unsigned long saved_state_change; 14485f220be2SThomas Gleixner # endif 14498eb23b9fSPeter Zijlstra #endif 14508bcbde54SDavid Hildenbrand int pagefault_disabled; 145103049269SMichal Hocko #ifdef CONFIG_MMU 145229c696e1SVladimir Davydov struct task_struct *oom_reaper_list; 1453e4a38402SNico Pache struct timer_list oom_reaper_timer; 145403049269SMichal Hocko #endif 1455ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK 1456ba14a194SAndy Lutomirski struct vm_struct *stack_vm_area; 1457ba14a194SAndy Lutomirski #endif 145868f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 14595eca1c10SIngo Molnar /* A live task holds one reference: */ 1460f0b89d39SElena Reshetova refcount_t stack_refcount; 146168f24b08SAndy Lutomirski #endif 1462d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH 1463d83a7cb3SJosh Poimboeuf int patch_state; 1464d83a7cb3SJosh Poimboeuf #endif 1465e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY 1466e4e55b47STetsuo Handa /* Used by LSM modules for access restriction: */ 1467e4e55b47STetsuo Handa void *security; 1468e4e55b47STetsuo Handa #endif 1469a10787e6SSong Liu #ifdef CONFIG_BPF_SYSCALL 1470a10787e6SSong Liu /* Used by BPF task local storage */ 1471a10787e6SSong Liu struct bpf_local_storage __rcu *bpf_storage; 1472c7603cfaSAndrii Nakryiko /* Used for BPF run context */ 1473c7603cfaSAndrii Nakryiko struct bpf_run_ctx *bpf_ctx; 1474a10787e6SSong Liu #endif 147529e48ce8SKees Cook 1476afaef01cSAlexander Popov #ifdef CONFIG_GCC_PLUGIN_STACKLEAK 1477afaef01cSAlexander Popov unsigned long lowest_stack; 1478c8d12627SAlexander Popov unsigned long prev_lowest_stack; 1479afaef01cSAlexander Popov #endif 1480afaef01cSAlexander Popov 14815567d11cSPeter Zijlstra #ifdef CONFIG_X86_MCE 1482c0ab7ffcSTony Luck void __user *mce_vaddr; 1483c0ab7ffcSTony Luck __u64 mce_kflags; 14845567d11cSPeter Zijlstra u64 mce_addr; 148517fae129STony Luck __u64 mce_ripv : 1, 148617fae129STony Luck mce_whole_page : 1, 148717fae129STony Luck __mce_reserved : 62; 14885567d11cSPeter Zijlstra struct callback_head mce_kill_me; 148981065b35STony Luck int mce_count; 14905567d11cSPeter Zijlstra #endif 14915567d11cSPeter Zijlstra 1492d741bf41SPeter Zijlstra #ifdef CONFIG_KRETPROBES 1493d741bf41SPeter Zijlstra struct llist_head kretprobe_instances; 1494d741bf41SPeter Zijlstra #endif 149554ecbe6fSMasami Hiramatsu #ifdef CONFIG_RETHOOK 149654ecbe6fSMasami Hiramatsu struct llist_head rethooks; 149754ecbe6fSMasami Hiramatsu #endif 1498d741bf41SPeter Zijlstra 149958e106e7SBalbir Singh #ifdef CONFIG_ARCH_HAS_PARANOID_L1D_FLUSH 150058e106e7SBalbir Singh /* 150158e106e7SBalbir Singh * If L1D flush is supported on mm context switch 150258e106e7SBalbir Singh * then we use this callback head to queue kill work 150358e106e7SBalbir Singh * to kill tasks that are not running on SMT disabled 150458e106e7SBalbir Singh * cores 150558e106e7SBalbir Singh */ 150658e106e7SBalbir Singh struct callback_head l1d_flush_kill; 150758e106e7SBalbir Singh #endif 150858e106e7SBalbir Singh 1509102227b9SDaniel Bristot de Oliveira #ifdef CONFIG_RV 1510102227b9SDaniel Bristot de Oliveira /* 1511102227b9SDaniel Bristot de Oliveira * Per-task RV monitor. Nowadays fixed in RV_PER_TASK_MONITORS. 1512102227b9SDaniel Bristot de Oliveira * If we find justification for more monitors, we can think 1513102227b9SDaniel Bristot de Oliveira * about adding more or developing a dynamic method. So far, 1514102227b9SDaniel Bristot de Oliveira * none of these are justified. 1515102227b9SDaniel Bristot de Oliveira */ 1516102227b9SDaniel Bristot de Oliveira union rv_task_monitor rv[RV_PER_TASK_MONITORS]; 1517102227b9SDaniel Bristot de Oliveira #endif 1518102227b9SDaniel Bristot de Oliveira 151929e48ce8SKees Cook /* 152029e48ce8SKees Cook * New fields for task_struct should be added above here, so that 152129e48ce8SKees Cook * they are included in the randomized portion of task_struct. 152229e48ce8SKees Cook */ 152329e48ce8SKees Cook randomized_struct_fields_end 152429e48ce8SKees Cook 15255eca1c10SIngo Molnar /* CPU-specific state of this task: */ 15260c8c0f03SDave Hansen struct thread_struct thread; 15275eca1c10SIngo Molnar 15280c8c0f03SDave Hansen /* 15290c8c0f03SDave Hansen * WARNING: on x86, 'thread_struct' contains a variable-sized 15300c8c0f03SDave Hansen * structure. It *MUST* be at the end of 'task_struct'. 15310c8c0f03SDave Hansen * 15320c8c0f03SDave Hansen * Do not put anything below here! 15330c8c0f03SDave Hansen */ 15341da177e4SLinus Torvalds }; 15351da177e4SLinus Torvalds 1536e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task) 153722c935f4SEric W. Biederman { 15382c470475SEric W. Biederman return task->thread_pid; 153922c935f4SEric W. Biederman } 154022c935f4SEric W. Biederman 15417af57294SPavel Emelyanov /* 15427af57294SPavel Emelyanov * the helpers to get the task's different pids as they are seen 15437af57294SPavel Emelyanov * from various namespaces 15447af57294SPavel Emelyanov * 15457af57294SPavel Emelyanov * task_xid_nr() : global id, i.e. the id seen from the init namespace; 154644c4e1b2SEric W. Biederman * task_xid_vnr() : virtual id, i.e. the id seen from the pid namespace of 154744c4e1b2SEric W. Biederman * current. 15487af57294SPavel Emelyanov * task_xid_nr_ns() : id seen from the ns specified; 15497af57294SPavel Emelyanov * 15507af57294SPavel Emelyanov * see also pid_nr() etc in include/linux/pid.h 15517af57294SPavel Emelyanov */ 15525eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns); 15537af57294SPavel Emelyanov 1554e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk) 15557af57294SPavel Emelyanov { 15567af57294SPavel Emelyanov return tsk->pid; 15577af57294SPavel Emelyanov } 15587af57294SPavel Emelyanov 15595eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 156052ee2dfdSOleg Nesterov { 156152ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns); 156252ee2dfdSOleg Nesterov } 15637af57294SPavel Emelyanov 15647af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk) 15657af57294SPavel Emelyanov { 156652ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL); 15677af57294SPavel Emelyanov } 15687af57294SPavel Emelyanov 15697af57294SPavel Emelyanov 1570e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk) 15717af57294SPavel Emelyanov { 15727af57294SPavel Emelyanov return tsk->tgid; 15737af57294SPavel Emelyanov } 15747af57294SPavel Emelyanov 15755eca1c10SIngo Molnar /** 15765eca1c10SIngo Molnar * pid_alive - check that a task structure is not stale 15775eca1c10SIngo Molnar * @p: Task structure to be checked. 15785eca1c10SIngo Molnar * 15795eca1c10SIngo Molnar * Test if a process is not yet dead (at most zombie state) 15805eca1c10SIngo Molnar * If pid_alive fails, then pointers within the task structure 15815eca1c10SIngo Molnar * can be stale and must not be dereferenced. 15825eca1c10SIngo Molnar * 15835eca1c10SIngo Molnar * Return: 1 if the process is alive. 0 otherwise. 15845eca1c10SIngo Molnar */ 15855eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p) 15865eca1c10SIngo Molnar { 15872c470475SEric W. Biederman return p->thread_pid != NULL; 15885eca1c10SIngo Molnar } 15897af57294SPavel Emelyanov 15905eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 15917af57294SPavel Emelyanov { 159252ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns); 15937af57294SPavel Emelyanov } 15947af57294SPavel Emelyanov 15957af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk) 15967af57294SPavel Emelyanov { 159752ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL); 15987af57294SPavel Emelyanov } 15997af57294SPavel Emelyanov 16007af57294SPavel Emelyanov 16015eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 16027af57294SPavel Emelyanov { 160352ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns); 16047af57294SPavel Emelyanov } 16057af57294SPavel Emelyanov 16067af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk) 16077af57294SPavel Emelyanov { 160852ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL); 16097af57294SPavel Emelyanov } 16107af57294SPavel Emelyanov 1611dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 1612dd1c1f2fSOleg Nesterov { 16136883f81aSEric W. Biederman return __task_pid_nr_ns(tsk, PIDTYPE_TGID, ns); 1614dd1c1f2fSOleg Nesterov } 1615dd1c1f2fSOleg Nesterov 1616dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk) 1617dd1c1f2fSOleg Nesterov { 16186883f81aSEric W. Biederman return __task_pid_nr_ns(tsk, PIDTYPE_TGID, NULL); 1619dd1c1f2fSOleg Nesterov } 1620dd1c1f2fSOleg Nesterov 1621dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns) 1622dd1c1f2fSOleg Nesterov { 1623dd1c1f2fSOleg Nesterov pid_t pid = 0; 1624dd1c1f2fSOleg Nesterov 1625dd1c1f2fSOleg Nesterov rcu_read_lock(); 1626dd1c1f2fSOleg Nesterov if (pid_alive(tsk)) 1627dd1c1f2fSOleg Nesterov pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns); 1628dd1c1f2fSOleg Nesterov rcu_read_unlock(); 1629dd1c1f2fSOleg Nesterov 1630dd1c1f2fSOleg Nesterov return pid; 1631dd1c1f2fSOleg Nesterov } 1632dd1c1f2fSOleg Nesterov 1633dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk) 1634dd1c1f2fSOleg Nesterov { 1635dd1c1f2fSOleg Nesterov return task_ppid_nr_ns(tsk, &init_pid_ns); 1636dd1c1f2fSOleg Nesterov } 1637dd1c1f2fSOleg Nesterov 16385eca1c10SIngo Molnar /* Obsolete, do not use: */ 16391b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk) 16401b0f7ffdSOleg Nesterov { 16411b0f7ffdSOleg Nesterov return task_pgrp_nr_ns(tsk, &init_pid_ns); 16421b0f7ffdSOleg Nesterov } 16437af57294SPavel Emelyanov 164406eb6184SPeter Zijlstra #define TASK_REPORT_IDLE (TASK_REPORT + 1) 164506eb6184SPeter Zijlstra #define TASK_REPORT_MAX (TASK_REPORT_IDLE << 1) 164606eb6184SPeter Zijlstra 1647fa2c3254SValentin Schneider static inline unsigned int __task_state_index(unsigned int tsk_state, 1648fa2c3254SValentin Schneider unsigned int tsk_exit_state) 164920435d84SXie XiuQi { 1650fa2c3254SValentin Schneider unsigned int state = (tsk_state | tsk_exit_state) & TASK_REPORT; 165120435d84SXie XiuQi 165206eb6184SPeter Zijlstra BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX); 165306eb6184SPeter Zijlstra 165406eb6184SPeter Zijlstra if (tsk_state == TASK_IDLE) 165506eb6184SPeter Zijlstra state = TASK_REPORT_IDLE; 165606eb6184SPeter Zijlstra 165725795ef6SValentin Schneider /* 165825795ef6SValentin Schneider * We're lying here, but rather than expose a completely new task state 165925795ef6SValentin Schneider * to userspace, we can make this appear as if the task has gone through 166025795ef6SValentin Schneider * a regular rt_mutex_lock() call. 166125795ef6SValentin Schneider */ 166225795ef6SValentin Schneider if (tsk_state == TASK_RTLOCK_WAIT) 166325795ef6SValentin Schneider state = TASK_UNINTERRUPTIBLE; 166425795ef6SValentin Schneider 16651593baabSPeter Zijlstra return fls(state); 16661593baabSPeter Zijlstra } 166720435d84SXie XiuQi 1668fa2c3254SValentin Schneider static inline unsigned int task_state_index(struct task_struct *tsk) 1669fa2c3254SValentin Schneider { 1670fa2c3254SValentin Schneider return __task_state_index(READ_ONCE(tsk->__state), tsk->exit_state); 1671fa2c3254SValentin Schneider } 1672fa2c3254SValentin Schneider 16731d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state) 16741593baabSPeter Zijlstra { 16758ef9925bSPeter Zijlstra static const char state_char[] = "RSDTtXZPI"; 16761593baabSPeter Zijlstra 167706eb6184SPeter Zijlstra BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1); 16781593baabSPeter Zijlstra 16791593baabSPeter Zijlstra return state_char[state]; 16801593baabSPeter Zijlstra } 16811593baabSPeter Zijlstra 16821593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk) 16831593baabSPeter Zijlstra { 16841d48b080SPeter Zijlstra return task_index_to_char(task_state_index(tsk)); 168520435d84SXie XiuQi } 168620435d84SXie XiuQi 16871da177e4SLinus Torvalds /** 1688570f5241SSergey Senozhatsky * is_global_init - check if a task structure is init. Since init 1689570f5241SSergey Senozhatsky * is free to have sub-threads we need to check tgid. 16903260259fSHenne * @tsk: Task structure to be checked. 16913260259fSHenne * 16923260259fSHenne * Check if a task structure is the first user space task the kernel created. 1693e69f6186SYacine Belkadi * 1694e69f6186SYacine Belkadi * Return: 1 if the task structure is init. 0 otherwise. 1695f400e198SSukadev Bhattiprolu */ 1696e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk) 1697b461cc03SPavel Emelyanov { 1698570f5241SSergey Senozhatsky return task_tgid_nr(tsk) == 1; 1699b461cc03SPavel Emelyanov } 1700b460cbc5SSerge E. Hallyn 17019ec52099SCedric Le Goater extern struct pid *cad_pid; 17029ec52099SCedric Le Goater 17031da177e4SLinus Torvalds /* 17041da177e4SLinus Torvalds * Per process flags 17051da177e4SLinus Torvalds */ 170601ccf592SSebastian Andrzej Siewior #define PF_VCPU 0x00000001 /* I'm a virtual CPU */ 1707c1de45caSPeter Zijlstra #define PF_IDLE 0x00000002 /* I am an IDLE thread */ 17085eca1c10SIngo Molnar #define PF_EXITING 0x00000004 /* Getting shut down */ 170992307383SEric W. Biederman #define PF_POSTCOREDUMP 0x00000008 /* Coredumps should ignore this task */ 171001ccf592SSebastian Andrzej Siewior #define PF_IO_WORKER 0x00000010 /* Task is an IO worker */ 171121aa9af0STejun Heo #define PF_WQ_WORKER 0x00000020 /* I'm a workqueue worker */ 17125eca1c10SIngo Molnar #define PF_FORKNOEXEC 0x00000040 /* Forked but didn't exec */ 17135eca1c10SIngo Molnar #define PF_MCE_PROCESS 0x00000080 /* Process policy on mce errors */ 17145eca1c10SIngo Molnar #define PF_SUPERPRIV 0x00000100 /* Used super-user privileges */ 17155eca1c10SIngo Molnar #define PF_DUMPCORE 0x00000200 /* Dumped core */ 17165eca1c10SIngo Molnar #define PF_SIGNALED 0x00000400 /* Killed by a signal */ 17171da177e4SLinus Torvalds #define PF_MEMALLOC 0x00000800 /* Allocating memory */ 17185eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED 0x00001000 /* set_user() noticed that RLIMIT_NPROC was exceeded */ 17195eca1c10SIngo Molnar #define PF_USED_MATH 0x00002000 /* If unset the fpu must be initialized before use */ 17205eca1c10SIngo Molnar #define PF_NOFREEZE 0x00008000 /* This thread should not be frozen */ 17215eca1c10SIngo Molnar #define PF_FROZEN 0x00010000 /* Frozen for system suspend */ 17227dea19f9SMichal Hocko #define PF_KSWAPD 0x00020000 /* I am kswapd */ 17237dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS 0x00040000 /* All allocation requests will inherit GFP_NOFS */ 17247dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO 0x00080000 /* All allocation requests will inherit GFP_NOIO */ 1725a37b0715SNeilBrown #define PF_LOCAL_THROTTLE 0x00100000 /* Throttle writes only against the bdi I write to, 1726a37b0715SNeilBrown * I am cleaning dirty pages from some other bdi. */ 1727246bb0b1SOleg Nesterov #define PF_KTHREAD 0x00200000 /* I am a kernel thread */ 17285eca1c10SIngo Molnar #define PF_RANDOMIZE 0x00400000 /* Randomize virtual address space */ 17293bd37062SSebastian Andrzej Siewior #define PF_NO_SETAFFINITY 0x04000000 /* Userland is not allowed to meddle with cpus_mask */ 17304db96cf0SAndi Kleen #define PF_MCE_EARLY 0x08000000 /* Early kill for mce process policy */ 17311a08ae36SPavel Tatashin #define PF_MEMALLOC_PIN 0x10000000 /* Allocation context constrained to zones which allow long term pinning. */ 173258a69cb4STejun Heo #define PF_FREEZER_SKIP 0x40000000 /* Freezer should not count it as freezable */ 17335eca1c10SIngo Molnar #define PF_SUSPEND_TASK 0x80000000 /* This thread called freeze_processes() and should not be frozen */ 17341da177e4SLinus Torvalds 17351da177e4SLinus Torvalds /* 17361da177e4SLinus Torvalds * Only the _current_ task can read/write to tsk->flags, but other 17371da177e4SLinus Torvalds * tasks can access tsk->flags in readonly mode for example 17381da177e4SLinus Torvalds * with tsk_used_math (like during threaded core dumping). 17391da177e4SLinus Torvalds * There is however an exception to this rule during ptrace 17401da177e4SLinus Torvalds * or during fork: the ptracer task is allowed to write to the 17411da177e4SLinus Torvalds * child->flags of its traced child (same goes for fork, the parent 17421da177e4SLinus Torvalds * can write to the child->flags), because we're guaranteed the 17431da177e4SLinus Torvalds * child is not running and in turn not changing child->flags 17441da177e4SLinus Torvalds * at the same time the parent does it. 17451da177e4SLinus Torvalds */ 17461da177e4SLinus Torvalds #define clear_stopped_child_used_math(child) do { (child)->flags &= ~PF_USED_MATH; } while (0) 17471da177e4SLinus Torvalds #define set_stopped_child_used_math(child) do { (child)->flags |= PF_USED_MATH; } while (0) 17481da177e4SLinus Torvalds #define clear_used_math() clear_stopped_child_used_math(current) 17491da177e4SLinus Torvalds #define set_used_math() set_stopped_child_used_math(current) 17505eca1c10SIngo Molnar 17511da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \ 17521da177e4SLinus Torvalds do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0) 17535eca1c10SIngo Molnar 17545eca1c10SIngo Molnar #define conditional_used_math(condition) conditional_stopped_child_used_math(condition, current) 17555eca1c10SIngo Molnar 17561da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \ 17571da177e4SLinus Torvalds do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0) 17585eca1c10SIngo Molnar 17591da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */ 17601da177e4SLinus Torvalds #define tsk_used_math(p) ((p)->flags & PF_USED_MATH) 17611da177e4SLinus Torvalds #define used_math() tsk_used_math(current) 17621da177e4SLinus Torvalds 176383d40a61SPeter Zijlstra static __always_inline bool is_percpu_thread(void) 176462ec05ddSThomas Gleixner { 176562ec05ddSThomas Gleixner #ifdef CONFIG_SMP 176662ec05ddSThomas Gleixner return (current->flags & PF_NO_SETAFFINITY) && 176762ec05ddSThomas Gleixner (current->nr_cpus_allowed == 1); 176862ec05ddSThomas Gleixner #else 176962ec05ddSThomas Gleixner return true; 177062ec05ddSThomas Gleixner #endif 177162ec05ddSThomas Gleixner } 177262ec05ddSThomas Gleixner 17731d4457f9SKees Cook /* Per-process atomic flags. */ 1774a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS 0 /* May not gain new privileges. */ 17752ad654bcSZefan Li #define PFA_SPREAD_PAGE 1 /* Spread page cache over cpuset */ 17762ad654bcSZefan Li #define PFA_SPREAD_SLAB 2 /* Spread some slab caches over cpuset */ 1777356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE 3 /* Speculative Store Bypass disabled */ 1778356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE 4 /* Speculative Store Bypass force disabled*/ 17799137bb27SThomas Gleixner #define PFA_SPEC_IB_DISABLE 5 /* Indirect branch speculation restricted */ 17809137bb27SThomas Gleixner #define PFA_SPEC_IB_FORCE_DISABLE 6 /* Indirect branch speculation permanently restricted */ 178171368af9SWaiman Long #define PFA_SPEC_SSB_NOEXEC 7 /* Speculative Store Bypass clear on execve() */ 17821d4457f9SKees Cook 1783e0e5070bSZefan Li #define TASK_PFA_TEST(name, func) \ 1784e0e5070bSZefan Li static inline bool task_##func(struct task_struct *p) \ 1785e0e5070bSZefan Li { return test_bit(PFA_##name, &p->atomic_flags); } 17865eca1c10SIngo Molnar 1787e0e5070bSZefan Li #define TASK_PFA_SET(name, func) \ 1788e0e5070bSZefan Li static inline void task_set_##func(struct task_struct *p) \ 1789e0e5070bSZefan Li { set_bit(PFA_##name, &p->atomic_flags); } 17905eca1c10SIngo Molnar 1791e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func) \ 1792e0e5070bSZefan Li static inline void task_clear_##func(struct task_struct *p) \ 1793e0e5070bSZefan Li { clear_bit(PFA_##name, &p->atomic_flags); } 17941d4457f9SKees Cook 1795e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs) 1796e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs) 17971d4457f9SKees Cook 17982ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page) 17992ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page) 18002ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page) 18012ad654bcSZefan Li 18022ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab) 18032ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab) 18042ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab) 1805544b2c91STejun Heo 1806356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable) 1807356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable) 1808356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable) 1809356e4bffSThomas Gleixner 181071368af9SWaiman Long TASK_PFA_TEST(SPEC_SSB_NOEXEC, spec_ssb_noexec) 181171368af9SWaiman Long TASK_PFA_SET(SPEC_SSB_NOEXEC, spec_ssb_noexec) 181271368af9SWaiman Long TASK_PFA_CLEAR(SPEC_SSB_NOEXEC, spec_ssb_noexec) 181371368af9SWaiman Long 1814356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable) 1815356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable) 1816356e4bffSThomas Gleixner 18179137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_DISABLE, spec_ib_disable) 18189137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_DISABLE, spec_ib_disable) 18199137bb27SThomas Gleixner TASK_PFA_CLEAR(SPEC_IB_DISABLE, spec_ib_disable) 18209137bb27SThomas Gleixner 18219137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable) 18229137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable) 18239137bb27SThomas Gleixner 18245eca1c10SIngo Molnar static inline void 1825717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags) 1826907aed48SMel Gorman { 1827717a94b5SNeilBrown current->flags &= ~flags; 1828717a94b5SNeilBrown current->flags |= orig_flags & flags; 1829907aed48SMel Gorman } 1830907aed48SMel Gorman 18315eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial); 1832b6e8d40dSWaiman Long extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_effective_cpus); 18331da177e4SLinus Torvalds #ifdef CONFIG_SMP 18345eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask); 18355eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask); 1836b90ca8baSWill Deacon extern int dup_user_cpus_ptr(struct task_struct *dst, struct task_struct *src, int node); 1837b90ca8baSWill Deacon extern void release_user_cpus_ptr(struct task_struct *p); 1838234b8ab6SWill Deacon extern int dl_task_check_affinity(struct task_struct *p, const struct cpumask *mask); 183907ec77a1SWill Deacon extern void force_compatible_cpus_allowed_ptr(struct task_struct *p); 184007ec77a1SWill Deacon extern void relax_compatible_cpus_allowed_ptr(struct task_struct *p); 18411da177e4SLinus Torvalds #else 18425eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask) 18431e1b6c51SKOSAKI Motohiro { 18441e1b6c51SKOSAKI Motohiro } 18455eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask) 18461da177e4SLinus Torvalds { 184796f874e2SRusty Russell if (!cpumask_test_cpu(0, new_mask)) 18481da177e4SLinus Torvalds return -EINVAL; 18491da177e4SLinus Torvalds return 0; 18501da177e4SLinus Torvalds } 1851b90ca8baSWill Deacon static inline int dup_user_cpus_ptr(struct task_struct *dst, struct task_struct *src, int node) 1852b90ca8baSWill Deacon { 1853b90ca8baSWill Deacon if (src->user_cpus_ptr) 1854b90ca8baSWill Deacon return -EINVAL; 1855b90ca8baSWill Deacon return 0; 1856b90ca8baSWill Deacon } 1857b90ca8baSWill Deacon static inline void release_user_cpus_ptr(struct task_struct *p) 1858b90ca8baSWill Deacon { 1859b90ca8baSWill Deacon WARN_ON(p->user_cpus_ptr); 1860b90ca8baSWill Deacon } 1861234b8ab6SWill Deacon 1862234b8ab6SWill Deacon static inline int dl_task_check_affinity(struct task_struct *p, const struct cpumask *mask) 1863234b8ab6SWill Deacon { 1864234b8ab6SWill Deacon return 0; 1865234b8ab6SWill Deacon } 18661da177e4SLinus Torvalds #endif 1867e0ad9556SRusty Russell 1868fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt); 186936c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice); 187036c8b586SIngo Molnar extern int task_prio(const struct task_struct *p); 18715eca1c10SIngo Molnar 1872d0ea0268SDongsheng Yang /** 1873d0ea0268SDongsheng Yang * task_nice - return the nice value of a given task. 1874d0ea0268SDongsheng Yang * @p: the task in question. 1875d0ea0268SDongsheng Yang * 1876d0ea0268SDongsheng Yang * Return: The nice value [ -20 ... 0 ... 19 ]. 1877d0ea0268SDongsheng Yang */ 1878d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p) 1879d0ea0268SDongsheng Yang { 1880d0ea0268SDongsheng Yang return PRIO_TO_NICE((p)->static_prio); 1881d0ea0268SDongsheng Yang } 18825eca1c10SIngo Molnar 188336c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice); 188436c8b586SIngo Molnar extern int task_curr(const struct task_struct *p); 18851da177e4SLinus Torvalds extern int idle_cpu(int cpu); 1886943d355dSRohit Jain extern int available_idle_cpu(int cpu); 18875eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *); 18885eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *); 18898b700983SPeter Zijlstra extern void sched_set_fifo(struct task_struct *p); 18908b700983SPeter Zijlstra extern void sched_set_fifo_low(struct task_struct *p); 18918b700983SPeter Zijlstra extern void sched_set_normal(struct task_struct *p, int nice); 18925eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *); 1893794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *); 189436c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu); 18955eca1c10SIngo Molnar 1896c4f30608SPaul E. McKenney /** 1897c4f30608SPaul E. McKenney * is_idle_task - is the specified task an idle task? 1898fa757281SRandy Dunlap * @p: the task in question. 1899e69f6186SYacine Belkadi * 1900e69f6186SYacine Belkadi * Return: 1 if @p is an idle task. 0 otherwise. 1901c4f30608SPaul E. McKenney */ 1902c94a88f3SMarco Elver static __always_inline bool is_idle_task(const struct task_struct *p) 1903c4f30608SPaul E. McKenney { 1904c1de45caSPeter Zijlstra return !!(p->flags & PF_IDLE); 1905c4f30608SPaul E. McKenney } 19065eca1c10SIngo Molnar 190736c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu); 1908a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p); 19091da177e4SLinus Torvalds 19101da177e4SLinus Torvalds void yield(void); 19111da177e4SLinus Torvalds 19121da177e4SLinus Torvalds union thread_union { 19130500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK 19140500871fSDavid Howells struct task_struct task; 19150500871fSDavid Howells #endif 1916c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK 19171da177e4SLinus Torvalds struct thread_info thread_info; 1918c65eacbeSAndy Lutomirski #endif 19191da177e4SLinus Torvalds unsigned long stack[THREAD_SIZE/sizeof(long)]; 19201da177e4SLinus Torvalds }; 19211da177e4SLinus Torvalds 19220500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK 19230500871fSDavid Howells extern struct thread_info init_thread_info; 19240500871fSDavid Howells #endif 19250500871fSDavid Howells 19260500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)]; 19270500871fSDavid Howells 1928f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK 1929bcf9033eSArd Biesheuvel # define task_thread_info(task) (&(task)->thread_info) 1930f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS) 1931f3ac6067SIngo Molnar # define task_thread_info(task) ((struct thread_info *)(task)->stack) 1932f3ac6067SIngo Molnar #endif 1933f3ac6067SIngo Molnar 1934198fe21bSPavel Emelyanov /* 1935198fe21bSPavel Emelyanov * find a task by one of its numerical ids 1936198fe21bSPavel Emelyanov * 1937198fe21bSPavel Emelyanov * find_task_by_pid_ns(): 1938198fe21bSPavel Emelyanov * finds a task by its pid in the specified namespace 1939228ebcbeSPavel Emelyanov * find_task_by_vpid(): 1940228ebcbeSPavel Emelyanov * finds a task by its virtual pid 1941198fe21bSPavel Emelyanov * 1942e49859e7SPavel Emelyanov * see also find_vpid() etc in include/linux/pid.h 1943198fe21bSPavel Emelyanov */ 1944198fe21bSPavel Emelyanov 1945228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr); 19465eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns); 1947198fe21bSPavel Emelyanov 19482ee08260SMike Rapoport /* 19492ee08260SMike Rapoport * find a task by its virtual pid and get the task struct 19502ee08260SMike Rapoport */ 19512ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr); 19522ee08260SMike Rapoport 1953b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state); 1954b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk); 19553e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk); 19565eca1c10SIngo Molnar 19571da177e4SLinus Torvalds #ifdef CONFIG_SMP 19581da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk); 19591da177e4SLinus Torvalds #else 19601da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { } 19611da177e4SLinus Torvalds #endif 19621da177e4SLinus Torvalds 196382b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec); 19645eca1c10SIngo Molnar 196582b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from) 196682b89778SAdrian Hunter { 196782b89778SAdrian Hunter __set_task_comm(tsk, from, false); 196882b89778SAdrian Hunter } 19695eca1c10SIngo Molnar 19703756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk); 19713756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({ \ 19723756f640SArnd Bergmann BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN); \ 19733756f640SArnd Bergmann __get_task_comm(buf, sizeof(buf), tsk); \ 19743756f640SArnd Bergmann }) 19751da177e4SLinus Torvalds 19761da177e4SLinus Torvalds #ifdef CONFIG_SMP 19772a0a24ebSThomas Gleixner static __always_inline void scheduler_ipi(void) 19782a0a24ebSThomas Gleixner { 19792a0a24ebSThomas Gleixner /* 19802a0a24ebSThomas Gleixner * Fold TIF_NEED_RESCHED into the preempt_count; anybody setting 19812a0a24ebSThomas Gleixner * TIF_NEED_RESCHED remotely (for the first time) will also send 19822a0a24ebSThomas Gleixner * this IPI. 19832a0a24ebSThomas Gleixner */ 19842a0a24ebSThomas Gleixner preempt_fold_need_resched(); 19852a0a24ebSThomas Gleixner } 19862f064a59SPeter Zijlstra extern unsigned long wait_task_inactive(struct task_struct *, unsigned int match_state); 19871da177e4SLinus Torvalds #else 1988184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { } 19892f064a59SPeter Zijlstra static inline unsigned long wait_task_inactive(struct task_struct *p, unsigned int match_state) 199085ba2d86SRoland McGrath { 199185ba2d86SRoland McGrath return 1; 199285ba2d86SRoland McGrath } 19931da177e4SLinus Torvalds #endif 19941da177e4SLinus Torvalds 19955eca1c10SIngo Molnar /* 19965eca1c10SIngo Molnar * Set thread flags in other task's structures. 19975eca1c10SIngo Molnar * See asm/thread_info.h for TIF_xxxx flags available: 19981da177e4SLinus Torvalds */ 19991da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag) 20001da177e4SLinus Torvalds { 2001a1261f54SAl Viro set_ti_thread_flag(task_thread_info(tsk), flag); 20021da177e4SLinus Torvalds } 20031da177e4SLinus Torvalds 20041da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag) 20051da177e4SLinus Torvalds { 2006a1261f54SAl Viro clear_ti_thread_flag(task_thread_info(tsk), flag); 20071da177e4SLinus Torvalds } 20081da177e4SLinus Torvalds 200993ee37c2SDave Martin static inline void update_tsk_thread_flag(struct task_struct *tsk, int flag, 201093ee37c2SDave Martin bool value) 201193ee37c2SDave Martin { 201293ee37c2SDave Martin update_ti_thread_flag(task_thread_info(tsk), flag, value); 201393ee37c2SDave Martin } 201493ee37c2SDave Martin 20151da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag) 20161da177e4SLinus Torvalds { 2017a1261f54SAl Viro return test_and_set_ti_thread_flag(task_thread_info(tsk), flag); 20181da177e4SLinus Torvalds } 20191da177e4SLinus Torvalds 20201da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag) 20211da177e4SLinus Torvalds { 2022a1261f54SAl Viro return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag); 20231da177e4SLinus Torvalds } 20241da177e4SLinus Torvalds 20251da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag) 20261da177e4SLinus Torvalds { 2027a1261f54SAl Viro return test_ti_thread_flag(task_thread_info(tsk), flag); 20281da177e4SLinus Torvalds } 20291da177e4SLinus Torvalds 20301da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk) 20311da177e4SLinus Torvalds { 20321da177e4SLinus Torvalds set_tsk_thread_flag(tsk,TIF_NEED_RESCHED); 20331da177e4SLinus Torvalds } 20341da177e4SLinus Torvalds 20351da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk) 20361da177e4SLinus Torvalds { 20371da177e4SLinus Torvalds clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED); 20381da177e4SLinus Torvalds } 20391da177e4SLinus Torvalds 20408ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk) 20418ae121acSGregory Haskins { 20428ae121acSGregory Haskins return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED)); 20438ae121acSGregory Haskins } 20448ae121acSGregory Haskins 20451da177e4SLinus Torvalds /* 20461da177e4SLinus Torvalds * cond_resched() and cond_resched_lock(): latency reduction via 20471da177e4SLinus Torvalds * explicit rescheduling in places that are safe. The return 20481da177e4SLinus Torvalds * value indicates whether a reschedule was done in fact. 20491da177e4SLinus Torvalds * cond_resched_lock() will drop the spinlock before scheduling, 20501da177e4SLinus Torvalds */ 2051b965f1ddSPeter Zijlstra (Intel) #if !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC) 2052b965f1ddSPeter Zijlstra (Intel) extern int __cond_resched(void); 2053b965f1ddSPeter Zijlstra (Intel) 205499cf983cSMark Rutland #if defined(CONFIG_PREEMPT_DYNAMIC) && defined(CONFIG_HAVE_PREEMPT_DYNAMIC_CALL) 2055b965f1ddSPeter Zijlstra (Intel) 2056b965f1ddSPeter Zijlstra (Intel) DECLARE_STATIC_CALL(cond_resched, __cond_resched); 2057b965f1ddSPeter Zijlstra (Intel) 2058b965f1ddSPeter Zijlstra (Intel) static __always_inline int _cond_resched(void) 2059b965f1ddSPeter Zijlstra (Intel) { 2060ef72661eSPeter Zijlstra return static_call_mod(cond_resched)(); 2061b965f1ddSPeter Zijlstra (Intel) } 2062b965f1ddSPeter Zijlstra (Intel) 206399cf983cSMark Rutland #elif defined(CONFIG_PREEMPT_DYNAMIC) && defined(CONFIG_HAVE_PREEMPT_DYNAMIC_KEY) 206499cf983cSMark Rutland extern int dynamic_cond_resched(void); 206599cf983cSMark Rutland 206699cf983cSMark Rutland static __always_inline int _cond_resched(void) 206799cf983cSMark Rutland { 206899cf983cSMark Rutland return dynamic_cond_resched(); 206999cf983cSMark Rutland } 207099cf983cSMark Rutland 207135a773a0SPeter Zijlstra #else 2072b965f1ddSPeter Zijlstra (Intel) 2073b965f1ddSPeter Zijlstra (Intel) static inline int _cond_resched(void) 2074b965f1ddSPeter Zijlstra (Intel) { 2075b965f1ddSPeter Zijlstra (Intel) return __cond_resched(); 2076b965f1ddSPeter Zijlstra (Intel) } 2077b965f1ddSPeter Zijlstra (Intel) 2078b965f1ddSPeter Zijlstra (Intel) #endif /* CONFIG_PREEMPT_DYNAMIC */ 2079b965f1ddSPeter Zijlstra (Intel) 2080b965f1ddSPeter Zijlstra (Intel) #else 2081b965f1ddSPeter Zijlstra (Intel) 208235a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; } 2083b965f1ddSPeter Zijlstra (Intel) 2084b965f1ddSPeter Zijlstra (Intel) #endif /* !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC) */ 20856f80bd98SFrederic Weisbecker 2086613afbf8SFrederic Weisbecker #define cond_resched() ({ \ 2087874f670eSThomas Gleixner __might_resched(__FILE__, __LINE__, 0); \ 2088613afbf8SFrederic Weisbecker _cond_resched(); \ 2089613afbf8SFrederic Weisbecker }) 20906f80bd98SFrederic Weisbecker 2091613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock); 2092f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_read(rwlock_t *lock); 2093f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_write(rwlock_t *lock); 2094613afbf8SFrederic Weisbecker 209550e081b9SThomas Gleixner #define MIGHT_RESCHED_RCU_SHIFT 8 209650e081b9SThomas Gleixner #define MIGHT_RESCHED_PREEMPT_MASK ((1U << MIGHT_RESCHED_RCU_SHIFT) - 1) 209750e081b9SThomas Gleixner 20983e9cc688SThomas Gleixner #ifndef CONFIG_PREEMPT_RT 20993e9cc688SThomas Gleixner /* 21003e9cc688SThomas Gleixner * Non RT kernels have an elevated preempt count due to the held lock, 21013e9cc688SThomas Gleixner * but are not allowed to be inside a RCU read side critical section 21023e9cc688SThomas Gleixner */ 21033e9cc688SThomas Gleixner # define PREEMPT_LOCK_RESCHED_OFFSETS PREEMPT_LOCK_OFFSET 21043e9cc688SThomas Gleixner #else 21053e9cc688SThomas Gleixner /* 21063e9cc688SThomas Gleixner * spin/rw_lock() on RT implies rcu_read_lock(). The might_sleep() check in 21073e9cc688SThomas Gleixner * cond_resched*lock() has to take that into account because it checks for 21083e9cc688SThomas Gleixner * preempt_count() and rcu_preempt_depth(). 21093e9cc688SThomas Gleixner */ 21103e9cc688SThomas Gleixner # define PREEMPT_LOCK_RESCHED_OFFSETS \ 21113e9cc688SThomas Gleixner (PREEMPT_LOCK_OFFSET + (1U << MIGHT_RESCHED_RCU_SHIFT)) 21123e9cc688SThomas Gleixner #endif 21133e9cc688SThomas Gleixner 2114613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({ \ 21153e9cc688SThomas Gleixner __might_resched(__FILE__, __LINE__, PREEMPT_LOCK_RESCHED_OFFSETS); \ 2116613afbf8SFrederic Weisbecker __cond_resched_lock(lock); \ 2117613afbf8SFrederic Weisbecker }) 2118613afbf8SFrederic Weisbecker 2119f3d4b4b1SBen Gardon #define cond_resched_rwlock_read(lock) ({ \ 21203e9cc688SThomas Gleixner __might_resched(__FILE__, __LINE__, PREEMPT_LOCK_RESCHED_OFFSETS); \ 2121f3d4b4b1SBen Gardon __cond_resched_rwlock_read(lock); \ 2122f3d4b4b1SBen Gardon }) 2123f3d4b4b1SBen Gardon 2124f3d4b4b1SBen Gardon #define cond_resched_rwlock_write(lock) ({ \ 21253e9cc688SThomas Gleixner __might_resched(__FILE__, __LINE__, PREEMPT_LOCK_RESCHED_OFFSETS); \ 2126f3d4b4b1SBen Gardon __cond_resched_rwlock_write(lock); \ 2127f3d4b4b1SBen Gardon }) 2128f3d4b4b1SBen Gardon 2129f6f3c437SSimon Horman static inline void cond_resched_rcu(void) 2130f6f3c437SSimon Horman { 2131f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU) 2132f6f3c437SSimon Horman rcu_read_unlock(); 2133f6f3c437SSimon Horman cond_resched(); 2134f6f3c437SSimon Horman rcu_read_lock(); 2135f6f3c437SSimon Horman #endif 2136f6f3c437SSimon Horman } 2137f6f3c437SSimon Horman 2138cfe43f47SValentin Schneider #ifdef CONFIG_PREEMPT_DYNAMIC 2139cfe43f47SValentin Schneider 2140cfe43f47SValentin Schneider extern bool preempt_model_none(void); 2141cfe43f47SValentin Schneider extern bool preempt_model_voluntary(void); 2142cfe43f47SValentin Schneider extern bool preempt_model_full(void); 2143cfe43f47SValentin Schneider 2144cfe43f47SValentin Schneider #else 2145cfe43f47SValentin Schneider 2146cfe43f47SValentin Schneider static inline bool preempt_model_none(void) 2147cfe43f47SValentin Schneider { 2148cfe43f47SValentin Schneider return IS_ENABLED(CONFIG_PREEMPT_NONE); 2149cfe43f47SValentin Schneider } 2150cfe43f47SValentin Schneider static inline bool preempt_model_voluntary(void) 2151cfe43f47SValentin Schneider { 2152cfe43f47SValentin Schneider return IS_ENABLED(CONFIG_PREEMPT_VOLUNTARY); 2153cfe43f47SValentin Schneider } 2154cfe43f47SValentin Schneider static inline bool preempt_model_full(void) 2155cfe43f47SValentin Schneider { 2156cfe43f47SValentin Schneider return IS_ENABLED(CONFIG_PREEMPT); 2157cfe43f47SValentin Schneider } 2158cfe43f47SValentin Schneider 2159cfe43f47SValentin Schneider #endif 2160cfe43f47SValentin Schneider 2161cfe43f47SValentin Schneider static inline bool preempt_model_rt(void) 2162cfe43f47SValentin Schneider { 2163cfe43f47SValentin Schneider return IS_ENABLED(CONFIG_PREEMPT_RT); 2164cfe43f47SValentin Schneider } 2165cfe43f47SValentin Schneider 2166cfe43f47SValentin Schneider /* 2167cfe43f47SValentin Schneider * Does the preemption model allow non-cooperative preemption? 2168cfe43f47SValentin Schneider * 2169cfe43f47SValentin Schneider * For !CONFIG_PREEMPT_DYNAMIC kernels this is an exact match with 2170cfe43f47SValentin Schneider * CONFIG_PREEMPTION; for CONFIG_PREEMPT_DYNAMIC this doesn't work as the 2171cfe43f47SValentin Schneider * kernel is *built* with CONFIG_PREEMPTION=y but may run with e.g. the 2172cfe43f47SValentin Schneider * PREEMPT_NONE model. 2173cfe43f47SValentin Schneider */ 2174cfe43f47SValentin Schneider static inline bool preempt_model_preemptible(void) 2175cfe43f47SValentin Schneider { 2176cfe43f47SValentin Schneider return preempt_model_full() || preempt_model_rt(); 2177cfe43f47SValentin Schneider } 2178cfe43f47SValentin Schneider 21791da177e4SLinus Torvalds /* 21801da177e4SLinus Torvalds * Does a critical section need to be broken due to another 2181c1a280b6SThomas Gleixner * task waiting?: (technically does not depend on CONFIG_PREEMPTION, 218295c354feSNick Piggin * but a general need for low latency) 21831da177e4SLinus Torvalds */ 218495c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock) 21851da177e4SLinus Torvalds { 2186c1a280b6SThomas Gleixner #ifdef CONFIG_PREEMPTION 218795c354feSNick Piggin return spin_is_contended(lock); 218895c354feSNick Piggin #else 21891da177e4SLinus Torvalds return 0; 219095c354feSNick Piggin #endif 21911da177e4SLinus Torvalds } 21921da177e4SLinus Torvalds 2193a09a689aSBen Gardon /* 2194a09a689aSBen Gardon * Check if a rwlock is contended. 2195a09a689aSBen Gardon * Returns non-zero if there is another task waiting on the rwlock. 2196a09a689aSBen Gardon * Returns zero if the lock is not contended or the system / underlying 2197a09a689aSBen Gardon * rwlock implementation does not support contention detection. 2198a09a689aSBen Gardon * Technically does not depend on CONFIG_PREEMPTION, but a general need 2199a09a689aSBen Gardon * for low latency. 2200a09a689aSBen Gardon */ 2201a09a689aSBen Gardon static inline int rwlock_needbreak(rwlock_t *lock) 2202a09a689aSBen Gardon { 2203a09a689aSBen Gardon #ifdef CONFIG_PREEMPTION 2204a09a689aSBen Gardon return rwlock_is_contended(lock); 2205a09a689aSBen Gardon #else 2206a09a689aSBen Gardon return 0; 2207a09a689aSBen Gardon #endif 2208a09a689aSBen Gardon } 2209a09a689aSBen Gardon 221075f93fedSPeter Zijlstra static __always_inline bool need_resched(void) 221175f93fedSPeter Zijlstra { 221275f93fedSPeter Zijlstra return unlikely(tif_need_resched()); 221375f93fedSPeter Zijlstra } 221475f93fedSPeter Zijlstra 2215ee761f62SThomas Gleixner /* 22161da177e4SLinus Torvalds * Wrappers for p->thread_info->cpu access. No-op on UP. 22171da177e4SLinus Torvalds */ 22181da177e4SLinus Torvalds #ifdef CONFIG_SMP 22191da177e4SLinus Torvalds 22201da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p) 22211da177e4SLinus Torvalds { 2222c546951dSAndrea Parri return READ_ONCE(task_thread_info(p)->cpu); 22231da177e4SLinus Torvalds } 22241da177e4SLinus Torvalds 2225c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu); 22261da177e4SLinus Torvalds 22271da177e4SLinus Torvalds #else 22281da177e4SLinus Torvalds 22291da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p) 22301da177e4SLinus Torvalds { 22311da177e4SLinus Torvalds return 0; 22321da177e4SLinus Torvalds } 22331da177e4SLinus Torvalds 22341da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu) 22351da177e4SLinus Torvalds { 22361da177e4SLinus Torvalds } 22371da177e4SLinus Torvalds 22381da177e4SLinus Torvalds #endif /* CONFIG_SMP */ 22391da177e4SLinus Torvalds 2240a1dfb631SMarcelo Tosatti extern bool sched_task_on_rq(struct task_struct *p); 224142a20f86SKees Cook extern unsigned long get_wchan(struct task_struct *p); 2242e386b672SPaul E. McKenney extern struct task_struct *cpu_curr_snapshot(int cpu); 2243a1dfb631SMarcelo Tosatti 2244d9345c65SPan Xinhui /* 2245d9345c65SPan Xinhui * In order to reduce various lock holder preemption latencies provide an 2246d9345c65SPan Xinhui * interface to see if a vCPU is currently running or not. 2247d9345c65SPan Xinhui * 2248d9345c65SPan Xinhui * This allows us to terminate optimistic spin loops and block, analogous to 2249d9345c65SPan Xinhui * the native optimistic spin heuristic of testing if the lock owner task is 2250d9345c65SPan Xinhui * running or not. 2251d9345c65SPan Xinhui */ 2252d9345c65SPan Xinhui #ifndef vcpu_is_preempted 225342fd8baaSQian Cai static inline bool vcpu_is_preempted(int cpu) 225442fd8baaSQian Cai { 225542fd8baaSQian Cai return false; 225642fd8baaSQian Cai } 2257d9345c65SPan Xinhui #endif 2258d9345c65SPan Xinhui 225996f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask); 226096f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask); 22615c45bf27SSiddha, Suresh B 226282455257SDave Hansen #ifndef TASK_SIZE_OF 226382455257SDave Hansen #define TASK_SIZE_OF(tsk) TASK_SIZE 226482455257SDave Hansen #endif 226582455257SDave Hansen 2266a5418be9SViresh Kumar #ifdef CONFIG_SMP 2267c0bed69dSKefeng Wang static inline bool owner_on_cpu(struct task_struct *owner) 2268c0bed69dSKefeng Wang { 2269c0bed69dSKefeng Wang /* 2270c0bed69dSKefeng Wang * As lock holder preemption issue, we both skip spinning if 2271c0bed69dSKefeng Wang * task is not on cpu or its cpu is preempted 2272c0bed69dSKefeng Wang */ 22734cf75fd4SMarco Elver return READ_ONCE(owner->on_cpu) && !vcpu_is_preempted(task_cpu(owner)); 2274c0bed69dSKefeng Wang } 2275c0bed69dSKefeng Wang 2276a5418be9SViresh Kumar /* Returns effective CPU energy utilization, as seen by the scheduler */ 2277bb447999SDietmar Eggemann unsigned long sched_cpu_util(int cpu); 2278a5418be9SViresh Kumar #endif /* CONFIG_SMP */ 2279a5418be9SViresh Kumar 2280d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ 2281d7822b1eSMathieu Desnoyers 2282d7822b1eSMathieu Desnoyers /* 2283d7822b1eSMathieu Desnoyers * Map the event mask on the user-space ABI enum rseq_cs_flags 2284d7822b1eSMathieu Desnoyers * for direct mask checks. 2285d7822b1eSMathieu Desnoyers */ 2286d7822b1eSMathieu Desnoyers enum rseq_event_mask_bits { 2287d7822b1eSMathieu Desnoyers RSEQ_EVENT_PREEMPT_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_PREEMPT_BIT, 2288d7822b1eSMathieu Desnoyers RSEQ_EVENT_SIGNAL_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_SIGNAL_BIT, 2289d7822b1eSMathieu Desnoyers RSEQ_EVENT_MIGRATE_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_MIGRATE_BIT, 2290d7822b1eSMathieu Desnoyers }; 2291d7822b1eSMathieu Desnoyers 2292d7822b1eSMathieu Desnoyers enum rseq_event_mask { 2293d7822b1eSMathieu Desnoyers RSEQ_EVENT_PREEMPT = (1U << RSEQ_EVENT_PREEMPT_BIT), 2294d7822b1eSMathieu Desnoyers RSEQ_EVENT_SIGNAL = (1U << RSEQ_EVENT_SIGNAL_BIT), 2295d7822b1eSMathieu Desnoyers RSEQ_EVENT_MIGRATE = (1U << RSEQ_EVENT_MIGRATE_BIT), 2296d7822b1eSMathieu Desnoyers }; 2297d7822b1eSMathieu Desnoyers 2298d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t) 2299d7822b1eSMathieu Desnoyers { 2300d7822b1eSMathieu Desnoyers if (t->rseq) 2301d7822b1eSMathieu Desnoyers set_tsk_thread_flag(t, TIF_NOTIFY_RESUME); 2302d7822b1eSMathieu Desnoyers } 2303d7822b1eSMathieu Desnoyers 2304784e0300SWill Deacon void __rseq_handle_notify_resume(struct ksignal *sig, struct pt_regs *regs); 2305d7822b1eSMathieu Desnoyers 2306784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig, 2307784e0300SWill Deacon struct pt_regs *regs) 2308d7822b1eSMathieu Desnoyers { 2309d7822b1eSMathieu Desnoyers if (current->rseq) 2310784e0300SWill Deacon __rseq_handle_notify_resume(ksig, regs); 2311d7822b1eSMathieu Desnoyers } 2312d7822b1eSMathieu Desnoyers 2313784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig, 2314784e0300SWill Deacon struct pt_regs *regs) 2315d7822b1eSMathieu Desnoyers { 2316d7822b1eSMathieu Desnoyers preempt_disable(); 2317d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_SIGNAL_BIT, ¤t->rseq_event_mask); 2318d7822b1eSMathieu Desnoyers preempt_enable(); 2319784e0300SWill Deacon rseq_handle_notify_resume(ksig, regs); 2320d7822b1eSMathieu Desnoyers } 2321d7822b1eSMathieu Desnoyers 2322d7822b1eSMathieu Desnoyers /* rseq_preempt() requires preemption to be disabled. */ 2323d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t) 2324d7822b1eSMathieu Desnoyers { 2325d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_PREEMPT_BIT, &t->rseq_event_mask); 2326d7822b1eSMathieu Desnoyers rseq_set_notify_resume(t); 2327d7822b1eSMathieu Desnoyers } 2328d7822b1eSMathieu Desnoyers 2329d7822b1eSMathieu Desnoyers /* rseq_migrate() requires preemption to be disabled. */ 2330d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t) 2331d7822b1eSMathieu Desnoyers { 2332d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_MIGRATE_BIT, &t->rseq_event_mask); 2333d7822b1eSMathieu Desnoyers rseq_set_notify_resume(t); 2334d7822b1eSMathieu Desnoyers } 2335d7822b1eSMathieu Desnoyers 2336d7822b1eSMathieu Desnoyers /* 2337d7822b1eSMathieu Desnoyers * If parent process has a registered restartable sequences area, the 2338463f550fSMathieu Desnoyers * child inherits. Unregister rseq for a clone with CLONE_VM set. 2339d7822b1eSMathieu Desnoyers */ 2340d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags) 2341d7822b1eSMathieu Desnoyers { 2342463f550fSMathieu Desnoyers if (clone_flags & CLONE_VM) { 2343d7822b1eSMathieu Desnoyers t->rseq = NULL; 2344d7822b1eSMathieu Desnoyers t->rseq_sig = 0; 2345d7822b1eSMathieu Desnoyers t->rseq_event_mask = 0; 2346d7822b1eSMathieu Desnoyers } else { 2347d7822b1eSMathieu Desnoyers t->rseq = current->rseq; 2348d7822b1eSMathieu Desnoyers t->rseq_sig = current->rseq_sig; 2349d7822b1eSMathieu Desnoyers t->rseq_event_mask = current->rseq_event_mask; 2350d7822b1eSMathieu Desnoyers } 2351d7822b1eSMathieu Desnoyers } 2352d7822b1eSMathieu Desnoyers 2353d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t) 2354d7822b1eSMathieu Desnoyers { 2355d7822b1eSMathieu Desnoyers t->rseq = NULL; 2356d7822b1eSMathieu Desnoyers t->rseq_sig = 0; 2357d7822b1eSMathieu Desnoyers t->rseq_event_mask = 0; 2358d7822b1eSMathieu Desnoyers } 2359d7822b1eSMathieu Desnoyers 2360d7822b1eSMathieu Desnoyers #else 2361d7822b1eSMathieu Desnoyers 2362d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t) 2363d7822b1eSMathieu Desnoyers { 2364d7822b1eSMathieu Desnoyers } 2365784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig, 2366784e0300SWill Deacon struct pt_regs *regs) 2367d7822b1eSMathieu Desnoyers { 2368d7822b1eSMathieu Desnoyers } 2369784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig, 2370784e0300SWill Deacon struct pt_regs *regs) 2371d7822b1eSMathieu Desnoyers { 2372d7822b1eSMathieu Desnoyers } 2373d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t) 2374d7822b1eSMathieu Desnoyers { 2375d7822b1eSMathieu Desnoyers } 2376d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t) 2377d7822b1eSMathieu Desnoyers { 2378d7822b1eSMathieu Desnoyers } 2379d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags) 2380d7822b1eSMathieu Desnoyers { 2381d7822b1eSMathieu Desnoyers } 2382d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t) 2383d7822b1eSMathieu Desnoyers { 2384d7822b1eSMathieu Desnoyers } 2385d7822b1eSMathieu Desnoyers 2386d7822b1eSMathieu Desnoyers #endif 2387d7822b1eSMathieu Desnoyers 2388d7822b1eSMathieu Desnoyers #ifdef CONFIG_DEBUG_RSEQ 2389d7822b1eSMathieu Desnoyers 2390d7822b1eSMathieu Desnoyers void rseq_syscall(struct pt_regs *regs); 2391d7822b1eSMathieu Desnoyers 2392d7822b1eSMathieu Desnoyers #else 2393d7822b1eSMathieu Desnoyers 2394d7822b1eSMathieu Desnoyers static inline void rseq_syscall(struct pt_regs *regs) 2395d7822b1eSMathieu Desnoyers { 2396d7822b1eSMathieu Desnoyers } 2397d7822b1eSMathieu Desnoyers 2398d7822b1eSMathieu Desnoyers #endif 2399d7822b1eSMathieu Desnoyers 24006e33cad0SPeter Zijlstra #ifdef CONFIG_SCHED_CORE 24016e33cad0SPeter Zijlstra extern void sched_core_free(struct task_struct *tsk); 240285dd3f61SPeter Zijlstra extern void sched_core_fork(struct task_struct *p); 24037ac592aaSChris Hyser extern int sched_core_share_pid(unsigned int cmd, pid_t pid, enum pid_type type, 24047ac592aaSChris Hyser unsigned long uaddr); 24056e33cad0SPeter Zijlstra #else 24066e33cad0SPeter Zijlstra static inline void sched_core_free(struct task_struct *tsk) { } 240785dd3f61SPeter Zijlstra static inline void sched_core_fork(struct task_struct *p) { } 24086e33cad0SPeter Zijlstra #endif 24096e33cad0SPeter Zijlstra 2410d664e399SThomas Gleixner extern void sched_set_stop_task(int cpu, struct task_struct *stop); 2411d664e399SThomas Gleixner 24121da177e4SLinus Torvalds #endif 2413