1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */ 21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H 31da177e4SLinus Torvalds #define _LINUX_SCHED_H 41da177e4SLinus Torvalds 55eca1c10SIngo Molnar /* 65eca1c10SIngo Molnar * Define 'struct task_struct' and provide the main scheduler 75eca1c10SIngo Molnar * APIs (schedule(), wakeup variants, etc.) 85eca1c10SIngo Molnar */ 95eca1c10SIngo Molnar 10607ca46eSDavid Howells #include <uapi/linux/sched.h> 11b7b3c76aSDavid Woodhouse 1270b8157eSIngo Molnar #include <asm/current.h> 1370b8157eSIngo Molnar 145eca1c10SIngo Molnar #include <linux/pid.h> 155eca1c10SIngo Molnar #include <linux/sem.h> 165eca1c10SIngo Molnar #include <linux/shm.h> 175eca1c10SIngo Molnar #include <linux/mutex.h> 185eca1c10SIngo Molnar #include <linux/plist.h> 195eca1c10SIngo Molnar #include <linux/hrtimer.h> 200584df9cSMarco Elver #include <linux/irqflags.h> 215eca1c10SIngo Molnar #include <linux/seccomp.h> 225eca1c10SIngo Molnar #include <linux/nodemask.h> 235eca1c10SIngo Molnar #include <linux/rcupdate.h> 24ec1d2819SElena Reshetova #include <linux/refcount.h> 255eca1c10SIngo Molnar #include <linux/resource.h> 265eca1c10SIngo Molnar #include <linux/latencytop.h> 275eca1c10SIngo Molnar #include <linux/sched/prio.h> 289eacb5c7SThomas Gleixner #include <linux/sched/types.h> 295eca1c10SIngo Molnar #include <linux/signal_types.h> 301446e1dfSGabriel Krisman Bertazi #include <linux/syscall_user_dispatch.h> 315eca1c10SIngo Molnar #include <linux/mm_types_task.h> 325eca1c10SIngo Molnar #include <linux/task_io_accounting.h> 332b69942fSThomas Gleixner #include <linux/posix-timers.h> 34d7822b1eSMathieu Desnoyers #include <linux/rseq.h> 350cd39f46SPeter Zijlstra #include <linux/seqlock.h> 36dfd402a4SMarco Elver #include <linux/kcsan.h> 375fbda3ecSThomas Gleixner #include <asm/kmap_size.h> 385eca1c10SIngo Molnar 395eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */ 40c7af7877SIngo Molnar struct audit_context; 41c7af7877SIngo Molnar struct backing_dev_info; 42c7af7877SIngo Molnar struct bio_list; 43c7af7877SIngo Molnar struct blk_plug; 44a10787e6SSong Liu struct bpf_local_storage; 45c7603cfaSAndrii Nakryiko struct bpf_run_ctx; 463c93a0c0SQais Yousef struct capture_control; 47c7af7877SIngo Molnar struct cfs_rq; 48c7af7877SIngo Molnar struct fs_struct; 49c7af7877SIngo Molnar struct futex_pi_state; 50c7af7877SIngo Molnar struct io_context; 511875dc5bSPeter Oskolkov struct io_uring_task; 52c7af7877SIngo Molnar struct mempolicy; 53c7af7877SIngo Molnar struct nameidata; 54c7af7877SIngo Molnar struct nsproxy; 55c7af7877SIngo Molnar struct perf_event_context; 56c7af7877SIngo Molnar struct pid_namespace; 57c7af7877SIngo Molnar struct pipe_inode_info; 58c7af7877SIngo Molnar struct rcu_node; 59c7af7877SIngo Molnar struct reclaim_state; 60c7af7877SIngo Molnar struct robust_list_head; 613c93a0c0SQais Yousef struct root_domain; 623c93a0c0SQais Yousef struct rq; 63e2d1e2aeSIngo Molnar struct sched_attr; 64e2d1e2aeSIngo Molnar struct sched_param; 6543ae34cbSIngo Molnar struct seq_file; 66c7af7877SIngo Molnar struct sighand_struct; 67c7af7877SIngo Molnar struct signal_struct; 68c7af7877SIngo Molnar struct task_delay_info; 694cf86d77SIngo Molnar struct task_group; 701da177e4SLinus Torvalds 714a8342d2SLinus Torvalds /* 724a8342d2SLinus Torvalds * Task state bitmask. NOTE! These bits are also 734a8342d2SLinus Torvalds * encoded in fs/proc/array.c: get_task_state(). 744a8342d2SLinus Torvalds * 754a8342d2SLinus Torvalds * We have two separate sets of flags: task->state 764a8342d2SLinus Torvalds * is about runnability, while task->exit_state are 774a8342d2SLinus Torvalds * about the task exiting. Confusing, but this way 784a8342d2SLinus Torvalds * modifying one set can't modify the other one by 794a8342d2SLinus Torvalds * mistake. 804a8342d2SLinus Torvalds */ 815eca1c10SIngo Molnar 825eca1c10SIngo Molnar /* Used in tsk->state: */ 8392c4bc9fSPeter Zijlstra #define TASK_RUNNING 0x0000 8492c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE 0x0001 8592c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE 0x0002 8692c4bc9fSPeter Zijlstra #define __TASK_STOPPED 0x0004 8792c4bc9fSPeter Zijlstra #define __TASK_TRACED 0x0008 885eca1c10SIngo Molnar /* Used in tsk->exit_state: */ 8992c4bc9fSPeter Zijlstra #define EXIT_DEAD 0x0010 9092c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE 0x0020 91abd50b39SOleg Nesterov #define EXIT_TRACE (EXIT_ZOMBIE | EXIT_DEAD) 925eca1c10SIngo Molnar /* Used in tsk->state again: */ 938ef9925bSPeter Zijlstra #define TASK_PARKED 0x0040 948ef9925bSPeter Zijlstra #define TASK_DEAD 0x0080 958ef9925bSPeter Zijlstra #define TASK_WAKEKILL 0x0100 968ef9925bSPeter Zijlstra #define TASK_WAKING 0x0200 9792c4bc9fSPeter Zijlstra #define TASK_NOLOAD 0x0400 9892c4bc9fSPeter Zijlstra #define TASK_NEW 0x0800 99cd781d0cSThomas Gleixner /* RT specific auxilliary flag to mark RT lock waiters */ 100cd781d0cSThomas Gleixner #define TASK_RTLOCK_WAIT 0x1000 101cd781d0cSThomas Gleixner #define TASK_STATE_MAX 0x2000 102f021a3c2SMatthew Wilcox 1035eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */ 104f021a3c2SMatthew Wilcox #define TASK_KILLABLE (TASK_WAKEKILL | TASK_UNINTERRUPTIBLE) 105f021a3c2SMatthew Wilcox #define TASK_STOPPED (TASK_WAKEKILL | __TASK_STOPPED) 106f021a3c2SMatthew Wilcox #define TASK_TRACED (TASK_WAKEKILL | __TASK_TRACED) 1071da177e4SLinus Torvalds 10880ed87c8SPeter Zijlstra #define TASK_IDLE (TASK_UNINTERRUPTIBLE | TASK_NOLOAD) 10980ed87c8SPeter Zijlstra 1105eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */ 11192a1f4bcSMatthew Wilcox #define TASK_NORMAL (TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE) 11292a1f4bcSMatthew Wilcox 1135eca1c10SIngo Molnar /* get_task_state(): */ 11492a1f4bcSMatthew Wilcox #define TASK_REPORT (TASK_RUNNING | TASK_INTERRUPTIBLE | \ 115f021a3c2SMatthew Wilcox TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \ 1168ef9925bSPeter Zijlstra __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \ 1178ef9925bSPeter Zijlstra TASK_PARKED) 11892a1f4bcSMatthew Wilcox 1192f064a59SPeter Zijlstra #define task_is_running(task) (READ_ONCE((task)->__state) == TASK_RUNNING) 1205eca1c10SIngo Molnar 1212f064a59SPeter Zijlstra #define task_is_traced(task) ((READ_ONCE(task->__state) & __TASK_TRACED) != 0) 1225eca1c10SIngo Molnar 1232f064a59SPeter Zijlstra #define task_is_stopped(task) ((READ_ONCE(task->__state) & __TASK_STOPPED) != 0) 1245eca1c10SIngo Molnar 1252f064a59SPeter Zijlstra #define task_is_stopped_or_traced(task) ((READ_ONCE(task->__state) & (__TASK_STOPPED | __TASK_TRACED)) != 0) 1265eca1c10SIngo Molnar 127b5bf9a90SPeter Zijlstra /* 128b5bf9a90SPeter Zijlstra * Special states are those that do not use the normal wait-loop pattern. See 129b5bf9a90SPeter Zijlstra * the comment with set_special_state(). 130b5bf9a90SPeter Zijlstra */ 131b5bf9a90SPeter Zijlstra #define is_special_task_state(state) \ 1321cef1150SPeter Zijlstra ((state) & (__TASK_STOPPED | __TASK_TRACED | TASK_PARKED | TASK_DEAD)) 133b5bf9a90SPeter Zijlstra 13485019c16SThomas Gleixner #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 13585019c16SThomas Gleixner # define debug_normal_state_change(state_value) \ 1368eb23b9fSPeter Zijlstra do { \ 137b5bf9a90SPeter Zijlstra WARN_ON_ONCE(is_special_task_state(state_value)); \ 1388eb23b9fSPeter Zijlstra current->task_state_change = _THIS_IP_; \ 1398eb23b9fSPeter Zijlstra } while (0) 140b5bf9a90SPeter Zijlstra 14185019c16SThomas Gleixner # define debug_special_state_change(state_value) \ 1428eb23b9fSPeter Zijlstra do { \ 143b5bf9a90SPeter Zijlstra WARN_ON_ONCE(!is_special_task_state(state_value)); \ 144b5bf9a90SPeter Zijlstra current->task_state_change = _THIS_IP_; \ 145b5bf9a90SPeter Zijlstra } while (0) 14685019c16SThomas Gleixner 1475f220be2SThomas Gleixner # define debug_rtlock_wait_set_state() \ 1485f220be2SThomas Gleixner do { \ 1495f220be2SThomas Gleixner current->saved_state_change = current->task_state_change;\ 1505f220be2SThomas Gleixner current->task_state_change = _THIS_IP_; \ 1515f220be2SThomas Gleixner } while (0) 1525f220be2SThomas Gleixner 1535f220be2SThomas Gleixner # define debug_rtlock_wait_restore_state() \ 1545f220be2SThomas Gleixner do { \ 1555f220be2SThomas Gleixner current->task_state_change = current->saved_state_change;\ 1565f220be2SThomas Gleixner } while (0) 1575f220be2SThomas Gleixner 1588eb23b9fSPeter Zijlstra #else 15985019c16SThomas Gleixner # define debug_normal_state_change(cond) do { } while (0) 16085019c16SThomas Gleixner # define debug_special_state_change(cond) do { } while (0) 1615f220be2SThomas Gleixner # define debug_rtlock_wait_set_state() do { } while (0) 1625f220be2SThomas Gleixner # define debug_rtlock_wait_restore_state() do { } while (0) 16385019c16SThomas Gleixner #endif 16485019c16SThomas Gleixner 165498d0c57SAndrew Morton /* 166498d0c57SAndrew Morton * set_current_state() includes a barrier so that the write of current->state 167498d0c57SAndrew Morton * is correctly serialised wrt the caller's subsequent test of whether to 168498d0c57SAndrew Morton * actually sleep: 169498d0c57SAndrew Morton * 170a2250238SPeter Zijlstra * for (;;) { 171498d0c57SAndrew Morton * set_current_state(TASK_UNINTERRUPTIBLE); 17258877d34SPeter Zijlstra * if (CONDITION) 173a2250238SPeter Zijlstra * break; 174498d0c57SAndrew Morton * 175a2250238SPeter Zijlstra * schedule(); 176a2250238SPeter Zijlstra * } 177a2250238SPeter Zijlstra * __set_current_state(TASK_RUNNING); 178a2250238SPeter Zijlstra * 179a2250238SPeter Zijlstra * If the caller does not need such serialisation (because, for instance, the 18058877d34SPeter Zijlstra * CONDITION test and condition change and wakeup are under the same lock) then 181a2250238SPeter Zijlstra * use __set_current_state(). 182a2250238SPeter Zijlstra * 183a2250238SPeter Zijlstra * The above is typically ordered against the wakeup, which does: 184a2250238SPeter Zijlstra * 18558877d34SPeter Zijlstra * CONDITION = 1; 186a2250238SPeter Zijlstra * wake_up_state(p, TASK_UNINTERRUPTIBLE); 187a2250238SPeter Zijlstra * 18858877d34SPeter Zijlstra * where wake_up_state()/try_to_wake_up() executes a full memory barrier before 18958877d34SPeter Zijlstra * accessing p->state. 190a2250238SPeter Zijlstra * 191a2250238SPeter Zijlstra * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is, 192a2250238SPeter Zijlstra * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a 193a2250238SPeter Zijlstra * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING). 194a2250238SPeter Zijlstra * 195b5bf9a90SPeter Zijlstra * However, with slightly different timing the wakeup TASK_RUNNING store can 196dfcb245eSIngo Molnar * also collide with the TASK_UNINTERRUPTIBLE store. Losing that store is not 197b5bf9a90SPeter Zijlstra * a problem either because that will result in one extra go around the loop 198b5bf9a90SPeter Zijlstra * and our @cond test will save the day. 199a2250238SPeter Zijlstra * 200a2250238SPeter Zijlstra * Also see the comments of try_to_wake_up(). 201498d0c57SAndrew Morton */ 202b5bf9a90SPeter Zijlstra #define __set_current_state(state_value) \ 20385019c16SThomas Gleixner do { \ 20485019c16SThomas Gleixner debug_normal_state_change((state_value)); \ 20585019c16SThomas Gleixner WRITE_ONCE(current->__state, (state_value)); \ 20685019c16SThomas Gleixner } while (0) 207b5bf9a90SPeter Zijlstra 208b5bf9a90SPeter Zijlstra #define set_current_state(state_value) \ 20985019c16SThomas Gleixner do { \ 21085019c16SThomas Gleixner debug_normal_state_change((state_value)); \ 21185019c16SThomas Gleixner smp_store_mb(current->__state, (state_value)); \ 21285019c16SThomas Gleixner } while (0) 213b5bf9a90SPeter Zijlstra 214b5bf9a90SPeter Zijlstra /* 215b5bf9a90SPeter Zijlstra * set_special_state() should be used for those states when the blocking task 216b5bf9a90SPeter Zijlstra * can not use the regular condition based wait-loop. In that case we must 21785019c16SThomas Gleixner * serialize against wakeups such that any possible in-flight TASK_RUNNING 21885019c16SThomas Gleixner * stores will not collide with our state change. 219b5bf9a90SPeter Zijlstra */ 220b5bf9a90SPeter Zijlstra #define set_special_state(state_value) \ 221b5bf9a90SPeter Zijlstra do { \ 222b5bf9a90SPeter Zijlstra unsigned long flags; /* may shadow */ \ 22385019c16SThomas Gleixner \ 224b5bf9a90SPeter Zijlstra raw_spin_lock_irqsave(¤t->pi_lock, flags); \ 22585019c16SThomas Gleixner debug_special_state_change((state_value)); \ 2262f064a59SPeter Zijlstra WRITE_ONCE(current->__state, (state_value)); \ 227b5bf9a90SPeter Zijlstra raw_spin_unlock_irqrestore(¤t->pi_lock, flags); \ 228b5bf9a90SPeter Zijlstra } while (0) 229b5bf9a90SPeter Zijlstra 2305f220be2SThomas Gleixner /* 2315f220be2SThomas Gleixner * PREEMPT_RT specific variants for "sleeping" spin/rwlocks 2325f220be2SThomas Gleixner * 2335f220be2SThomas Gleixner * RT's spin/rwlock substitutions are state preserving. The state of the 2345f220be2SThomas Gleixner * task when blocking on the lock is saved in task_struct::saved_state and 2355f220be2SThomas Gleixner * restored after the lock has been acquired. These operations are 2365f220be2SThomas Gleixner * serialized by task_struct::pi_lock against try_to_wake_up(). Any non RT 2375f220be2SThomas Gleixner * lock related wakeups while the task is blocked on the lock are 2385f220be2SThomas Gleixner * redirected to operate on task_struct::saved_state to ensure that these 2395f220be2SThomas Gleixner * are not dropped. On restore task_struct::saved_state is set to 2405f220be2SThomas Gleixner * TASK_RUNNING so any wakeup attempt redirected to saved_state will fail. 2415f220be2SThomas Gleixner * 2425f220be2SThomas Gleixner * The lock operation looks like this: 2435f220be2SThomas Gleixner * 2445f220be2SThomas Gleixner * current_save_and_set_rtlock_wait_state(); 2455f220be2SThomas Gleixner * for (;;) { 2465f220be2SThomas Gleixner * if (try_lock()) 2475f220be2SThomas Gleixner * break; 2485f220be2SThomas Gleixner * raw_spin_unlock_irq(&lock->wait_lock); 2495f220be2SThomas Gleixner * schedule_rtlock(); 2505f220be2SThomas Gleixner * raw_spin_lock_irq(&lock->wait_lock); 2515f220be2SThomas Gleixner * set_current_state(TASK_RTLOCK_WAIT); 2525f220be2SThomas Gleixner * } 2535f220be2SThomas Gleixner * current_restore_rtlock_saved_state(); 2545f220be2SThomas Gleixner */ 2555f220be2SThomas Gleixner #define current_save_and_set_rtlock_wait_state() \ 2565f220be2SThomas Gleixner do { \ 2575f220be2SThomas Gleixner lockdep_assert_irqs_disabled(); \ 2585f220be2SThomas Gleixner raw_spin_lock(¤t->pi_lock); \ 2595f220be2SThomas Gleixner current->saved_state = current->__state; \ 2605f220be2SThomas Gleixner debug_rtlock_wait_set_state(); \ 2615f220be2SThomas Gleixner WRITE_ONCE(current->__state, TASK_RTLOCK_WAIT); \ 2625f220be2SThomas Gleixner raw_spin_unlock(¤t->pi_lock); \ 2635f220be2SThomas Gleixner } while (0); 2645f220be2SThomas Gleixner 2655f220be2SThomas Gleixner #define current_restore_rtlock_saved_state() \ 2665f220be2SThomas Gleixner do { \ 2675f220be2SThomas Gleixner lockdep_assert_irqs_disabled(); \ 2685f220be2SThomas Gleixner raw_spin_lock(¤t->pi_lock); \ 2695f220be2SThomas Gleixner debug_rtlock_wait_restore_state(); \ 2705f220be2SThomas Gleixner WRITE_ONCE(current->__state, current->saved_state); \ 2715f220be2SThomas Gleixner current->saved_state = TASK_RUNNING; \ 2725f220be2SThomas Gleixner raw_spin_unlock(¤t->pi_lock); \ 2735f220be2SThomas Gleixner } while (0); 2748eb23b9fSPeter Zijlstra 2752f064a59SPeter Zijlstra #define get_current_state() READ_ONCE(current->__state) 276d6c23bb3SPeter Zijlstra 2775eca1c10SIngo Molnar /* Task command name length: */ 2781da177e4SLinus Torvalds #define TASK_COMM_LEN 16 2791da177e4SLinus Torvalds 2801da177e4SLinus Torvalds extern void scheduler_tick(void); 2811da177e4SLinus Torvalds 2821da177e4SLinus Torvalds #define MAX_SCHEDULE_TIMEOUT LONG_MAX 2835eca1c10SIngo Molnar 2845eca1c10SIngo Molnar extern long schedule_timeout(long timeout); 2855eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout); 2865eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout); 2875eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout); 2885eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout); 2891da177e4SLinus Torvalds asmlinkage void schedule(void); 290c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void); 29119c95f26SJulien Thierry asmlinkage void preempt_schedule_irq(void); 2926991436cSThomas Gleixner #ifdef CONFIG_PREEMPT_RT 2936991436cSThomas Gleixner extern void schedule_rtlock(void); 2946991436cSThomas Gleixner #endif 2951da177e4SLinus Torvalds 29610ab5643STejun Heo extern int __must_check io_schedule_prepare(void); 29710ab5643STejun Heo extern void io_schedule_finish(int token); 2989cff8adeSNeilBrown extern long io_schedule_timeout(long timeout); 29910ab5643STejun Heo extern void io_schedule(void); 3009cff8adeSNeilBrown 301f06febc9SFrank Mayhar /** 3020ba42a59SMasanari Iida * struct prev_cputime - snapshot of system and user cputime 303d37f761dSFrederic Weisbecker * @utime: time spent in user mode 304d37f761dSFrederic Weisbecker * @stime: time spent in system mode 3059d7fb042SPeter Zijlstra * @lock: protects the above two fields 306d37f761dSFrederic Weisbecker * 3079d7fb042SPeter Zijlstra * Stores previous user/system time values such that we can guarantee 3089d7fb042SPeter Zijlstra * monotonicity. 309d37f761dSFrederic Weisbecker */ 3109d7fb042SPeter Zijlstra struct prev_cputime { 3119d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE 3125613fda9SFrederic Weisbecker u64 utime; 3135613fda9SFrederic Weisbecker u64 stime; 3149d7fb042SPeter Zijlstra raw_spinlock_t lock; 3159d7fb042SPeter Zijlstra #endif 316d37f761dSFrederic Weisbecker }; 317d37f761dSFrederic Weisbecker 318bac5b6b6SFrederic Weisbecker enum vtime_state { 319bac5b6b6SFrederic Weisbecker /* Task is sleeping or running in a CPU with VTIME inactive: */ 320bac5b6b6SFrederic Weisbecker VTIME_INACTIVE = 0, 32114faf6fcSFrederic Weisbecker /* Task is idle */ 32214faf6fcSFrederic Weisbecker VTIME_IDLE, 323bac5b6b6SFrederic Weisbecker /* Task runs in kernelspace in a CPU with VTIME active: */ 324bac5b6b6SFrederic Weisbecker VTIME_SYS, 32514faf6fcSFrederic Weisbecker /* Task runs in userspace in a CPU with VTIME active: */ 32614faf6fcSFrederic Weisbecker VTIME_USER, 327e6d5bf3eSFrederic Weisbecker /* Task runs as guests in a CPU with VTIME active: */ 328e6d5bf3eSFrederic Weisbecker VTIME_GUEST, 329bac5b6b6SFrederic Weisbecker }; 330bac5b6b6SFrederic Weisbecker 331bac5b6b6SFrederic Weisbecker struct vtime { 332bac5b6b6SFrederic Weisbecker seqcount_t seqcount; 333bac5b6b6SFrederic Weisbecker unsigned long long starttime; 334bac5b6b6SFrederic Weisbecker enum vtime_state state; 335802f4a82SFrederic Weisbecker unsigned int cpu; 3362a42eb95SWanpeng Li u64 utime; 3372a42eb95SWanpeng Li u64 stime; 3382a42eb95SWanpeng Li u64 gtime; 339bac5b6b6SFrederic Weisbecker }; 340bac5b6b6SFrederic Weisbecker 34169842cbaSPatrick Bellasi /* 34269842cbaSPatrick Bellasi * Utilization clamp constraints. 34369842cbaSPatrick Bellasi * @UCLAMP_MIN: Minimum utilization 34469842cbaSPatrick Bellasi * @UCLAMP_MAX: Maximum utilization 34569842cbaSPatrick Bellasi * @UCLAMP_CNT: Utilization clamp constraints count 34669842cbaSPatrick Bellasi */ 34769842cbaSPatrick Bellasi enum uclamp_id { 34869842cbaSPatrick Bellasi UCLAMP_MIN = 0, 34969842cbaSPatrick Bellasi UCLAMP_MAX, 35069842cbaSPatrick Bellasi UCLAMP_CNT 35169842cbaSPatrick Bellasi }; 35269842cbaSPatrick Bellasi 353f9a25f77SMathieu Poirier #ifdef CONFIG_SMP 354f9a25f77SMathieu Poirier extern struct root_domain def_root_domain; 355f9a25f77SMathieu Poirier extern struct mutex sched_domains_mutex; 356f9a25f77SMathieu Poirier #endif 357f9a25f77SMathieu Poirier 3581da177e4SLinus Torvalds struct sched_info { 3597f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO 3605eca1c10SIngo Molnar /* Cumulative counters: */ 3611da177e4SLinus Torvalds 3625eca1c10SIngo Molnar /* # of times we have run on this CPU: */ 3635eca1c10SIngo Molnar unsigned long pcount; 3645eca1c10SIngo Molnar 3655eca1c10SIngo Molnar /* Time spent waiting on a runqueue: */ 3665eca1c10SIngo Molnar unsigned long long run_delay; 3675eca1c10SIngo Molnar 3685eca1c10SIngo Molnar /* Timestamps: */ 3695eca1c10SIngo Molnar 3705eca1c10SIngo Molnar /* When did we last run on a CPU? */ 3715eca1c10SIngo Molnar unsigned long long last_arrival; 3725eca1c10SIngo Molnar 3735eca1c10SIngo Molnar /* When were we last queued to run? */ 3745eca1c10SIngo Molnar unsigned long long last_queued; 3755eca1c10SIngo Molnar 376f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */ 3777f5f8e8dSIngo Molnar }; 3781da177e4SLinus Torvalds 3791da177e4SLinus Torvalds /* 3806ecdd749SYuyang Du * Integer metrics need fixed point arithmetic, e.g., sched/fair 3816ecdd749SYuyang Du * has a few: load, load_avg, util_avg, freq, and capacity. 3826ecdd749SYuyang Du * 3836ecdd749SYuyang Du * We define a basic fixed point arithmetic range, and then formalize 3846ecdd749SYuyang Du * all these metrics based on that basic range. 3856ecdd749SYuyang Du */ 3866ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT 10 3876ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE (1L << SCHED_FIXEDPOINT_SHIFT) 3886ecdd749SYuyang Du 38969842cbaSPatrick Bellasi /* Increase resolution of cpu_capacity calculations */ 39069842cbaSPatrick Bellasi # define SCHED_CAPACITY_SHIFT SCHED_FIXEDPOINT_SHIFT 39169842cbaSPatrick Bellasi # define SCHED_CAPACITY_SCALE (1L << SCHED_CAPACITY_SHIFT) 39269842cbaSPatrick Bellasi 39320b8a59fSIngo Molnar struct load_weight { 3949dbdb155SPeter Zijlstra unsigned long weight; 3959dbdb155SPeter Zijlstra u32 inv_weight; 39620b8a59fSIngo Molnar }; 39720b8a59fSIngo Molnar 3987f65ea42SPatrick Bellasi /** 3997f65ea42SPatrick Bellasi * struct util_est - Estimation utilization of FAIR tasks 4007f65ea42SPatrick Bellasi * @enqueued: instantaneous estimated utilization of a task/cpu 4017f65ea42SPatrick Bellasi * @ewma: the Exponential Weighted Moving Average (EWMA) 4027f65ea42SPatrick Bellasi * utilization of a task 4037f65ea42SPatrick Bellasi * 4047f65ea42SPatrick Bellasi * Support data structure to track an Exponential Weighted Moving Average 4057f65ea42SPatrick Bellasi * (EWMA) of a FAIR task's utilization. New samples are added to the moving 4067f65ea42SPatrick Bellasi * average each time a task completes an activation. Sample's weight is chosen 4077f65ea42SPatrick Bellasi * so that the EWMA will be relatively insensitive to transient changes to the 4087f65ea42SPatrick Bellasi * task's workload. 4097f65ea42SPatrick Bellasi * 4107f65ea42SPatrick Bellasi * The enqueued attribute has a slightly different meaning for tasks and cpus: 4117f65ea42SPatrick Bellasi * - task: the task's util_avg at last task dequeue time 4127f65ea42SPatrick Bellasi * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU 4137f65ea42SPatrick Bellasi * Thus, the util_est.enqueued of a task represents the contribution on the 4147f65ea42SPatrick Bellasi * estimated utilization of the CPU where that task is currently enqueued. 4157f65ea42SPatrick Bellasi * 4167f65ea42SPatrick Bellasi * Only for tasks we track a moving average of the past instantaneous 4177f65ea42SPatrick Bellasi * estimated utilization. This allows to absorb sporadic drops in utilization 4187f65ea42SPatrick Bellasi * of an otherwise almost periodic task. 41968d7a190SDietmar Eggemann * 42068d7a190SDietmar Eggemann * The UTIL_AVG_UNCHANGED flag is used to synchronize util_est with util_avg 42168d7a190SDietmar Eggemann * updates. When a task is dequeued, its util_est should not be updated if its 42268d7a190SDietmar Eggemann * util_avg has not been updated in the meantime. 42368d7a190SDietmar Eggemann * This information is mapped into the MSB bit of util_est.enqueued at dequeue 42468d7a190SDietmar Eggemann * time. Since max value of util_est.enqueued for a task is 1024 (PELT util_avg 42568d7a190SDietmar Eggemann * for a task) it is safe to use MSB. 4267f65ea42SPatrick Bellasi */ 4277f65ea42SPatrick Bellasi struct util_est { 4287f65ea42SPatrick Bellasi unsigned int enqueued; 4297f65ea42SPatrick Bellasi unsigned int ewma; 4307f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT 2 43168d7a190SDietmar Eggemann #define UTIL_AVG_UNCHANGED 0x80000000 432317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64)))); 4337f65ea42SPatrick Bellasi 4349d89c257SYuyang Du /* 4359f683953SVincent Guittot * The load/runnable/util_avg accumulates an infinite geometric series 4360dacee1bSVincent Guittot * (see __update_load_avg_cfs_rq() in kernel/sched/pelt.c). 4377b595334SYuyang Du * 4387b595334SYuyang Du * [load_avg definition] 4397b595334SYuyang Du * 4407b595334SYuyang Du * load_avg = runnable% * scale_load_down(load) 4417b595334SYuyang Du * 4429f683953SVincent Guittot * [runnable_avg definition] 4439f683953SVincent Guittot * 4449f683953SVincent Guittot * runnable_avg = runnable% * SCHED_CAPACITY_SCALE 4457b595334SYuyang Du * 4467b595334SYuyang Du * [util_avg definition] 4477b595334SYuyang Du * 4487b595334SYuyang Du * util_avg = running% * SCHED_CAPACITY_SCALE 4497b595334SYuyang Du * 4509f683953SVincent Guittot * where runnable% is the time ratio that a sched_entity is runnable and 4519f683953SVincent Guittot * running% the time ratio that a sched_entity is running. 4527b595334SYuyang Du * 4539f683953SVincent Guittot * For cfs_rq, they are the aggregated values of all runnable and blocked 4549f683953SVincent Guittot * sched_entities. 4559f683953SVincent Guittot * 456c1b7b8d4S王文虎 * The load/runnable/util_avg doesn't directly factor frequency scaling and CPU 4579f683953SVincent Guittot * capacity scaling. The scaling is done through the rq_clock_pelt that is used 4589f683953SVincent Guittot * for computing those signals (see update_rq_clock_pelt()) 4597b595334SYuyang Du * 46023127296SVincent Guittot * N.B., the above ratios (runnable% and running%) themselves are in the 46123127296SVincent Guittot * range of [0, 1]. To do fixed point arithmetics, we therefore scale them 46223127296SVincent Guittot * to as large a range as necessary. This is for example reflected by 46323127296SVincent Guittot * util_avg's SCHED_CAPACITY_SCALE. 4647b595334SYuyang Du * 4657b595334SYuyang Du * [Overflow issue] 4667b595334SYuyang Du * 4677b595334SYuyang Du * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities 4687b595334SYuyang Du * with the highest load (=88761), always runnable on a single cfs_rq, 4697b595334SYuyang Du * and should not overflow as the number already hits PID_MAX_LIMIT. 4707b595334SYuyang Du * 4717b595334SYuyang Du * For all other cases (including 32-bit kernels), struct load_weight's 4727b595334SYuyang Du * weight will overflow first before we do, because: 4737b595334SYuyang Du * 4747b595334SYuyang Du * Max(load_avg) <= Max(load.weight) 4757b595334SYuyang Du * 4767b595334SYuyang Du * Then it is the load_weight's responsibility to consider overflow 4777b595334SYuyang Du * issues. 4789d89c257SYuyang Du */ 4799d85f21cSPaul Turner struct sched_avg { 4805eca1c10SIngo Molnar u64 last_update_time; 4815eca1c10SIngo Molnar u64 load_sum; 4829f683953SVincent Guittot u64 runnable_sum; 4835eca1c10SIngo Molnar u32 util_sum; 4845eca1c10SIngo Molnar u32 period_contrib; 4855eca1c10SIngo Molnar unsigned long load_avg; 4869f683953SVincent Guittot unsigned long runnable_avg; 4875eca1c10SIngo Molnar unsigned long util_avg; 4887f65ea42SPatrick Bellasi struct util_est util_est; 489317d359dSPeter Zijlstra } ____cacheline_aligned; 4909d85f21cSPaul Turner 49141acab88SLucas De Marchi struct sched_statistics { 4927f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS 49394c18227SIngo Molnar u64 wait_start; 49494c18227SIngo Molnar u64 wait_max; 4956d082592SArjan van de Ven u64 wait_count; 4966d082592SArjan van de Ven u64 wait_sum; 4978f0dfc34SArjan van de Ven u64 iowait_count; 4988f0dfc34SArjan van de Ven u64 iowait_sum; 49994c18227SIngo Molnar 50094c18227SIngo Molnar u64 sleep_start; 50120b8a59fSIngo Molnar u64 sleep_max; 50294c18227SIngo Molnar s64 sum_sleep_runtime; 50394c18227SIngo Molnar 50494c18227SIngo Molnar u64 block_start; 50520b8a59fSIngo Molnar u64 block_max; 506847fc0cdSYafang Shao s64 sum_block_runtime; 507847fc0cdSYafang Shao 50820b8a59fSIngo Molnar u64 exec_max; 509eba1ed4bSIngo Molnar u64 slice_max; 510cc367732SIngo Molnar 511cc367732SIngo Molnar u64 nr_migrations_cold; 512cc367732SIngo Molnar u64 nr_failed_migrations_affine; 513cc367732SIngo Molnar u64 nr_failed_migrations_running; 514cc367732SIngo Molnar u64 nr_failed_migrations_hot; 515cc367732SIngo Molnar u64 nr_forced_migrations; 516cc367732SIngo Molnar 517cc367732SIngo Molnar u64 nr_wakeups; 518cc367732SIngo Molnar u64 nr_wakeups_sync; 519cc367732SIngo Molnar u64 nr_wakeups_migrate; 520cc367732SIngo Molnar u64 nr_wakeups_local; 521cc367732SIngo Molnar u64 nr_wakeups_remote; 522cc367732SIngo Molnar u64 nr_wakeups_affine; 523cc367732SIngo Molnar u64 nr_wakeups_affine_attempts; 524cc367732SIngo Molnar u64 nr_wakeups_passive; 525cc367732SIngo Molnar u64 nr_wakeups_idle; 52641acab88SLucas De Marchi #endif 527ceeadb83SYafang Shao } ____cacheline_aligned; 52841acab88SLucas De Marchi 52941acab88SLucas De Marchi struct sched_entity { 5305eca1c10SIngo Molnar /* For load-balancing: */ 5315eca1c10SIngo Molnar struct load_weight load; 53241acab88SLucas De Marchi struct rb_node run_node; 53341acab88SLucas De Marchi struct list_head group_node; 53441acab88SLucas De Marchi unsigned int on_rq; 53541acab88SLucas De Marchi 53641acab88SLucas De Marchi u64 exec_start; 53741acab88SLucas De Marchi u64 sum_exec_runtime; 53841acab88SLucas De Marchi u64 vruntime; 53941acab88SLucas De Marchi u64 prev_sum_exec_runtime; 54041acab88SLucas De Marchi 54141acab88SLucas De Marchi u64 nr_migrations; 54241acab88SLucas De Marchi 54320b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED 544fed14d45SPeter Zijlstra int depth; 54520b8a59fSIngo Molnar struct sched_entity *parent; 54620b8a59fSIngo Molnar /* rq on which this entity is (to be) queued: */ 54720b8a59fSIngo Molnar struct cfs_rq *cfs_rq; 54820b8a59fSIngo Molnar /* rq "owned" by this entity/group: */ 54920b8a59fSIngo Molnar struct cfs_rq *my_q; 5509f683953SVincent Guittot /* cached value of my_q->h_nr_running */ 5519f683953SVincent Guittot unsigned long runnable_weight; 55220b8a59fSIngo Molnar #endif 5538bd75c77SClark Williams 554141965c7SAlex Shi #ifdef CONFIG_SMP 5555a107804SJiri Olsa /* 5565a107804SJiri Olsa * Per entity load average tracking. 5575a107804SJiri Olsa * 5585a107804SJiri Olsa * Put into separate cache line so it does not 5595a107804SJiri Olsa * collide with read-mostly values above. 5605a107804SJiri Olsa */ 561317d359dSPeter Zijlstra struct sched_avg avg; 5629d85f21cSPaul Turner #endif 56320b8a59fSIngo Molnar }; 56470b97a7fSIngo Molnar 565fa717060SPeter Zijlstra struct sched_rt_entity { 566fa717060SPeter Zijlstra struct list_head run_list; 56778f2c7dbSPeter Zijlstra unsigned long timeout; 56857d2aa00SYing Xue unsigned long watchdog_stamp; 569bee367edSRichard Kennedy unsigned int time_slice; 570ff77e468SPeter Zijlstra unsigned short on_rq; 571ff77e468SPeter Zijlstra unsigned short on_list; 5726f505b16SPeter Zijlstra 57358d6c2d7SPeter Zijlstra struct sched_rt_entity *back; 574052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED 5756f505b16SPeter Zijlstra struct sched_rt_entity *parent; 5766f505b16SPeter Zijlstra /* rq on which this entity is (to be) queued: */ 5776f505b16SPeter Zijlstra struct rt_rq *rt_rq; 5786f505b16SPeter Zijlstra /* rq "owned" by this entity/group: */ 5796f505b16SPeter Zijlstra struct rt_rq *my_q; 5806f505b16SPeter Zijlstra #endif 5813859a271SKees Cook } __randomize_layout; 582fa717060SPeter Zijlstra 583aab03e05SDario Faggioli struct sched_dl_entity { 584aab03e05SDario Faggioli struct rb_node rb_node; 585aab03e05SDario Faggioli 586aab03e05SDario Faggioli /* 587aab03e05SDario Faggioli * Original scheduling parameters. Copied here from sched_attr 5884027d080Sxiaofeng.yan * during sched_setattr(), they will remain the same until 5894027d080Sxiaofeng.yan * the next sched_setattr(). 590aab03e05SDario Faggioli */ 5915eca1c10SIngo Molnar u64 dl_runtime; /* Maximum runtime for each instance */ 5925eca1c10SIngo Molnar u64 dl_deadline; /* Relative deadline of each instance */ 5935eca1c10SIngo Molnar u64 dl_period; /* Separation of two instances (period) */ 59454d6d303SDaniel Bristot de Oliveira u64 dl_bw; /* dl_runtime / dl_period */ 5953effcb42SDaniel Bristot de Oliveira u64 dl_density; /* dl_runtime / dl_deadline */ 596aab03e05SDario Faggioli 597aab03e05SDario Faggioli /* 598aab03e05SDario Faggioli * Actual scheduling parameters. Initialized with the values above, 599dfcb245eSIngo Molnar * they are continuously updated during task execution. Note that 600aab03e05SDario Faggioli * the remaining runtime could be < 0 in case we are in overrun. 601aab03e05SDario Faggioli */ 6025eca1c10SIngo Molnar s64 runtime; /* Remaining runtime for this instance */ 6035eca1c10SIngo Molnar u64 deadline; /* Absolute deadline for this instance */ 6045eca1c10SIngo Molnar unsigned int flags; /* Specifying the scheduler behaviour */ 605aab03e05SDario Faggioli 606aab03e05SDario Faggioli /* 607aab03e05SDario Faggioli * Some bool flags: 608aab03e05SDario Faggioli * 609aab03e05SDario Faggioli * @dl_throttled tells if we exhausted the runtime. If so, the 610aab03e05SDario Faggioli * task has to wait for a replenishment to be performed at the 611aab03e05SDario Faggioli * next firing of dl_timer. 612aab03e05SDario Faggioli * 6132d3d891dSDario Faggioli * @dl_boosted tells if we are boosted due to DI. If so we are 6142d3d891dSDario Faggioli * outside bandwidth enforcement mechanism (but only until we 6155bfd126eSJuri Lelli * exit the critical section); 6165bfd126eSJuri Lelli * 6175eca1c10SIngo Molnar * @dl_yielded tells if task gave up the CPU before consuming 6185bfd126eSJuri Lelli * all its available runtime during the last job. 619209a0cbdSLuca Abeni * 620209a0cbdSLuca Abeni * @dl_non_contending tells if the task is inactive while still 621209a0cbdSLuca Abeni * contributing to the active utilization. In other words, it 622209a0cbdSLuca Abeni * indicates if the inactive timer has been armed and its handler 623209a0cbdSLuca Abeni * has not been executed yet. This flag is useful to avoid race 624209a0cbdSLuca Abeni * conditions between the inactive timer handler and the wakeup 625209a0cbdSLuca Abeni * code. 62634be3930SJuri Lelli * 62734be3930SJuri Lelli * @dl_overrun tells if the task asked to be informed about runtime 62834be3930SJuri Lelli * overruns. 629aab03e05SDario Faggioli */ 630aa5222e9SDan Carpenter unsigned int dl_throttled : 1; 631aa5222e9SDan Carpenter unsigned int dl_yielded : 1; 632aa5222e9SDan Carpenter unsigned int dl_non_contending : 1; 63334be3930SJuri Lelli unsigned int dl_overrun : 1; 634aab03e05SDario Faggioli 635aab03e05SDario Faggioli /* 636aab03e05SDario Faggioli * Bandwidth enforcement timer. Each -deadline task has its 637aab03e05SDario Faggioli * own bandwidth to be enforced, thus we need one timer per task. 638aab03e05SDario Faggioli */ 639aab03e05SDario Faggioli struct hrtimer dl_timer; 640209a0cbdSLuca Abeni 641209a0cbdSLuca Abeni /* 642209a0cbdSLuca Abeni * Inactive timer, responsible for decreasing the active utilization 643209a0cbdSLuca Abeni * at the "0-lag time". When a -deadline task blocks, it contributes 644209a0cbdSLuca Abeni * to GRUB's active utilization until the "0-lag time", hence a 645209a0cbdSLuca Abeni * timer is needed to decrease the active utilization at the correct 646209a0cbdSLuca Abeni * time. 647209a0cbdSLuca Abeni */ 648209a0cbdSLuca Abeni struct hrtimer inactive_timer; 6492279f540SJuri Lelli 6502279f540SJuri Lelli #ifdef CONFIG_RT_MUTEXES 6512279f540SJuri Lelli /* 6522279f540SJuri Lelli * Priority Inheritance. When a DEADLINE scheduling entity is boosted 6532279f540SJuri Lelli * pi_se points to the donor, otherwise points to the dl_se it belongs 6542279f540SJuri Lelli * to (the original one/itself). 6552279f540SJuri Lelli */ 6562279f540SJuri Lelli struct sched_dl_entity *pi_se; 6572279f540SJuri Lelli #endif 658aab03e05SDario Faggioli }; 6598bd75c77SClark Williams 66069842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK 66169842cbaSPatrick Bellasi /* Number of utilization clamp buckets (shorter alias) */ 66269842cbaSPatrick Bellasi #define UCLAMP_BUCKETS CONFIG_UCLAMP_BUCKETS_COUNT 66369842cbaSPatrick Bellasi 66469842cbaSPatrick Bellasi /* 66569842cbaSPatrick Bellasi * Utilization clamp for a scheduling entity 66669842cbaSPatrick Bellasi * @value: clamp value "assigned" to a se 66769842cbaSPatrick Bellasi * @bucket_id: bucket index corresponding to the "assigned" value 668e8f14172SPatrick Bellasi * @active: the se is currently refcounted in a rq's bucket 669a509a7cdSPatrick Bellasi * @user_defined: the requested clamp value comes from user-space 67069842cbaSPatrick Bellasi * 67169842cbaSPatrick Bellasi * The bucket_id is the index of the clamp bucket matching the clamp value 67269842cbaSPatrick Bellasi * which is pre-computed and stored to avoid expensive integer divisions from 67369842cbaSPatrick Bellasi * the fast path. 674e8f14172SPatrick Bellasi * 675e8f14172SPatrick Bellasi * The active bit is set whenever a task has got an "effective" value assigned, 676e8f14172SPatrick Bellasi * which can be different from the clamp value "requested" from user-space. 677e8f14172SPatrick Bellasi * This allows to know a task is refcounted in the rq's bucket corresponding 678e8f14172SPatrick Bellasi * to the "effective" bucket_id. 679a509a7cdSPatrick Bellasi * 680a509a7cdSPatrick Bellasi * The user_defined bit is set whenever a task has got a task-specific clamp 681a509a7cdSPatrick Bellasi * value requested from userspace, i.e. the system defaults apply to this task 682a509a7cdSPatrick Bellasi * just as a restriction. This allows to relax default clamps when a less 683a509a7cdSPatrick Bellasi * restrictive task-specific value has been requested, thus allowing to 684a509a7cdSPatrick Bellasi * implement a "nice" semantic. For example, a task running with a 20% 685a509a7cdSPatrick Bellasi * default boost can still drop its own boosting to 0%. 68669842cbaSPatrick Bellasi */ 68769842cbaSPatrick Bellasi struct uclamp_se { 68869842cbaSPatrick Bellasi unsigned int value : bits_per(SCHED_CAPACITY_SCALE); 68969842cbaSPatrick Bellasi unsigned int bucket_id : bits_per(UCLAMP_BUCKETS); 690e8f14172SPatrick Bellasi unsigned int active : 1; 691a509a7cdSPatrick Bellasi unsigned int user_defined : 1; 69269842cbaSPatrick Bellasi }; 69369842cbaSPatrick Bellasi #endif /* CONFIG_UCLAMP_TASK */ 69469842cbaSPatrick Bellasi 6951d082fd0SPaul E. McKenney union rcu_special { 6961d082fd0SPaul E. McKenney struct { 6978203d6d0SPaul E. McKenney u8 blocked; 6988203d6d0SPaul E. McKenney u8 need_qs; 69905f41571SPaul E. McKenney u8 exp_hint; /* Hint for performance. */ 700276c4104SPaul E. McKenney u8 need_mb; /* Readers need smp_mb(). */ 7018203d6d0SPaul E. McKenney } b; /* Bits. */ 70205f41571SPaul E. McKenney u32 s; /* Set of bits. */ 7031d082fd0SPaul E. McKenney }; 70486848966SPaul E. McKenney 7058dc85d54SPeter Zijlstra enum perf_event_task_context { 7068dc85d54SPeter Zijlstra perf_invalid_context = -1, 7078dc85d54SPeter Zijlstra perf_hw_context = 0, 70889a1e187SPeter Zijlstra perf_sw_context, 7098dc85d54SPeter Zijlstra perf_nr_task_contexts, 7108dc85d54SPeter Zijlstra }; 7118dc85d54SPeter Zijlstra 712eb61baf6SIngo Molnar struct wake_q_node { 713eb61baf6SIngo Molnar struct wake_q_node *next; 714eb61baf6SIngo Molnar }; 715eb61baf6SIngo Molnar 7165fbda3ecSThomas Gleixner struct kmap_ctrl { 7175fbda3ecSThomas Gleixner #ifdef CONFIG_KMAP_LOCAL 7185fbda3ecSThomas Gleixner int idx; 7195fbda3ecSThomas Gleixner pte_t pteval[KM_MAX_IDX]; 7205fbda3ecSThomas Gleixner #endif 7215fbda3ecSThomas Gleixner }; 7225fbda3ecSThomas Gleixner 7231da177e4SLinus Torvalds struct task_struct { 724c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 725c65eacbeSAndy Lutomirski /* 726c65eacbeSAndy Lutomirski * For reasons of header soup (see current_thread_info()), this 727c65eacbeSAndy Lutomirski * must be the first element of task_struct. 728c65eacbeSAndy Lutomirski */ 729c65eacbeSAndy Lutomirski struct thread_info thread_info; 730c65eacbeSAndy Lutomirski #endif 7312f064a59SPeter Zijlstra unsigned int __state; 73229e48ce8SKees Cook 7335f220be2SThomas Gleixner #ifdef CONFIG_PREEMPT_RT 7345f220be2SThomas Gleixner /* saved state for "spinlock sleepers" */ 7355f220be2SThomas Gleixner unsigned int saved_state; 7365f220be2SThomas Gleixner #endif 7375f220be2SThomas Gleixner 73829e48ce8SKees Cook /* 73929e48ce8SKees Cook * This begins the randomizable portion of task_struct. Only 74029e48ce8SKees Cook * scheduling-critical items should be added above here. 74129e48ce8SKees Cook */ 74229e48ce8SKees Cook randomized_struct_fields_start 74329e48ce8SKees Cook 744f7e4217bSRoman Zippel void *stack; 745ec1d2819SElena Reshetova refcount_t usage; 7465eca1c10SIngo Molnar /* Per task flags (PF_*), defined further below: */ 7475eca1c10SIngo Molnar unsigned int flags; 74897dc32cdSWilliam Cohen unsigned int ptrace; 7491da177e4SLinus Torvalds 7502dd73a4fSPeter Williams #ifdef CONFIG_SMP 7513ca7a440SPeter Zijlstra int on_cpu; 7528c4890d1SPeter Zijlstra struct __call_single_node wake_entry; 753c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 7545eca1c10SIngo Molnar /* Current CPU: */ 7555eca1c10SIngo Molnar unsigned int cpu; 756c65eacbeSAndy Lutomirski #endif 75763b0e9edSMike Galbraith unsigned int wakee_flips; 75862470419SMichael Wang unsigned long wakee_flip_decay_ts; 75963b0e9edSMike Galbraith struct task_struct *last_wakee; 760ac66f547SPeter Zijlstra 76132e839ddSMel Gorman /* 76232e839ddSMel Gorman * recent_used_cpu is initially set as the last CPU used by a task 76332e839ddSMel Gorman * that wakes affine another task. Waker/wakee relationships can 76432e839ddSMel Gorman * push tasks around a CPU where each wakeup moves to the next one. 76532e839ddSMel Gorman * Tracking a recently used CPU allows a quick search for a recently 76632e839ddSMel Gorman * used CPU that may be idle. 76732e839ddSMel Gorman */ 76832e839ddSMel Gorman int recent_used_cpu; 769ac66f547SPeter Zijlstra int wake_cpu; 7704866cde0SNick Piggin #endif 771fd2f4419SPeter Zijlstra int on_rq; 77250e645a8SIngo Molnar 7735eca1c10SIngo Molnar int prio; 7745eca1c10SIngo Molnar int static_prio; 7755eca1c10SIngo Molnar int normal_prio; 776c7aceabaSRichard Kennedy unsigned int rt_priority; 7775eca1c10SIngo Molnar 77820b8a59fSIngo Molnar struct sched_entity se; 779fa717060SPeter Zijlstra struct sched_rt_entity rt; 7808a311c74SPeter Zijlstra struct sched_dl_entity dl; 781*804bccbaSKees Cook const struct sched_class *sched_class; 7828a311c74SPeter Zijlstra 7838a311c74SPeter Zijlstra #ifdef CONFIG_SCHED_CORE 7848a311c74SPeter Zijlstra struct rb_node core_node; 7858a311c74SPeter Zijlstra unsigned long core_cookie; 786d2dfa17bSPeter Zijlstra unsigned int core_occupation; 7878a311c74SPeter Zijlstra #endif 7888a311c74SPeter Zijlstra 7898323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED 7908323f26cSPeter Zijlstra struct task_group *sched_task_group; 7918323f26cSPeter Zijlstra #endif 7921da177e4SLinus Torvalds 79369842cbaSPatrick Bellasi #ifdef CONFIG_UCLAMP_TASK 79413685c4aSQais Yousef /* 79513685c4aSQais Yousef * Clamp values requested for a scheduling entity. 79613685c4aSQais Yousef * Must be updated with task_rq_lock() held. 79713685c4aSQais Yousef */ 798e8f14172SPatrick Bellasi struct uclamp_se uclamp_req[UCLAMP_CNT]; 79913685c4aSQais Yousef /* 80013685c4aSQais Yousef * Effective clamp values used for a scheduling entity. 80113685c4aSQais Yousef * Must be updated with task_rq_lock() held. 80213685c4aSQais Yousef */ 80369842cbaSPatrick Bellasi struct uclamp_se uclamp[UCLAMP_CNT]; 80469842cbaSPatrick Bellasi #endif 80569842cbaSPatrick Bellasi 806ceeadb83SYafang Shao struct sched_statistics stats; 807ceeadb83SYafang Shao 808e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS 8095eca1c10SIngo Molnar /* List of struct preempt_notifier: */ 810e107be36SAvi Kivity struct hlist_head preempt_notifiers; 811e107be36SAvi Kivity #endif 812e107be36SAvi Kivity 8136c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE 8142056a782SJens Axboe unsigned int btrace_seq; 8156c5c9341SAlexey Dobriyan #endif 8161da177e4SLinus Torvalds 81797dc32cdSWilliam Cohen unsigned int policy; 81829baa747SPeter Zijlstra int nr_cpus_allowed; 8193bd37062SSebastian Andrzej Siewior const cpumask_t *cpus_ptr; 820b90ca8baSWill Deacon cpumask_t *user_cpus_ptr; 8213bd37062SSebastian Andrzej Siewior cpumask_t cpus_mask; 8226d337eabSPeter Zijlstra void *migration_pending; 82374d862b6SThomas Gleixner #ifdef CONFIG_SMP 824a7c81556SPeter Zijlstra unsigned short migration_disabled; 825af449901SPeter Zijlstra #endif 826a7c81556SPeter Zijlstra unsigned short migration_flags; 8271da177e4SLinus Torvalds 828a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU 829e260be67SPaul E. McKenney int rcu_read_lock_nesting; 8301d082fd0SPaul E. McKenney union rcu_special rcu_read_unlock_special; 831f41d911fSPaul E. McKenney struct list_head rcu_node_entry; 832a57eb940SPaul E. McKenney struct rcu_node *rcu_blocked_node; 83328f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */ 8345eca1c10SIngo Molnar 8358315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU 8368315f422SPaul E. McKenney unsigned long rcu_tasks_nvcsw; 837ccdd29ffSPaul E. McKenney u8 rcu_tasks_holdout; 838ccdd29ffSPaul E. McKenney u8 rcu_tasks_idx; 839176f8f7aSPaul E. McKenney int rcu_tasks_idle_cpu; 840ccdd29ffSPaul E. McKenney struct list_head rcu_tasks_holdout_list; 8418315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */ 842e260be67SPaul E. McKenney 843d5f177d3SPaul E. McKenney #ifdef CONFIG_TASKS_TRACE_RCU 844d5f177d3SPaul E. McKenney int trc_reader_nesting; 845d5f177d3SPaul E. McKenney int trc_ipi_to_cpu; 846276c4104SPaul E. McKenney union rcu_special trc_reader_special; 847d5f177d3SPaul E. McKenney bool trc_reader_checked; 848d5f177d3SPaul E. McKenney struct list_head trc_holdout_list; 849d5f177d3SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_TRACE_RCU */ 850d5f177d3SPaul E. McKenney 8511da177e4SLinus Torvalds struct sched_info sched_info; 8521da177e4SLinus Torvalds 8531da177e4SLinus Torvalds struct list_head tasks; 854806c09a7SDario Faggioli #ifdef CONFIG_SMP 855917b627dSGregory Haskins struct plist_node pushable_tasks; 8561baca4ceSJuri Lelli struct rb_node pushable_dl_tasks; 857806c09a7SDario Faggioli #endif 8581da177e4SLinus Torvalds 8595eca1c10SIngo Molnar struct mm_struct *mm; 8605eca1c10SIngo Molnar struct mm_struct *active_mm; 861314ff785SIngo Molnar 862314ff785SIngo Molnar /* Per-thread vma caching: */ 863314ff785SIngo Molnar struct vmacache vmacache; 864314ff785SIngo Molnar 8655eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING 86634e55232SKAMEZAWA Hiroyuki struct task_rss_stat rss_stat; 86734e55232SKAMEZAWA Hiroyuki #endif 86897dc32cdSWilliam Cohen int exit_state; 8695eca1c10SIngo Molnar int exit_code; 8705eca1c10SIngo Molnar int exit_signal; 8715eca1c10SIngo Molnar /* The signal sent when the parent dies: */ 8725eca1c10SIngo Molnar int pdeath_signal; 8735eca1c10SIngo Molnar /* JOBCTL_*, siglock protected: */ 8745eca1c10SIngo Molnar unsigned long jobctl; 8759b89f6baSAndrei Epure 8765eca1c10SIngo Molnar /* Used for emulating ABI behavior of previous Linux versions: */ 87797dc32cdSWilliam Cohen unsigned int personality; 8789b89f6baSAndrei Epure 8795eca1c10SIngo Molnar /* Scheduler bits, serialized by scheduler locks: */ 880ca94c442SLennart Poettering unsigned sched_reset_on_fork:1; 881a8e4f2eaSPeter Zijlstra unsigned sched_contributes_to_load:1; 882ff303e66SPeter Zijlstra unsigned sched_migrated:1; 883eb414681SJohannes Weiner #ifdef CONFIG_PSI 884eb414681SJohannes Weiner unsigned sched_psi_wake_requeue:1; 885eb414681SJohannes Weiner #endif 886eb414681SJohannes Weiner 8875eca1c10SIngo Molnar /* Force alignment to the next boundary: */ 8885eca1c10SIngo Molnar unsigned :0; 889be958bdcSPeter Zijlstra 8905eca1c10SIngo Molnar /* Unserialized, strictly 'current' */ 8915eca1c10SIngo Molnar 892f97bb527SPeter Zijlstra /* 893f97bb527SPeter Zijlstra * This field must not be in the scheduler word above due to wakelist 894f97bb527SPeter Zijlstra * queueing no longer being serialized by p->on_cpu. However: 895f97bb527SPeter Zijlstra * 896f97bb527SPeter Zijlstra * p->XXX = X; ttwu() 897f97bb527SPeter Zijlstra * schedule() if (p->on_rq && ..) // false 898f97bb527SPeter Zijlstra * smp_mb__after_spinlock(); if (smp_load_acquire(&p->on_cpu) && //true 899f97bb527SPeter Zijlstra * deactivate_task() ttwu_queue_wakelist()) 900f97bb527SPeter Zijlstra * p->on_rq = 0; p->sched_remote_wakeup = Y; 901f97bb527SPeter Zijlstra * 902f97bb527SPeter Zijlstra * guarantees all stores of 'current' are visible before 903f97bb527SPeter Zijlstra * ->sched_remote_wakeup gets used, so it can be in this word. 904f97bb527SPeter Zijlstra */ 905f97bb527SPeter Zijlstra unsigned sched_remote_wakeup:1; 906f97bb527SPeter Zijlstra 9075eca1c10SIngo Molnar /* Bit to tell LSMs we're in execve(): */ 9085eca1c10SIngo Molnar unsigned in_execve:1; 909be958bdcSPeter Zijlstra unsigned in_iowait:1; 9105eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK 9117e781418SAndy Lutomirski unsigned restore_sigmask:1; 9127e781418SAndy Lutomirski #endif 913626ebc41STejun Heo #ifdef CONFIG_MEMCG 91429ef680aSMichal Hocko unsigned in_user_fault:1; 915127424c8SJohannes Weiner #endif 916ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK 917ff303e66SPeter Zijlstra unsigned brk_randomized:1; 918ff303e66SPeter Zijlstra #endif 91977f88796STejun Heo #ifdef CONFIG_CGROUPS 92077f88796STejun Heo /* disallow userland-initiated cgroup migration */ 92177f88796STejun Heo unsigned no_cgroup_migration:1; 92276f969e8SRoman Gushchin /* task is frozen/stopped (used by the cgroup freezer) */ 92376f969e8SRoman Gushchin unsigned frozen:1; 92477f88796STejun Heo #endif 925d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP 926d09d8df3SJosef Bacik unsigned use_memdelay:1; 927d09d8df3SJosef Bacik #endif 9281066d1b6SYafang Shao #ifdef CONFIG_PSI 9291066d1b6SYafang Shao /* Stalled due to lack of memory */ 9301066d1b6SYafang Shao unsigned in_memstall:1; 9311066d1b6SYafang Shao #endif 9328e9b16c4SSergei Trofimovich #ifdef CONFIG_PAGE_OWNER 9338e9b16c4SSergei Trofimovich /* Used by page_owner=on to detect recursion in page tracking. */ 9348e9b16c4SSergei Trofimovich unsigned in_page_owner:1; 9358e9b16c4SSergei Trofimovich #endif 936b542e383SThomas Gleixner #ifdef CONFIG_EVENTFD 937b542e383SThomas Gleixner /* Recursion prevention for eventfd_signal() */ 938b542e383SThomas Gleixner unsigned in_eventfd_signal:1; 939b542e383SThomas Gleixner #endif 9406f185c29SVladimir Davydov 9415eca1c10SIngo Molnar unsigned long atomic_flags; /* Flags requiring atomic access. */ 9421d4457f9SKees Cook 943f56141e3SAndy Lutomirski struct restart_block restart_block; 944f56141e3SAndy Lutomirski 9451da177e4SLinus Torvalds pid_t pid; 9461da177e4SLinus Torvalds pid_t tgid; 9470a425405SArjan van de Ven 948050e9baaSLinus Torvalds #ifdef CONFIG_STACKPROTECTOR 9495eca1c10SIngo Molnar /* Canary value for the -fstack-protector GCC feature: */ 9500a425405SArjan van de Ven unsigned long stack_canary; 9511314562aSHiroshi Shimamoto #endif 9521da177e4SLinus Torvalds /* 9535eca1c10SIngo Molnar * Pointers to the (original) parent process, youngest child, younger sibling, 9541da177e4SLinus Torvalds * older sibling, respectively. (p->father can be replaced with 955f470021aSRoland McGrath * p->real_parent->pid) 9561da177e4SLinus Torvalds */ 9575eca1c10SIngo Molnar 9585eca1c10SIngo Molnar /* Real parent process: */ 9595eca1c10SIngo Molnar struct task_struct __rcu *real_parent; 9605eca1c10SIngo Molnar 9615eca1c10SIngo Molnar /* Recipient of SIGCHLD, wait4() reports: */ 9625eca1c10SIngo Molnar struct task_struct __rcu *parent; 9631da177e4SLinus Torvalds 964f470021aSRoland McGrath /* 9655eca1c10SIngo Molnar * Children/sibling form the list of natural children: 9665eca1c10SIngo Molnar */ 9675eca1c10SIngo Molnar struct list_head children; 9685eca1c10SIngo Molnar struct list_head sibling; 9695eca1c10SIngo Molnar struct task_struct *group_leader; 9705eca1c10SIngo Molnar 9715eca1c10SIngo Molnar /* 9725eca1c10SIngo Molnar * 'ptraced' is the list of tasks this task is using ptrace() on. 9735eca1c10SIngo Molnar * 974f470021aSRoland McGrath * This includes both natural children and PTRACE_ATTACH targets. 9755eca1c10SIngo Molnar * 'ptrace_entry' is this task's link on the p->parent->ptraced list. 976f470021aSRoland McGrath */ 977f470021aSRoland McGrath struct list_head ptraced; 978f470021aSRoland McGrath struct list_head ptrace_entry; 979f470021aSRoland McGrath 9801da177e4SLinus Torvalds /* PID/PID hash table linkage. */ 9812c470475SEric W. Biederman struct pid *thread_pid; 9822c470475SEric W. Biederman struct hlist_node pid_links[PIDTYPE_MAX]; 98347e65328SOleg Nesterov struct list_head thread_group; 9840c740d0aSOleg Nesterov struct list_head thread_node; 9851da177e4SLinus Torvalds 9865eca1c10SIngo Molnar struct completion *vfork_done; 9871da177e4SLinus Torvalds 9885eca1c10SIngo Molnar /* CLONE_CHILD_SETTID: */ 9895eca1c10SIngo Molnar int __user *set_child_tid; 9905eca1c10SIngo Molnar 9915eca1c10SIngo Molnar /* CLONE_CHILD_CLEARTID: */ 9925eca1c10SIngo Molnar int __user *clear_child_tid; 9935eca1c10SIngo Molnar 9943bfe6106SJens Axboe /* PF_IO_WORKER */ 9953bfe6106SJens Axboe void *pf_io_worker; 9963bfe6106SJens Axboe 9975eca1c10SIngo Molnar u64 utime; 9985eca1c10SIngo Molnar u64 stime; 99940565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME 10005eca1c10SIngo Molnar u64 utimescaled; 10015eca1c10SIngo Molnar u64 stimescaled; 100240565b5aSStanislaw Gruszka #endif 100316a6d9beSFrederic Weisbecker u64 gtime; 10049d7fb042SPeter Zijlstra struct prev_cputime prev_cputime; 10056a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN 1006bac5b6b6SFrederic Weisbecker struct vtime vtime; 10076a61671bSFrederic Weisbecker #endif 1008d027d45dSFrederic Weisbecker 1009d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL 1010f009a7a7SFrederic Weisbecker atomic_t tick_dep_mask; 1011d027d45dSFrederic Weisbecker #endif 10125eca1c10SIngo Molnar /* Context switch counts: */ 10135eca1c10SIngo Molnar unsigned long nvcsw; 10145eca1c10SIngo Molnar unsigned long nivcsw; 10155eca1c10SIngo Molnar 10165eca1c10SIngo Molnar /* Monotonic time in nsecs: */ 10175eca1c10SIngo Molnar u64 start_time; 10185eca1c10SIngo Molnar 10195eca1c10SIngo Molnar /* Boot based time in nsecs: */ 1020cf25e24dSPeter Zijlstra u64 start_boottime; 10215eca1c10SIngo Molnar 10225eca1c10SIngo Molnar /* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */ 10235eca1c10SIngo Molnar unsigned long min_flt; 10245eca1c10SIngo Molnar unsigned long maj_flt; 10251da177e4SLinus Torvalds 10262b69942fSThomas Gleixner /* Empty if CONFIG_POSIX_CPUTIMERS=n */ 10272b69942fSThomas Gleixner struct posix_cputimers posix_cputimers; 10281da177e4SLinus Torvalds 10291fb497ddSThomas Gleixner #ifdef CONFIG_POSIX_CPU_TIMERS_TASK_WORK 10301fb497ddSThomas Gleixner struct posix_cputimers_work posix_cputimers_work; 10311fb497ddSThomas Gleixner #endif 10321fb497ddSThomas Gleixner 10335eca1c10SIngo Molnar /* Process credentials: */ 10345eca1c10SIngo Molnar 10355eca1c10SIngo Molnar /* Tracer's credentials at attach: */ 10365eca1c10SIngo Molnar const struct cred __rcu *ptracer_cred; 10375eca1c10SIngo Molnar 10385eca1c10SIngo Molnar /* Objective and real subjective task credentials (COW): */ 10395eca1c10SIngo Molnar const struct cred __rcu *real_cred; 10405eca1c10SIngo Molnar 10415eca1c10SIngo Molnar /* Effective (overridable) subjective task credentials (COW): */ 10425eca1c10SIngo Molnar const struct cred __rcu *cred; 10435eca1c10SIngo Molnar 10447743c48eSDavid Howells #ifdef CONFIG_KEYS 10457743c48eSDavid Howells /* Cached requested key. */ 10467743c48eSDavid Howells struct key *cached_requested_key; 10477743c48eSDavid Howells #endif 10487743c48eSDavid Howells 10495eca1c10SIngo Molnar /* 10505eca1c10SIngo Molnar * executable name, excluding path. 10515eca1c10SIngo Molnar * 10525eca1c10SIngo Molnar * - normally initialized setup_new_exec() 10535eca1c10SIngo Molnar * - access it with [gs]et_task_comm() 10545eca1c10SIngo Molnar * - lock it with task_lock() 10555eca1c10SIngo Molnar */ 10565eca1c10SIngo Molnar char comm[TASK_COMM_LEN]; 10575eca1c10SIngo Molnar 1058756daf26SNeilBrown struct nameidata *nameidata; 10595eca1c10SIngo Molnar 10603d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC 10611da177e4SLinus Torvalds struct sysv_sem sysvsem; 1062ab602f79SJack Miller struct sysv_shm sysvshm; 10633d5b6fccSAlexey Dobriyan #endif 1064e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK 106582a1fcb9SIngo Molnar unsigned long last_switch_count; 1066a2e51445SDmitry Vyukov unsigned long last_switch_time; 106782a1fcb9SIngo Molnar #endif 10685eca1c10SIngo Molnar /* Filesystem information: */ 10691da177e4SLinus Torvalds struct fs_struct *fs; 10705eca1c10SIngo Molnar 10715eca1c10SIngo Molnar /* Open file information: */ 10721da177e4SLinus Torvalds struct files_struct *files; 10735eca1c10SIngo Molnar 10740f212204SJens Axboe #ifdef CONFIG_IO_URING 10750f212204SJens Axboe struct io_uring_task *io_uring; 10760f212204SJens Axboe #endif 10770f212204SJens Axboe 10785eca1c10SIngo Molnar /* Namespaces: */ 1079ab516013SSerge E. Hallyn struct nsproxy *nsproxy; 10805eca1c10SIngo Molnar 10815eca1c10SIngo Molnar /* Signal handlers: */ 10821da177e4SLinus Torvalds struct signal_struct *signal; 1083913292c9SMadhuparna Bhowmik struct sighand_struct __rcu *sighand; 10845eca1c10SIngo Molnar sigset_t blocked; 10855eca1c10SIngo Molnar sigset_t real_blocked; 10865eca1c10SIngo Molnar /* Restored if set_restore_sigmask() was used: */ 10875eca1c10SIngo Molnar sigset_t saved_sigmask; 10881da177e4SLinus Torvalds struct sigpending pending; 10891da177e4SLinus Torvalds unsigned long sas_ss_sp; 10901da177e4SLinus Torvalds size_t sas_ss_size; 10915eca1c10SIngo Molnar unsigned int sas_ss_flags; 10922e01fabeSOleg Nesterov 109367d12145SAl Viro struct callback_head *task_works; 1094e73f8959SOleg Nesterov 10954b7d248bSRichard Guy Briggs #ifdef CONFIG_AUDIT 1096bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL 10975f3d544fSRichard Guy Briggs struct audit_context *audit_context; 10985f3d544fSRichard Guy Briggs #endif 1099e1760bd5SEric W. Biederman kuid_t loginuid; 11004746ec5bSEric Paris unsigned int sessionid; 1101bfef93a5SAl Viro #endif 1102932ecebbSWill Drewry struct seccomp seccomp; 11031446e1dfSGabriel Krisman Bertazi struct syscall_user_dispatch syscall_dispatch; 11041da177e4SLinus Torvalds 11055eca1c10SIngo Molnar /* Thread group tracking: */ 1106d1e7fd64SEric W. Biederman u64 parent_exec_id; 1107d1e7fd64SEric W. Biederman u64 self_exec_id; 11085eca1c10SIngo Molnar 11095eca1c10SIngo Molnar /* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */ 11101da177e4SLinus Torvalds spinlock_t alloc_lock; 11111da177e4SLinus Torvalds 1112b29739f9SIngo Molnar /* Protection of the PI data structures: */ 11131d615482SThomas Gleixner raw_spinlock_t pi_lock; 1114b29739f9SIngo Molnar 111576751049SPeter Zijlstra struct wake_q_node wake_q; 111676751049SPeter Zijlstra 111723f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES 11185eca1c10SIngo Molnar /* PI waiters blocked on a rt_mutex held by this task: */ 1119a23ba907SDavidlohr Bueso struct rb_root_cached pi_waiters; 1120e96a7705SXunlei Pang /* Updated under owner's pi_lock and rq lock */ 1121e96a7705SXunlei Pang struct task_struct *pi_top_task; 11225eca1c10SIngo Molnar /* Deadlock detection and priority inheritance handling: */ 112323f78d4aSIngo Molnar struct rt_mutex_waiter *pi_blocked_on; 112423f78d4aSIngo Molnar #endif 112523f78d4aSIngo Molnar 1126408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES 11275eca1c10SIngo Molnar /* Mutex deadlock detection: */ 1128408894eeSIngo Molnar struct mutex_waiter *blocked_on; 1129408894eeSIngo Molnar #endif 11305eca1c10SIngo Molnar 1131312364f3SDaniel Vetter #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 1132312364f3SDaniel Vetter int non_block_count; 1133312364f3SDaniel Vetter #endif 1134312364f3SDaniel Vetter 1135de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS 11360584df9cSMarco Elver struct irqtrace_events irqtrace; 1137de8f5e4fSPeter Zijlstra unsigned int hardirq_threaded; 1138c86e9b98SPeter Zijlstra u64 hardirq_chain_key; 1139fa1452e8SHiroshi Shimamoto int softirqs_enabled; 1140de30a2b3SIngo Molnar int softirq_context; 114140db1739SSebastian Andrzej Siewior int irq_config; 1142de30a2b3SIngo Molnar #endif 1143728b478dSThomas Gleixner #ifdef CONFIG_PREEMPT_RT 1144728b478dSThomas Gleixner int softirq_disable_cnt; 1145728b478dSThomas Gleixner #endif 11465eca1c10SIngo Molnar 1147fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP 1148bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH 48UL 1149fbb9ce95SIngo Molnar u64 curr_chain_key; 1150fbb9ce95SIngo Molnar int lockdep_depth; 1151fbb9ce95SIngo Molnar unsigned int lockdep_recursion; 1152c7aceabaSRichard Kennedy struct held_lock held_locks[MAX_LOCK_DEPTH]; 1153fbb9ce95SIngo Molnar #endif 11545eca1c10SIngo Molnar 11555cf53f3cSElena Petrova #if defined(CONFIG_UBSAN) && !defined(CONFIG_UBSAN_TRAP) 1156c6d30853SAndrey Ryabinin unsigned int in_ubsan; 1157c6d30853SAndrey Ryabinin #endif 1158408894eeSIngo Molnar 11595eca1c10SIngo Molnar /* Journalling filesystem info: */ 11601da177e4SLinus Torvalds void *journal_info; 11611da177e4SLinus Torvalds 11625eca1c10SIngo Molnar /* Stacked block device info: */ 1163bddd87c7SAkinobu Mita struct bio_list *bio_list; 1164d89d8796SNeil Brown 116573c10101SJens Axboe #ifdef CONFIG_BLOCK 11665eca1c10SIngo Molnar /* Stack plugging: */ 116773c10101SJens Axboe struct blk_plug *plug; 116873c10101SJens Axboe #endif 116973c10101SJens Axboe 11705eca1c10SIngo Molnar /* VM state: */ 11711da177e4SLinus Torvalds struct reclaim_state *reclaim_state; 11721da177e4SLinus Torvalds 11731da177e4SLinus Torvalds struct backing_dev_info *backing_dev_info; 11741da177e4SLinus Torvalds 11751da177e4SLinus Torvalds struct io_context *io_context; 11761da177e4SLinus Torvalds 11775e1f0f09SMel Gorman #ifdef CONFIG_COMPACTION 11785e1f0f09SMel Gorman struct capture_control *capture_control; 11795e1f0f09SMel Gorman #endif 11805eca1c10SIngo Molnar /* Ptrace state: */ 11811da177e4SLinus Torvalds unsigned long ptrace_message; 1182ae7795bcSEric W. Biederman kernel_siginfo_t *last_siginfo; 11835eca1c10SIngo Molnar 11847c3ab738SAndrew Morton struct task_io_accounting ioac; 1185eb414681SJohannes Weiner #ifdef CONFIG_PSI 1186eb414681SJohannes Weiner /* Pressure stall state */ 1187eb414681SJohannes Weiner unsigned int psi_flags; 1188eb414681SJohannes Weiner #endif 11895eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT 11905eca1c10SIngo Molnar /* Accumulated RSS usage: */ 11915eca1c10SIngo Molnar u64 acct_rss_mem1; 11925eca1c10SIngo Molnar /* Accumulated virtual memory usage: */ 11935eca1c10SIngo Molnar u64 acct_vm_mem1; 11945eca1c10SIngo Molnar /* stime + utime since last update: */ 11955eca1c10SIngo Molnar u64 acct_timexpd; 11961da177e4SLinus Torvalds #endif 11971da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS 11985eca1c10SIngo Molnar /* Protected by ->alloc_lock: */ 11995eca1c10SIngo Molnar nodemask_t mems_allowed; 12003b03706fSIngo Molnar /* Sequence number to catch updates: */ 1201b7505861SAhmed S. Darwish seqcount_spinlock_t mems_allowed_seq; 1202825a46afSPaul Jackson int cpuset_mem_spread_rotor; 12036adef3ebSJack Steiner int cpuset_slab_spread_rotor; 12041da177e4SLinus Torvalds #endif 1205ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS 12065eca1c10SIngo Molnar /* Control Group info protected by css_set_lock: */ 12072c392b8cSArnd Bergmann struct css_set __rcu *cgroups; 12085eca1c10SIngo Molnar /* cg_list protected by css_set_lock and tsk->alloc_lock: */ 1209817929ecSPaul Menage struct list_head cg_list; 1210ddbcc7e8SPaul Menage #endif 1211e6d42931SJohannes Weiner #ifdef CONFIG_X86_CPU_RESCTRL 12120734ded1SVikas Shivappa u32 closid; 1213d6aaba61SVikas Shivappa u32 rmid; 1214e02737d5SFenghua Yu #endif 121542b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX 12160771dfefSIngo Molnar struct robust_list_head __user *robust_list; 121734f192c6SIngo Molnar #ifdef CONFIG_COMPAT 121834f192c6SIngo Molnar struct compat_robust_list_head __user *compat_robust_list; 121934f192c6SIngo Molnar #endif 1220c87e2837SIngo Molnar struct list_head pi_state_list; 1221c87e2837SIngo Molnar struct futex_pi_state *pi_state_cache; 12223f186d97SThomas Gleixner struct mutex futex_exit_mutex; 12233d4775dfSThomas Gleixner unsigned int futex_state; 122442b2dd0aSAlexey Dobriyan #endif 1225cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS 12268dc85d54SPeter Zijlstra struct perf_event_context *perf_event_ctxp[perf_nr_task_contexts]; 1227cdd6c482SIngo Molnar struct mutex perf_event_mutex; 1228cdd6c482SIngo Molnar struct list_head perf_event_list; 1229a63eaf34SPaul Mackerras #endif 12308f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT 12318f47b187SThomas Gleixner unsigned long preempt_disable_ip; 12328f47b187SThomas Gleixner #endif 1233c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA 12345eca1c10SIngo Molnar /* Protected by alloc_lock: */ 12355eca1c10SIngo Molnar struct mempolicy *mempolicy; 123645816682SVlastimil Babka short il_prev; 1237207205a2SEric Dumazet short pref_node_fork; 1238c7aceabaSRichard Kennedy #endif 1239cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING 1240cbee9f88SPeter Zijlstra int numa_scan_seq; 1241cbee9f88SPeter Zijlstra unsigned int numa_scan_period; 1242598f0ec0SMel Gorman unsigned int numa_scan_period_max; 1243de1c9ce6SRik van Riel int numa_preferred_nid; 12446b9a7460SMel Gorman unsigned long numa_migrate_retry; 12455eca1c10SIngo Molnar /* Migration stamp: */ 12465eca1c10SIngo Molnar u64 node_stamp; 12477e2703e6SRik van Riel u64 last_task_numa_placement; 12487e2703e6SRik van Riel u64 last_sum_exec_runtime; 1249cbee9f88SPeter Zijlstra struct callback_head numa_work; 1250f809ca9aSMel Gorman 1251cb361d8cSJann Horn /* 1252cb361d8cSJann Horn * This pointer is only modified for current in syscall and 1253cb361d8cSJann Horn * pagefault context (and for tasks being destroyed), so it can be read 1254cb361d8cSJann Horn * from any of the following contexts: 1255cb361d8cSJann Horn * - RCU read-side critical section 1256cb361d8cSJann Horn * - current->numa_group from everywhere 1257cb361d8cSJann Horn * - task's runqueue locked, task not running 1258cb361d8cSJann Horn */ 1259cb361d8cSJann Horn struct numa_group __rcu *numa_group; 12608c8a743cSPeter Zijlstra 1261745d6147SMel Gorman /* 126244dba3d5SIulia Manda * numa_faults is an array split into four regions: 126344dba3d5SIulia Manda * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer 126444dba3d5SIulia Manda * in this precise order. 126544dba3d5SIulia Manda * 126644dba3d5SIulia Manda * faults_memory: Exponential decaying average of faults on a per-node 126744dba3d5SIulia Manda * basis. Scheduling placement decisions are made based on these 126844dba3d5SIulia Manda * counts. The values remain static for the duration of a PTE scan. 126944dba3d5SIulia Manda * faults_cpu: Track the nodes the process was running on when a NUMA 127044dba3d5SIulia Manda * hinting fault was incurred. 127144dba3d5SIulia Manda * faults_memory_buffer and faults_cpu_buffer: Record faults per node 127244dba3d5SIulia Manda * during the current scan window. When the scan completes, the counts 127344dba3d5SIulia Manda * in faults_memory and faults_cpu decay and these values are copied. 1274745d6147SMel Gorman */ 127544dba3d5SIulia Manda unsigned long *numa_faults; 127683e1d2cdSMel Gorman unsigned long total_numa_faults; 1277745d6147SMel Gorman 1278745d6147SMel Gorman /* 127904bb2f94SRik van Riel * numa_faults_locality tracks if faults recorded during the last 1280074c2381SMel Gorman * scan window were remote/local or failed to migrate. The task scan 1281074c2381SMel Gorman * period is adapted based on the locality of the faults with different 1282074c2381SMel Gorman * weights depending on whether they were shared or private faults 128304bb2f94SRik van Riel */ 1284074c2381SMel Gorman unsigned long numa_faults_locality[3]; 128504bb2f94SRik van Riel 1286b32e86b4SIngo Molnar unsigned long numa_pages_migrated; 1287cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */ 1288cbee9f88SPeter Zijlstra 1289d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ 1290d7822b1eSMathieu Desnoyers struct rseq __user *rseq; 1291d7822b1eSMathieu Desnoyers u32 rseq_sig; 1292d7822b1eSMathieu Desnoyers /* 1293d7822b1eSMathieu Desnoyers * RmW on rseq_event_mask must be performed atomically 1294d7822b1eSMathieu Desnoyers * with respect to preemption. 1295d7822b1eSMathieu Desnoyers */ 1296d7822b1eSMathieu Desnoyers unsigned long rseq_event_mask; 1297d7822b1eSMathieu Desnoyers #endif 1298d7822b1eSMathieu Desnoyers 129972b252aeSMel Gorman struct tlbflush_unmap_batch tlb_ubc; 130072b252aeSMel Gorman 13013fbd7ee2SEric W. Biederman union { 13023fbd7ee2SEric W. Biederman refcount_t rcu_users; 1303e56d0903SIngo Molnar struct rcu_head rcu; 13043fbd7ee2SEric W. Biederman }; 1305b92ce558SJens Axboe 13065eca1c10SIngo Molnar /* Cache last used pipe for splice(): */ 1307b92ce558SJens Axboe struct pipe_inode_info *splice_pipe; 13085640f768SEric Dumazet 13095640f768SEric Dumazet struct page_frag task_frag; 13105640f768SEric Dumazet 1311ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT 1312ca74e92bSShailabh Nagar struct task_delay_info *delays; 1313ca74e92bSShailabh Nagar #endif 131447913d4eSIngo Molnar 1315f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION 1316f4f154fdSAkinobu Mita int make_it_fail; 13179049f2f6SAkinobu Mita unsigned int fail_nth; 1318f4f154fdSAkinobu Mita #endif 13199d823e8fSWu Fengguang /* 13205eca1c10SIngo Molnar * When (nr_dirtied >= nr_dirtied_pause), it's time to call 13215eca1c10SIngo Molnar * balance_dirty_pages() for a dirty throttling pause: 13229d823e8fSWu Fengguang */ 13239d823e8fSWu Fengguang int nr_dirtied; 13249d823e8fSWu Fengguang int nr_dirtied_pause; 13255eca1c10SIngo Molnar /* Start of a write-and-pause period: */ 13265eca1c10SIngo Molnar unsigned long dirty_paused_when; 13279d823e8fSWu Fengguang 13289745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP 13299745512cSArjan van de Ven int latency_record_count; 13309745512cSArjan van de Ven struct latency_record latency_record[LT_SAVECOUNT]; 13319745512cSArjan van de Ven #endif 13326976675dSArjan van de Ven /* 13335eca1c10SIngo Molnar * Time slack values; these are used to round up poll() and 13346976675dSArjan van de Ven * select() etc timeout values. These are in nanoseconds. 13356976675dSArjan van de Ven */ 1336da8b44d5SJohn Stultz u64 timer_slack_ns; 1337da8b44d5SJohn Stultz u64 default_timer_slack_ns; 1338f8d570a4SDavid Miller 1339d73b4936SAndrey Konovalov #if defined(CONFIG_KASAN_GENERIC) || defined(CONFIG_KASAN_SW_TAGS) 13400b24beccSAndrey Ryabinin unsigned int kasan_depth; 13410b24beccSAndrey Ryabinin #endif 134292c209acSMarco Elver 1343dfd402a4SMarco Elver #ifdef CONFIG_KCSAN 1344dfd402a4SMarco Elver struct kcsan_ctx kcsan_ctx; 134592c209acSMarco Elver #ifdef CONFIG_TRACE_IRQFLAGS 134692c209acSMarco Elver struct irqtrace_events kcsan_save_irqtrace; 134792c209acSMarco Elver #endif 1348dfd402a4SMarco Elver #endif 13495eca1c10SIngo Molnar 1350393824f6SPatricia Alfonso #if IS_ENABLED(CONFIG_KUNIT) 1351393824f6SPatricia Alfonso struct kunit *kunit_test; 1352393824f6SPatricia Alfonso #endif 1353393824f6SPatricia Alfonso 1354fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER 13555eca1c10SIngo Molnar /* Index of current stored address in ret_stack: */ 1356f201ae23SFrederic Weisbecker int curr_ret_stack; 135739eb456dSSteven Rostedt (VMware) int curr_ret_depth; 13585eca1c10SIngo Molnar 13595eca1c10SIngo Molnar /* Stack of return addresses for return function tracing: */ 1360f201ae23SFrederic Weisbecker struct ftrace_ret_stack *ret_stack; 13615eca1c10SIngo Molnar 13625eca1c10SIngo Molnar /* Timestamp for last schedule: */ 13638aef2d28SSteven Rostedt unsigned long long ftrace_timestamp; 13645eca1c10SIngo Molnar 1365f201ae23SFrederic Weisbecker /* 1366f201ae23SFrederic Weisbecker * Number of functions that haven't been traced 13675eca1c10SIngo Molnar * because of depth overrun: 1368f201ae23SFrederic Weisbecker */ 1369f201ae23SFrederic Weisbecker atomic_t trace_overrun; 13705eca1c10SIngo Molnar 13715eca1c10SIngo Molnar /* Pause tracing: */ 1372380c4b14SFrederic Weisbecker atomic_t tracing_graph_pause; 1373f201ae23SFrederic Weisbecker #endif 13745eca1c10SIngo Molnar 1375ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING 13765eca1c10SIngo Molnar /* State flags for use by tracers: */ 1377ea4e2bc4SSteven Rostedt unsigned long trace; 13785eca1c10SIngo Molnar 13795eca1c10SIngo Molnar /* Bitmask and counter of trace recursion: */ 1380261842b7SSteven Rostedt unsigned long trace_recursion; 1381261842b7SSteven Rostedt #endif /* CONFIG_TRACING */ 13825eca1c10SIngo Molnar 13835c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV 1384eec028c9SAndrey Konovalov /* See kernel/kcov.c for more details. */ 1385eec028c9SAndrey Konovalov 13865eca1c10SIngo Molnar /* Coverage collection mode enabled for this task (0 if disabled): */ 13870ed557aaSMark Rutland unsigned int kcov_mode; 13885eca1c10SIngo Molnar 13895eca1c10SIngo Molnar /* Size of the kcov_area: */ 13905eca1c10SIngo Molnar unsigned int kcov_size; 13915eca1c10SIngo Molnar 13925eca1c10SIngo Molnar /* Buffer for coverage collection: */ 13935c9a8750SDmitry Vyukov void *kcov_area; 13945eca1c10SIngo Molnar 13955eca1c10SIngo Molnar /* KCOV descriptor wired with this task or NULL: */ 13965c9a8750SDmitry Vyukov struct kcov *kcov; 1397eec028c9SAndrey Konovalov 1398eec028c9SAndrey Konovalov /* KCOV common handle for remote coverage collection: */ 1399eec028c9SAndrey Konovalov u64 kcov_handle; 1400eec028c9SAndrey Konovalov 1401eec028c9SAndrey Konovalov /* KCOV sequence number: */ 1402eec028c9SAndrey Konovalov int kcov_sequence; 14035ff3b30aSAndrey Konovalov 14045ff3b30aSAndrey Konovalov /* Collect coverage from softirq context: */ 14055ff3b30aSAndrey Konovalov unsigned int kcov_softirq; 14065c9a8750SDmitry Vyukov #endif 14075eca1c10SIngo Molnar 14086f185c29SVladimir Davydov #ifdef CONFIG_MEMCG 1409626ebc41STejun Heo struct mem_cgroup *memcg_in_oom; 1410626ebc41STejun Heo gfp_t memcg_oom_gfp_mask; 1411626ebc41STejun Heo int memcg_oom_order; 1412b23afb93STejun Heo 14135eca1c10SIngo Molnar /* Number of pages to reclaim on returning to userland: */ 1414b23afb93STejun Heo unsigned int memcg_nr_pages_over_high; 1415d46eb14bSShakeel Butt 1416d46eb14bSShakeel Butt /* Used by memcontrol for targeted memcg charge: */ 1417d46eb14bSShakeel Butt struct mem_cgroup *active_memcg; 1418569b846dSKAMEZAWA Hiroyuki #endif 14195eca1c10SIngo Molnar 1420d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP 1421d09d8df3SJosef Bacik struct request_queue *throttle_queue; 1422d09d8df3SJosef Bacik #endif 1423d09d8df3SJosef Bacik 14240326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES 14250326f5a9SSrikar Dronamraju struct uprobe_task *utask; 14260326f5a9SSrikar Dronamraju #endif 1427cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE) 1428cafe5635SKent Overstreet unsigned int sequential_io; 1429cafe5635SKent Overstreet unsigned int sequential_io_avg; 1430cafe5635SKent Overstreet #endif 14315fbda3ecSThomas Gleixner struct kmap_ctrl kmap_ctrl; 14328eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 14338eb23b9fSPeter Zijlstra unsigned long task_state_change; 14345f220be2SThomas Gleixner # ifdef CONFIG_PREEMPT_RT 14355f220be2SThomas Gleixner unsigned long saved_state_change; 14365f220be2SThomas Gleixner # endif 14378eb23b9fSPeter Zijlstra #endif 14388bcbde54SDavid Hildenbrand int pagefault_disabled; 143903049269SMichal Hocko #ifdef CONFIG_MMU 144029c696e1SVladimir Davydov struct task_struct *oom_reaper_list; 144103049269SMichal Hocko #endif 1442ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK 1443ba14a194SAndy Lutomirski struct vm_struct *stack_vm_area; 1444ba14a194SAndy Lutomirski #endif 144568f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 14465eca1c10SIngo Molnar /* A live task holds one reference: */ 1447f0b89d39SElena Reshetova refcount_t stack_refcount; 144868f24b08SAndy Lutomirski #endif 1449d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH 1450d83a7cb3SJosh Poimboeuf int patch_state; 1451d83a7cb3SJosh Poimboeuf #endif 1452e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY 1453e4e55b47STetsuo Handa /* Used by LSM modules for access restriction: */ 1454e4e55b47STetsuo Handa void *security; 1455e4e55b47STetsuo Handa #endif 1456a10787e6SSong Liu #ifdef CONFIG_BPF_SYSCALL 1457a10787e6SSong Liu /* Used by BPF task local storage */ 1458a10787e6SSong Liu struct bpf_local_storage __rcu *bpf_storage; 1459c7603cfaSAndrii Nakryiko /* Used for BPF run context */ 1460c7603cfaSAndrii Nakryiko struct bpf_run_ctx *bpf_ctx; 1461a10787e6SSong Liu #endif 146229e48ce8SKees Cook 1463afaef01cSAlexander Popov #ifdef CONFIG_GCC_PLUGIN_STACKLEAK 1464afaef01cSAlexander Popov unsigned long lowest_stack; 1465c8d12627SAlexander Popov unsigned long prev_lowest_stack; 1466afaef01cSAlexander Popov #endif 1467afaef01cSAlexander Popov 14685567d11cSPeter Zijlstra #ifdef CONFIG_X86_MCE 1469c0ab7ffcSTony Luck void __user *mce_vaddr; 1470c0ab7ffcSTony Luck __u64 mce_kflags; 14715567d11cSPeter Zijlstra u64 mce_addr; 147217fae129STony Luck __u64 mce_ripv : 1, 147317fae129STony Luck mce_whole_page : 1, 147417fae129STony Luck __mce_reserved : 62; 14755567d11cSPeter Zijlstra struct callback_head mce_kill_me; 147681065b35STony Luck int mce_count; 14775567d11cSPeter Zijlstra #endif 14785567d11cSPeter Zijlstra 1479d741bf41SPeter Zijlstra #ifdef CONFIG_KRETPROBES 1480d741bf41SPeter Zijlstra struct llist_head kretprobe_instances; 1481d741bf41SPeter Zijlstra #endif 1482d741bf41SPeter Zijlstra 148358e106e7SBalbir Singh #ifdef CONFIG_ARCH_HAS_PARANOID_L1D_FLUSH 148458e106e7SBalbir Singh /* 148558e106e7SBalbir Singh * If L1D flush is supported on mm context switch 148658e106e7SBalbir Singh * then we use this callback head to queue kill work 148758e106e7SBalbir Singh * to kill tasks that are not running on SMT disabled 148858e106e7SBalbir Singh * cores 148958e106e7SBalbir Singh */ 149058e106e7SBalbir Singh struct callback_head l1d_flush_kill; 149158e106e7SBalbir Singh #endif 149258e106e7SBalbir Singh 149329e48ce8SKees Cook /* 149429e48ce8SKees Cook * New fields for task_struct should be added above here, so that 149529e48ce8SKees Cook * they are included in the randomized portion of task_struct. 149629e48ce8SKees Cook */ 149729e48ce8SKees Cook randomized_struct_fields_end 149829e48ce8SKees Cook 14995eca1c10SIngo Molnar /* CPU-specific state of this task: */ 15000c8c0f03SDave Hansen struct thread_struct thread; 15015eca1c10SIngo Molnar 15020c8c0f03SDave Hansen /* 15030c8c0f03SDave Hansen * WARNING: on x86, 'thread_struct' contains a variable-sized 15040c8c0f03SDave Hansen * structure. It *MUST* be at the end of 'task_struct'. 15050c8c0f03SDave Hansen * 15060c8c0f03SDave Hansen * Do not put anything below here! 15070c8c0f03SDave Hansen */ 15081da177e4SLinus Torvalds }; 15091da177e4SLinus Torvalds 1510e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task) 151122c935f4SEric W. Biederman { 15122c470475SEric W. Biederman return task->thread_pid; 151322c935f4SEric W. Biederman } 151422c935f4SEric W. Biederman 15157af57294SPavel Emelyanov /* 15167af57294SPavel Emelyanov * the helpers to get the task's different pids as they are seen 15177af57294SPavel Emelyanov * from various namespaces 15187af57294SPavel Emelyanov * 15197af57294SPavel Emelyanov * task_xid_nr() : global id, i.e. the id seen from the init namespace; 152044c4e1b2SEric W. Biederman * task_xid_vnr() : virtual id, i.e. the id seen from the pid namespace of 152144c4e1b2SEric W. Biederman * current. 15227af57294SPavel Emelyanov * task_xid_nr_ns() : id seen from the ns specified; 15237af57294SPavel Emelyanov * 15247af57294SPavel Emelyanov * see also pid_nr() etc in include/linux/pid.h 15257af57294SPavel Emelyanov */ 15265eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns); 15277af57294SPavel Emelyanov 1528e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk) 15297af57294SPavel Emelyanov { 15307af57294SPavel Emelyanov return tsk->pid; 15317af57294SPavel Emelyanov } 15327af57294SPavel Emelyanov 15335eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 153452ee2dfdSOleg Nesterov { 153552ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns); 153652ee2dfdSOleg Nesterov } 15377af57294SPavel Emelyanov 15387af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk) 15397af57294SPavel Emelyanov { 154052ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL); 15417af57294SPavel Emelyanov } 15427af57294SPavel Emelyanov 15437af57294SPavel Emelyanov 1544e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk) 15457af57294SPavel Emelyanov { 15467af57294SPavel Emelyanov return tsk->tgid; 15477af57294SPavel Emelyanov } 15487af57294SPavel Emelyanov 15495eca1c10SIngo Molnar /** 15505eca1c10SIngo Molnar * pid_alive - check that a task structure is not stale 15515eca1c10SIngo Molnar * @p: Task structure to be checked. 15525eca1c10SIngo Molnar * 15535eca1c10SIngo Molnar * Test if a process is not yet dead (at most zombie state) 15545eca1c10SIngo Molnar * If pid_alive fails, then pointers within the task structure 15555eca1c10SIngo Molnar * can be stale and must not be dereferenced. 15565eca1c10SIngo Molnar * 15575eca1c10SIngo Molnar * Return: 1 if the process is alive. 0 otherwise. 15585eca1c10SIngo Molnar */ 15595eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p) 15605eca1c10SIngo Molnar { 15612c470475SEric W. Biederman return p->thread_pid != NULL; 15625eca1c10SIngo Molnar } 15637af57294SPavel Emelyanov 15645eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 15657af57294SPavel Emelyanov { 156652ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns); 15677af57294SPavel Emelyanov } 15687af57294SPavel Emelyanov 15697af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk) 15707af57294SPavel Emelyanov { 157152ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL); 15727af57294SPavel Emelyanov } 15737af57294SPavel Emelyanov 15747af57294SPavel Emelyanov 15755eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 15767af57294SPavel Emelyanov { 157752ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns); 15787af57294SPavel Emelyanov } 15797af57294SPavel Emelyanov 15807af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk) 15817af57294SPavel Emelyanov { 158252ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL); 15837af57294SPavel Emelyanov } 15847af57294SPavel Emelyanov 1585dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 1586dd1c1f2fSOleg Nesterov { 15876883f81aSEric W. Biederman return __task_pid_nr_ns(tsk, PIDTYPE_TGID, ns); 1588dd1c1f2fSOleg Nesterov } 1589dd1c1f2fSOleg Nesterov 1590dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk) 1591dd1c1f2fSOleg Nesterov { 15926883f81aSEric W. Biederman return __task_pid_nr_ns(tsk, PIDTYPE_TGID, NULL); 1593dd1c1f2fSOleg Nesterov } 1594dd1c1f2fSOleg Nesterov 1595dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns) 1596dd1c1f2fSOleg Nesterov { 1597dd1c1f2fSOleg Nesterov pid_t pid = 0; 1598dd1c1f2fSOleg Nesterov 1599dd1c1f2fSOleg Nesterov rcu_read_lock(); 1600dd1c1f2fSOleg Nesterov if (pid_alive(tsk)) 1601dd1c1f2fSOleg Nesterov pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns); 1602dd1c1f2fSOleg Nesterov rcu_read_unlock(); 1603dd1c1f2fSOleg Nesterov 1604dd1c1f2fSOleg Nesterov return pid; 1605dd1c1f2fSOleg Nesterov } 1606dd1c1f2fSOleg Nesterov 1607dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk) 1608dd1c1f2fSOleg Nesterov { 1609dd1c1f2fSOleg Nesterov return task_ppid_nr_ns(tsk, &init_pid_ns); 1610dd1c1f2fSOleg Nesterov } 1611dd1c1f2fSOleg Nesterov 16125eca1c10SIngo Molnar /* Obsolete, do not use: */ 16131b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk) 16141b0f7ffdSOleg Nesterov { 16151b0f7ffdSOleg Nesterov return task_pgrp_nr_ns(tsk, &init_pid_ns); 16161b0f7ffdSOleg Nesterov } 16177af57294SPavel Emelyanov 161806eb6184SPeter Zijlstra #define TASK_REPORT_IDLE (TASK_REPORT + 1) 161906eb6184SPeter Zijlstra #define TASK_REPORT_MAX (TASK_REPORT_IDLE << 1) 162006eb6184SPeter Zijlstra 16211d48b080SPeter Zijlstra static inline unsigned int task_state_index(struct task_struct *tsk) 162220435d84SXie XiuQi { 16232f064a59SPeter Zijlstra unsigned int tsk_state = READ_ONCE(tsk->__state); 16241593baabSPeter Zijlstra unsigned int state = (tsk_state | tsk->exit_state) & TASK_REPORT; 162520435d84SXie XiuQi 162606eb6184SPeter Zijlstra BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX); 162706eb6184SPeter Zijlstra 162806eb6184SPeter Zijlstra if (tsk_state == TASK_IDLE) 162906eb6184SPeter Zijlstra state = TASK_REPORT_IDLE; 163006eb6184SPeter Zijlstra 16311593baabSPeter Zijlstra return fls(state); 16321593baabSPeter Zijlstra } 163320435d84SXie XiuQi 16341d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state) 16351593baabSPeter Zijlstra { 16368ef9925bSPeter Zijlstra static const char state_char[] = "RSDTtXZPI"; 16371593baabSPeter Zijlstra 163806eb6184SPeter Zijlstra BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1); 16391593baabSPeter Zijlstra 16401593baabSPeter Zijlstra return state_char[state]; 16411593baabSPeter Zijlstra } 16421593baabSPeter Zijlstra 16431593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk) 16441593baabSPeter Zijlstra { 16451d48b080SPeter Zijlstra return task_index_to_char(task_state_index(tsk)); 164620435d84SXie XiuQi } 164720435d84SXie XiuQi 16481da177e4SLinus Torvalds /** 1649570f5241SSergey Senozhatsky * is_global_init - check if a task structure is init. Since init 1650570f5241SSergey Senozhatsky * is free to have sub-threads we need to check tgid. 16513260259fSHenne * @tsk: Task structure to be checked. 16523260259fSHenne * 16533260259fSHenne * Check if a task structure is the first user space task the kernel created. 1654e69f6186SYacine Belkadi * 1655e69f6186SYacine Belkadi * Return: 1 if the task structure is init. 0 otherwise. 1656f400e198SSukadev Bhattiprolu */ 1657e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk) 1658b461cc03SPavel Emelyanov { 1659570f5241SSergey Senozhatsky return task_tgid_nr(tsk) == 1; 1660b461cc03SPavel Emelyanov } 1661b460cbc5SSerge E. Hallyn 16629ec52099SCedric Le Goater extern struct pid *cad_pid; 16639ec52099SCedric Le Goater 16641da177e4SLinus Torvalds /* 16651da177e4SLinus Torvalds * Per process flags 16661da177e4SLinus Torvalds */ 166701ccf592SSebastian Andrzej Siewior #define PF_VCPU 0x00000001 /* I'm a virtual CPU */ 1668c1de45caSPeter Zijlstra #define PF_IDLE 0x00000002 /* I am an IDLE thread */ 16695eca1c10SIngo Molnar #define PF_EXITING 0x00000004 /* Getting shut down */ 167001ccf592SSebastian Andrzej Siewior #define PF_IO_WORKER 0x00000010 /* Task is an IO worker */ 167121aa9af0STejun Heo #define PF_WQ_WORKER 0x00000020 /* I'm a workqueue worker */ 16725eca1c10SIngo Molnar #define PF_FORKNOEXEC 0x00000040 /* Forked but didn't exec */ 16735eca1c10SIngo Molnar #define PF_MCE_PROCESS 0x00000080 /* Process policy on mce errors */ 16745eca1c10SIngo Molnar #define PF_SUPERPRIV 0x00000100 /* Used super-user privileges */ 16755eca1c10SIngo Molnar #define PF_DUMPCORE 0x00000200 /* Dumped core */ 16765eca1c10SIngo Molnar #define PF_SIGNALED 0x00000400 /* Killed by a signal */ 16771da177e4SLinus Torvalds #define PF_MEMALLOC 0x00000800 /* Allocating memory */ 16785eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED 0x00001000 /* set_user() noticed that RLIMIT_NPROC was exceeded */ 16795eca1c10SIngo Molnar #define PF_USED_MATH 0x00002000 /* If unset the fpu must be initialized before use */ 16805eca1c10SIngo Molnar #define PF_USED_ASYNC 0x00004000 /* Used async_schedule*(), used by module init */ 16815eca1c10SIngo Molnar #define PF_NOFREEZE 0x00008000 /* This thread should not be frozen */ 16825eca1c10SIngo Molnar #define PF_FROZEN 0x00010000 /* Frozen for system suspend */ 16837dea19f9SMichal Hocko #define PF_KSWAPD 0x00020000 /* I am kswapd */ 16847dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS 0x00040000 /* All allocation requests will inherit GFP_NOFS */ 16857dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO 0x00080000 /* All allocation requests will inherit GFP_NOIO */ 1686a37b0715SNeilBrown #define PF_LOCAL_THROTTLE 0x00100000 /* Throttle writes only against the bdi I write to, 1687a37b0715SNeilBrown * I am cleaning dirty pages from some other bdi. */ 1688246bb0b1SOleg Nesterov #define PF_KTHREAD 0x00200000 /* I am a kernel thread */ 16895eca1c10SIngo Molnar #define PF_RANDOMIZE 0x00400000 /* Randomize virtual address space */ 1690b31dc66aSJens Axboe #define PF_SWAPWRITE 0x00800000 /* Allowed to write to swap */ 16913bd37062SSebastian Andrzej Siewior #define PF_NO_SETAFFINITY 0x04000000 /* Userland is not allowed to meddle with cpus_mask */ 16924db96cf0SAndi Kleen #define PF_MCE_EARLY 0x08000000 /* Early kill for mce process policy */ 16931a08ae36SPavel Tatashin #define PF_MEMALLOC_PIN 0x10000000 /* Allocation context constrained to zones which allow long term pinning. */ 169458a69cb4STejun Heo #define PF_FREEZER_SKIP 0x40000000 /* Freezer should not count it as freezable */ 16955eca1c10SIngo Molnar #define PF_SUSPEND_TASK 0x80000000 /* This thread called freeze_processes() and should not be frozen */ 16961da177e4SLinus Torvalds 16971da177e4SLinus Torvalds /* 16981da177e4SLinus Torvalds * Only the _current_ task can read/write to tsk->flags, but other 16991da177e4SLinus Torvalds * tasks can access tsk->flags in readonly mode for example 17001da177e4SLinus Torvalds * with tsk_used_math (like during threaded core dumping). 17011da177e4SLinus Torvalds * There is however an exception to this rule during ptrace 17021da177e4SLinus Torvalds * or during fork: the ptracer task is allowed to write to the 17031da177e4SLinus Torvalds * child->flags of its traced child (same goes for fork, the parent 17041da177e4SLinus Torvalds * can write to the child->flags), because we're guaranteed the 17051da177e4SLinus Torvalds * child is not running and in turn not changing child->flags 17061da177e4SLinus Torvalds * at the same time the parent does it. 17071da177e4SLinus Torvalds */ 17081da177e4SLinus Torvalds #define clear_stopped_child_used_math(child) do { (child)->flags &= ~PF_USED_MATH; } while (0) 17091da177e4SLinus Torvalds #define set_stopped_child_used_math(child) do { (child)->flags |= PF_USED_MATH; } while (0) 17101da177e4SLinus Torvalds #define clear_used_math() clear_stopped_child_used_math(current) 17111da177e4SLinus Torvalds #define set_used_math() set_stopped_child_used_math(current) 17125eca1c10SIngo Molnar 17131da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \ 17141da177e4SLinus Torvalds do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0) 17155eca1c10SIngo Molnar 17165eca1c10SIngo Molnar #define conditional_used_math(condition) conditional_stopped_child_used_math(condition, current) 17175eca1c10SIngo Molnar 17181da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \ 17191da177e4SLinus Torvalds do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0) 17205eca1c10SIngo Molnar 17211da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */ 17221da177e4SLinus Torvalds #define tsk_used_math(p) ((p)->flags & PF_USED_MATH) 17231da177e4SLinus Torvalds #define used_math() tsk_used_math(current) 17241da177e4SLinus Torvalds 172583d40a61SPeter Zijlstra static __always_inline bool is_percpu_thread(void) 172662ec05ddSThomas Gleixner { 172762ec05ddSThomas Gleixner #ifdef CONFIG_SMP 172862ec05ddSThomas Gleixner return (current->flags & PF_NO_SETAFFINITY) && 172962ec05ddSThomas Gleixner (current->nr_cpus_allowed == 1); 173062ec05ddSThomas Gleixner #else 173162ec05ddSThomas Gleixner return true; 173262ec05ddSThomas Gleixner #endif 173362ec05ddSThomas Gleixner } 173462ec05ddSThomas Gleixner 17351d4457f9SKees Cook /* Per-process atomic flags. */ 1736a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS 0 /* May not gain new privileges. */ 17372ad654bcSZefan Li #define PFA_SPREAD_PAGE 1 /* Spread page cache over cpuset */ 17382ad654bcSZefan Li #define PFA_SPREAD_SLAB 2 /* Spread some slab caches over cpuset */ 1739356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE 3 /* Speculative Store Bypass disabled */ 1740356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE 4 /* Speculative Store Bypass force disabled*/ 17419137bb27SThomas Gleixner #define PFA_SPEC_IB_DISABLE 5 /* Indirect branch speculation restricted */ 17429137bb27SThomas Gleixner #define PFA_SPEC_IB_FORCE_DISABLE 6 /* Indirect branch speculation permanently restricted */ 174371368af9SWaiman Long #define PFA_SPEC_SSB_NOEXEC 7 /* Speculative Store Bypass clear on execve() */ 17441d4457f9SKees Cook 1745e0e5070bSZefan Li #define TASK_PFA_TEST(name, func) \ 1746e0e5070bSZefan Li static inline bool task_##func(struct task_struct *p) \ 1747e0e5070bSZefan Li { return test_bit(PFA_##name, &p->atomic_flags); } 17485eca1c10SIngo Molnar 1749e0e5070bSZefan Li #define TASK_PFA_SET(name, func) \ 1750e0e5070bSZefan Li static inline void task_set_##func(struct task_struct *p) \ 1751e0e5070bSZefan Li { set_bit(PFA_##name, &p->atomic_flags); } 17525eca1c10SIngo Molnar 1753e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func) \ 1754e0e5070bSZefan Li static inline void task_clear_##func(struct task_struct *p) \ 1755e0e5070bSZefan Li { clear_bit(PFA_##name, &p->atomic_flags); } 17561d4457f9SKees Cook 1757e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs) 1758e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs) 17591d4457f9SKees Cook 17602ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page) 17612ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page) 17622ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page) 17632ad654bcSZefan Li 17642ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab) 17652ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab) 17662ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab) 1767544b2c91STejun Heo 1768356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable) 1769356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable) 1770356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable) 1771356e4bffSThomas Gleixner 177271368af9SWaiman Long TASK_PFA_TEST(SPEC_SSB_NOEXEC, spec_ssb_noexec) 177371368af9SWaiman Long TASK_PFA_SET(SPEC_SSB_NOEXEC, spec_ssb_noexec) 177471368af9SWaiman Long TASK_PFA_CLEAR(SPEC_SSB_NOEXEC, spec_ssb_noexec) 177571368af9SWaiman Long 1776356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable) 1777356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable) 1778356e4bffSThomas Gleixner 17799137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_DISABLE, spec_ib_disable) 17809137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_DISABLE, spec_ib_disable) 17819137bb27SThomas Gleixner TASK_PFA_CLEAR(SPEC_IB_DISABLE, spec_ib_disable) 17829137bb27SThomas Gleixner 17839137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable) 17849137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable) 17859137bb27SThomas Gleixner 17865eca1c10SIngo Molnar static inline void 1787717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags) 1788907aed48SMel Gorman { 1789717a94b5SNeilBrown current->flags &= ~flags; 1790717a94b5SNeilBrown current->flags |= orig_flags & flags; 1791907aed48SMel Gorman } 1792907aed48SMel Gorman 17935eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial); 17945eca1c10SIngo Molnar extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_cpus_allowed); 17951da177e4SLinus Torvalds #ifdef CONFIG_SMP 17965eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask); 17975eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask); 1798b90ca8baSWill Deacon extern int dup_user_cpus_ptr(struct task_struct *dst, struct task_struct *src, int node); 1799b90ca8baSWill Deacon extern void release_user_cpus_ptr(struct task_struct *p); 1800234b8ab6SWill Deacon extern int dl_task_check_affinity(struct task_struct *p, const struct cpumask *mask); 180107ec77a1SWill Deacon extern void force_compatible_cpus_allowed_ptr(struct task_struct *p); 180207ec77a1SWill Deacon extern void relax_compatible_cpus_allowed_ptr(struct task_struct *p); 18031da177e4SLinus Torvalds #else 18045eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask) 18051e1b6c51SKOSAKI Motohiro { 18061e1b6c51SKOSAKI Motohiro } 18075eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask) 18081da177e4SLinus Torvalds { 180996f874e2SRusty Russell if (!cpumask_test_cpu(0, new_mask)) 18101da177e4SLinus Torvalds return -EINVAL; 18111da177e4SLinus Torvalds return 0; 18121da177e4SLinus Torvalds } 1813b90ca8baSWill Deacon static inline int dup_user_cpus_ptr(struct task_struct *dst, struct task_struct *src, int node) 1814b90ca8baSWill Deacon { 1815b90ca8baSWill Deacon if (src->user_cpus_ptr) 1816b90ca8baSWill Deacon return -EINVAL; 1817b90ca8baSWill Deacon return 0; 1818b90ca8baSWill Deacon } 1819b90ca8baSWill Deacon static inline void release_user_cpus_ptr(struct task_struct *p) 1820b90ca8baSWill Deacon { 1821b90ca8baSWill Deacon WARN_ON(p->user_cpus_ptr); 1822b90ca8baSWill Deacon } 1823234b8ab6SWill Deacon 1824234b8ab6SWill Deacon static inline int dl_task_check_affinity(struct task_struct *p, const struct cpumask *mask) 1825234b8ab6SWill Deacon { 1826234b8ab6SWill Deacon return 0; 1827234b8ab6SWill Deacon } 18281da177e4SLinus Torvalds #endif 1829e0ad9556SRusty Russell 1830fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt); 183136c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice); 183236c8b586SIngo Molnar extern int task_prio(const struct task_struct *p); 18335eca1c10SIngo Molnar 1834d0ea0268SDongsheng Yang /** 1835d0ea0268SDongsheng Yang * task_nice - return the nice value of a given task. 1836d0ea0268SDongsheng Yang * @p: the task in question. 1837d0ea0268SDongsheng Yang * 1838d0ea0268SDongsheng Yang * Return: The nice value [ -20 ... 0 ... 19 ]. 1839d0ea0268SDongsheng Yang */ 1840d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p) 1841d0ea0268SDongsheng Yang { 1842d0ea0268SDongsheng Yang return PRIO_TO_NICE((p)->static_prio); 1843d0ea0268SDongsheng Yang } 18445eca1c10SIngo Molnar 184536c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice); 184636c8b586SIngo Molnar extern int task_curr(const struct task_struct *p); 18471da177e4SLinus Torvalds extern int idle_cpu(int cpu); 1848943d355dSRohit Jain extern int available_idle_cpu(int cpu); 18495eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *); 18505eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *); 18518b700983SPeter Zijlstra extern void sched_set_fifo(struct task_struct *p); 18528b700983SPeter Zijlstra extern void sched_set_fifo_low(struct task_struct *p); 18538b700983SPeter Zijlstra extern void sched_set_normal(struct task_struct *p, int nice); 18545eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *); 1855794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *); 185636c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu); 18575eca1c10SIngo Molnar 1858c4f30608SPaul E. McKenney /** 1859c4f30608SPaul E. McKenney * is_idle_task - is the specified task an idle task? 1860fa757281SRandy Dunlap * @p: the task in question. 1861e69f6186SYacine Belkadi * 1862e69f6186SYacine Belkadi * Return: 1 if @p is an idle task. 0 otherwise. 1863c4f30608SPaul E. McKenney */ 1864c94a88f3SMarco Elver static __always_inline bool is_idle_task(const struct task_struct *p) 1865c4f30608SPaul E. McKenney { 1866c1de45caSPeter Zijlstra return !!(p->flags & PF_IDLE); 1867c4f30608SPaul E. McKenney } 18685eca1c10SIngo Molnar 186936c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu); 1870a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p); 18711da177e4SLinus Torvalds 18721da177e4SLinus Torvalds void yield(void); 18731da177e4SLinus Torvalds 18741da177e4SLinus Torvalds union thread_union { 18750500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK 18760500871fSDavid Howells struct task_struct task; 18770500871fSDavid Howells #endif 1878c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK 18791da177e4SLinus Torvalds struct thread_info thread_info; 1880c65eacbeSAndy Lutomirski #endif 18811da177e4SLinus Torvalds unsigned long stack[THREAD_SIZE/sizeof(long)]; 18821da177e4SLinus Torvalds }; 18831da177e4SLinus Torvalds 18840500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK 18850500871fSDavid Howells extern struct thread_info init_thread_info; 18860500871fSDavid Howells #endif 18870500871fSDavid Howells 18880500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)]; 18890500871fSDavid Howells 1890f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK 1891f3ac6067SIngo Molnar static inline struct thread_info *task_thread_info(struct task_struct *task) 1892f3ac6067SIngo Molnar { 1893f3ac6067SIngo Molnar return &task->thread_info; 1894f3ac6067SIngo Molnar } 1895f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS) 1896f3ac6067SIngo Molnar # define task_thread_info(task) ((struct thread_info *)(task)->stack) 1897f3ac6067SIngo Molnar #endif 1898f3ac6067SIngo Molnar 1899198fe21bSPavel Emelyanov /* 1900198fe21bSPavel Emelyanov * find a task by one of its numerical ids 1901198fe21bSPavel Emelyanov * 1902198fe21bSPavel Emelyanov * find_task_by_pid_ns(): 1903198fe21bSPavel Emelyanov * finds a task by its pid in the specified namespace 1904228ebcbeSPavel Emelyanov * find_task_by_vpid(): 1905228ebcbeSPavel Emelyanov * finds a task by its virtual pid 1906198fe21bSPavel Emelyanov * 1907e49859e7SPavel Emelyanov * see also find_vpid() etc in include/linux/pid.h 1908198fe21bSPavel Emelyanov */ 1909198fe21bSPavel Emelyanov 1910228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr); 19115eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns); 1912198fe21bSPavel Emelyanov 19132ee08260SMike Rapoport /* 19142ee08260SMike Rapoport * find a task by its virtual pid and get the task struct 19152ee08260SMike Rapoport */ 19162ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr); 19172ee08260SMike Rapoport 1918b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state); 1919b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk); 19203e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk); 19215eca1c10SIngo Molnar 19221da177e4SLinus Torvalds #ifdef CONFIG_SMP 19231da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk); 19241da177e4SLinus Torvalds #else 19251da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { } 19261da177e4SLinus Torvalds #endif 19271da177e4SLinus Torvalds 192882b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec); 19295eca1c10SIngo Molnar 193082b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from) 193182b89778SAdrian Hunter { 193282b89778SAdrian Hunter __set_task_comm(tsk, from, false); 193382b89778SAdrian Hunter } 19345eca1c10SIngo Molnar 19353756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk); 19363756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({ \ 19373756f640SArnd Bergmann BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN); \ 19383756f640SArnd Bergmann __get_task_comm(buf, sizeof(buf), tsk); \ 19393756f640SArnd Bergmann }) 19401da177e4SLinus Torvalds 19411da177e4SLinus Torvalds #ifdef CONFIG_SMP 19422a0a24ebSThomas Gleixner static __always_inline void scheduler_ipi(void) 19432a0a24ebSThomas Gleixner { 19442a0a24ebSThomas Gleixner /* 19452a0a24ebSThomas Gleixner * Fold TIF_NEED_RESCHED into the preempt_count; anybody setting 19462a0a24ebSThomas Gleixner * TIF_NEED_RESCHED remotely (for the first time) will also send 19472a0a24ebSThomas Gleixner * this IPI. 19482a0a24ebSThomas Gleixner */ 19492a0a24ebSThomas Gleixner preempt_fold_need_resched(); 19502a0a24ebSThomas Gleixner } 19512f064a59SPeter Zijlstra extern unsigned long wait_task_inactive(struct task_struct *, unsigned int match_state); 19521da177e4SLinus Torvalds #else 1953184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { } 19542f064a59SPeter Zijlstra static inline unsigned long wait_task_inactive(struct task_struct *p, unsigned int match_state) 195585ba2d86SRoland McGrath { 195685ba2d86SRoland McGrath return 1; 195785ba2d86SRoland McGrath } 19581da177e4SLinus Torvalds #endif 19591da177e4SLinus Torvalds 19605eca1c10SIngo Molnar /* 19615eca1c10SIngo Molnar * Set thread flags in other task's structures. 19625eca1c10SIngo Molnar * See asm/thread_info.h for TIF_xxxx flags available: 19631da177e4SLinus Torvalds */ 19641da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag) 19651da177e4SLinus Torvalds { 1966a1261f54SAl Viro set_ti_thread_flag(task_thread_info(tsk), flag); 19671da177e4SLinus Torvalds } 19681da177e4SLinus Torvalds 19691da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag) 19701da177e4SLinus Torvalds { 1971a1261f54SAl Viro clear_ti_thread_flag(task_thread_info(tsk), flag); 19721da177e4SLinus Torvalds } 19731da177e4SLinus Torvalds 197493ee37c2SDave Martin static inline void update_tsk_thread_flag(struct task_struct *tsk, int flag, 197593ee37c2SDave Martin bool value) 197693ee37c2SDave Martin { 197793ee37c2SDave Martin update_ti_thread_flag(task_thread_info(tsk), flag, value); 197893ee37c2SDave Martin } 197993ee37c2SDave Martin 19801da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag) 19811da177e4SLinus Torvalds { 1982a1261f54SAl Viro return test_and_set_ti_thread_flag(task_thread_info(tsk), flag); 19831da177e4SLinus Torvalds } 19841da177e4SLinus Torvalds 19851da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag) 19861da177e4SLinus Torvalds { 1987a1261f54SAl Viro return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag); 19881da177e4SLinus Torvalds } 19891da177e4SLinus Torvalds 19901da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag) 19911da177e4SLinus Torvalds { 1992a1261f54SAl Viro return test_ti_thread_flag(task_thread_info(tsk), flag); 19931da177e4SLinus Torvalds } 19941da177e4SLinus Torvalds 19951da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk) 19961da177e4SLinus Torvalds { 19971da177e4SLinus Torvalds set_tsk_thread_flag(tsk,TIF_NEED_RESCHED); 19981da177e4SLinus Torvalds } 19991da177e4SLinus Torvalds 20001da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk) 20011da177e4SLinus Torvalds { 20021da177e4SLinus Torvalds clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED); 20031da177e4SLinus Torvalds } 20041da177e4SLinus Torvalds 20058ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk) 20068ae121acSGregory Haskins { 20078ae121acSGregory Haskins return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED)); 20088ae121acSGregory Haskins } 20098ae121acSGregory Haskins 20101da177e4SLinus Torvalds /* 20111da177e4SLinus Torvalds * cond_resched() and cond_resched_lock(): latency reduction via 20121da177e4SLinus Torvalds * explicit rescheduling in places that are safe. The return 20131da177e4SLinus Torvalds * value indicates whether a reschedule was done in fact. 20141da177e4SLinus Torvalds * cond_resched_lock() will drop the spinlock before scheduling, 20151da177e4SLinus Torvalds */ 2016b965f1ddSPeter Zijlstra (Intel) #if !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC) 2017b965f1ddSPeter Zijlstra (Intel) extern int __cond_resched(void); 2018b965f1ddSPeter Zijlstra (Intel) 2019b965f1ddSPeter Zijlstra (Intel) #ifdef CONFIG_PREEMPT_DYNAMIC 2020b965f1ddSPeter Zijlstra (Intel) 2021b965f1ddSPeter Zijlstra (Intel) DECLARE_STATIC_CALL(cond_resched, __cond_resched); 2022b965f1ddSPeter Zijlstra (Intel) 2023b965f1ddSPeter Zijlstra (Intel) static __always_inline int _cond_resched(void) 2024b965f1ddSPeter Zijlstra (Intel) { 2025ef72661eSPeter Zijlstra return static_call_mod(cond_resched)(); 2026b965f1ddSPeter Zijlstra (Intel) } 2027b965f1ddSPeter Zijlstra (Intel) 202835a773a0SPeter Zijlstra #else 2029b965f1ddSPeter Zijlstra (Intel) 2030b965f1ddSPeter Zijlstra (Intel) static inline int _cond_resched(void) 2031b965f1ddSPeter Zijlstra (Intel) { 2032b965f1ddSPeter Zijlstra (Intel) return __cond_resched(); 2033b965f1ddSPeter Zijlstra (Intel) } 2034b965f1ddSPeter Zijlstra (Intel) 2035b965f1ddSPeter Zijlstra (Intel) #endif /* CONFIG_PREEMPT_DYNAMIC */ 2036b965f1ddSPeter Zijlstra (Intel) 2037b965f1ddSPeter Zijlstra (Intel) #else 2038b965f1ddSPeter Zijlstra (Intel) 203935a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; } 2040b965f1ddSPeter Zijlstra (Intel) 2041b965f1ddSPeter Zijlstra (Intel) #endif /* !defined(CONFIG_PREEMPTION) || defined(CONFIG_PREEMPT_DYNAMIC) */ 20426f80bd98SFrederic Weisbecker 2043613afbf8SFrederic Weisbecker #define cond_resched() ({ \ 20443427445aSPeter Zijlstra ___might_sleep(__FILE__, __LINE__, 0); \ 2045613afbf8SFrederic Weisbecker _cond_resched(); \ 2046613afbf8SFrederic Weisbecker }) 20476f80bd98SFrederic Weisbecker 2048613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock); 2049f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_read(rwlock_t *lock); 2050f3d4b4b1SBen Gardon extern int __cond_resched_rwlock_write(rwlock_t *lock); 2051613afbf8SFrederic Weisbecker 2052613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({ \ 20533427445aSPeter Zijlstra ___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\ 2054613afbf8SFrederic Weisbecker __cond_resched_lock(lock); \ 2055613afbf8SFrederic Weisbecker }) 2056613afbf8SFrederic Weisbecker 2057f3d4b4b1SBen Gardon #define cond_resched_rwlock_read(lock) ({ \ 2058f3d4b4b1SBen Gardon __might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET); \ 2059f3d4b4b1SBen Gardon __cond_resched_rwlock_read(lock); \ 2060f3d4b4b1SBen Gardon }) 2061f3d4b4b1SBen Gardon 2062f3d4b4b1SBen Gardon #define cond_resched_rwlock_write(lock) ({ \ 2063f3d4b4b1SBen Gardon __might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET); \ 2064f3d4b4b1SBen Gardon __cond_resched_rwlock_write(lock); \ 2065f3d4b4b1SBen Gardon }) 2066f3d4b4b1SBen Gardon 2067f6f3c437SSimon Horman static inline void cond_resched_rcu(void) 2068f6f3c437SSimon Horman { 2069f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU) 2070f6f3c437SSimon Horman rcu_read_unlock(); 2071f6f3c437SSimon Horman cond_resched(); 2072f6f3c437SSimon Horman rcu_read_lock(); 2073f6f3c437SSimon Horman #endif 2074f6f3c437SSimon Horman } 2075f6f3c437SSimon Horman 20761da177e4SLinus Torvalds /* 20771da177e4SLinus Torvalds * Does a critical section need to be broken due to another 2078c1a280b6SThomas Gleixner * task waiting?: (technically does not depend on CONFIG_PREEMPTION, 207995c354feSNick Piggin * but a general need for low latency) 20801da177e4SLinus Torvalds */ 208195c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock) 20821da177e4SLinus Torvalds { 2083c1a280b6SThomas Gleixner #ifdef CONFIG_PREEMPTION 208495c354feSNick Piggin return spin_is_contended(lock); 208595c354feSNick Piggin #else 20861da177e4SLinus Torvalds return 0; 208795c354feSNick Piggin #endif 20881da177e4SLinus Torvalds } 20891da177e4SLinus Torvalds 2090a09a689aSBen Gardon /* 2091a09a689aSBen Gardon * Check if a rwlock is contended. 2092a09a689aSBen Gardon * Returns non-zero if there is another task waiting on the rwlock. 2093a09a689aSBen Gardon * Returns zero if the lock is not contended or the system / underlying 2094a09a689aSBen Gardon * rwlock implementation does not support contention detection. 2095a09a689aSBen Gardon * Technically does not depend on CONFIG_PREEMPTION, but a general need 2096a09a689aSBen Gardon * for low latency. 2097a09a689aSBen Gardon */ 2098a09a689aSBen Gardon static inline int rwlock_needbreak(rwlock_t *lock) 2099a09a689aSBen Gardon { 2100a09a689aSBen Gardon #ifdef CONFIG_PREEMPTION 2101a09a689aSBen Gardon return rwlock_is_contended(lock); 2102a09a689aSBen Gardon #else 2103a09a689aSBen Gardon return 0; 2104a09a689aSBen Gardon #endif 2105a09a689aSBen Gardon } 2106a09a689aSBen Gardon 210775f93fedSPeter Zijlstra static __always_inline bool need_resched(void) 210875f93fedSPeter Zijlstra { 210975f93fedSPeter Zijlstra return unlikely(tif_need_resched()); 211075f93fedSPeter Zijlstra } 211175f93fedSPeter Zijlstra 2112ee761f62SThomas Gleixner /* 21131da177e4SLinus Torvalds * Wrappers for p->thread_info->cpu access. No-op on UP. 21141da177e4SLinus Torvalds */ 21151da177e4SLinus Torvalds #ifdef CONFIG_SMP 21161da177e4SLinus Torvalds 21171da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p) 21181da177e4SLinus Torvalds { 2119c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 2120c546951dSAndrea Parri return READ_ONCE(p->cpu); 2121c65eacbeSAndy Lutomirski #else 2122c546951dSAndrea Parri return READ_ONCE(task_thread_info(p)->cpu); 2123c65eacbeSAndy Lutomirski #endif 21241da177e4SLinus Torvalds } 21251da177e4SLinus Torvalds 2126c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu); 21271da177e4SLinus Torvalds 21281da177e4SLinus Torvalds #else 21291da177e4SLinus Torvalds 21301da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p) 21311da177e4SLinus Torvalds { 21321da177e4SLinus Torvalds return 0; 21331da177e4SLinus Torvalds } 21341da177e4SLinus Torvalds 21351da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu) 21361da177e4SLinus Torvalds { 21371da177e4SLinus Torvalds } 21381da177e4SLinus Torvalds 21391da177e4SLinus Torvalds #endif /* CONFIG_SMP */ 21401da177e4SLinus Torvalds 2141a1dfb631SMarcelo Tosatti extern bool sched_task_on_rq(struct task_struct *p); 2142a1dfb631SMarcelo Tosatti 2143d9345c65SPan Xinhui /* 2144d9345c65SPan Xinhui * In order to reduce various lock holder preemption latencies provide an 2145d9345c65SPan Xinhui * interface to see if a vCPU is currently running or not. 2146d9345c65SPan Xinhui * 2147d9345c65SPan Xinhui * This allows us to terminate optimistic spin loops and block, analogous to 2148d9345c65SPan Xinhui * the native optimistic spin heuristic of testing if the lock owner task is 2149d9345c65SPan Xinhui * running or not. 2150d9345c65SPan Xinhui */ 2151d9345c65SPan Xinhui #ifndef vcpu_is_preempted 215242fd8baaSQian Cai static inline bool vcpu_is_preempted(int cpu) 215342fd8baaSQian Cai { 215442fd8baaSQian Cai return false; 215542fd8baaSQian Cai } 2156d9345c65SPan Xinhui #endif 2157d9345c65SPan Xinhui 215896f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask); 215996f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask); 21605c45bf27SSiddha, Suresh B 216182455257SDave Hansen #ifndef TASK_SIZE_OF 216282455257SDave Hansen #define TASK_SIZE_OF(tsk) TASK_SIZE 216382455257SDave Hansen #endif 216482455257SDave Hansen 2165a5418be9SViresh Kumar #ifdef CONFIG_SMP 2166a5418be9SViresh Kumar /* Returns effective CPU energy utilization, as seen by the scheduler */ 2167a5418be9SViresh Kumar unsigned long sched_cpu_util(int cpu, unsigned long max); 2168a5418be9SViresh Kumar #endif /* CONFIG_SMP */ 2169a5418be9SViresh Kumar 2170d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ 2171d7822b1eSMathieu Desnoyers 2172d7822b1eSMathieu Desnoyers /* 2173d7822b1eSMathieu Desnoyers * Map the event mask on the user-space ABI enum rseq_cs_flags 2174d7822b1eSMathieu Desnoyers * for direct mask checks. 2175d7822b1eSMathieu Desnoyers */ 2176d7822b1eSMathieu Desnoyers enum rseq_event_mask_bits { 2177d7822b1eSMathieu Desnoyers RSEQ_EVENT_PREEMPT_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_PREEMPT_BIT, 2178d7822b1eSMathieu Desnoyers RSEQ_EVENT_SIGNAL_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_SIGNAL_BIT, 2179d7822b1eSMathieu Desnoyers RSEQ_EVENT_MIGRATE_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_MIGRATE_BIT, 2180d7822b1eSMathieu Desnoyers }; 2181d7822b1eSMathieu Desnoyers 2182d7822b1eSMathieu Desnoyers enum rseq_event_mask { 2183d7822b1eSMathieu Desnoyers RSEQ_EVENT_PREEMPT = (1U << RSEQ_EVENT_PREEMPT_BIT), 2184d7822b1eSMathieu Desnoyers RSEQ_EVENT_SIGNAL = (1U << RSEQ_EVENT_SIGNAL_BIT), 2185d7822b1eSMathieu Desnoyers RSEQ_EVENT_MIGRATE = (1U << RSEQ_EVENT_MIGRATE_BIT), 2186d7822b1eSMathieu Desnoyers }; 2187d7822b1eSMathieu Desnoyers 2188d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t) 2189d7822b1eSMathieu Desnoyers { 2190d7822b1eSMathieu Desnoyers if (t->rseq) 2191d7822b1eSMathieu Desnoyers set_tsk_thread_flag(t, TIF_NOTIFY_RESUME); 2192d7822b1eSMathieu Desnoyers } 2193d7822b1eSMathieu Desnoyers 2194784e0300SWill Deacon void __rseq_handle_notify_resume(struct ksignal *sig, struct pt_regs *regs); 2195d7822b1eSMathieu Desnoyers 2196784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig, 2197784e0300SWill Deacon struct pt_regs *regs) 2198d7822b1eSMathieu Desnoyers { 2199d7822b1eSMathieu Desnoyers if (current->rseq) 2200784e0300SWill Deacon __rseq_handle_notify_resume(ksig, regs); 2201d7822b1eSMathieu Desnoyers } 2202d7822b1eSMathieu Desnoyers 2203784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig, 2204784e0300SWill Deacon struct pt_regs *regs) 2205d7822b1eSMathieu Desnoyers { 2206d7822b1eSMathieu Desnoyers preempt_disable(); 2207d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_SIGNAL_BIT, ¤t->rseq_event_mask); 2208d7822b1eSMathieu Desnoyers preempt_enable(); 2209784e0300SWill Deacon rseq_handle_notify_resume(ksig, regs); 2210d7822b1eSMathieu Desnoyers } 2211d7822b1eSMathieu Desnoyers 2212d7822b1eSMathieu Desnoyers /* rseq_preempt() requires preemption to be disabled. */ 2213d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t) 2214d7822b1eSMathieu Desnoyers { 2215d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_PREEMPT_BIT, &t->rseq_event_mask); 2216d7822b1eSMathieu Desnoyers rseq_set_notify_resume(t); 2217d7822b1eSMathieu Desnoyers } 2218d7822b1eSMathieu Desnoyers 2219d7822b1eSMathieu Desnoyers /* rseq_migrate() requires preemption to be disabled. */ 2220d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t) 2221d7822b1eSMathieu Desnoyers { 2222d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_MIGRATE_BIT, &t->rseq_event_mask); 2223d7822b1eSMathieu Desnoyers rseq_set_notify_resume(t); 2224d7822b1eSMathieu Desnoyers } 2225d7822b1eSMathieu Desnoyers 2226d7822b1eSMathieu Desnoyers /* 2227d7822b1eSMathieu Desnoyers * If parent process has a registered restartable sequences area, the 2228463f550fSMathieu Desnoyers * child inherits. Unregister rseq for a clone with CLONE_VM set. 2229d7822b1eSMathieu Desnoyers */ 2230d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags) 2231d7822b1eSMathieu Desnoyers { 2232463f550fSMathieu Desnoyers if (clone_flags & CLONE_VM) { 2233d7822b1eSMathieu Desnoyers t->rseq = NULL; 2234d7822b1eSMathieu Desnoyers t->rseq_sig = 0; 2235d7822b1eSMathieu Desnoyers t->rseq_event_mask = 0; 2236d7822b1eSMathieu Desnoyers } else { 2237d7822b1eSMathieu Desnoyers t->rseq = current->rseq; 2238d7822b1eSMathieu Desnoyers t->rseq_sig = current->rseq_sig; 2239d7822b1eSMathieu Desnoyers t->rseq_event_mask = current->rseq_event_mask; 2240d7822b1eSMathieu Desnoyers } 2241d7822b1eSMathieu Desnoyers } 2242d7822b1eSMathieu Desnoyers 2243d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t) 2244d7822b1eSMathieu Desnoyers { 2245d7822b1eSMathieu Desnoyers t->rseq = NULL; 2246d7822b1eSMathieu Desnoyers t->rseq_sig = 0; 2247d7822b1eSMathieu Desnoyers t->rseq_event_mask = 0; 2248d7822b1eSMathieu Desnoyers } 2249d7822b1eSMathieu Desnoyers 2250d7822b1eSMathieu Desnoyers #else 2251d7822b1eSMathieu Desnoyers 2252d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t) 2253d7822b1eSMathieu Desnoyers { 2254d7822b1eSMathieu Desnoyers } 2255784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig, 2256784e0300SWill Deacon struct pt_regs *regs) 2257d7822b1eSMathieu Desnoyers { 2258d7822b1eSMathieu Desnoyers } 2259784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig, 2260784e0300SWill Deacon struct pt_regs *regs) 2261d7822b1eSMathieu Desnoyers { 2262d7822b1eSMathieu Desnoyers } 2263d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t) 2264d7822b1eSMathieu Desnoyers { 2265d7822b1eSMathieu Desnoyers } 2266d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t) 2267d7822b1eSMathieu Desnoyers { 2268d7822b1eSMathieu Desnoyers } 2269d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags) 2270d7822b1eSMathieu Desnoyers { 2271d7822b1eSMathieu Desnoyers } 2272d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t) 2273d7822b1eSMathieu Desnoyers { 2274d7822b1eSMathieu Desnoyers } 2275d7822b1eSMathieu Desnoyers 2276d7822b1eSMathieu Desnoyers #endif 2277d7822b1eSMathieu Desnoyers 2278d7822b1eSMathieu Desnoyers #ifdef CONFIG_DEBUG_RSEQ 2279d7822b1eSMathieu Desnoyers 2280d7822b1eSMathieu Desnoyers void rseq_syscall(struct pt_regs *regs); 2281d7822b1eSMathieu Desnoyers 2282d7822b1eSMathieu Desnoyers #else 2283d7822b1eSMathieu Desnoyers 2284d7822b1eSMathieu Desnoyers static inline void rseq_syscall(struct pt_regs *regs) 2285d7822b1eSMathieu Desnoyers { 2286d7822b1eSMathieu Desnoyers } 2287d7822b1eSMathieu Desnoyers 2288d7822b1eSMathieu Desnoyers #endif 2289d7822b1eSMathieu Desnoyers 22903c93a0c0SQais Yousef const struct sched_avg *sched_trace_cfs_rq_avg(struct cfs_rq *cfs_rq); 22913c93a0c0SQais Yousef char *sched_trace_cfs_rq_path(struct cfs_rq *cfs_rq, char *str, int len); 22923c93a0c0SQais Yousef int sched_trace_cfs_rq_cpu(struct cfs_rq *cfs_rq); 22933c93a0c0SQais Yousef 22943c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_rt(struct rq *rq); 22953c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_dl(struct rq *rq); 22963c93a0c0SQais Yousef const struct sched_avg *sched_trace_rq_avg_irq(struct rq *rq); 22973c93a0c0SQais Yousef 22983c93a0c0SQais Yousef int sched_trace_rq_cpu(struct rq *rq); 229951cf18c9SVincent Donnefort int sched_trace_rq_cpu_capacity(struct rq *rq); 23009d246053SPhil Auld int sched_trace_rq_nr_running(struct rq *rq); 23013c93a0c0SQais Yousef 23023c93a0c0SQais Yousef const struct cpumask *sched_trace_rd_span(struct root_domain *rd); 23033c93a0c0SQais Yousef 23046e33cad0SPeter Zijlstra #ifdef CONFIG_SCHED_CORE 23056e33cad0SPeter Zijlstra extern void sched_core_free(struct task_struct *tsk); 230685dd3f61SPeter Zijlstra extern void sched_core_fork(struct task_struct *p); 23077ac592aaSChris Hyser extern int sched_core_share_pid(unsigned int cmd, pid_t pid, enum pid_type type, 23087ac592aaSChris Hyser unsigned long uaddr); 23096e33cad0SPeter Zijlstra #else 23106e33cad0SPeter Zijlstra static inline void sched_core_free(struct task_struct *tsk) { } 231185dd3f61SPeter Zijlstra static inline void sched_core_fork(struct task_struct *p) { } 23126e33cad0SPeter Zijlstra #endif 23136e33cad0SPeter Zijlstra 23141da177e4SLinus Torvalds #endif 2315