1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */ 21da177e4SLinus Torvalds #ifndef _LINUX_SCHED_H 31da177e4SLinus Torvalds #define _LINUX_SCHED_H 41da177e4SLinus Torvalds 55eca1c10SIngo Molnar /* 65eca1c10SIngo Molnar * Define 'struct task_struct' and provide the main scheduler 75eca1c10SIngo Molnar * APIs (schedule(), wakeup variants, etc.) 85eca1c10SIngo Molnar */ 95eca1c10SIngo Molnar 10607ca46eSDavid Howells #include <uapi/linux/sched.h> 11b7b3c76aSDavid Woodhouse 1270b8157eSIngo Molnar #include <asm/current.h> 1370b8157eSIngo Molnar 145eca1c10SIngo Molnar #include <linux/pid.h> 155eca1c10SIngo Molnar #include <linux/sem.h> 165eca1c10SIngo Molnar #include <linux/shm.h> 175eca1c10SIngo Molnar #include <linux/kcov.h> 185eca1c10SIngo Molnar #include <linux/mutex.h> 195eca1c10SIngo Molnar #include <linux/plist.h> 205eca1c10SIngo Molnar #include <linux/hrtimer.h> 215eca1c10SIngo Molnar #include <linux/seccomp.h> 225eca1c10SIngo Molnar #include <linux/nodemask.h> 235eca1c10SIngo Molnar #include <linux/rcupdate.h> 245eca1c10SIngo Molnar #include <linux/resource.h> 255eca1c10SIngo Molnar #include <linux/latencytop.h> 265eca1c10SIngo Molnar #include <linux/sched/prio.h> 275eca1c10SIngo Molnar #include <linux/signal_types.h> 28eb414681SJohannes Weiner #include <linux/psi_types.h> 295eca1c10SIngo Molnar #include <linux/mm_types_task.h> 305eca1c10SIngo Molnar #include <linux/task_io_accounting.h> 31d7822b1eSMathieu Desnoyers #include <linux/rseq.h> 325eca1c10SIngo Molnar 335eca1c10SIngo Molnar /* task_struct member predeclarations (sorted alphabetically): */ 34c7af7877SIngo Molnar struct audit_context; 35c7af7877SIngo Molnar struct backing_dev_info; 36c7af7877SIngo Molnar struct bio_list; 37c7af7877SIngo Molnar struct blk_plug; 38c7af7877SIngo Molnar struct cfs_rq; 39c7af7877SIngo Molnar struct fs_struct; 40c7af7877SIngo Molnar struct futex_pi_state; 41c7af7877SIngo Molnar struct io_context; 42c7af7877SIngo Molnar struct mempolicy; 43c7af7877SIngo Molnar struct nameidata; 44c7af7877SIngo Molnar struct nsproxy; 45c7af7877SIngo Molnar struct perf_event_context; 46c7af7877SIngo Molnar struct pid_namespace; 47c7af7877SIngo Molnar struct pipe_inode_info; 48c7af7877SIngo Molnar struct rcu_node; 49c7af7877SIngo Molnar struct reclaim_state; 50c7af7877SIngo Molnar struct robust_list_head; 51e2d1e2aeSIngo Molnar struct sched_attr; 52e2d1e2aeSIngo Molnar struct sched_param; 5343ae34cbSIngo Molnar struct seq_file; 54c7af7877SIngo Molnar struct sighand_struct; 55c7af7877SIngo Molnar struct signal_struct; 56c7af7877SIngo Molnar struct task_delay_info; 574cf86d77SIngo Molnar struct task_group; 581da177e4SLinus Torvalds 594a8342d2SLinus Torvalds /* 604a8342d2SLinus Torvalds * Task state bitmask. NOTE! These bits are also 614a8342d2SLinus Torvalds * encoded in fs/proc/array.c: get_task_state(). 624a8342d2SLinus Torvalds * 634a8342d2SLinus Torvalds * We have two separate sets of flags: task->state 644a8342d2SLinus Torvalds * is about runnability, while task->exit_state are 654a8342d2SLinus Torvalds * about the task exiting. Confusing, but this way 664a8342d2SLinus Torvalds * modifying one set can't modify the other one by 674a8342d2SLinus Torvalds * mistake. 684a8342d2SLinus Torvalds */ 695eca1c10SIngo Molnar 705eca1c10SIngo Molnar /* Used in tsk->state: */ 7192c4bc9fSPeter Zijlstra #define TASK_RUNNING 0x0000 7292c4bc9fSPeter Zijlstra #define TASK_INTERRUPTIBLE 0x0001 7392c4bc9fSPeter Zijlstra #define TASK_UNINTERRUPTIBLE 0x0002 7492c4bc9fSPeter Zijlstra #define __TASK_STOPPED 0x0004 7592c4bc9fSPeter Zijlstra #define __TASK_TRACED 0x0008 765eca1c10SIngo Molnar /* Used in tsk->exit_state: */ 7792c4bc9fSPeter Zijlstra #define EXIT_DEAD 0x0010 7892c4bc9fSPeter Zijlstra #define EXIT_ZOMBIE 0x0020 79abd50b39SOleg Nesterov #define EXIT_TRACE (EXIT_ZOMBIE | EXIT_DEAD) 805eca1c10SIngo Molnar /* Used in tsk->state again: */ 818ef9925bSPeter Zijlstra #define TASK_PARKED 0x0040 828ef9925bSPeter Zijlstra #define TASK_DEAD 0x0080 838ef9925bSPeter Zijlstra #define TASK_WAKEKILL 0x0100 848ef9925bSPeter Zijlstra #define TASK_WAKING 0x0200 8592c4bc9fSPeter Zijlstra #define TASK_NOLOAD 0x0400 8692c4bc9fSPeter Zijlstra #define TASK_NEW 0x0800 8792c4bc9fSPeter Zijlstra #define TASK_STATE_MAX 0x1000 88f021a3c2SMatthew Wilcox 895eca1c10SIngo Molnar /* Convenience macros for the sake of set_current_state: */ 90f021a3c2SMatthew Wilcox #define TASK_KILLABLE (TASK_WAKEKILL | TASK_UNINTERRUPTIBLE) 91f021a3c2SMatthew Wilcox #define TASK_STOPPED (TASK_WAKEKILL | __TASK_STOPPED) 92f021a3c2SMatthew Wilcox #define TASK_TRACED (TASK_WAKEKILL | __TASK_TRACED) 931da177e4SLinus Torvalds 9480ed87c8SPeter Zijlstra #define TASK_IDLE (TASK_UNINTERRUPTIBLE | TASK_NOLOAD) 9580ed87c8SPeter Zijlstra 965eca1c10SIngo Molnar /* Convenience macros for the sake of wake_up(): */ 9792a1f4bcSMatthew Wilcox #define TASK_NORMAL (TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE) 9892a1f4bcSMatthew Wilcox 995eca1c10SIngo Molnar /* get_task_state(): */ 10092a1f4bcSMatthew Wilcox #define TASK_REPORT (TASK_RUNNING | TASK_INTERRUPTIBLE | \ 101f021a3c2SMatthew Wilcox TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \ 1028ef9925bSPeter Zijlstra __TASK_TRACED | EXIT_DEAD | EXIT_ZOMBIE | \ 1038ef9925bSPeter Zijlstra TASK_PARKED) 10492a1f4bcSMatthew Wilcox 105f021a3c2SMatthew Wilcox #define task_is_traced(task) ((task->state & __TASK_TRACED) != 0) 1065eca1c10SIngo Molnar 107f021a3c2SMatthew Wilcox #define task_is_stopped(task) ((task->state & __TASK_STOPPED) != 0) 1085eca1c10SIngo Molnar 1095eca1c10SIngo Molnar #define task_is_stopped_or_traced(task) ((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0) 1105eca1c10SIngo Molnar 1115eca1c10SIngo Molnar #define task_contributes_to_load(task) ((task->state & TASK_UNINTERRUPTIBLE) != 0 && \ 11280ed87c8SPeter Zijlstra (task->flags & PF_FROZEN) == 0 && \ 11380ed87c8SPeter Zijlstra (task->state & TASK_NOLOAD) == 0) 1141da177e4SLinus Torvalds 1158eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 1168eb23b9fSPeter Zijlstra 117b5bf9a90SPeter Zijlstra /* 118b5bf9a90SPeter Zijlstra * Special states are those that do not use the normal wait-loop pattern. See 119b5bf9a90SPeter Zijlstra * the comment with set_special_state(). 120b5bf9a90SPeter Zijlstra */ 121b5bf9a90SPeter Zijlstra #define is_special_task_state(state) \ 1221cef1150SPeter Zijlstra ((state) & (__TASK_STOPPED | __TASK_TRACED | TASK_PARKED | TASK_DEAD)) 123b5bf9a90SPeter Zijlstra 1248eb23b9fSPeter Zijlstra #define __set_current_state(state_value) \ 1258eb23b9fSPeter Zijlstra do { \ 126b5bf9a90SPeter Zijlstra WARN_ON_ONCE(is_special_task_state(state_value));\ 1278eb23b9fSPeter Zijlstra current->task_state_change = _THIS_IP_; \ 1288eb23b9fSPeter Zijlstra current->state = (state_value); \ 1298eb23b9fSPeter Zijlstra } while (0) 130b5bf9a90SPeter Zijlstra 1318eb23b9fSPeter Zijlstra #define set_current_state(state_value) \ 1328eb23b9fSPeter Zijlstra do { \ 133b5bf9a90SPeter Zijlstra WARN_ON_ONCE(is_special_task_state(state_value));\ 1348eb23b9fSPeter Zijlstra current->task_state_change = _THIS_IP_; \ 135b92b8b35SPeter Zijlstra smp_store_mb(current->state, (state_value)); \ 1368eb23b9fSPeter Zijlstra } while (0) 1378eb23b9fSPeter Zijlstra 138b5bf9a90SPeter Zijlstra #define set_special_state(state_value) \ 139b5bf9a90SPeter Zijlstra do { \ 140b5bf9a90SPeter Zijlstra unsigned long flags; /* may shadow */ \ 141b5bf9a90SPeter Zijlstra WARN_ON_ONCE(!is_special_task_state(state_value)); \ 142b5bf9a90SPeter Zijlstra raw_spin_lock_irqsave(¤t->pi_lock, flags); \ 143b5bf9a90SPeter Zijlstra current->task_state_change = _THIS_IP_; \ 144b5bf9a90SPeter Zijlstra current->state = (state_value); \ 145b5bf9a90SPeter Zijlstra raw_spin_unlock_irqrestore(¤t->pi_lock, flags); \ 146b5bf9a90SPeter Zijlstra } while (0) 1478eb23b9fSPeter Zijlstra #else 148498d0c57SAndrew Morton /* 149498d0c57SAndrew Morton * set_current_state() includes a barrier so that the write of current->state 150498d0c57SAndrew Morton * is correctly serialised wrt the caller's subsequent test of whether to 151498d0c57SAndrew Morton * actually sleep: 152498d0c57SAndrew Morton * 153a2250238SPeter Zijlstra * for (;;) { 154498d0c57SAndrew Morton * set_current_state(TASK_UNINTERRUPTIBLE); 155a2250238SPeter Zijlstra * if (!need_sleep) 156a2250238SPeter Zijlstra * break; 157498d0c57SAndrew Morton * 158a2250238SPeter Zijlstra * schedule(); 159a2250238SPeter Zijlstra * } 160a2250238SPeter Zijlstra * __set_current_state(TASK_RUNNING); 161a2250238SPeter Zijlstra * 162a2250238SPeter Zijlstra * If the caller does not need such serialisation (because, for instance, the 163a2250238SPeter Zijlstra * condition test and condition change and wakeup are under the same lock) then 164a2250238SPeter Zijlstra * use __set_current_state(). 165a2250238SPeter Zijlstra * 166a2250238SPeter Zijlstra * The above is typically ordered against the wakeup, which does: 167a2250238SPeter Zijlstra * 168a2250238SPeter Zijlstra * need_sleep = false; 169a2250238SPeter Zijlstra * wake_up_state(p, TASK_UNINTERRUPTIBLE); 170a2250238SPeter Zijlstra * 1717696f991SAndrea Parri * where wake_up_state() executes a full memory barrier before accessing the 1727696f991SAndrea Parri * task state. 173a2250238SPeter Zijlstra * 174a2250238SPeter Zijlstra * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is, 175a2250238SPeter Zijlstra * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a 176a2250238SPeter Zijlstra * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING). 177a2250238SPeter Zijlstra * 178b5bf9a90SPeter Zijlstra * However, with slightly different timing the wakeup TASK_RUNNING store can 179b5bf9a90SPeter Zijlstra * also collide with the TASK_UNINTERRUPTIBLE store. Loosing that store is not 180b5bf9a90SPeter Zijlstra * a problem either because that will result in one extra go around the loop 181b5bf9a90SPeter Zijlstra * and our @cond test will save the day. 182a2250238SPeter Zijlstra * 183a2250238SPeter Zijlstra * Also see the comments of try_to_wake_up(). 184498d0c57SAndrew Morton */ 185b5bf9a90SPeter Zijlstra #define __set_current_state(state_value) \ 186b5bf9a90SPeter Zijlstra current->state = (state_value) 187b5bf9a90SPeter Zijlstra 188b5bf9a90SPeter Zijlstra #define set_current_state(state_value) \ 189b5bf9a90SPeter Zijlstra smp_store_mb(current->state, (state_value)) 190b5bf9a90SPeter Zijlstra 191b5bf9a90SPeter Zijlstra /* 192b5bf9a90SPeter Zijlstra * set_special_state() should be used for those states when the blocking task 193b5bf9a90SPeter Zijlstra * can not use the regular condition based wait-loop. In that case we must 194b5bf9a90SPeter Zijlstra * serialize against wakeups such that any possible in-flight TASK_RUNNING stores 195b5bf9a90SPeter Zijlstra * will not collide with our state change. 196b5bf9a90SPeter Zijlstra */ 197b5bf9a90SPeter Zijlstra #define set_special_state(state_value) \ 198b5bf9a90SPeter Zijlstra do { \ 199b5bf9a90SPeter Zijlstra unsigned long flags; /* may shadow */ \ 200b5bf9a90SPeter Zijlstra raw_spin_lock_irqsave(¤t->pi_lock, flags); \ 201b5bf9a90SPeter Zijlstra current->state = (state_value); \ 202b5bf9a90SPeter Zijlstra raw_spin_unlock_irqrestore(¤t->pi_lock, flags); \ 203b5bf9a90SPeter Zijlstra } while (0) 204b5bf9a90SPeter Zijlstra 2058eb23b9fSPeter Zijlstra #endif 2068eb23b9fSPeter Zijlstra 2075eca1c10SIngo Molnar /* Task command name length: */ 2081da177e4SLinus Torvalds #define TASK_COMM_LEN 16 2091da177e4SLinus Torvalds 2101da177e4SLinus Torvalds extern void scheduler_tick(void); 2111da177e4SLinus Torvalds 2121da177e4SLinus Torvalds #define MAX_SCHEDULE_TIMEOUT LONG_MAX 2135eca1c10SIngo Molnar 2145eca1c10SIngo Molnar extern long schedule_timeout(long timeout); 2155eca1c10SIngo Molnar extern long schedule_timeout_interruptible(long timeout); 2165eca1c10SIngo Molnar extern long schedule_timeout_killable(long timeout); 2175eca1c10SIngo Molnar extern long schedule_timeout_uninterruptible(long timeout); 2185eca1c10SIngo Molnar extern long schedule_timeout_idle(long timeout); 2191da177e4SLinus Torvalds asmlinkage void schedule(void); 220c5491ea7SThomas Gleixner extern void schedule_preempt_disabled(void); 2211da177e4SLinus Torvalds 22210ab5643STejun Heo extern int __must_check io_schedule_prepare(void); 22310ab5643STejun Heo extern void io_schedule_finish(int token); 2249cff8adeSNeilBrown extern long io_schedule_timeout(long timeout); 22510ab5643STejun Heo extern void io_schedule(void); 2269cff8adeSNeilBrown 227f06febc9SFrank Mayhar /** 2280ba42a59SMasanari Iida * struct prev_cputime - snapshot of system and user cputime 229d37f761dSFrederic Weisbecker * @utime: time spent in user mode 230d37f761dSFrederic Weisbecker * @stime: time spent in system mode 2319d7fb042SPeter Zijlstra * @lock: protects the above two fields 232d37f761dSFrederic Weisbecker * 2339d7fb042SPeter Zijlstra * Stores previous user/system time values such that we can guarantee 2349d7fb042SPeter Zijlstra * monotonicity. 235d37f761dSFrederic Weisbecker */ 2369d7fb042SPeter Zijlstra struct prev_cputime { 2379d7fb042SPeter Zijlstra #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE 2385613fda9SFrederic Weisbecker u64 utime; 2395613fda9SFrederic Weisbecker u64 stime; 2409d7fb042SPeter Zijlstra raw_spinlock_t lock; 2419d7fb042SPeter Zijlstra #endif 242d37f761dSFrederic Weisbecker }; 243d37f761dSFrederic Weisbecker 244d37f761dSFrederic Weisbecker /** 245f06febc9SFrank Mayhar * struct task_cputime - collected CPU time counts 2465613fda9SFrederic Weisbecker * @utime: time spent in user mode, in nanoseconds 2475613fda9SFrederic Weisbecker * @stime: time spent in kernel mode, in nanoseconds 248f06febc9SFrank Mayhar * @sum_exec_runtime: total time spent on the CPU, in nanoseconds 249f06febc9SFrank Mayhar * 2509d7fb042SPeter Zijlstra * This structure groups together three kinds of CPU time that are tracked for 2519d7fb042SPeter Zijlstra * threads and thread groups. Most things considering CPU time want to group 2529d7fb042SPeter Zijlstra * these counts together and treat all three of them in parallel. 253f06febc9SFrank Mayhar */ 254f06febc9SFrank Mayhar struct task_cputime { 2555613fda9SFrederic Weisbecker u64 utime; 2565613fda9SFrederic Weisbecker u64 stime; 257f06febc9SFrank Mayhar unsigned long long sum_exec_runtime; 258f06febc9SFrank Mayhar }; 2599d7fb042SPeter Zijlstra 2605eca1c10SIngo Molnar /* Alternate field names when used on cache expirations: */ 261f06febc9SFrank Mayhar #define virt_exp utime 2629d7fb042SPeter Zijlstra #define prof_exp stime 263f06febc9SFrank Mayhar #define sched_exp sum_exec_runtime 264f06febc9SFrank Mayhar 265bac5b6b6SFrederic Weisbecker enum vtime_state { 266bac5b6b6SFrederic Weisbecker /* Task is sleeping or running in a CPU with VTIME inactive: */ 267bac5b6b6SFrederic Weisbecker VTIME_INACTIVE = 0, 268bac5b6b6SFrederic Weisbecker /* Task runs in userspace in a CPU with VTIME active: */ 269bac5b6b6SFrederic Weisbecker VTIME_USER, 270bac5b6b6SFrederic Weisbecker /* Task runs in kernelspace in a CPU with VTIME active: */ 271bac5b6b6SFrederic Weisbecker VTIME_SYS, 272bac5b6b6SFrederic Weisbecker }; 273bac5b6b6SFrederic Weisbecker 274bac5b6b6SFrederic Weisbecker struct vtime { 275bac5b6b6SFrederic Weisbecker seqcount_t seqcount; 276bac5b6b6SFrederic Weisbecker unsigned long long starttime; 277bac5b6b6SFrederic Weisbecker enum vtime_state state; 2782a42eb95SWanpeng Li u64 utime; 2792a42eb95SWanpeng Li u64 stime; 2802a42eb95SWanpeng Li u64 gtime; 281bac5b6b6SFrederic Weisbecker }; 282bac5b6b6SFrederic Weisbecker 2831da177e4SLinus Torvalds struct sched_info { 2847f5f8e8dSIngo Molnar #ifdef CONFIG_SCHED_INFO 2855eca1c10SIngo Molnar /* Cumulative counters: */ 2861da177e4SLinus Torvalds 2875eca1c10SIngo Molnar /* # of times we have run on this CPU: */ 2885eca1c10SIngo Molnar unsigned long pcount; 2895eca1c10SIngo Molnar 2905eca1c10SIngo Molnar /* Time spent waiting on a runqueue: */ 2915eca1c10SIngo Molnar unsigned long long run_delay; 2925eca1c10SIngo Molnar 2935eca1c10SIngo Molnar /* Timestamps: */ 2945eca1c10SIngo Molnar 2955eca1c10SIngo Molnar /* When did we last run on a CPU? */ 2965eca1c10SIngo Molnar unsigned long long last_arrival; 2975eca1c10SIngo Molnar 2985eca1c10SIngo Molnar /* When were we last queued to run? */ 2995eca1c10SIngo Molnar unsigned long long last_queued; 3005eca1c10SIngo Molnar 301f6db8347SNaveen N. Rao #endif /* CONFIG_SCHED_INFO */ 3027f5f8e8dSIngo Molnar }; 3031da177e4SLinus Torvalds 3041da177e4SLinus Torvalds /* 3056ecdd749SYuyang Du * Integer metrics need fixed point arithmetic, e.g., sched/fair 3066ecdd749SYuyang Du * has a few: load, load_avg, util_avg, freq, and capacity. 3076ecdd749SYuyang Du * 3086ecdd749SYuyang Du * We define a basic fixed point arithmetic range, and then formalize 3096ecdd749SYuyang Du * all these metrics based on that basic range. 3106ecdd749SYuyang Du */ 3116ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SHIFT 10 3126ecdd749SYuyang Du # define SCHED_FIXEDPOINT_SCALE (1L << SCHED_FIXEDPOINT_SHIFT) 3136ecdd749SYuyang Du 31420b8a59fSIngo Molnar struct load_weight { 3159dbdb155SPeter Zijlstra unsigned long weight; 3169dbdb155SPeter Zijlstra u32 inv_weight; 31720b8a59fSIngo Molnar }; 31820b8a59fSIngo Molnar 3197f65ea42SPatrick Bellasi /** 3207f65ea42SPatrick Bellasi * struct util_est - Estimation utilization of FAIR tasks 3217f65ea42SPatrick Bellasi * @enqueued: instantaneous estimated utilization of a task/cpu 3227f65ea42SPatrick Bellasi * @ewma: the Exponential Weighted Moving Average (EWMA) 3237f65ea42SPatrick Bellasi * utilization of a task 3247f65ea42SPatrick Bellasi * 3257f65ea42SPatrick Bellasi * Support data structure to track an Exponential Weighted Moving Average 3267f65ea42SPatrick Bellasi * (EWMA) of a FAIR task's utilization. New samples are added to the moving 3277f65ea42SPatrick Bellasi * average each time a task completes an activation. Sample's weight is chosen 3287f65ea42SPatrick Bellasi * so that the EWMA will be relatively insensitive to transient changes to the 3297f65ea42SPatrick Bellasi * task's workload. 3307f65ea42SPatrick Bellasi * 3317f65ea42SPatrick Bellasi * The enqueued attribute has a slightly different meaning for tasks and cpus: 3327f65ea42SPatrick Bellasi * - task: the task's util_avg at last task dequeue time 3337f65ea42SPatrick Bellasi * - cfs_rq: the sum of util_est.enqueued for each RUNNABLE task on that CPU 3347f65ea42SPatrick Bellasi * Thus, the util_est.enqueued of a task represents the contribution on the 3357f65ea42SPatrick Bellasi * estimated utilization of the CPU where that task is currently enqueued. 3367f65ea42SPatrick Bellasi * 3377f65ea42SPatrick Bellasi * Only for tasks we track a moving average of the past instantaneous 3387f65ea42SPatrick Bellasi * estimated utilization. This allows to absorb sporadic drops in utilization 3397f65ea42SPatrick Bellasi * of an otherwise almost periodic task. 3407f65ea42SPatrick Bellasi */ 3417f65ea42SPatrick Bellasi struct util_est { 3427f65ea42SPatrick Bellasi unsigned int enqueued; 3437f65ea42SPatrick Bellasi unsigned int ewma; 3447f65ea42SPatrick Bellasi #define UTIL_EST_WEIGHT_SHIFT 2 345317d359dSPeter Zijlstra } __attribute__((__aligned__(sizeof(u64)))); 3467f65ea42SPatrick Bellasi 3479d89c257SYuyang Du /* 3487b595334SYuyang Du * The load_avg/util_avg accumulates an infinite geometric series 3497b595334SYuyang Du * (see __update_load_avg() in kernel/sched/fair.c). 3507b595334SYuyang Du * 3517b595334SYuyang Du * [load_avg definition] 3527b595334SYuyang Du * 3537b595334SYuyang Du * load_avg = runnable% * scale_load_down(load) 3547b595334SYuyang Du * 3557b595334SYuyang Du * where runnable% is the time ratio that a sched_entity is runnable. 3567b595334SYuyang Du * For cfs_rq, it is the aggregated load_avg of all runnable and 3579d89c257SYuyang Du * blocked sched_entities. 3587b595334SYuyang Du * 3597b595334SYuyang Du * load_avg may also take frequency scaling into account: 3607b595334SYuyang Du * 3617b595334SYuyang Du * load_avg = runnable% * scale_load_down(load) * freq% 3627b595334SYuyang Du * 3637b595334SYuyang Du * where freq% is the CPU frequency normalized to the highest frequency. 3647b595334SYuyang Du * 3657b595334SYuyang Du * [util_avg definition] 3667b595334SYuyang Du * 3677b595334SYuyang Du * util_avg = running% * SCHED_CAPACITY_SCALE 3687b595334SYuyang Du * 3697b595334SYuyang Du * where running% is the time ratio that a sched_entity is running on 3707b595334SYuyang Du * a CPU. For cfs_rq, it is the aggregated util_avg of all runnable 3717b595334SYuyang Du * and blocked sched_entities. 3727b595334SYuyang Du * 3737b595334SYuyang Du * util_avg may also factor frequency scaling and CPU capacity scaling: 3747b595334SYuyang Du * 3757b595334SYuyang Du * util_avg = running% * SCHED_CAPACITY_SCALE * freq% * capacity% 3767b595334SYuyang Du * 3777b595334SYuyang Du * where freq% is the same as above, and capacity% is the CPU capacity 3787b595334SYuyang Du * normalized to the greatest capacity (due to uarch differences, etc). 3797b595334SYuyang Du * 3807b595334SYuyang Du * N.B., the above ratios (runnable%, running%, freq%, and capacity%) 3817b595334SYuyang Du * themselves are in the range of [0, 1]. To do fixed point arithmetics, 3827b595334SYuyang Du * we therefore scale them to as large a range as necessary. This is for 3837b595334SYuyang Du * example reflected by util_avg's SCHED_CAPACITY_SCALE. 3847b595334SYuyang Du * 3857b595334SYuyang Du * [Overflow issue] 3867b595334SYuyang Du * 3877b595334SYuyang Du * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities 3887b595334SYuyang Du * with the highest load (=88761), always runnable on a single cfs_rq, 3897b595334SYuyang Du * and should not overflow as the number already hits PID_MAX_LIMIT. 3907b595334SYuyang Du * 3917b595334SYuyang Du * For all other cases (including 32-bit kernels), struct load_weight's 3927b595334SYuyang Du * weight will overflow first before we do, because: 3937b595334SYuyang Du * 3947b595334SYuyang Du * Max(load_avg) <= Max(load.weight) 3957b595334SYuyang Du * 3967b595334SYuyang Du * Then it is the load_weight's responsibility to consider overflow 3977b595334SYuyang Du * issues. 3989d89c257SYuyang Du */ 3999d85f21cSPaul Turner struct sched_avg { 4005eca1c10SIngo Molnar u64 last_update_time; 4015eca1c10SIngo Molnar u64 load_sum; 4021ea6c46aSPeter Zijlstra u64 runnable_load_sum; 4035eca1c10SIngo Molnar u32 util_sum; 4045eca1c10SIngo Molnar u32 period_contrib; 4055eca1c10SIngo Molnar unsigned long load_avg; 4061ea6c46aSPeter Zijlstra unsigned long runnable_load_avg; 4075eca1c10SIngo Molnar unsigned long util_avg; 4087f65ea42SPatrick Bellasi struct util_est util_est; 409317d359dSPeter Zijlstra } ____cacheline_aligned; 4109d85f21cSPaul Turner 41141acab88SLucas De Marchi struct sched_statistics { 4127f5f8e8dSIngo Molnar #ifdef CONFIG_SCHEDSTATS 41394c18227SIngo Molnar u64 wait_start; 41494c18227SIngo Molnar u64 wait_max; 4156d082592SArjan van de Ven u64 wait_count; 4166d082592SArjan van de Ven u64 wait_sum; 4178f0dfc34SArjan van de Ven u64 iowait_count; 4188f0dfc34SArjan van de Ven u64 iowait_sum; 41994c18227SIngo Molnar 42094c18227SIngo Molnar u64 sleep_start; 42120b8a59fSIngo Molnar u64 sleep_max; 42294c18227SIngo Molnar s64 sum_sleep_runtime; 42394c18227SIngo Molnar 42494c18227SIngo Molnar u64 block_start; 42520b8a59fSIngo Molnar u64 block_max; 42620b8a59fSIngo Molnar u64 exec_max; 427eba1ed4bSIngo Molnar u64 slice_max; 428cc367732SIngo Molnar 429cc367732SIngo Molnar u64 nr_migrations_cold; 430cc367732SIngo Molnar u64 nr_failed_migrations_affine; 431cc367732SIngo Molnar u64 nr_failed_migrations_running; 432cc367732SIngo Molnar u64 nr_failed_migrations_hot; 433cc367732SIngo Molnar u64 nr_forced_migrations; 434cc367732SIngo Molnar 435cc367732SIngo Molnar u64 nr_wakeups; 436cc367732SIngo Molnar u64 nr_wakeups_sync; 437cc367732SIngo Molnar u64 nr_wakeups_migrate; 438cc367732SIngo Molnar u64 nr_wakeups_local; 439cc367732SIngo Molnar u64 nr_wakeups_remote; 440cc367732SIngo Molnar u64 nr_wakeups_affine; 441cc367732SIngo Molnar u64 nr_wakeups_affine_attempts; 442cc367732SIngo Molnar u64 nr_wakeups_passive; 443cc367732SIngo Molnar u64 nr_wakeups_idle; 44441acab88SLucas De Marchi #endif 4457f5f8e8dSIngo Molnar }; 44641acab88SLucas De Marchi 44741acab88SLucas De Marchi struct sched_entity { 4485eca1c10SIngo Molnar /* For load-balancing: */ 4495eca1c10SIngo Molnar struct load_weight load; 4501ea6c46aSPeter Zijlstra unsigned long runnable_weight; 45141acab88SLucas De Marchi struct rb_node run_node; 45241acab88SLucas De Marchi struct list_head group_node; 45341acab88SLucas De Marchi unsigned int on_rq; 45441acab88SLucas De Marchi 45541acab88SLucas De Marchi u64 exec_start; 45641acab88SLucas De Marchi u64 sum_exec_runtime; 45741acab88SLucas De Marchi u64 vruntime; 45841acab88SLucas De Marchi u64 prev_sum_exec_runtime; 45941acab88SLucas De Marchi 46041acab88SLucas De Marchi u64 nr_migrations; 46141acab88SLucas De Marchi 46241acab88SLucas De Marchi struct sched_statistics statistics; 46394c18227SIngo Molnar 46420b8a59fSIngo Molnar #ifdef CONFIG_FAIR_GROUP_SCHED 465fed14d45SPeter Zijlstra int depth; 46620b8a59fSIngo Molnar struct sched_entity *parent; 46720b8a59fSIngo Molnar /* rq on which this entity is (to be) queued: */ 46820b8a59fSIngo Molnar struct cfs_rq *cfs_rq; 46920b8a59fSIngo Molnar /* rq "owned" by this entity/group: */ 47020b8a59fSIngo Molnar struct cfs_rq *my_q; 47120b8a59fSIngo Molnar #endif 4728bd75c77SClark Williams 473141965c7SAlex Shi #ifdef CONFIG_SMP 4745a107804SJiri Olsa /* 4755a107804SJiri Olsa * Per entity load average tracking. 4765a107804SJiri Olsa * 4775a107804SJiri Olsa * Put into separate cache line so it does not 4785a107804SJiri Olsa * collide with read-mostly values above. 4795a107804SJiri Olsa */ 480317d359dSPeter Zijlstra struct sched_avg avg; 4819d85f21cSPaul Turner #endif 48220b8a59fSIngo Molnar }; 48370b97a7fSIngo Molnar 484fa717060SPeter Zijlstra struct sched_rt_entity { 485fa717060SPeter Zijlstra struct list_head run_list; 48678f2c7dbSPeter Zijlstra unsigned long timeout; 48757d2aa00SYing Xue unsigned long watchdog_stamp; 488bee367edSRichard Kennedy unsigned int time_slice; 489ff77e468SPeter Zijlstra unsigned short on_rq; 490ff77e468SPeter Zijlstra unsigned short on_list; 4916f505b16SPeter Zijlstra 49258d6c2d7SPeter Zijlstra struct sched_rt_entity *back; 493052f1dc7SPeter Zijlstra #ifdef CONFIG_RT_GROUP_SCHED 4946f505b16SPeter Zijlstra struct sched_rt_entity *parent; 4956f505b16SPeter Zijlstra /* rq on which this entity is (to be) queued: */ 4966f505b16SPeter Zijlstra struct rt_rq *rt_rq; 4976f505b16SPeter Zijlstra /* rq "owned" by this entity/group: */ 4986f505b16SPeter Zijlstra struct rt_rq *my_q; 4996f505b16SPeter Zijlstra #endif 5003859a271SKees Cook } __randomize_layout; 501fa717060SPeter Zijlstra 502aab03e05SDario Faggioli struct sched_dl_entity { 503aab03e05SDario Faggioli struct rb_node rb_node; 504aab03e05SDario Faggioli 505aab03e05SDario Faggioli /* 506aab03e05SDario Faggioli * Original scheduling parameters. Copied here from sched_attr 5074027d080Sxiaofeng.yan * during sched_setattr(), they will remain the same until 5084027d080Sxiaofeng.yan * the next sched_setattr(). 509aab03e05SDario Faggioli */ 5105eca1c10SIngo Molnar u64 dl_runtime; /* Maximum runtime for each instance */ 5115eca1c10SIngo Molnar u64 dl_deadline; /* Relative deadline of each instance */ 5125eca1c10SIngo Molnar u64 dl_period; /* Separation of two instances (period) */ 51354d6d303SDaniel Bristot de Oliveira u64 dl_bw; /* dl_runtime / dl_period */ 5143effcb42SDaniel Bristot de Oliveira u64 dl_density; /* dl_runtime / dl_deadline */ 515aab03e05SDario Faggioli 516aab03e05SDario Faggioli /* 517aab03e05SDario Faggioli * Actual scheduling parameters. Initialized with the values above, 518aab03e05SDario Faggioli * they are continously updated during task execution. Note that 519aab03e05SDario Faggioli * the remaining runtime could be < 0 in case we are in overrun. 520aab03e05SDario Faggioli */ 5215eca1c10SIngo Molnar s64 runtime; /* Remaining runtime for this instance */ 5225eca1c10SIngo Molnar u64 deadline; /* Absolute deadline for this instance */ 5235eca1c10SIngo Molnar unsigned int flags; /* Specifying the scheduler behaviour */ 524aab03e05SDario Faggioli 525aab03e05SDario Faggioli /* 526aab03e05SDario Faggioli * Some bool flags: 527aab03e05SDario Faggioli * 528aab03e05SDario Faggioli * @dl_throttled tells if we exhausted the runtime. If so, the 529aab03e05SDario Faggioli * task has to wait for a replenishment to be performed at the 530aab03e05SDario Faggioli * next firing of dl_timer. 531aab03e05SDario Faggioli * 5322d3d891dSDario Faggioli * @dl_boosted tells if we are boosted due to DI. If so we are 5332d3d891dSDario Faggioli * outside bandwidth enforcement mechanism (but only until we 5345bfd126eSJuri Lelli * exit the critical section); 5355bfd126eSJuri Lelli * 5365eca1c10SIngo Molnar * @dl_yielded tells if task gave up the CPU before consuming 5375bfd126eSJuri Lelli * all its available runtime during the last job. 538209a0cbdSLuca Abeni * 539209a0cbdSLuca Abeni * @dl_non_contending tells if the task is inactive while still 540209a0cbdSLuca Abeni * contributing to the active utilization. In other words, it 541209a0cbdSLuca Abeni * indicates if the inactive timer has been armed and its handler 542209a0cbdSLuca Abeni * has not been executed yet. This flag is useful to avoid race 543209a0cbdSLuca Abeni * conditions between the inactive timer handler and the wakeup 544209a0cbdSLuca Abeni * code. 54534be3930SJuri Lelli * 54634be3930SJuri Lelli * @dl_overrun tells if the task asked to be informed about runtime 54734be3930SJuri Lelli * overruns. 548aab03e05SDario Faggioli */ 549aa5222e9SDan Carpenter unsigned int dl_throttled : 1; 550aa5222e9SDan Carpenter unsigned int dl_boosted : 1; 551aa5222e9SDan Carpenter unsigned int dl_yielded : 1; 552aa5222e9SDan Carpenter unsigned int dl_non_contending : 1; 55334be3930SJuri Lelli unsigned int dl_overrun : 1; 554aab03e05SDario Faggioli 555aab03e05SDario Faggioli /* 556aab03e05SDario Faggioli * Bandwidth enforcement timer. Each -deadline task has its 557aab03e05SDario Faggioli * own bandwidth to be enforced, thus we need one timer per task. 558aab03e05SDario Faggioli */ 559aab03e05SDario Faggioli struct hrtimer dl_timer; 560209a0cbdSLuca Abeni 561209a0cbdSLuca Abeni /* 562209a0cbdSLuca Abeni * Inactive timer, responsible for decreasing the active utilization 563209a0cbdSLuca Abeni * at the "0-lag time". When a -deadline task blocks, it contributes 564209a0cbdSLuca Abeni * to GRUB's active utilization until the "0-lag time", hence a 565209a0cbdSLuca Abeni * timer is needed to decrease the active utilization at the correct 566209a0cbdSLuca Abeni * time. 567209a0cbdSLuca Abeni */ 568209a0cbdSLuca Abeni struct hrtimer inactive_timer; 569aab03e05SDario Faggioli }; 5708bd75c77SClark Williams 5711d082fd0SPaul E. McKenney union rcu_special { 5721d082fd0SPaul E. McKenney struct { 5738203d6d0SPaul E. McKenney u8 blocked; 5748203d6d0SPaul E. McKenney u8 need_qs; 5758203d6d0SPaul E. McKenney } b; /* Bits. */ 576fcc878e4SPaul E. McKenney u16 s; /* Set of bits. */ 5771d082fd0SPaul E. McKenney }; 57886848966SPaul E. McKenney 5798dc85d54SPeter Zijlstra enum perf_event_task_context { 5808dc85d54SPeter Zijlstra perf_invalid_context = -1, 5818dc85d54SPeter Zijlstra perf_hw_context = 0, 58289a1e187SPeter Zijlstra perf_sw_context, 5838dc85d54SPeter Zijlstra perf_nr_task_contexts, 5848dc85d54SPeter Zijlstra }; 5858dc85d54SPeter Zijlstra 586eb61baf6SIngo Molnar struct wake_q_node { 587eb61baf6SIngo Molnar struct wake_q_node *next; 588eb61baf6SIngo Molnar }; 589eb61baf6SIngo Molnar 5901da177e4SLinus Torvalds struct task_struct { 591c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 592c65eacbeSAndy Lutomirski /* 593c65eacbeSAndy Lutomirski * For reasons of header soup (see current_thread_info()), this 594c65eacbeSAndy Lutomirski * must be the first element of task_struct. 595c65eacbeSAndy Lutomirski */ 596c65eacbeSAndy Lutomirski struct thread_info thread_info; 597c65eacbeSAndy Lutomirski #endif 5985eca1c10SIngo Molnar /* -1 unrunnable, 0 runnable, >0 stopped: */ 5995eca1c10SIngo Molnar volatile long state; 60029e48ce8SKees Cook 60129e48ce8SKees Cook /* 60229e48ce8SKees Cook * This begins the randomizable portion of task_struct. Only 60329e48ce8SKees Cook * scheduling-critical items should be added above here. 60429e48ce8SKees Cook */ 60529e48ce8SKees Cook randomized_struct_fields_start 60629e48ce8SKees Cook 607f7e4217bSRoman Zippel void *stack; 6081da177e4SLinus Torvalds atomic_t usage; 6095eca1c10SIngo Molnar /* Per task flags (PF_*), defined further below: */ 6105eca1c10SIngo Molnar unsigned int flags; 61197dc32cdSWilliam Cohen unsigned int ptrace; 6121da177e4SLinus Torvalds 6132dd73a4fSPeter Williams #ifdef CONFIG_SMP 614fa14ff4aSPeter Zijlstra struct llist_node wake_entry; 6153ca7a440SPeter Zijlstra int on_cpu; 616c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 6175eca1c10SIngo Molnar /* Current CPU: */ 6185eca1c10SIngo Molnar unsigned int cpu; 619c65eacbeSAndy Lutomirski #endif 62063b0e9edSMike Galbraith unsigned int wakee_flips; 62162470419SMichael Wang unsigned long wakee_flip_decay_ts; 62263b0e9edSMike Galbraith struct task_struct *last_wakee; 623ac66f547SPeter Zijlstra 62432e839ddSMel Gorman /* 62532e839ddSMel Gorman * recent_used_cpu is initially set as the last CPU used by a task 62632e839ddSMel Gorman * that wakes affine another task. Waker/wakee relationships can 62732e839ddSMel Gorman * push tasks around a CPU where each wakeup moves to the next one. 62832e839ddSMel Gorman * Tracking a recently used CPU allows a quick search for a recently 62932e839ddSMel Gorman * used CPU that may be idle. 63032e839ddSMel Gorman */ 63132e839ddSMel Gorman int recent_used_cpu; 632ac66f547SPeter Zijlstra int wake_cpu; 6334866cde0SNick Piggin #endif 634fd2f4419SPeter Zijlstra int on_rq; 63550e645a8SIngo Molnar 6365eca1c10SIngo Molnar int prio; 6375eca1c10SIngo Molnar int static_prio; 6385eca1c10SIngo Molnar int normal_prio; 639c7aceabaSRichard Kennedy unsigned int rt_priority; 6405eca1c10SIngo Molnar 6415522d5d5SIngo Molnar const struct sched_class *sched_class; 64220b8a59fSIngo Molnar struct sched_entity se; 643fa717060SPeter Zijlstra struct sched_rt_entity rt; 6448323f26cSPeter Zijlstra #ifdef CONFIG_CGROUP_SCHED 6458323f26cSPeter Zijlstra struct task_group *sched_task_group; 6468323f26cSPeter Zijlstra #endif 647aab03e05SDario Faggioli struct sched_dl_entity dl; 6481da177e4SLinus Torvalds 649e107be36SAvi Kivity #ifdef CONFIG_PREEMPT_NOTIFIERS 6505eca1c10SIngo Molnar /* List of struct preempt_notifier: */ 651e107be36SAvi Kivity struct hlist_head preempt_notifiers; 652e107be36SAvi Kivity #endif 653e107be36SAvi Kivity 6546c5c9341SAlexey Dobriyan #ifdef CONFIG_BLK_DEV_IO_TRACE 6552056a782SJens Axboe unsigned int btrace_seq; 6566c5c9341SAlexey Dobriyan #endif 6571da177e4SLinus Torvalds 65897dc32cdSWilliam Cohen unsigned int policy; 65929baa747SPeter Zijlstra int nr_cpus_allowed; 6601da177e4SLinus Torvalds cpumask_t cpus_allowed; 6611da177e4SLinus Torvalds 662a57eb940SPaul E. McKenney #ifdef CONFIG_PREEMPT_RCU 663e260be67SPaul E. McKenney int rcu_read_lock_nesting; 6641d082fd0SPaul E. McKenney union rcu_special rcu_read_unlock_special; 665f41d911fSPaul E. McKenney struct list_head rcu_node_entry; 666a57eb940SPaul E. McKenney struct rcu_node *rcu_blocked_node; 66728f6569aSPranith Kumar #endif /* #ifdef CONFIG_PREEMPT_RCU */ 6685eca1c10SIngo Molnar 6698315f422SPaul E. McKenney #ifdef CONFIG_TASKS_RCU 6708315f422SPaul E. McKenney unsigned long rcu_tasks_nvcsw; 671ccdd29ffSPaul E. McKenney u8 rcu_tasks_holdout; 672ccdd29ffSPaul E. McKenney u8 rcu_tasks_idx; 673176f8f7aSPaul E. McKenney int rcu_tasks_idle_cpu; 674ccdd29ffSPaul E. McKenney struct list_head rcu_tasks_holdout_list; 6758315f422SPaul E. McKenney #endif /* #ifdef CONFIG_TASKS_RCU */ 676e260be67SPaul E. McKenney 6771da177e4SLinus Torvalds struct sched_info sched_info; 6781da177e4SLinus Torvalds 6791da177e4SLinus Torvalds struct list_head tasks; 680806c09a7SDario Faggioli #ifdef CONFIG_SMP 681917b627dSGregory Haskins struct plist_node pushable_tasks; 6821baca4ceSJuri Lelli struct rb_node pushable_dl_tasks; 683806c09a7SDario Faggioli #endif 6841da177e4SLinus Torvalds 6855eca1c10SIngo Molnar struct mm_struct *mm; 6865eca1c10SIngo Molnar struct mm_struct *active_mm; 687314ff785SIngo Molnar 688314ff785SIngo Molnar /* Per-thread vma caching: */ 689314ff785SIngo Molnar struct vmacache vmacache; 690314ff785SIngo Molnar 6915eca1c10SIngo Molnar #ifdef SPLIT_RSS_COUNTING 69234e55232SKAMEZAWA Hiroyuki struct task_rss_stat rss_stat; 69334e55232SKAMEZAWA Hiroyuki #endif 69497dc32cdSWilliam Cohen int exit_state; 6955eca1c10SIngo Molnar int exit_code; 6965eca1c10SIngo Molnar int exit_signal; 6975eca1c10SIngo Molnar /* The signal sent when the parent dies: */ 6985eca1c10SIngo Molnar int pdeath_signal; 6995eca1c10SIngo Molnar /* JOBCTL_*, siglock protected: */ 7005eca1c10SIngo Molnar unsigned long jobctl; 7019b89f6baSAndrei Epure 7025eca1c10SIngo Molnar /* Used for emulating ABI behavior of previous Linux versions: */ 70397dc32cdSWilliam Cohen unsigned int personality; 7049b89f6baSAndrei Epure 7055eca1c10SIngo Molnar /* Scheduler bits, serialized by scheduler locks: */ 706ca94c442SLennart Poettering unsigned sched_reset_on_fork:1; 707a8e4f2eaSPeter Zijlstra unsigned sched_contributes_to_load:1; 708ff303e66SPeter Zijlstra unsigned sched_migrated:1; 709b7e7ade3SPeter Zijlstra unsigned sched_remote_wakeup:1; 710eb414681SJohannes Weiner #ifdef CONFIG_PSI 711eb414681SJohannes Weiner unsigned sched_psi_wake_requeue:1; 712eb414681SJohannes Weiner #endif 713eb414681SJohannes Weiner 7145eca1c10SIngo Molnar /* Force alignment to the next boundary: */ 7155eca1c10SIngo Molnar unsigned :0; 716be958bdcSPeter Zijlstra 7175eca1c10SIngo Molnar /* Unserialized, strictly 'current' */ 7185eca1c10SIngo Molnar 7195eca1c10SIngo Molnar /* Bit to tell LSMs we're in execve(): */ 7205eca1c10SIngo Molnar unsigned in_execve:1; 721be958bdcSPeter Zijlstra unsigned in_iowait:1; 7225eca1c10SIngo Molnar #ifndef TIF_RESTORE_SIGMASK 7237e781418SAndy Lutomirski unsigned restore_sigmask:1; 7247e781418SAndy Lutomirski #endif 725626ebc41STejun Heo #ifdef CONFIG_MEMCG 72629ef680aSMichal Hocko unsigned in_user_fault:1; 727127424c8SJohannes Weiner #endif 728ff303e66SPeter Zijlstra #ifdef CONFIG_COMPAT_BRK 729ff303e66SPeter Zijlstra unsigned brk_randomized:1; 730ff303e66SPeter Zijlstra #endif 73177f88796STejun Heo #ifdef CONFIG_CGROUPS 73277f88796STejun Heo /* disallow userland-initiated cgroup migration */ 73377f88796STejun Heo unsigned no_cgroup_migration:1; 73477f88796STejun Heo #endif 735d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP 736d09d8df3SJosef Bacik /* to be used once the psi infrastructure lands upstream. */ 737d09d8df3SJosef Bacik unsigned use_memdelay:1; 738d09d8df3SJosef Bacik #endif 7396f185c29SVladimir Davydov 7409da3f2b7SJann Horn /* 7419da3f2b7SJann Horn * May usercopy functions fault on kernel addresses? 7429da3f2b7SJann Horn * This is not just a single bit because this can potentially nest. 7439da3f2b7SJann Horn */ 7449da3f2b7SJann Horn unsigned int kernel_uaccess_faults_ok; 7459da3f2b7SJann Horn 7465eca1c10SIngo Molnar unsigned long atomic_flags; /* Flags requiring atomic access. */ 7471d4457f9SKees Cook 748f56141e3SAndy Lutomirski struct restart_block restart_block; 749f56141e3SAndy Lutomirski 7501da177e4SLinus Torvalds pid_t pid; 7511da177e4SLinus Torvalds pid_t tgid; 7520a425405SArjan van de Ven 753050e9baaSLinus Torvalds #ifdef CONFIG_STACKPROTECTOR 7545eca1c10SIngo Molnar /* Canary value for the -fstack-protector GCC feature: */ 7550a425405SArjan van de Ven unsigned long stack_canary; 7561314562aSHiroshi Shimamoto #endif 7571da177e4SLinus Torvalds /* 7585eca1c10SIngo Molnar * Pointers to the (original) parent process, youngest child, younger sibling, 7591da177e4SLinus Torvalds * older sibling, respectively. (p->father can be replaced with 760f470021aSRoland McGrath * p->real_parent->pid) 7611da177e4SLinus Torvalds */ 7625eca1c10SIngo Molnar 7635eca1c10SIngo Molnar /* Real parent process: */ 7645eca1c10SIngo Molnar struct task_struct __rcu *real_parent; 7655eca1c10SIngo Molnar 7665eca1c10SIngo Molnar /* Recipient of SIGCHLD, wait4() reports: */ 7675eca1c10SIngo Molnar struct task_struct __rcu *parent; 7681da177e4SLinus Torvalds 769f470021aSRoland McGrath /* 7705eca1c10SIngo Molnar * Children/sibling form the list of natural children: 7715eca1c10SIngo Molnar */ 7725eca1c10SIngo Molnar struct list_head children; 7735eca1c10SIngo Molnar struct list_head sibling; 7745eca1c10SIngo Molnar struct task_struct *group_leader; 7755eca1c10SIngo Molnar 7765eca1c10SIngo Molnar /* 7775eca1c10SIngo Molnar * 'ptraced' is the list of tasks this task is using ptrace() on. 7785eca1c10SIngo Molnar * 779f470021aSRoland McGrath * This includes both natural children and PTRACE_ATTACH targets. 7805eca1c10SIngo Molnar * 'ptrace_entry' is this task's link on the p->parent->ptraced list. 781f470021aSRoland McGrath */ 782f470021aSRoland McGrath struct list_head ptraced; 783f470021aSRoland McGrath struct list_head ptrace_entry; 784f470021aSRoland McGrath 7851da177e4SLinus Torvalds /* PID/PID hash table linkage. */ 7862c470475SEric W. Biederman struct pid *thread_pid; 7872c470475SEric W. Biederman struct hlist_node pid_links[PIDTYPE_MAX]; 78847e65328SOleg Nesterov struct list_head thread_group; 7890c740d0aSOleg Nesterov struct list_head thread_node; 7901da177e4SLinus Torvalds 7915eca1c10SIngo Molnar struct completion *vfork_done; 7921da177e4SLinus Torvalds 7935eca1c10SIngo Molnar /* CLONE_CHILD_SETTID: */ 7945eca1c10SIngo Molnar int __user *set_child_tid; 7955eca1c10SIngo Molnar 7965eca1c10SIngo Molnar /* CLONE_CHILD_CLEARTID: */ 7975eca1c10SIngo Molnar int __user *clear_child_tid; 7985eca1c10SIngo Molnar 7995eca1c10SIngo Molnar u64 utime; 8005eca1c10SIngo Molnar u64 stime; 80140565b5aSStanislaw Gruszka #ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME 8025eca1c10SIngo Molnar u64 utimescaled; 8035eca1c10SIngo Molnar u64 stimescaled; 80440565b5aSStanislaw Gruszka #endif 80516a6d9beSFrederic Weisbecker u64 gtime; 8069d7fb042SPeter Zijlstra struct prev_cputime prev_cputime; 8076a61671bSFrederic Weisbecker #ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN 808bac5b6b6SFrederic Weisbecker struct vtime vtime; 8096a61671bSFrederic Weisbecker #endif 810d027d45dSFrederic Weisbecker 811d027d45dSFrederic Weisbecker #ifdef CONFIG_NO_HZ_FULL 812f009a7a7SFrederic Weisbecker atomic_t tick_dep_mask; 813d027d45dSFrederic Weisbecker #endif 8145eca1c10SIngo Molnar /* Context switch counts: */ 8155eca1c10SIngo Molnar unsigned long nvcsw; 8165eca1c10SIngo Molnar unsigned long nivcsw; 8175eca1c10SIngo Molnar 8185eca1c10SIngo Molnar /* Monotonic time in nsecs: */ 8195eca1c10SIngo Molnar u64 start_time; 8205eca1c10SIngo Molnar 8215eca1c10SIngo Molnar /* Boot based time in nsecs: */ 8225eca1c10SIngo Molnar u64 real_start_time; 8235eca1c10SIngo Molnar 8245eca1c10SIngo Molnar /* MM fault and swap info: this can arguably be seen as either mm-specific or thread-specific: */ 8255eca1c10SIngo Molnar unsigned long min_flt; 8265eca1c10SIngo Molnar unsigned long maj_flt; 8271da177e4SLinus Torvalds 828b18b6a9cSNicolas Pitre #ifdef CONFIG_POSIX_TIMERS 829f06febc9SFrank Mayhar struct task_cputime cputime_expires; 8301da177e4SLinus Torvalds struct list_head cpu_timers[3]; 831b18b6a9cSNicolas Pitre #endif 8321da177e4SLinus Torvalds 8335eca1c10SIngo Molnar /* Process credentials: */ 8345eca1c10SIngo Molnar 8355eca1c10SIngo Molnar /* Tracer's credentials at attach: */ 8365eca1c10SIngo Molnar const struct cred __rcu *ptracer_cred; 8375eca1c10SIngo Molnar 8385eca1c10SIngo Molnar /* Objective and real subjective task credentials (COW): */ 8395eca1c10SIngo Molnar const struct cred __rcu *real_cred; 8405eca1c10SIngo Molnar 8415eca1c10SIngo Molnar /* Effective (overridable) subjective task credentials (COW): */ 8425eca1c10SIngo Molnar const struct cred __rcu *cred; 8435eca1c10SIngo Molnar 8445eca1c10SIngo Molnar /* 8455eca1c10SIngo Molnar * executable name, excluding path. 8465eca1c10SIngo Molnar * 8475eca1c10SIngo Molnar * - normally initialized setup_new_exec() 8485eca1c10SIngo Molnar * - access it with [gs]et_task_comm() 8495eca1c10SIngo Molnar * - lock it with task_lock() 8505eca1c10SIngo Molnar */ 8515eca1c10SIngo Molnar char comm[TASK_COMM_LEN]; 8525eca1c10SIngo Molnar 853756daf26SNeilBrown struct nameidata *nameidata; 8545eca1c10SIngo Molnar 8553d5b6fccSAlexey Dobriyan #ifdef CONFIG_SYSVIPC 8561da177e4SLinus Torvalds struct sysv_sem sysvsem; 857ab602f79SJack Miller struct sysv_shm sysvshm; 8583d5b6fccSAlexey Dobriyan #endif 859e162b39aSMandeep Singh Baines #ifdef CONFIG_DETECT_HUNG_TASK 86082a1fcb9SIngo Molnar unsigned long last_switch_count; 861a2e51445SDmitry Vyukov unsigned long last_switch_time; 86282a1fcb9SIngo Molnar #endif 8635eca1c10SIngo Molnar /* Filesystem information: */ 8641da177e4SLinus Torvalds struct fs_struct *fs; 8655eca1c10SIngo Molnar 8665eca1c10SIngo Molnar /* Open file information: */ 8671da177e4SLinus Torvalds struct files_struct *files; 8685eca1c10SIngo Molnar 8695eca1c10SIngo Molnar /* Namespaces: */ 870ab516013SSerge E. Hallyn struct nsproxy *nsproxy; 8715eca1c10SIngo Molnar 8725eca1c10SIngo Molnar /* Signal handlers: */ 8731da177e4SLinus Torvalds struct signal_struct *signal; 8741da177e4SLinus Torvalds struct sighand_struct *sighand; 8755eca1c10SIngo Molnar sigset_t blocked; 8765eca1c10SIngo Molnar sigset_t real_blocked; 8775eca1c10SIngo Molnar /* Restored if set_restore_sigmask() was used: */ 8785eca1c10SIngo Molnar sigset_t saved_sigmask; 8791da177e4SLinus Torvalds struct sigpending pending; 8801da177e4SLinus Torvalds unsigned long sas_ss_sp; 8811da177e4SLinus Torvalds size_t sas_ss_size; 8825eca1c10SIngo Molnar unsigned int sas_ss_flags; 8832e01fabeSOleg Nesterov 88467d12145SAl Viro struct callback_head *task_works; 885e73f8959SOleg Nesterov 8861da177e4SLinus Torvalds struct audit_context *audit_context; 887bfef93a5SAl Viro #ifdef CONFIG_AUDITSYSCALL 888e1760bd5SEric W. Biederman kuid_t loginuid; 8894746ec5bSEric Paris unsigned int sessionid; 890bfef93a5SAl Viro #endif 891932ecebbSWill Drewry struct seccomp seccomp; 8921da177e4SLinus Torvalds 8935eca1c10SIngo Molnar /* Thread group tracking: */ 8941da177e4SLinus Torvalds u32 parent_exec_id; 8951da177e4SLinus Torvalds u32 self_exec_id; 8965eca1c10SIngo Molnar 8975eca1c10SIngo Molnar /* Protection against (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed, mempolicy: */ 8981da177e4SLinus Torvalds spinlock_t alloc_lock; 8991da177e4SLinus Torvalds 900b29739f9SIngo Molnar /* Protection of the PI data structures: */ 9011d615482SThomas Gleixner raw_spinlock_t pi_lock; 902b29739f9SIngo Molnar 90376751049SPeter Zijlstra struct wake_q_node wake_q; 90476751049SPeter Zijlstra 90523f78d4aSIngo Molnar #ifdef CONFIG_RT_MUTEXES 9065eca1c10SIngo Molnar /* PI waiters blocked on a rt_mutex held by this task: */ 907a23ba907SDavidlohr Bueso struct rb_root_cached pi_waiters; 908e96a7705SXunlei Pang /* Updated under owner's pi_lock and rq lock */ 909e96a7705SXunlei Pang struct task_struct *pi_top_task; 9105eca1c10SIngo Molnar /* Deadlock detection and priority inheritance handling: */ 91123f78d4aSIngo Molnar struct rt_mutex_waiter *pi_blocked_on; 91223f78d4aSIngo Molnar #endif 91323f78d4aSIngo Molnar 914408894eeSIngo Molnar #ifdef CONFIG_DEBUG_MUTEXES 9155eca1c10SIngo Molnar /* Mutex deadlock detection: */ 916408894eeSIngo Molnar struct mutex_waiter *blocked_on; 917408894eeSIngo Molnar #endif 9185eca1c10SIngo Molnar 919de30a2b3SIngo Molnar #ifdef CONFIG_TRACE_IRQFLAGS 920de30a2b3SIngo Molnar unsigned int irq_events; 921de30a2b3SIngo Molnar unsigned long hardirq_enable_ip; 922de30a2b3SIngo Molnar unsigned long hardirq_disable_ip; 923fa1452e8SHiroshi Shimamoto unsigned int hardirq_enable_event; 924de30a2b3SIngo Molnar unsigned int hardirq_disable_event; 925fa1452e8SHiroshi Shimamoto int hardirqs_enabled; 926de30a2b3SIngo Molnar int hardirq_context; 927fa1452e8SHiroshi Shimamoto unsigned long softirq_disable_ip; 928fa1452e8SHiroshi Shimamoto unsigned long softirq_enable_ip; 929fa1452e8SHiroshi Shimamoto unsigned int softirq_disable_event; 930fa1452e8SHiroshi Shimamoto unsigned int softirq_enable_event; 931fa1452e8SHiroshi Shimamoto int softirqs_enabled; 932de30a2b3SIngo Molnar int softirq_context; 933de30a2b3SIngo Molnar #endif 9345eca1c10SIngo Molnar 935fbb9ce95SIngo Molnar #ifdef CONFIG_LOCKDEP 936bdb9441eSPeter Zijlstra # define MAX_LOCK_DEPTH 48UL 937fbb9ce95SIngo Molnar u64 curr_chain_key; 938fbb9ce95SIngo Molnar int lockdep_depth; 939fbb9ce95SIngo Molnar unsigned int lockdep_recursion; 940c7aceabaSRichard Kennedy struct held_lock held_locks[MAX_LOCK_DEPTH]; 941fbb9ce95SIngo Molnar #endif 9425eca1c10SIngo Molnar 943c6d30853SAndrey Ryabinin #ifdef CONFIG_UBSAN 944c6d30853SAndrey Ryabinin unsigned int in_ubsan; 945c6d30853SAndrey Ryabinin #endif 946408894eeSIngo Molnar 9475eca1c10SIngo Molnar /* Journalling filesystem info: */ 9481da177e4SLinus Torvalds void *journal_info; 9491da177e4SLinus Torvalds 9505eca1c10SIngo Molnar /* Stacked block device info: */ 951bddd87c7SAkinobu Mita struct bio_list *bio_list; 952d89d8796SNeil Brown 95373c10101SJens Axboe #ifdef CONFIG_BLOCK 9545eca1c10SIngo Molnar /* Stack plugging: */ 95573c10101SJens Axboe struct blk_plug *plug; 95673c10101SJens Axboe #endif 95773c10101SJens Axboe 9585eca1c10SIngo Molnar /* VM state: */ 9591da177e4SLinus Torvalds struct reclaim_state *reclaim_state; 9601da177e4SLinus Torvalds 9611da177e4SLinus Torvalds struct backing_dev_info *backing_dev_info; 9621da177e4SLinus Torvalds 9631da177e4SLinus Torvalds struct io_context *io_context; 9641da177e4SLinus Torvalds 9655eca1c10SIngo Molnar /* Ptrace state: */ 9661da177e4SLinus Torvalds unsigned long ptrace_message; 967ae7795bcSEric W. Biederman kernel_siginfo_t *last_siginfo; 9685eca1c10SIngo Molnar 9697c3ab738SAndrew Morton struct task_io_accounting ioac; 970eb414681SJohannes Weiner #ifdef CONFIG_PSI 971eb414681SJohannes Weiner /* Pressure stall state */ 972eb414681SJohannes Weiner unsigned int psi_flags; 973eb414681SJohannes Weiner #endif 9745eca1c10SIngo Molnar #ifdef CONFIG_TASK_XACCT 9755eca1c10SIngo Molnar /* Accumulated RSS usage: */ 9765eca1c10SIngo Molnar u64 acct_rss_mem1; 9775eca1c10SIngo Molnar /* Accumulated virtual memory usage: */ 9785eca1c10SIngo Molnar u64 acct_vm_mem1; 9795eca1c10SIngo Molnar /* stime + utime since last update: */ 9805eca1c10SIngo Molnar u64 acct_timexpd; 9811da177e4SLinus Torvalds #endif 9821da177e4SLinus Torvalds #ifdef CONFIG_CPUSETS 9835eca1c10SIngo Molnar /* Protected by ->alloc_lock: */ 9845eca1c10SIngo Molnar nodemask_t mems_allowed; 9855eca1c10SIngo Molnar /* Seqence number to catch updates: */ 9865eca1c10SIngo Molnar seqcount_t mems_allowed_seq; 987825a46afSPaul Jackson int cpuset_mem_spread_rotor; 9886adef3ebSJack Steiner int cpuset_slab_spread_rotor; 9891da177e4SLinus Torvalds #endif 990ddbcc7e8SPaul Menage #ifdef CONFIG_CGROUPS 9915eca1c10SIngo Molnar /* Control Group info protected by css_set_lock: */ 9922c392b8cSArnd Bergmann struct css_set __rcu *cgroups; 9935eca1c10SIngo Molnar /* cg_list protected by css_set_lock and tsk->alloc_lock: */ 994817929ecSPaul Menage struct list_head cg_list; 995ddbcc7e8SPaul Menage #endif 996f01d7d51SVikas Shivappa #ifdef CONFIG_INTEL_RDT 9970734ded1SVikas Shivappa u32 closid; 998d6aaba61SVikas Shivappa u32 rmid; 999e02737d5SFenghua Yu #endif 100042b2dd0aSAlexey Dobriyan #ifdef CONFIG_FUTEX 10010771dfefSIngo Molnar struct robust_list_head __user *robust_list; 100234f192c6SIngo Molnar #ifdef CONFIG_COMPAT 100334f192c6SIngo Molnar struct compat_robust_list_head __user *compat_robust_list; 100434f192c6SIngo Molnar #endif 1005c87e2837SIngo Molnar struct list_head pi_state_list; 1006c87e2837SIngo Molnar struct futex_pi_state *pi_state_cache; 100742b2dd0aSAlexey Dobriyan #endif 1008cdd6c482SIngo Molnar #ifdef CONFIG_PERF_EVENTS 10098dc85d54SPeter Zijlstra struct perf_event_context *perf_event_ctxp[perf_nr_task_contexts]; 1010cdd6c482SIngo Molnar struct mutex perf_event_mutex; 1011cdd6c482SIngo Molnar struct list_head perf_event_list; 1012a63eaf34SPaul Mackerras #endif 10138f47b187SThomas Gleixner #ifdef CONFIG_DEBUG_PREEMPT 10148f47b187SThomas Gleixner unsigned long preempt_disable_ip; 10158f47b187SThomas Gleixner #endif 1016c7aceabaSRichard Kennedy #ifdef CONFIG_NUMA 10175eca1c10SIngo Molnar /* Protected by alloc_lock: */ 10185eca1c10SIngo Molnar struct mempolicy *mempolicy; 101945816682SVlastimil Babka short il_prev; 1020207205a2SEric Dumazet short pref_node_fork; 1021c7aceabaSRichard Kennedy #endif 1022cbee9f88SPeter Zijlstra #ifdef CONFIG_NUMA_BALANCING 1023cbee9f88SPeter Zijlstra int numa_scan_seq; 1024cbee9f88SPeter Zijlstra unsigned int numa_scan_period; 1025598f0ec0SMel Gorman unsigned int numa_scan_period_max; 1026de1c9ce6SRik van Riel int numa_preferred_nid; 10276b9a7460SMel Gorman unsigned long numa_migrate_retry; 10285eca1c10SIngo Molnar /* Migration stamp: */ 10295eca1c10SIngo Molnar u64 node_stamp; 10307e2703e6SRik van Riel u64 last_task_numa_placement; 10317e2703e6SRik van Riel u64 last_sum_exec_runtime; 1032cbee9f88SPeter Zijlstra struct callback_head numa_work; 1033f809ca9aSMel Gorman 10348c8a743cSPeter Zijlstra struct numa_group *numa_group; 10358c8a743cSPeter Zijlstra 1036745d6147SMel Gorman /* 103744dba3d5SIulia Manda * numa_faults is an array split into four regions: 103844dba3d5SIulia Manda * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer 103944dba3d5SIulia Manda * in this precise order. 104044dba3d5SIulia Manda * 104144dba3d5SIulia Manda * faults_memory: Exponential decaying average of faults on a per-node 104244dba3d5SIulia Manda * basis. Scheduling placement decisions are made based on these 104344dba3d5SIulia Manda * counts. The values remain static for the duration of a PTE scan. 104444dba3d5SIulia Manda * faults_cpu: Track the nodes the process was running on when a NUMA 104544dba3d5SIulia Manda * hinting fault was incurred. 104644dba3d5SIulia Manda * faults_memory_buffer and faults_cpu_buffer: Record faults per node 104744dba3d5SIulia Manda * during the current scan window. When the scan completes, the counts 104844dba3d5SIulia Manda * in faults_memory and faults_cpu decay and these values are copied. 1049745d6147SMel Gorman */ 105044dba3d5SIulia Manda unsigned long *numa_faults; 105183e1d2cdSMel Gorman unsigned long total_numa_faults; 1052745d6147SMel Gorman 1053745d6147SMel Gorman /* 105404bb2f94SRik van Riel * numa_faults_locality tracks if faults recorded during the last 1055074c2381SMel Gorman * scan window were remote/local or failed to migrate. The task scan 1056074c2381SMel Gorman * period is adapted based on the locality of the faults with different 1057074c2381SMel Gorman * weights depending on whether they were shared or private faults 105804bb2f94SRik van Riel */ 1059074c2381SMel Gorman unsigned long numa_faults_locality[3]; 106004bb2f94SRik van Riel 1061b32e86b4SIngo Molnar unsigned long numa_pages_migrated; 1062cbee9f88SPeter Zijlstra #endif /* CONFIG_NUMA_BALANCING */ 1063cbee9f88SPeter Zijlstra 1064d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ 1065d7822b1eSMathieu Desnoyers struct rseq __user *rseq; 1066d7822b1eSMathieu Desnoyers u32 rseq_len; 1067d7822b1eSMathieu Desnoyers u32 rseq_sig; 1068d7822b1eSMathieu Desnoyers /* 1069d7822b1eSMathieu Desnoyers * RmW on rseq_event_mask must be performed atomically 1070d7822b1eSMathieu Desnoyers * with respect to preemption. 1071d7822b1eSMathieu Desnoyers */ 1072d7822b1eSMathieu Desnoyers unsigned long rseq_event_mask; 1073d7822b1eSMathieu Desnoyers #endif 1074d7822b1eSMathieu Desnoyers 107572b252aeSMel Gorman struct tlbflush_unmap_batch tlb_ubc; 107672b252aeSMel Gorman 1077e56d0903SIngo Molnar struct rcu_head rcu; 1078b92ce558SJens Axboe 10795eca1c10SIngo Molnar /* Cache last used pipe for splice(): */ 1080b92ce558SJens Axboe struct pipe_inode_info *splice_pipe; 10815640f768SEric Dumazet 10825640f768SEric Dumazet struct page_frag task_frag; 10835640f768SEric Dumazet 1084ca74e92bSShailabh Nagar #ifdef CONFIG_TASK_DELAY_ACCT 1085ca74e92bSShailabh Nagar struct task_delay_info *delays; 1086ca74e92bSShailabh Nagar #endif 108747913d4eSIngo Molnar 1088f4f154fdSAkinobu Mita #ifdef CONFIG_FAULT_INJECTION 1089f4f154fdSAkinobu Mita int make_it_fail; 10909049f2f6SAkinobu Mita unsigned int fail_nth; 1091f4f154fdSAkinobu Mita #endif 10929d823e8fSWu Fengguang /* 10935eca1c10SIngo Molnar * When (nr_dirtied >= nr_dirtied_pause), it's time to call 10945eca1c10SIngo Molnar * balance_dirty_pages() for a dirty throttling pause: 10959d823e8fSWu Fengguang */ 10969d823e8fSWu Fengguang int nr_dirtied; 10979d823e8fSWu Fengguang int nr_dirtied_pause; 10985eca1c10SIngo Molnar /* Start of a write-and-pause period: */ 10995eca1c10SIngo Molnar unsigned long dirty_paused_when; 11009d823e8fSWu Fengguang 11019745512cSArjan van de Ven #ifdef CONFIG_LATENCYTOP 11029745512cSArjan van de Ven int latency_record_count; 11039745512cSArjan van de Ven struct latency_record latency_record[LT_SAVECOUNT]; 11049745512cSArjan van de Ven #endif 11056976675dSArjan van de Ven /* 11065eca1c10SIngo Molnar * Time slack values; these are used to round up poll() and 11076976675dSArjan van de Ven * select() etc timeout values. These are in nanoseconds. 11086976675dSArjan van de Ven */ 1109da8b44d5SJohn Stultz u64 timer_slack_ns; 1110da8b44d5SJohn Stultz u64 default_timer_slack_ns; 1111f8d570a4SDavid Miller 11120b24beccSAndrey Ryabinin #ifdef CONFIG_KASAN 11130b24beccSAndrey Ryabinin unsigned int kasan_depth; 11140b24beccSAndrey Ryabinin #endif 11155eca1c10SIngo Molnar 1116fb52607aSFrederic Weisbecker #ifdef CONFIG_FUNCTION_GRAPH_TRACER 11175eca1c10SIngo Molnar /* Index of current stored address in ret_stack: */ 1118f201ae23SFrederic Weisbecker int curr_ret_stack; 11195eca1c10SIngo Molnar 11205eca1c10SIngo Molnar /* Stack of return addresses for return function tracing: */ 1121f201ae23SFrederic Weisbecker struct ftrace_ret_stack *ret_stack; 11225eca1c10SIngo Molnar 11235eca1c10SIngo Molnar /* Timestamp for last schedule: */ 11248aef2d28SSteven Rostedt unsigned long long ftrace_timestamp; 11255eca1c10SIngo Molnar 1126f201ae23SFrederic Weisbecker /* 1127f201ae23SFrederic Weisbecker * Number of functions that haven't been traced 11285eca1c10SIngo Molnar * because of depth overrun: 1129f201ae23SFrederic Weisbecker */ 1130f201ae23SFrederic Weisbecker atomic_t trace_overrun; 11315eca1c10SIngo Molnar 11325eca1c10SIngo Molnar /* Pause tracing: */ 1133380c4b14SFrederic Weisbecker atomic_t tracing_graph_pause; 1134f201ae23SFrederic Weisbecker #endif 11355eca1c10SIngo Molnar 1136ea4e2bc4SSteven Rostedt #ifdef CONFIG_TRACING 11375eca1c10SIngo Molnar /* State flags for use by tracers: */ 1138ea4e2bc4SSteven Rostedt unsigned long trace; 11395eca1c10SIngo Molnar 11405eca1c10SIngo Molnar /* Bitmask and counter of trace recursion: */ 1141261842b7SSteven Rostedt unsigned long trace_recursion; 1142261842b7SSteven Rostedt #endif /* CONFIG_TRACING */ 11435eca1c10SIngo Molnar 11445c9a8750SDmitry Vyukov #ifdef CONFIG_KCOV 11455eca1c10SIngo Molnar /* Coverage collection mode enabled for this task (0 if disabled): */ 11460ed557aaSMark Rutland unsigned int kcov_mode; 11475eca1c10SIngo Molnar 11485eca1c10SIngo Molnar /* Size of the kcov_area: */ 11495eca1c10SIngo Molnar unsigned int kcov_size; 11505eca1c10SIngo Molnar 11515eca1c10SIngo Molnar /* Buffer for coverage collection: */ 11525c9a8750SDmitry Vyukov void *kcov_area; 11535eca1c10SIngo Molnar 11545eca1c10SIngo Molnar /* KCOV descriptor wired with this task or NULL: */ 11555c9a8750SDmitry Vyukov struct kcov *kcov; 11565c9a8750SDmitry Vyukov #endif 11575eca1c10SIngo Molnar 11586f185c29SVladimir Davydov #ifdef CONFIG_MEMCG 1159626ebc41STejun Heo struct mem_cgroup *memcg_in_oom; 1160626ebc41STejun Heo gfp_t memcg_oom_gfp_mask; 1161626ebc41STejun Heo int memcg_oom_order; 1162b23afb93STejun Heo 11635eca1c10SIngo Molnar /* Number of pages to reclaim on returning to userland: */ 1164b23afb93STejun Heo unsigned int memcg_nr_pages_over_high; 1165d46eb14bSShakeel Butt 1166d46eb14bSShakeel Butt /* Used by memcontrol for targeted memcg charge: */ 1167d46eb14bSShakeel Butt struct mem_cgroup *active_memcg; 1168569b846dSKAMEZAWA Hiroyuki #endif 11695eca1c10SIngo Molnar 1170d09d8df3SJosef Bacik #ifdef CONFIG_BLK_CGROUP 1171d09d8df3SJosef Bacik struct request_queue *throttle_queue; 1172d09d8df3SJosef Bacik #endif 1173d09d8df3SJosef Bacik 11740326f5a9SSrikar Dronamraju #ifdef CONFIG_UPROBES 11750326f5a9SSrikar Dronamraju struct uprobe_task *utask; 11760326f5a9SSrikar Dronamraju #endif 1177cafe5635SKent Overstreet #if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE) 1178cafe5635SKent Overstreet unsigned int sequential_io; 1179cafe5635SKent Overstreet unsigned int sequential_io_avg; 1180cafe5635SKent Overstreet #endif 11818eb23b9fSPeter Zijlstra #ifdef CONFIG_DEBUG_ATOMIC_SLEEP 11828eb23b9fSPeter Zijlstra unsigned long task_state_change; 11838eb23b9fSPeter Zijlstra #endif 11848bcbde54SDavid Hildenbrand int pagefault_disabled; 118503049269SMichal Hocko #ifdef CONFIG_MMU 118629c696e1SVladimir Davydov struct task_struct *oom_reaper_list; 118703049269SMichal Hocko #endif 1188ba14a194SAndy Lutomirski #ifdef CONFIG_VMAP_STACK 1189ba14a194SAndy Lutomirski struct vm_struct *stack_vm_area; 1190ba14a194SAndy Lutomirski #endif 119168f24b08SAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 11925eca1c10SIngo Molnar /* A live task holds one reference: */ 119368f24b08SAndy Lutomirski atomic_t stack_refcount; 119468f24b08SAndy Lutomirski #endif 1195d83a7cb3SJosh Poimboeuf #ifdef CONFIG_LIVEPATCH 1196d83a7cb3SJosh Poimboeuf int patch_state; 1197d83a7cb3SJosh Poimboeuf #endif 1198e4e55b47STetsuo Handa #ifdef CONFIG_SECURITY 1199e4e55b47STetsuo Handa /* Used by LSM modules for access restriction: */ 1200e4e55b47STetsuo Handa void *security; 1201e4e55b47STetsuo Handa #endif 120229e48ce8SKees Cook 1203afaef01cSAlexander Popov #ifdef CONFIG_GCC_PLUGIN_STACKLEAK 1204afaef01cSAlexander Popov unsigned long lowest_stack; 1205c8d12627SAlexander Popov unsigned long prev_lowest_stack; 1206afaef01cSAlexander Popov #endif 1207afaef01cSAlexander Popov 120829e48ce8SKees Cook /* 120929e48ce8SKees Cook * New fields for task_struct should be added above here, so that 121029e48ce8SKees Cook * they are included in the randomized portion of task_struct. 121129e48ce8SKees Cook */ 121229e48ce8SKees Cook randomized_struct_fields_end 121329e48ce8SKees Cook 12145eca1c10SIngo Molnar /* CPU-specific state of this task: */ 12150c8c0f03SDave Hansen struct thread_struct thread; 12165eca1c10SIngo Molnar 12170c8c0f03SDave Hansen /* 12180c8c0f03SDave Hansen * WARNING: on x86, 'thread_struct' contains a variable-sized 12190c8c0f03SDave Hansen * structure. It *MUST* be at the end of 'task_struct'. 12200c8c0f03SDave Hansen * 12210c8c0f03SDave Hansen * Do not put anything below here! 12220c8c0f03SDave Hansen */ 12231da177e4SLinus Torvalds }; 12241da177e4SLinus Torvalds 1225e868171aSAlexey Dobriyan static inline struct pid *task_pid(struct task_struct *task) 122622c935f4SEric W. Biederman { 12272c470475SEric W. Biederman return task->thread_pid; 122822c935f4SEric W. Biederman } 122922c935f4SEric W. Biederman 12307af57294SPavel Emelyanov /* 12317af57294SPavel Emelyanov * the helpers to get the task's different pids as they are seen 12327af57294SPavel Emelyanov * from various namespaces 12337af57294SPavel Emelyanov * 12347af57294SPavel Emelyanov * task_xid_nr() : global id, i.e. the id seen from the init namespace; 123544c4e1b2SEric W. Biederman * task_xid_vnr() : virtual id, i.e. the id seen from the pid namespace of 123644c4e1b2SEric W. Biederman * current. 12377af57294SPavel Emelyanov * task_xid_nr_ns() : id seen from the ns specified; 12387af57294SPavel Emelyanov * 12397af57294SPavel Emelyanov * see also pid_nr() etc in include/linux/pid.h 12407af57294SPavel Emelyanov */ 12415eca1c10SIngo Molnar pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type, struct pid_namespace *ns); 12427af57294SPavel Emelyanov 1243e868171aSAlexey Dobriyan static inline pid_t task_pid_nr(struct task_struct *tsk) 12447af57294SPavel Emelyanov { 12457af57294SPavel Emelyanov return tsk->pid; 12467af57294SPavel Emelyanov } 12477af57294SPavel Emelyanov 12485eca1c10SIngo Molnar static inline pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 124952ee2dfdSOleg Nesterov { 125052ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns); 125152ee2dfdSOleg Nesterov } 12527af57294SPavel Emelyanov 12537af57294SPavel Emelyanov static inline pid_t task_pid_vnr(struct task_struct *tsk) 12547af57294SPavel Emelyanov { 125552ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL); 12567af57294SPavel Emelyanov } 12577af57294SPavel Emelyanov 12587af57294SPavel Emelyanov 1259e868171aSAlexey Dobriyan static inline pid_t task_tgid_nr(struct task_struct *tsk) 12607af57294SPavel Emelyanov { 12617af57294SPavel Emelyanov return tsk->tgid; 12627af57294SPavel Emelyanov } 12637af57294SPavel Emelyanov 12645eca1c10SIngo Molnar /** 12655eca1c10SIngo Molnar * pid_alive - check that a task structure is not stale 12665eca1c10SIngo Molnar * @p: Task structure to be checked. 12675eca1c10SIngo Molnar * 12685eca1c10SIngo Molnar * Test if a process is not yet dead (at most zombie state) 12695eca1c10SIngo Molnar * If pid_alive fails, then pointers within the task structure 12705eca1c10SIngo Molnar * can be stale and must not be dereferenced. 12715eca1c10SIngo Molnar * 12725eca1c10SIngo Molnar * Return: 1 if the process is alive. 0 otherwise. 12735eca1c10SIngo Molnar */ 12745eca1c10SIngo Molnar static inline int pid_alive(const struct task_struct *p) 12755eca1c10SIngo Molnar { 12762c470475SEric W. Biederman return p->thread_pid != NULL; 12775eca1c10SIngo Molnar } 12787af57294SPavel Emelyanov 12795eca1c10SIngo Molnar static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 12807af57294SPavel Emelyanov { 128152ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns); 12827af57294SPavel Emelyanov } 12837af57294SPavel Emelyanov 12847af57294SPavel Emelyanov static inline pid_t task_pgrp_vnr(struct task_struct *tsk) 12857af57294SPavel Emelyanov { 128652ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL); 12877af57294SPavel Emelyanov } 12887af57294SPavel Emelyanov 12897af57294SPavel Emelyanov 12905eca1c10SIngo Molnar static inline pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 12917af57294SPavel Emelyanov { 129252ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns); 12937af57294SPavel Emelyanov } 12947af57294SPavel Emelyanov 12957af57294SPavel Emelyanov static inline pid_t task_session_vnr(struct task_struct *tsk) 12967af57294SPavel Emelyanov { 129752ee2dfdSOleg Nesterov return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL); 12987af57294SPavel Emelyanov } 12997af57294SPavel Emelyanov 1300dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns) 1301dd1c1f2fSOleg Nesterov { 13026883f81aSEric W. Biederman return __task_pid_nr_ns(tsk, PIDTYPE_TGID, ns); 1303dd1c1f2fSOleg Nesterov } 1304dd1c1f2fSOleg Nesterov 1305dd1c1f2fSOleg Nesterov static inline pid_t task_tgid_vnr(struct task_struct *tsk) 1306dd1c1f2fSOleg Nesterov { 13076883f81aSEric W. Biederman return __task_pid_nr_ns(tsk, PIDTYPE_TGID, NULL); 1308dd1c1f2fSOleg Nesterov } 1309dd1c1f2fSOleg Nesterov 1310dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns) 1311dd1c1f2fSOleg Nesterov { 1312dd1c1f2fSOleg Nesterov pid_t pid = 0; 1313dd1c1f2fSOleg Nesterov 1314dd1c1f2fSOleg Nesterov rcu_read_lock(); 1315dd1c1f2fSOleg Nesterov if (pid_alive(tsk)) 1316dd1c1f2fSOleg Nesterov pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns); 1317dd1c1f2fSOleg Nesterov rcu_read_unlock(); 1318dd1c1f2fSOleg Nesterov 1319dd1c1f2fSOleg Nesterov return pid; 1320dd1c1f2fSOleg Nesterov } 1321dd1c1f2fSOleg Nesterov 1322dd1c1f2fSOleg Nesterov static inline pid_t task_ppid_nr(const struct task_struct *tsk) 1323dd1c1f2fSOleg Nesterov { 1324dd1c1f2fSOleg Nesterov return task_ppid_nr_ns(tsk, &init_pid_ns); 1325dd1c1f2fSOleg Nesterov } 1326dd1c1f2fSOleg Nesterov 13275eca1c10SIngo Molnar /* Obsolete, do not use: */ 13281b0f7ffdSOleg Nesterov static inline pid_t task_pgrp_nr(struct task_struct *tsk) 13291b0f7ffdSOleg Nesterov { 13301b0f7ffdSOleg Nesterov return task_pgrp_nr_ns(tsk, &init_pid_ns); 13311b0f7ffdSOleg Nesterov } 13327af57294SPavel Emelyanov 133306eb6184SPeter Zijlstra #define TASK_REPORT_IDLE (TASK_REPORT + 1) 133406eb6184SPeter Zijlstra #define TASK_REPORT_MAX (TASK_REPORT_IDLE << 1) 133506eb6184SPeter Zijlstra 13361d48b080SPeter Zijlstra static inline unsigned int task_state_index(struct task_struct *tsk) 133720435d84SXie XiuQi { 13381593baabSPeter Zijlstra unsigned int tsk_state = READ_ONCE(tsk->state); 13391593baabSPeter Zijlstra unsigned int state = (tsk_state | tsk->exit_state) & TASK_REPORT; 134020435d84SXie XiuQi 134106eb6184SPeter Zijlstra BUILD_BUG_ON_NOT_POWER_OF_2(TASK_REPORT_MAX); 134206eb6184SPeter Zijlstra 134306eb6184SPeter Zijlstra if (tsk_state == TASK_IDLE) 134406eb6184SPeter Zijlstra state = TASK_REPORT_IDLE; 134506eb6184SPeter Zijlstra 13461593baabSPeter Zijlstra return fls(state); 13471593baabSPeter Zijlstra } 134820435d84SXie XiuQi 13491d48b080SPeter Zijlstra static inline char task_index_to_char(unsigned int state) 13501593baabSPeter Zijlstra { 13518ef9925bSPeter Zijlstra static const char state_char[] = "RSDTtXZPI"; 13521593baabSPeter Zijlstra 135306eb6184SPeter Zijlstra BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != sizeof(state_char) - 1); 13541593baabSPeter Zijlstra 13551593baabSPeter Zijlstra return state_char[state]; 13561593baabSPeter Zijlstra } 13571593baabSPeter Zijlstra 13581593baabSPeter Zijlstra static inline char task_state_to_char(struct task_struct *tsk) 13591593baabSPeter Zijlstra { 13601d48b080SPeter Zijlstra return task_index_to_char(task_state_index(tsk)); 136120435d84SXie XiuQi } 136220435d84SXie XiuQi 13631da177e4SLinus Torvalds /** 1364570f5241SSergey Senozhatsky * is_global_init - check if a task structure is init. Since init 1365570f5241SSergey Senozhatsky * is free to have sub-threads we need to check tgid. 13663260259fSHenne * @tsk: Task structure to be checked. 13673260259fSHenne * 13683260259fSHenne * Check if a task structure is the first user space task the kernel created. 1369e69f6186SYacine Belkadi * 1370e69f6186SYacine Belkadi * Return: 1 if the task structure is init. 0 otherwise. 1371f400e198SSukadev Bhattiprolu */ 1372e868171aSAlexey Dobriyan static inline int is_global_init(struct task_struct *tsk) 1373b461cc03SPavel Emelyanov { 1374570f5241SSergey Senozhatsky return task_tgid_nr(tsk) == 1; 1375b461cc03SPavel Emelyanov } 1376b460cbc5SSerge E. Hallyn 13779ec52099SCedric Le Goater extern struct pid *cad_pid; 13789ec52099SCedric Le Goater 13791da177e4SLinus Torvalds /* 13801da177e4SLinus Torvalds * Per process flags 13811da177e4SLinus Torvalds */ 1382c1de45caSPeter Zijlstra #define PF_IDLE 0x00000002 /* I am an IDLE thread */ 13835eca1c10SIngo Molnar #define PF_EXITING 0x00000004 /* Getting shut down */ 13845eca1c10SIngo Molnar #define PF_EXITPIDONE 0x00000008 /* PI exit done on shut down */ 138594886b84SLaurent Vivier #define PF_VCPU 0x00000010 /* I'm a virtual CPU */ 138621aa9af0STejun Heo #define PF_WQ_WORKER 0x00000020 /* I'm a workqueue worker */ 13875eca1c10SIngo Molnar #define PF_FORKNOEXEC 0x00000040 /* Forked but didn't exec */ 13885eca1c10SIngo Molnar #define PF_MCE_PROCESS 0x00000080 /* Process policy on mce errors */ 13895eca1c10SIngo Molnar #define PF_SUPERPRIV 0x00000100 /* Used super-user privileges */ 13905eca1c10SIngo Molnar #define PF_DUMPCORE 0x00000200 /* Dumped core */ 13915eca1c10SIngo Molnar #define PF_SIGNALED 0x00000400 /* Killed by a signal */ 13921da177e4SLinus Torvalds #define PF_MEMALLOC 0x00000800 /* Allocating memory */ 13935eca1c10SIngo Molnar #define PF_NPROC_EXCEEDED 0x00001000 /* set_user() noticed that RLIMIT_NPROC was exceeded */ 13945eca1c10SIngo Molnar #define PF_USED_MATH 0x00002000 /* If unset the fpu must be initialized before use */ 13955eca1c10SIngo Molnar #define PF_USED_ASYNC 0x00004000 /* Used async_schedule*(), used by module init */ 13965eca1c10SIngo Molnar #define PF_NOFREEZE 0x00008000 /* This thread should not be frozen */ 13975eca1c10SIngo Molnar #define PF_FROZEN 0x00010000 /* Frozen for system suspend */ 13987dea19f9SMichal Hocko #define PF_KSWAPD 0x00020000 /* I am kswapd */ 13997dea19f9SMichal Hocko #define PF_MEMALLOC_NOFS 0x00040000 /* All allocation requests will inherit GFP_NOFS */ 14007dea19f9SMichal Hocko #define PF_MEMALLOC_NOIO 0x00080000 /* All allocation requests will inherit GFP_NOIO */ 14011da177e4SLinus Torvalds #define PF_LESS_THROTTLE 0x00100000 /* Throttle me less: I clean memory */ 1402246bb0b1SOleg Nesterov #define PF_KTHREAD 0x00200000 /* I am a kernel thread */ 14035eca1c10SIngo Molnar #define PF_RANDOMIZE 0x00400000 /* Randomize virtual address space */ 1404b31dc66aSJens Axboe #define PF_SWAPWRITE 0x00800000 /* Allowed to write to swap */ 1405eb414681SJohannes Weiner #define PF_MEMSTALL 0x01000000 /* Stalled due to lack of memory */ 140614a40ffcSTejun Heo #define PF_NO_SETAFFINITY 0x04000000 /* Userland is not allowed to meddle with cpus_allowed */ 14074db96cf0SAndi Kleen #define PF_MCE_EARLY 0x08000000 /* Early kill for mce process policy */ 140861a87122SThomas Gleixner #define PF_MUTEX_TESTER 0x20000000 /* Thread belongs to the rt mutex tester */ 140958a69cb4STejun Heo #define PF_FREEZER_SKIP 0x40000000 /* Freezer should not count it as freezable */ 14105eca1c10SIngo Molnar #define PF_SUSPEND_TASK 0x80000000 /* This thread called freeze_processes() and should not be frozen */ 14111da177e4SLinus Torvalds 14121da177e4SLinus Torvalds /* 14131da177e4SLinus Torvalds * Only the _current_ task can read/write to tsk->flags, but other 14141da177e4SLinus Torvalds * tasks can access tsk->flags in readonly mode for example 14151da177e4SLinus Torvalds * with tsk_used_math (like during threaded core dumping). 14161da177e4SLinus Torvalds * There is however an exception to this rule during ptrace 14171da177e4SLinus Torvalds * or during fork: the ptracer task is allowed to write to the 14181da177e4SLinus Torvalds * child->flags of its traced child (same goes for fork, the parent 14191da177e4SLinus Torvalds * can write to the child->flags), because we're guaranteed the 14201da177e4SLinus Torvalds * child is not running and in turn not changing child->flags 14211da177e4SLinus Torvalds * at the same time the parent does it. 14221da177e4SLinus Torvalds */ 14231da177e4SLinus Torvalds #define clear_stopped_child_used_math(child) do { (child)->flags &= ~PF_USED_MATH; } while (0) 14241da177e4SLinus Torvalds #define set_stopped_child_used_math(child) do { (child)->flags |= PF_USED_MATH; } while (0) 14251da177e4SLinus Torvalds #define clear_used_math() clear_stopped_child_used_math(current) 14261da177e4SLinus Torvalds #define set_used_math() set_stopped_child_used_math(current) 14275eca1c10SIngo Molnar 14281da177e4SLinus Torvalds #define conditional_stopped_child_used_math(condition, child) \ 14291da177e4SLinus Torvalds do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0) 14305eca1c10SIngo Molnar 14315eca1c10SIngo Molnar #define conditional_used_math(condition) conditional_stopped_child_used_math(condition, current) 14325eca1c10SIngo Molnar 14331da177e4SLinus Torvalds #define copy_to_stopped_child_used_math(child) \ 14341da177e4SLinus Torvalds do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0) 14355eca1c10SIngo Molnar 14361da177e4SLinus Torvalds /* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */ 14371da177e4SLinus Torvalds #define tsk_used_math(p) ((p)->flags & PF_USED_MATH) 14381da177e4SLinus Torvalds #define used_math() tsk_used_math(current) 14391da177e4SLinus Torvalds 144062ec05ddSThomas Gleixner static inline bool is_percpu_thread(void) 144162ec05ddSThomas Gleixner { 144262ec05ddSThomas Gleixner #ifdef CONFIG_SMP 144362ec05ddSThomas Gleixner return (current->flags & PF_NO_SETAFFINITY) && 144462ec05ddSThomas Gleixner (current->nr_cpus_allowed == 1); 144562ec05ddSThomas Gleixner #else 144662ec05ddSThomas Gleixner return true; 144762ec05ddSThomas Gleixner #endif 144862ec05ddSThomas Gleixner } 144962ec05ddSThomas Gleixner 14501d4457f9SKees Cook /* Per-process atomic flags. */ 1451a2b86f77SZefan Li #define PFA_NO_NEW_PRIVS 0 /* May not gain new privileges. */ 14522ad654bcSZefan Li #define PFA_SPREAD_PAGE 1 /* Spread page cache over cpuset */ 14532ad654bcSZefan Li #define PFA_SPREAD_SLAB 2 /* Spread some slab caches over cpuset */ 1454356e4bffSThomas Gleixner #define PFA_SPEC_SSB_DISABLE 3 /* Speculative Store Bypass disabled */ 1455356e4bffSThomas Gleixner #define PFA_SPEC_SSB_FORCE_DISABLE 4 /* Speculative Store Bypass force disabled*/ 1456*9137bb27SThomas Gleixner #define PFA_SPEC_IB_DISABLE 5 /* Indirect branch speculation restricted */ 1457*9137bb27SThomas Gleixner #define PFA_SPEC_IB_FORCE_DISABLE 6 /* Indirect branch speculation permanently restricted */ 14581d4457f9SKees Cook 1459e0e5070bSZefan Li #define TASK_PFA_TEST(name, func) \ 1460e0e5070bSZefan Li static inline bool task_##func(struct task_struct *p) \ 1461e0e5070bSZefan Li { return test_bit(PFA_##name, &p->atomic_flags); } 14625eca1c10SIngo Molnar 1463e0e5070bSZefan Li #define TASK_PFA_SET(name, func) \ 1464e0e5070bSZefan Li static inline void task_set_##func(struct task_struct *p) \ 1465e0e5070bSZefan Li { set_bit(PFA_##name, &p->atomic_flags); } 14665eca1c10SIngo Molnar 1467e0e5070bSZefan Li #define TASK_PFA_CLEAR(name, func) \ 1468e0e5070bSZefan Li static inline void task_clear_##func(struct task_struct *p) \ 1469e0e5070bSZefan Li { clear_bit(PFA_##name, &p->atomic_flags); } 14701d4457f9SKees Cook 1471e0e5070bSZefan Li TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs) 1472e0e5070bSZefan Li TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs) 14731d4457f9SKees Cook 14742ad654bcSZefan Li TASK_PFA_TEST(SPREAD_PAGE, spread_page) 14752ad654bcSZefan Li TASK_PFA_SET(SPREAD_PAGE, spread_page) 14762ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_PAGE, spread_page) 14772ad654bcSZefan Li 14782ad654bcSZefan Li TASK_PFA_TEST(SPREAD_SLAB, spread_slab) 14792ad654bcSZefan Li TASK_PFA_SET(SPREAD_SLAB, spread_slab) 14802ad654bcSZefan Li TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab) 1481544b2c91STejun Heo 1482356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_DISABLE, spec_ssb_disable) 1483356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_DISABLE, spec_ssb_disable) 1484356e4bffSThomas Gleixner TASK_PFA_CLEAR(SPEC_SSB_DISABLE, spec_ssb_disable) 1485356e4bffSThomas Gleixner 1486356e4bffSThomas Gleixner TASK_PFA_TEST(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable) 1487356e4bffSThomas Gleixner TASK_PFA_SET(SPEC_SSB_FORCE_DISABLE, spec_ssb_force_disable) 1488356e4bffSThomas Gleixner 1489*9137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_DISABLE, spec_ib_disable) 1490*9137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_DISABLE, spec_ib_disable) 1491*9137bb27SThomas Gleixner TASK_PFA_CLEAR(SPEC_IB_DISABLE, spec_ib_disable) 1492*9137bb27SThomas Gleixner 1493*9137bb27SThomas Gleixner TASK_PFA_TEST(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable) 1494*9137bb27SThomas Gleixner TASK_PFA_SET(SPEC_IB_FORCE_DISABLE, spec_ib_force_disable) 1495*9137bb27SThomas Gleixner 14965eca1c10SIngo Molnar static inline void 1497717a94b5SNeilBrown current_restore_flags(unsigned long orig_flags, unsigned long flags) 1498907aed48SMel Gorman { 1499717a94b5SNeilBrown current->flags &= ~flags; 1500717a94b5SNeilBrown current->flags |= orig_flags & flags; 1501907aed48SMel Gorman } 1502907aed48SMel Gorman 15035eca1c10SIngo Molnar extern int cpuset_cpumask_can_shrink(const struct cpumask *cur, const struct cpumask *trial); 15045eca1c10SIngo Molnar extern int task_can_attach(struct task_struct *p, const struct cpumask *cs_cpus_allowed); 15051da177e4SLinus Torvalds #ifdef CONFIG_SMP 15065eca1c10SIngo Molnar extern void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask); 15075eca1c10SIngo Molnar extern int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask); 15081da177e4SLinus Torvalds #else 15095eca1c10SIngo Molnar static inline void do_set_cpus_allowed(struct task_struct *p, const struct cpumask *new_mask) 15101e1b6c51SKOSAKI Motohiro { 15111e1b6c51SKOSAKI Motohiro } 15125eca1c10SIngo Molnar static inline int set_cpus_allowed_ptr(struct task_struct *p, const struct cpumask *new_mask) 15131da177e4SLinus Torvalds { 151496f874e2SRusty Russell if (!cpumask_test_cpu(0, new_mask)) 15151da177e4SLinus Torvalds return -EINVAL; 15161da177e4SLinus Torvalds return 0; 15171da177e4SLinus Torvalds } 15181da177e4SLinus Torvalds #endif 1519e0ad9556SRusty Russell 15206d0d2878SChristian Borntraeger #ifndef cpu_relax_yield 15216d0d2878SChristian Borntraeger #define cpu_relax_yield() cpu_relax() 15226d0d2878SChristian Borntraeger #endif 15236d0d2878SChristian Borntraeger 1524fa93384fSDan Carpenter extern int yield_to(struct task_struct *p, bool preempt); 152536c8b586SIngo Molnar extern void set_user_nice(struct task_struct *p, long nice); 152636c8b586SIngo Molnar extern int task_prio(const struct task_struct *p); 15275eca1c10SIngo Molnar 1528d0ea0268SDongsheng Yang /** 1529d0ea0268SDongsheng Yang * task_nice - return the nice value of a given task. 1530d0ea0268SDongsheng Yang * @p: the task in question. 1531d0ea0268SDongsheng Yang * 1532d0ea0268SDongsheng Yang * Return: The nice value [ -20 ... 0 ... 19 ]. 1533d0ea0268SDongsheng Yang */ 1534d0ea0268SDongsheng Yang static inline int task_nice(const struct task_struct *p) 1535d0ea0268SDongsheng Yang { 1536d0ea0268SDongsheng Yang return PRIO_TO_NICE((p)->static_prio); 1537d0ea0268SDongsheng Yang } 15385eca1c10SIngo Molnar 153936c8b586SIngo Molnar extern int can_nice(const struct task_struct *p, const int nice); 154036c8b586SIngo Molnar extern int task_curr(const struct task_struct *p); 15411da177e4SLinus Torvalds extern int idle_cpu(int cpu); 1542943d355dSRohit Jain extern int available_idle_cpu(int cpu); 15435eca1c10SIngo Molnar extern int sched_setscheduler(struct task_struct *, int, const struct sched_param *); 15445eca1c10SIngo Molnar extern int sched_setscheduler_nocheck(struct task_struct *, int, const struct sched_param *); 15455eca1c10SIngo Molnar extern int sched_setattr(struct task_struct *, const struct sched_attr *); 1546794a56ebSJuri Lelli extern int sched_setattr_nocheck(struct task_struct *, const struct sched_attr *); 154736c8b586SIngo Molnar extern struct task_struct *idle_task(int cpu); 15485eca1c10SIngo Molnar 1549c4f30608SPaul E. McKenney /** 1550c4f30608SPaul E. McKenney * is_idle_task - is the specified task an idle task? 1551fa757281SRandy Dunlap * @p: the task in question. 1552e69f6186SYacine Belkadi * 1553e69f6186SYacine Belkadi * Return: 1 if @p is an idle task. 0 otherwise. 1554c4f30608SPaul E. McKenney */ 15557061ca3bSPaul E. McKenney static inline bool is_idle_task(const struct task_struct *p) 1556c4f30608SPaul E. McKenney { 1557c1de45caSPeter Zijlstra return !!(p->flags & PF_IDLE); 1558c4f30608SPaul E. McKenney } 15595eca1c10SIngo Molnar 156036c8b586SIngo Molnar extern struct task_struct *curr_task(int cpu); 1561a458ae2eSPeter Zijlstra extern void ia64_set_curr_task(int cpu, struct task_struct *p); 15621da177e4SLinus Torvalds 15631da177e4SLinus Torvalds void yield(void); 15641da177e4SLinus Torvalds 15651da177e4SLinus Torvalds union thread_union { 15660500871fSDavid Howells #ifndef CONFIG_ARCH_TASK_STRUCT_ON_STACK 15670500871fSDavid Howells struct task_struct task; 15680500871fSDavid Howells #endif 1569c65eacbeSAndy Lutomirski #ifndef CONFIG_THREAD_INFO_IN_TASK 15701da177e4SLinus Torvalds struct thread_info thread_info; 1571c65eacbeSAndy Lutomirski #endif 15721da177e4SLinus Torvalds unsigned long stack[THREAD_SIZE/sizeof(long)]; 15731da177e4SLinus Torvalds }; 15741da177e4SLinus Torvalds 15750500871fSDavid Howells #ifndef CONFIG_THREAD_INFO_IN_TASK 15760500871fSDavid Howells extern struct thread_info init_thread_info; 15770500871fSDavid Howells #endif 15780500871fSDavid Howells 15790500871fSDavid Howells extern unsigned long init_stack[THREAD_SIZE / sizeof(unsigned long)]; 15800500871fSDavid Howells 1581f3ac6067SIngo Molnar #ifdef CONFIG_THREAD_INFO_IN_TASK 1582f3ac6067SIngo Molnar static inline struct thread_info *task_thread_info(struct task_struct *task) 1583f3ac6067SIngo Molnar { 1584f3ac6067SIngo Molnar return &task->thread_info; 1585f3ac6067SIngo Molnar } 1586f3ac6067SIngo Molnar #elif !defined(__HAVE_THREAD_FUNCTIONS) 1587f3ac6067SIngo Molnar # define task_thread_info(task) ((struct thread_info *)(task)->stack) 1588f3ac6067SIngo Molnar #endif 1589f3ac6067SIngo Molnar 1590198fe21bSPavel Emelyanov /* 1591198fe21bSPavel Emelyanov * find a task by one of its numerical ids 1592198fe21bSPavel Emelyanov * 1593198fe21bSPavel Emelyanov * find_task_by_pid_ns(): 1594198fe21bSPavel Emelyanov * finds a task by its pid in the specified namespace 1595228ebcbeSPavel Emelyanov * find_task_by_vpid(): 1596228ebcbeSPavel Emelyanov * finds a task by its virtual pid 1597198fe21bSPavel Emelyanov * 1598e49859e7SPavel Emelyanov * see also find_vpid() etc in include/linux/pid.h 1599198fe21bSPavel Emelyanov */ 1600198fe21bSPavel Emelyanov 1601228ebcbeSPavel Emelyanov extern struct task_struct *find_task_by_vpid(pid_t nr); 16025eca1c10SIngo Molnar extern struct task_struct *find_task_by_pid_ns(pid_t nr, struct pid_namespace *ns); 1603198fe21bSPavel Emelyanov 16042ee08260SMike Rapoport /* 16052ee08260SMike Rapoport * find a task by its virtual pid and get the task struct 16062ee08260SMike Rapoport */ 16072ee08260SMike Rapoport extern struct task_struct *find_get_task_by_vpid(pid_t nr); 16082ee08260SMike Rapoport 1609b3c97528SHarvey Harrison extern int wake_up_state(struct task_struct *tsk, unsigned int state); 1610b3c97528SHarvey Harrison extern int wake_up_process(struct task_struct *tsk); 16113e51e3edSSamir Bellabes extern void wake_up_new_task(struct task_struct *tsk); 16125eca1c10SIngo Molnar 16131da177e4SLinus Torvalds #ifdef CONFIG_SMP 16141da177e4SLinus Torvalds extern void kick_process(struct task_struct *tsk); 16151da177e4SLinus Torvalds #else 16161da177e4SLinus Torvalds static inline void kick_process(struct task_struct *tsk) { } 16171da177e4SLinus Torvalds #endif 16181da177e4SLinus Torvalds 161982b89778SAdrian Hunter extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec); 16205eca1c10SIngo Molnar 162182b89778SAdrian Hunter static inline void set_task_comm(struct task_struct *tsk, const char *from) 162282b89778SAdrian Hunter { 162382b89778SAdrian Hunter __set_task_comm(tsk, from, false); 162482b89778SAdrian Hunter } 16255eca1c10SIngo Molnar 16263756f640SArnd Bergmann extern char *__get_task_comm(char *to, size_t len, struct task_struct *tsk); 16273756f640SArnd Bergmann #define get_task_comm(buf, tsk) ({ \ 16283756f640SArnd Bergmann BUILD_BUG_ON(sizeof(buf) != TASK_COMM_LEN); \ 16293756f640SArnd Bergmann __get_task_comm(buf, sizeof(buf), tsk); \ 16303756f640SArnd Bergmann }) 16311da177e4SLinus Torvalds 16321da177e4SLinus Torvalds #ifdef CONFIG_SMP 1633317f3941SPeter Zijlstra void scheduler_ipi(void); 163485ba2d86SRoland McGrath extern unsigned long wait_task_inactive(struct task_struct *, long match_state); 16351da177e4SLinus Torvalds #else 1636184748ccSPeter Zijlstra static inline void scheduler_ipi(void) { } 16375eca1c10SIngo Molnar static inline unsigned long wait_task_inactive(struct task_struct *p, long match_state) 163885ba2d86SRoland McGrath { 163985ba2d86SRoland McGrath return 1; 164085ba2d86SRoland McGrath } 16411da177e4SLinus Torvalds #endif 16421da177e4SLinus Torvalds 16435eca1c10SIngo Molnar /* 16445eca1c10SIngo Molnar * Set thread flags in other task's structures. 16455eca1c10SIngo Molnar * See asm/thread_info.h for TIF_xxxx flags available: 16461da177e4SLinus Torvalds */ 16471da177e4SLinus Torvalds static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag) 16481da177e4SLinus Torvalds { 1649a1261f54SAl Viro set_ti_thread_flag(task_thread_info(tsk), flag); 16501da177e4SLinus Torvalds } 16511da177e4SLinus Torvalds 16521da177e4SLinus Torvalds static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag) 16531da177e4SLinus Torvalds { 1654a1261f54SAl Viro clear_ti_thread_flag(task_thread_info(tsk), flag); 16551da177e4SLinus Torvalds } 16561da177e4SLinus Torvalds 165793ee37c2SDave Martin static inline void update_tsk_thread_flag(struct task_struct *tsk, int flag, 165893ee37c2SDave Martin bool value) 165993ee37c2SDave Martin { 166093ee37c2SDave Martin update_ti_thread_flag(task_thread_info(tsk), flag, value); 166193ee37c2SDave Martin } 166293ee37c2SDave Martin 16631da177e4SLinus Torvalds static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag) 16641da177e4SLinus Torvalds { 1665a1261f54SAl Viro return test_and_set_ti_thread_flag(task_thread_info(tsk), flag); 16661da177e4SLinus Torvalds } 16671da177e4SLinus Torvalds 16681da177e4SLinus Torvalds static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag) 16691da177e4SLinus Torvalds { 1670a1261f54SAl Viro return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag); 16711da177e4SLinus Torvalds } 16721da177e4SLinus Torvalds 16731da177e4SLinus Torvalds static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag) 16741da177e4SLinus Torvalds { 1675a1261f54SAl Viro return test_ti_thread_flag(task_thread_info(tsk), flag); 16761da177e4SLinus Torvalds } 16771da177e4SLinus Torvalds 16781da177e4SLinus Torvalds static inline void set_tsk_need_resched(struct task_struct *tsk) 16791da177e4SLinus Torvalds { 16801da177e4SLinus Torvalds set_tsk_thread_flag(tsk,TIF_NEED_RESCHED); 16811da177e4SLinus Torvalds } 16821da177e4SLinus Torvalds 16831da177e4SLinus Torvalds static inline void clear_tsk_need_resched(struct task_struct *tsk) 16841da177e4SLinus Torvalds { 16851da177e4SLinus Torvalds clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED); 16861da177e4SLinus Torvalds } 16871da177e4SLinus Torvalds 16888ae121acSGregory Haskins static inline int test_tsk_need_resched(struct task_struct *tsk) 16898ae121acSGregory Haskins { 16908ae121acSGregory Haskins return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED)); 16918ae121acSGregory Haskins } 16928ae121acSGregory Haskins 16931da177e4SLinus Torvalds /* 16941da177e4SLinus Torvalds * cond_resched() and cond_resched_lock(): latency reduction via 16951da177e4SLinus Torvalds * explicit rescheduling in places that are safe. The return 16961da177e4SLinus Torvalds * value indicates whether a reschedule was done in fact. 16971da177e4SLinus Torvalds * cond_resched_lock() will drop the spinlock before scheduling, 16981da177e4SLinus Torvalds */ 169935a773a0SPeter Zijlstra #ifndef CONFIG_PREEMPT 1700c3921ab7SLinus Torvalds extern int _cond_resched(void); 170135a773a0SPeter Zijlstra #else 170235a773a0SPeter Zijlstra static inline int _cond_resched(void) { return 0; } 170335a773a0SPeter Zijlstra #endif 17046f80bd98SFrederic Weisbecker 1705613afbf8SFrederic Weisbecker #define cond_resched() ({ \ 17063427445aSPeter Zijlstra ___might_sleep(__FILE__, __LINE__, 0); \ 1707613afbf8SFrederic Weisbecker _cond_resched(); \ 1708613afbf8SFrederic Weisbecker }) 17096f80bd98SFrederic Weisbecker 1710613afbf8SFrederic Weisbecker extern int __cond_resched_lock(spinlock_t *lock); 1711613afbf8SFrederic Weisbecker 1712613afbf8SFrederic Weisbecker #define cond_resched_lock(lock) ({ \ 17133427445aSPeter Zijlstra ___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\ 1714613afbf8SFrederic Weisbecker __cond_resched_lock(lock); \ 1715613afbf8SFrederic Weisbecker }) 1716613afbf8SFrederic Weisbecker 1717f6f3c437SSimon Horman static inline void cond_resched_rcu(void) 1718f6f3c437SSimon Horman { 1719f6f3c437SSimon Horman #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU) 1720f6f3c437SSimon Horman rcu_read_unlock(); 1721f6f3c437SSimon Horman cond_resched(); 1722f6f3c437SSimon Horman rcu_read_lock(); 1723f6f3c437SSimon Horman #endif 1724f6f3c437SSimon Horman } 1725f6f3c437SSimon Horman 17261da177e4SLinus Torvalds /* 17271da177e4SLinus Torvalds * Does a critical section need to be broken due to another 172895c354feSNick Piggin * task waiting?: (technically does not depend on CONFIG_PREEMPT, 172995c354feSNick Piggin * but a general need for low latency) 17301da177e4SLinus Torvalds */ 173195c354feSNick Piggin static inline int spin_needbreak(spinlock_t *lock) 17321da177e4SLinus Torvalds { 173395c354feSNick Piggin #ifdef CONFIG_PREEMPT 173495c354feSNick Piggin return spin_is_contended(lock); 173595c354feSNick Piggin #else 17361da177e4SLinus Torvalds return 0; 173795c354feSNick Piggin #endif 17381da177e4SLinus Torvalds } 17391da177e4SLinus Torvalds 174075f93fedSPeter Zijlstra static __always_inline bool need_resched(void) 174175f93fedSPeter Zijlstra { 174275f93fedSPeter Zijlstra return unlikely(tif_need_resched()); 174375f93fedSPeter Zijlstra } 174475f93fedSPeter Zijlstra 1745ee761f62SThomas Gleixner /* 17461da177e4SLinus Torvalds * Wrappers for p->thread_info->cpu access. No-op on UP. 17471da177e4SLinus Torvalds */ 17481da177e4SLinus Torvalds #ifdef CONFIG_SMP 17491da177e4SLinus Torvalds 17501da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p) 17511da177e4SLinus Torvalds { 1752c65eacbeSAndy Lutomirski #ifdef CONFIG_THREAD_INFO_IN_TASK 1753c65eacbeSAndy Lutomirski return p->cpu; 1754c65eacbeSAndy Lutomirski #else 1755a1261f54SAl Viro return task_thread_info(p)->cpu; 1756c65eacbeSAndy Lutomirski #endif 17571da177e4SLinus Torvalds } 17581da177e4SLinus Torvalds 1759c65cc870SIngo Molnar extern void set_task_cpu(struct task_struct *p, unsigned int cpu); 17601da177e4SLinus Torvalds 17611da177e4SLinus Torvalds #else 17621da177e4SLinus Torvalds 17631da177e4SLinus Torvalds static inline unsigned int task_cpu(const struct task_struct *p) 17641da177e4SLinus Torvalds { 17651da177e4SLinus Torvalds return 0; 17661da177e4SLinus Torvalds } 17671da177e4SLinus Torvalds 17681da177e4SLinus Torvalds static inline void set_task_cpu(struct task_struct *p, unsigned int cpu) 17691da177e4SLinus Torvalds { 17701da177e4SLinus Torvalds } 17711da177e4SLinus Torvalds 17721da177e4SLinus Torvalds #endif /* CONFIG_SMP */ 17731da177e4SLinus Torvalds 1774d9345c65SPan Xinhui /* 1775d9345c65SPan Xinhui * In order to reduce various lock holder preemption latencies provide an 1776d9345c65SPan Xinhui * interface to see if a vCPU is currently running or not. 1777d9345c65SPan Xinhui * 1778d9345c65SPan Xinhui * This allows us to terminate optimistic spin loops and block, analogous to 1779d9345c65SPan Xinhui * the native optimistic spin heuristic of testing if the lock owner task is 1780d9345c65SPan Xinhui * running or not. 1781d9345c65SPan Xinhui */ 1782d9345c65SPan Xinhui #ifndef vcpu_is_preempted 1783d9345c65SPan Xinhui # define vcpu_is_preempted(cpu) false 1784d9345c65SPan Xinhui #endif 1785d9345c65SPan Xinhui 178696f874e2SRusty Russell extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask); 178796f874e2SRusty Russell extern long sched_getaffinity(pid_t pid, struct cpumask *mask); 17885c45bf27SSiddha, Suresh B 178982455257SDave Hansen #ifndef TASK_SIZE_OF 179082455257SDave Hansen #define TASK_SIZE_OF(tsk) TASK_SIZE 179182455257SDave Hansen #endif 179282455257SDave Hansen 1793d7822b1eSMathieu Desnoyers #ifdef CONFIG_RSEQ 1794d7822b1eSMathieu Desnoyers 1795d7822b1eSMathieu Desnoyers /* 1796d7822b1eSMathieu Desnoyers * Map the event mask on the user-space ABI enum rseq_cs_flags 1797d7822b1eSMathieu Desnoyers * for direct mask checks. 1798d7822b1eSMathieu Desnoyers */ 1799d7822b1eSMathieu Desnoyers enum rseq_event_mask_bits { 1800d7822b1eSMathieu Desnoyers RSEQ_EVENT_PREEMPT_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_PREEMPT_BIT, 1801d7822b1eSMathieu Desnoyers RSEQ_EVENT_SIGNAL_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_SIGNAL_BIT, 1802d7822b1eSMathieu Desnoyers RSEQ_EVENT_MIGRATE_BIT = RSEQ_CS_FLAG_NO_RESTART_ON_MIGRATE_BIT, 1803d7822b1eSMathieu Desnoyers }; 1804d7822b1eSMathieu Desnoyers 1805d7822b1eSMathieu Desnoyers enum rseq_event_mask { 1806d7822b1eSMathieu Desnoyers RSEQ_EVENT_PREEMPT = (1U << RSEQ_EVENT_PREEMPT_BIT), 1807d7822b1eSMathieu Desnoyers RSEQ_EVENT_SIGNAL = (1U << RSEQ_EVENT_SIGNAL_BIT), 1808d7822b1eSMathieu Desnoyers RSEQ_EVENT_MIGRATE = (1U << RSEQ_EVENT_MIGRATE_BIT), 1809d7822b1eSMathieu Desnoyers }; 1810d7822b1eSMathieu Desnoyers 1811d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t) 1812d7822b1eSMathieu Desnoyers { 1813d7822b1eSMathieu Desnoyers if (t->rseq) 1814d7822b1eSMathieu Desnoyers set_tsk_thread_flag(t, TIF_NOTIFY_RESUME); 1815d7822b1eSMathieu Desnoyers } 1816d7822b1eSMathieu Desnoyers 1817784e0300SWill Deacon void __rseq_handle_notify_resume(struct ksignal *sig, struct pt_regs *regs); 1818d7822b1eSMathieu Desnoyers 1819784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig, 1820784e0300SWill Deacon struct pt_regs *regs) 1821d7822b1eSMathieu Desnoyers { 1822d7822b1eSMathieu Desnoyers if (current->rseq) 1823784e0300SWill Deacon __rseq_handle_notify_resume(ksig, regs); 1824d7822b1eSMathieu Desnoyers } 1825d7822b1eSMathieu Desnoyers 1826784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig, 1827784e0300SWill Deacon struct pt_regs *regs) 1828d7822b1eSMathieu Desnoyers { 1829d7822b1eSMathieu Desnoyers preempt_disable(); 1830d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_SIGNAL_BIT, ¤t->rseq_event_mask); 1831d7822b1eSMathieu Desnoyers preempt_enable(); 1832784e0300SWill Deacon rseq_handle_notify_resume(ksig, regs); 1833d7822b1eSMathieu Desnoyers } 1834d7822b1eSMathieu Desnoyers 1835d7822b1eSMathieu Desnoyers /* rseq_preempt() requires preemption to be disabled. */ 1836d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t) 1837d7822b1eSMathieu Desnoyers { 1838d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_PREEMPT_BIT, &t->rseq_event_mask); 1839d7822b1eSMathieu Desnoyers rseq_set_notify_resume(t); 1840d7822b1eSMathieu Desnoyers } 1841d7822b1eSMathieu Desnoyers 1842d7822b1eSMathieu Desnoyers /* rseq_migrate() requires preemption to be disabled. */ 1843d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t) 1844d7822b1eSMathieu Desnoyers { 1845d7822b1eSMathieu Desnoyers __set_bit(RSEQ_EVENT_MIGRATE_BIT, &t->rseq_event_mask); 1846d7822b1eSMathieu Desnoyers rseq_set_notify_resume(t); 1847d7822b1eSMathieu Desnoyers } 1848d7822b1eSMathieu Desnoyers 1849d7822b1eSMathieu Desnoyers /* 1850d7822b1eSMathieu Desnoyers * If parent process has a registered restartable sequences area, the 18519a789fcfSMathieu Desnoyers * child inherits. Only applies when forking a process, not a thread. 1852d7822b1eSMathieu Desnoyers */ 1853d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags) 1854d7822b1eSMathieu Desnoyers { 1855d7822b1eSMathieu Desnoyers if (clone_flags & CLONE_THREAD) { 1856d7822b1eSMathieu Desnoyers t->rseq = NULL; 1857d7822b1eSMathieu Desnoyers t->rseq_len = 0; 1858d7822b1eSMathieu Desnoyers t->rseq_sig = 0; 1859d7822b1eSMathieu Desnoyers t->rseq_event_mask = 0; 1860d7822b1eSMathieu Desnoyers } else { 1861d7822b1eSMathieu Desnoyers t->rseq = current->rseq; 1862d7822b1eSMathieu Desnoyers t->rseq_len = current->rseq_len; 1863d7822b1eSMathieu Desnoyers t->rseq_sig = current->rseq_sig; 1864d7822b1eSMathieu Desnoyers t->rseq_event_mask = current->rseq_event_mask; 1865d7822b1eSMathieu Desnoyers } 1866d7822b1eSMathieu Desnoyers } 1867d7822b1eSMathieu Desnoyers 1868d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t) 1869d7822b1eSMathieu Desnoyers { 1870d7822b1eSMathieu Desnoyers t->rseq = NULL; 1871d7822b1eSMathieu Desnoyers t->rseq_len = 0; 1872d7822b1eSMathieu Desnoyers t->rseq_sig = 0; 1873d7822b1eSMathieu Desnoyers t->rseq_event_mask = 0; 1874d7822b1eSMathieu Desnoyers } 1875d7822b1eSMathieu Desnoyers 1876d7822b1eSMathieu Desnoyers #else 1877d7822b1eSMathieu Desnoyers 1878d7822b1eSMathieu Desnoyers static inline void rseq_set_notify_resume(struct task_struct *t) 1879d7822b1eSMathieu Desnoyers { 1880d7822b1eSMathieu Desnoyers } 1881784e0300SWill Deacon static inline void rseq_handle_notify_resume(struct ksignal *ksig, 1882784e0300SWill Deacon struct pt_regs *regs) 1883d7822b1eSMathieu Desnoyers { 1884d7822b1eSMathieu Desnoyers } 1885784e0300SWill Deacon static inline void rseq_signal_deliver(struct ksignal *ksig, 1886784e0300SWill Deacon struct pt_regs *regs) 1887d7822b1eSMathieu Desnoyers { 1888d7822b1eSMathieu Desnoyers } 1889d7822b1eSMathieu Desnoyers static inline void rseq_preempt(struct task_struct *t) 1890d7822b1eSMathieu Desnoyers { 1891d7822b1eSMathieu Desnoyers } 1892d7822b1eSMathieu Desnoyers static inline void rseq_migrate(struct task_struct *t) 1893d7822b1eSMathieu Desnoyers { 1894d7822b1eSMathieu Desnoyers } 1895d7822b1eSMathieu Desnoyers static inline void rseq_fork(struct task_struct *t, unsigned long clone_flags) 1896d7822b1eSMathieu Desnoyers { 1897d7822b1eSMathieu Desnoyers } 1898d7822b1eSMathieu Desnoyers static inline void rseq_execve(struct task_struct *t) 1899d7822b1eSMathieu Desnoyers { 1900d7822b1eSMathieu Desnoyers } 1901d7822b1eSMathieu Desnoyers 1902d7822b1eSMathieu Desnoyers #endif 1903d7822b1eSMathieu Desnoyers 1904d7822b1eSMathieu Desnoyers #ifdef CONFIG_DEBUG_RSEQ 1905d7822b1eSMathieu Desnoyers 1906d7822b1eSMathieu Desnoyers void rseq_syscall(struct pt_regs *regs); 1907d7822b1eSMathieu Desnoyers 1908d7822b1eSMathieu Desnoyers #else 1909d7822b1eSMathieu Desnoyers 1910d7822b1eSMathieu Desnoyers static inline void rseq_syscall(struct pt_regs *regs) 1911d7822b1eSMathieu Desnoyers { 1912d7822b1eSMathieu Desnoyers } 1913d7822b1eSMathieu Desnoyers 1914d7822b1eSMathieu Desnoyers #endif 1915d7822b1eSMathieu Desnoyers 19161da177e4SLinus Torvalds #endif 1917