blob: af9590c8bfb0f39718f16c4fc2d4f3f9275e54f2 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#ifndef _LINUX_SCHED_H
2#define _LINUX_SCHED_H
3
David Howells607ca462012-10-13 10:46:48 +01004#include <uapi/linux/sched.h>
David Woodhouseb7b3c762006-04-27 00:12:56 +01005
Dongsheng Yang5c228072014-01-27 17:15:37 -05006#include <linux/sched/prio.h>
7
Linus Torvalds1da177e2005-04-16 15:20:36 -07008#include <linux/capability.h>
Ingo Molnarb69339ba2017-02-05 16:15:03 +01009#include <linux/mutex.h>
Peter Zijlstrafb00aca2013-11-07 14:43:43 +010010#include <linux/plist.h>
Martin Schwidefskyc92ff1b2007-10-16 01:24:43 -070011#include <linux/mm_types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <asm/ptrace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013
Linus Torvalds1da177e2005-04-16 15:20:36 -070014#include <linux/sem.h>
Jack Millerab602f72014-08-08 14:23:19 -070015#include <linux/shm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/signal.h>
Ingo Molnarf361bf42017-02-03 23:47:37 +010017#include <linux/signal_types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/pid.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <linux/seccomp.h>
Jiri Pirko05725f72009-04-14 20:17:16 +020020#include <linux/rculist.h>
Ingo Molnar23f78d4a2006-06-27 02:54:53 -070021#include <linux/rtmutex.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022
David Woodhousea3b67142006-04-25 14:54:40 +010023#include <linux/resource.h>
David Woodhousea3b67142006-04-25 14:54:40 +010024#include <linux/hrtimer.h>
Dmitry Vyukov5c9a8752016-03-22 14:27:30 -070025#include <linux/kcov.h>
Andrew Morton7c3ab7382006-12-10 02:19:19 -080026#include <linux/task_io_accounting.h>
Arjan van de Ven97455122008-01-25 21:08:34 +010027#include <linux/latencytop.h>
David Howells9e2b2dc2008-08-13 16:20:04 +010028#include <linux/cred.h>
Ming Lei21caf2f2013-02-22 16:34:08 -080029#include <linux/gfp.h>
Ingo Molnarfd771232017-02-02 20:56:33 +010030#include <linux/topology.h>
Aaron Tomlind4311ff2014-09-12 14:16:17 +010031#include <linux/magic.h>
Tejun Heo7d7efec2015-05-13 16:35:16 -040032#include <linux/cgroup-defs.h>
David Woodhousea3b67142006-04-25 14:54:40 +010033
Ingo Molnar70b81572017-02-03 12:11:00 +010034#include <asm/current.h>
35
Ingo Molnarc7af7872017-02-03 22:01:58 +010036/* task_struct member predeclarations: */
37struct audit_context;
38struct autogroup;
39struct backing_dev_info;
40struct bio_list;
41struct blk_plug;
42struct cfs_rq;
43struct filename;
44struct fs_struct;
45struct futex_pi_state;
46struct io_context;
47struct mempolicy;
48struct nameidata;
49struct nsproxy;
50struct perf_event_context;
51struct pid_namespace;
52struct pipe_inode_info;
53struct rcu_node;
54struct reclaim_state;
55struct robust_list_head;
Ingo Molnare2d1e2a2017-02-01 18:07:51 +010056struct sched_attr;
57struct sched_param;
Ingo Molnar43ae34c2007-07-09 18:52:00 +020058struct seq_file;
Ingo Molnarc7af7872017-02-03 22:01:58 +010059struct sighand_struct;
60struct signal_struct;
61struct task_delay_info;
Ingo Molnar4cf86d72007-10-15 17:00:14 +020062struct task_group;
Ingo Molnarc7af7872017-02-03 22:01:58 +010063struct task_struct;
64struct uts_namespace;
Linus Torvalds1da177e2005-04-16 15:20:36 -070065
Linus Torvalds4a8342d2005-09-29 15:18:21 -070066/*
67 * Task state bitmask. NOTE! These bits are also
68 * encoded in fs/proc/array.c: get_task_state().
69 *
70 * We have two separate sets of flags: task->state
71 * is about runnability, while task->exit_state are
72 * about the task exiting. Confusing, but this way
73 * modifying one set can't modify the other one by
74 * mistake.
75 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070076#define TASK_RUNNING 0
77#define TASK_INTERRUPTIBLE 1
78#define TASK_UNINTERRUPTIBLE 2
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -050079#define __TASK_STOPPED 4
80#define __TASK_TRACED 8
Linus Torvalds4a8342d2005-09-29 15:18:21 -070081/* in tsk->exit_state */
Oleg Nesterovad866222014-04-07 15:38:46 -070082#define EXIT_DEAD 16
83#define EXIT_ZOMBIE 32
Oleg Nesterovabd50b32014-04-07 15:38:42 -070084#define EXIT_TRACE (EXIT_ZOMBIE | EXIT_DEAD)
Linus Torvalds4a8342d2005-09-29 15:18:21 -070085/* in tsk->state again */
Mike Galbraithaf927232007-10-15 17:00:13 +020086#define TASK_DEAD 64
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -050087#define TASK_WAKEKILL 128
Peter Zijlstrae9c84312009-09-15 14:43:03 +020088#define TASK_WAKING 256
Thomas Gleixnerf2530dc2013-04-09 09:33:34 +020089#define TASK_PARKED 512
Peter Zijlstra80ed87c2015-05-08 14:23:45 +020090#define TASK_NOLOAD 1024
Peter Zijlstra7dc603c2016-06-16 13:29:28 +020091#define TASK_NEW 2048
92#define TASK_STATE_MAX 4096
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -050093
Peter Zijlstra7dc603c2016-06-16 13:29:28 +020094#define TASK_STATE_TO_CHAR_STR "RSDTtXZxKWPNn"
Peter Zijlstra73342152009-12-17 13:16:27 +010095
Davidlohr Bueso642fa442017-01-03 13:43:14 -080096/* Convenience macros for the sake of set_current_state */
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -050097#define TASK_KILLABLE (TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
98#define TASK_STOPPED (TASK_WAKEKILL | __TASK_STOPPED)
99#define TASK_TRACED (TASK_WAKEKILL | __TASK_TRACED)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100
Peter Zijlstra80ed87c2015-05-08 14:23:45 +0200101#define TASK_IDLE (TASK_UNINTERRUPTIBLE | TASK_NOLOAD)
102
Matthew Wilcox92a1f4b2007-12-06 10:55:25 -0500103/* Convenience macros for the sake of wake_up */
104#define TASK_NORMAL (TASK_INTERRUPTIBLE | TASK_UNINTERRUPTIBLE)
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -0500105#define TASK_ALL (TASK_NORMAL | __TASK_STOPPED | __TASK_TRACED)
Matthew Wilcox92a1f4b2007-12-06 10:55:25 -0500106
107/* get_task_state() */
108#define TASK_REPORT (TASK_RUNNING | TASK_INTERRUPTIBLE | \
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -0500109 TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
Oleg Nesterov74e37202014-01-23 15:55:35 -0800110 __TASK_TRACED | EXIT_ZOMBIE | EXIT_DEAD)
Matthew Wilcox92a1f4b2007-12-06 10:55:25 -0500111
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -0500112#define task_is_traced(task) ((task->state & __TASK_TRACED) != 0)
113#define task_is_stopped(task) ((task->state & __TASK_STOPPED) != 0)
Matthew Wilcox92a1f4b2007-12-06 10:55:25 -0500114#define task_is_stopped_or_traced(task) \
Matthew Wilcoxf021a3c2007-12-06 11:13:16 -0500115 ((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
Matthew Wilcox92a1f4b2007-12-06 10:55:25 -0500116#define task_contributes_to_load(task) \
Nathan Lynche3c8ca82009-04-08 19:45:12 -0500117 ((task->state & TASK_UNINTERRUPTIBLE) != 0 && \
Peter Zijlstra80ed87c2015-05-08 14:23:45 +0200118 (task->flags & PF_FROZEN) == 0 && \
119 (task->state & TASK_NOLOAD) == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
Peter Zijlstra8eb23b92014-09-24 10:18:55 +0200121#ifdef CONFIG_DEBUG_ATOMIC_SLEEP
122
Peter Zijlstra8eb23b92014-09-24 10:18:55 +0200123#define __set_current_state(state_value) \
124 do { \
125 current->task_state_change = _THIS_IP_; \
126 current->state = (state_value); \
127 } while (0)
128#define set_current_state(state_value) \
129 do { \
130 current->task_state_change = _THIS_IP_; \
Peter Zijlstraa2250232016-10-19 15:45:27 +0200131 smp_store_mb(current->state, (state_value)); \
Peter Zijlstra8eb23b92014-09-24 10:18:55 +0200132 } while (0)
133
134#else
Andrew Morton498d0c52005-09-13 01:25:14 -0700135/*
136 * set_current_state() includes a barrier so that the write of current->state
137 * is correctly serialised wrt the caller's subsequent test of whether to
138 * actually sleep:
139 *
Peter Zijlstraa2250232016-10-19 15:45:27 +0200140 * for (;;) {
Andrew Morton498d0c52005-09-13 01:25:14 -0700141 * set_current_state(TASK_UNINTERRUPTIBLE);
Peter Zijlstraa2250232016-10-19 15:45:27 +0200142 * if (!need_sleep)
143 * break;
Andrew Morton498d0c52005-09-13 01:25:14 -0700144 *
Peter Zijlstraa2250232016-10-19 15:45:27 +0200145 * schedule();
146 * }
147 * __set_current_state(TASK_RUNNING);
148 *
149 * If the caller does not need such serialisation (because, for instance, the
150 * condition test and condition change and wakeup are under the same lock) then
151 * use __set_current_state().
152 *
153 * The above is typically ordered against the wakeup, which does:
154 *
155 * need_sleep = false;
156 * wake_up_state(p, TASK_UNINTERRUPTIBLE);
157 *
158 * Where wake_up_state() (and all other wakeup primitives) imply enough
159 * barriers to order the store of the variable against wakeup.
160 *
161 * Wakeup will do: if (@state & p->state) p->state = TASK_RUNNING, that is,
162 * once it observes the TASK_UNINTERRUPTIBLE store the waking CPU can issue a
163 * TASK_RUNNING store which can collide with __set_current_state(TASK_RUNNING).
164 *
165 * This is obviously fine, since they both store the exact same value.
166 *
167 * Also see the comments of try_to_wake_up().
Andrew Morton498d0c52005-09-13 01:25:14 -0700168 */
Peter Zijlstra8eb23b92014-09-24 10:18:55 +0200169#define __set_current_state(state_value) \
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170 do { current->state = (state_value); } while (0)
Peter Zijlstra8eb23b92014-09-24 10:18:55 +0200171#define set_current_state(state_value) \
Peter Zijlstrab92b8b32015-05-12 10:51:55 +0200172 smp_store_mb(current->state, (state_value))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173
Peter Zijlstra8eb23b92014-09-24 10:18:55 +0200174#endif
175
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176/* Task command name length */
177#define TASK_COMM_LEN 16
178
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179extern void sched_init(void);
180extern void sched_init_smp(void);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181
Rik van Riel3fa08182015-03-09 12:12:07 -0400182extern cpumask_var_t cpu_isolated_map;
183
Andrew Morton89f19f02009-09-19 11:55:44 -0700184extern int runqueue_is_locked(int cpu);
Ingo Molnar017730c2008-05-12 21:20:52 +0200185
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186extern void cpu_init (void);
187extern void trap_init(void);
188extern void update_process_times(int user);
189extern void scheduler_tick(void);
190
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191#define MAX_SCHEDULE_TIMEOUT LONG_MAX
Harvey Harrisonb3c97522008-02-13 15:03:15 -0800192extern signed long schedule_timeout(signed long timeout);
Nishanth Aravamudan64ed93a2005-09-10 00:27:21 -0700193extern signed long schedule_timeout_interruptible(signed long timeout);
Matthew Wilcox294d5cc2007-12-06 11:59:46 -0500194extern signed long schedule_timeout_killable(signed long timeout);
Nishanth Aravamudan64ed93a2005-09-10 00:27:21 -0700195extern signed long schedule_timeout_uninterruptible(signed long timeout);
Andrew Morton69b27ba2016-03-25 14:20:21 -0700196extern signed long schedule_timeout_idle(signed long timeout);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197asmlinkage void schedule(void);
Thomas Gleixnerc5491ea2011-03-21 12:09:35 +0100198extern void schedule_preempt_disabled(void);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199
Tejun Heo10ab5642016-10-28 12:58:10 -0400200extern int __must_check io_schedule_prepare(void);
201extern void io_schedule_finish(int token);
NeilBrown9cff8ad2015-02-13 15:49:17 +1100202extern long io_schedule_timeout(long timeout);
Tejun Heo10ab5642016-10-28 12:58:10 -0400203extern void io_schedule(void);
NeilBrown9cff8ad2015-02-13 15:49:17 +1100204
Frank Mayharf06febc2008-09-12 09:54:39 -0700205/**
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200206 * struct prev_cputime - snaphsot of system and user cputime
Frederic Weisbeckerd37f761d2012-11-22 00:58:35 +0100207 * @utime: time spent in user mode
208 * @stime: time spent in system mode
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200209 * @lock: protects the above two fields
Frederic Weisbeckerd37f761d2012-11-22 00:58:35 +0100210 *
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200211 * Stores previous user/system time values such that we can guarantee
212 * monotonicity.
Frederic Weisbeckerd37f761d2012-11-22 00:58:35 +0100213 */
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200214struct prev_cputime {
215#ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
Frederic Weisbecker5613fda2017-01-31 04:09:23 +0100216 u64 utime;
217 u64 stime;
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200218 raw_spinlock_t lock;
219#endif
Frederic Weisbeckerd37f761d2012-11-22 00:58:35 +0100220};
221
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200222static inline void prev_cputime_init(struct prev_cputime *prev)
223{
224#ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
225 prev->utime = prev->stime = 0;
226 raw_spin_lock_init(&prev->lock);
227#endif
228}
229
Frederic Weisbeckerd37f761d2012-11-22 00:58:35 +0100230/**
Frank Mayharf06febc2008-09-12 09:54:39 -0700231 * struct task_cputime - collected CPU time counts
Frederic Weisbecker5613fda2017-01-31 04:09:23 +0100232 * @utime: time spent in user mode, in nanoseconds
233 * @stime: time spent in kernel mode, in nanoseconds
Frank Mayharf06febc2008-09-12 09:54:39 -0700234 * @sum_exec_runtime: total time spent on the CPU, in nanoseconds
Ingo Molnar5ce73a42008-09-14 17:11:46 +0200235 *
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200236 * This structure groups together three kinds of CPU time that are tracked for
237 * threads and thread groups. Most things considering CPU time want to group
238 * these counts together and treat all three of them in parallel.
Frank Mayharf06febc2008-09-12 09:54:39 -0700239 */
240struct task_cputime {
Frederic Weisbecker5613fda2017-01-31 04:09:23 +0100241 u64 utime;
242 u64 stime;
Frank Mayharf06febc2008-09-12 09:54:39 -0700243 unsigned long long sum_exec_runtime;
244};
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200245
Frank Mayharf06febc2008-09-12 09:54:39 -0700246/* Alternate field names when used to cache expirations. */
Frank Mayharf06febc2008-09-12 09:54:39 -0700247#define virt_exp utime
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200248#define prof_exp stime
Frank Mayharf06febc2008-09-12 09:54:39 -0700249#define sched_exp sum_exec_runtime
250
Jason Low971e8a982015-04-28 13:00:23 -0700251/*
252 * This is the atomic variant of task_cputime, which can be used for
253 * storing and updating task_cputime statistics without locking.
254 */
255struct task_cputime_atomic {
256 atomic64_t utime;
257 atomic64_t stime;
258 atomic64_t sum_exec_runtime;
259};
260
261#define INIT_CPUTIME_ATOMIC \
262 (struct task_cputime_atomic) { \
263 .utime = ATOMIC64_INIT(0), \
264 .stime = ATOMIC64_INIT(0), \
265 .sum_exec_runtime = ATOMIC64_INIT(0), \
266 }
267
Frank Mayharf06febc2008-09-12 09:54:39 -0700268/**
Peter Zijlstra4cd4c1b2009-02-05 12:24:16 +0100269 * struct thread_group_cputimer - thread group interval timer counts
Jason Low920ce392015-05-08 14:31:50 -0700270 * @cputime_atomic: atomic thread group interval timers.
Jason Lowd5c373e2015-10-14 12:07:55 -0700271 * @running: true when there are timers running and
272 * @cputime_atomic receives updates.
Jason Lowc8d75aa2015-10-14 12:07:56 -0700273 * @checking_timer: true when a thread in the group is in the
274 * process of checking for thread group timers.
Frank Mayharf06febc2008-09-12 09:54:39 -0700275 *
276 * This structure contains the version of task_cputime, above, that is
Peter Zijlstra4cd4c1b2009-02-05 12:24:16 +0100277 * used for thread group CPU timer calculations.
Frank Mayharf06febc2008-09-12 09:54:39 -0700278 */
Peter Zijlstra4cd4c1b2009-02-05 12:24:16 +0100279struct thread_group_cputimer {
Jason Low71107442015-04-28 13:00:24 -0700280 struct task_cputime_atomic cputime_atomic;
Jason Lowd5c373e2015-10-14 12:07:55 -0700281 bool running;
Jason Lowc8d75aa2015-10-14 12:07:56 -0700282 bool checking_timer;
Frank Mayharf06febc2008-09-12 09:54:39 -0700283};
Frank Mayharf06febc2008-09-12 09:54:39 -0700284
Ben Blum4714d1d2011-05-26 16:25:18 -0700285#include <linux/rwsem.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286
Naveen N. Raof6db83472015-06-25 23:53:37 +0530287#ifdef CONFIG_SCHED_INFO
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288struct sched_info {
289 /* cumulative counters */
Ingo Molnar2d723762007-10-15 17:00:12 +0200290 unsigned long pcount; /* # of times run on this cpu */
Ken Chen9c2c4802008-12-16 23:41:22 -0800291 unsigned long long run_delay; /* time spent waiting on a runqueue */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
293 /* timestamps */
Balbir Singh172ba842007-07-09 18:52:00 +0200294 unsigned long long last_arrival,/* when we last ran on a cpu */
295 last_queued; /* when we were last queued to run */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296};
Naveen N. Raof6db83472015-06-25 23:53:37 +0530297#endif /* CONFIG_SCHED_INFO */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298
Chandra Seetharaman52f17b62006-07-14 00:24:38 -0700299static inline int sched_info_on(void)
300{
301#ifdef CONFIG_SCHEDSTATS
302 return 1;
303#elif defined(CONFIG_TASK_DELAY_ACCT)
304 extern int delayacct_on;
305 return delayacct_on;
306#else
307 return 0;
Shailabh Nagarca74e922006-07-14 00:24:36 -0700308#endif
Chandra Seetharaman52f17b62006-07-14 00:24:38 -0700309}
Shailabh Nagarca74e922006-07-14 00:24:36 -0700310
Mel Gormancb251762016-02-05 09:08:36 +0000311#ifdef CONFIG_SCHEDSTATS
312void force_schedstat_enabled(void);
313#endif
314
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315/*
Yuyang Du6ecdd742016-04-05 12:12:26 +0800316 * Integer metrics need fixed point arithmetic, e.g., sched/fair
317 * has a few: load, load_avg, util_avg, freq, and capacity.
318 *
319 * We define a basic fixed point arithmetic range, and then formalize
320 * all these metrics based on that basic range.
321 */
322# define SCHED_FIXEDPOINT_SHIFT 10
323# define SCHED_FIXEDPOINT_SCALE (1L << SCHED_FIXEDPOINT_SHIFT)
324
Chen, Kenneth W383f2832005-09-09 13:02:02 -0700325#ifdef ARCH_HAS_PREFETCH_SWITCH_STACK
Ingo Molnar36c8b582006-07-03 00:25:41 -0700326extern void prefetch_stack(struct task_struct *t);
Chen, Kenneth W383f2832005-09-09 13:02:02 -0700327#else
328static inline void prefetch_stack(struct task_struct *t) { }
329#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330
Ingo Molnar20b8a592007-07-09 18:51:58 +0200331struct load_weight {
Peter Zijlstra9dbdb152013-11-18 18:27:06 +0100332 unsigned long weight;
333 u32 inv_weight;
Ingo Molnar20b8a592007-07-09 18:51:58 +0200334};
335
Yuyang Du9d89c252015-07-15 08:04:37 +0800336/*
Yuyang Du7b595332016-04-05 12:12:28 +0800337 * The load_avg/util_avg accumulates an infinite geometric series
338 * (see __update_load_avg() in kernel/sched/fair.c).
339 *
340 * [load_avg definition]
341 *
342 * load_avg = runnable% * scale_load_down(load)
343 *
344 * where runnable% is the time ratio that a sched_entity is runnable.
345 * For cfs_rq, it is the aggregated load_avg of all runnable and
Yuyang Du9d89c252015-07-15 08:04:37 +0800346 * blocked sched_entities.
Yuyang Du7b595332016-04-05 12:12:28 +0800347 *
348 * load_avg may also take frequency scaling into account:
349 *
350 * load_avg = runnable% * scale_load_down(load) * freq%
351 *
352 * where freq% is the CPU frequency normalized to the highest frequency.
353 *
354 * [util_avg definition]
355 *
356 * util_avg = running% * SCHED_CAPACITY_SCALE
357 *
358 * where running% is the time ratio that a sched_entity is running on
359 * a CPU. For cfs_rq, it is the aggregated util_avg of all runnable
360 * and blocked sched_entities.
361 *
362 * util_avg may also factor frequency scaling and CPU capacity scaling:
363 *
364 * util_avg = running% * SCHED_CAPACITY_SCALE * freq% * capacity%
365 *
366 * where freq% is the same as above, and capacity% is the CPU capacity
367 * normalized to the greatest capacity (due to uarch differences, etc).
368 *
369 * N.B., the above ratios (runnable%, running%, freq%, and capacity%)
370 * themselves are in the range of [0, 1]. To do fixed point arithmetics,
371 * we therefore scale them to as large a range as necessary. This is for
372 * example reflected by util_avg's SCHED_CAPACITY_SCALE.
373 *
374 * [Overflow issue]
375 *
376 * The 64-bit load_sum can have 4353082796 (=2^64/47742/88761) entities
377 * with the highest load (=88761), always runnable on a single cfs_rq,
378 * and should not overflow as the number already hits PID_MAX_LIMIT.
379 *
380 * For all other cases (including 32-bit kernels), struct load_weight's
381 * weight will overflow first before we do, because:
382 *
383 * Max(load_avg) <= Max(load.weight)
384 *
385 * Then it is the load_weight's responsibility to consider overflow
386 * issues.
Yuyang Du9d89c252015-07-15 08:04:37 +0800387 */
Paul Turner9d85f212012-10-04 13:18:29 +0200388struct sched_avg {
Yuyang Du9d89c252015-07-15 08:04:37 +0800389 u64 last_update_time, load_sum;
390 u32 util_sum, period_contrib;
391 unsigned long load_avg, util_avg;
Paul Turner9d85f212012-10-04 13:18:29 +0200392};
393
Ingo Molnar94c18222007-08-02 17:41:40 +0200394#ifdef CONFIG_SCHEDSTATS
Lucas De Marchi41acab82010-03-10 23:37:45 -0300395struct sched_statistics {
Ingo Molnar94c18222007-08-02 17:41:40 +0200396 u64 wait_start;
397 u64 wait_max;
Arjan van de Ven6d082592008-01-25 21:08:35 +0100398 u64 wait_count;
399 u64 wait_sum;
Arjan van de Ven8f0dfc32009-07-20 11:26:58 -0700400 u64 iowait_count;
401 u64 iowait_sum;
Ingo Molnar94c18222007-08-02 17:41:40 +0200402
403 u64 sleep_start;
Ingo Molnar20b8a592007-07-09 18:51:58 +0200404 u64 sleep_max;
Ingo Molnar94c18222007-08-02 17:41:40 +0200405 s64 sum_sleep_runtime;
406
407 u64 block_start;
Ingo Molnar20b8a592007-07-09 18:51:58 +0200408 u64 block_max;
409 u64 exec_max;
Ingo Molnareba1ed42007-10-15 17:00:02 +0200410 u64 slice_max;
Ingo Molnarcc367732007-10-15 17:00:18 +0200411
Ingo Molnarcc367732007-10-15 17:00:18 +0200412 u64 nr_migrations_cold;
413 u64 nr_failed_migrations_affine;
414 u64 nr_failed_migrations_running;
415 u64 nr_failed_migrations_hot;
416 u64 nr_forced_migrations;
Ingo Molnarcc367732007-10-15 17:00:18 +0200417
418 u64 nr_wakeups;
419 u64 nr_wakeups_sync;
420 u64 nr_wakeups_migrate;
421 u64 nr_wakeups_local;
422 u64 nr_wakeups_remote;
423 u64 nr_wakeups_affine;
424 u64 nr_wakeups_affine_attempts;
425 u64 nr_wakeups_passive;
426 u64 nr_wakeups_idle;
Lucas De Marchi41acab82010-03-10 23:37:45 -0300427};
428#endif
429
430struct sched_entity {
431 struct load_weight load; /* for load-balancing */
432 struct rb_node run_node;
433 struct list_head group_node;
434 unsigned int on_rq;
435
436 u64 exec_start;
437 u64 sum_exec_runtime;
438 u64 vruntime;
439 u64 prev_sum_exec_runtime;
440
Lucas De Marchi41acab82010-03-10 23:37:45 -0300441 u64 nr_migrations;
442
Lucas De Marchi41acab82010-03-10 23:37:45 -0300443#ifdef CONFIG_SCHEDSTATS
444 struct sched_statistics statistics;
Ingo Molnar94c18222007-08-02 17:41:40 +0200445#endif
446
Ingo Molnar20b8a592007-07-09 18:51:58 +0200447#ifdef CONFIG_FAIR_GROUP_SCHED
Peter Zijlstrafed14d42012-02-11 06:05:00 +0100448 int depth;
Ingo Molnar20b8a592007-07-09 18:51:58 +0200449 struct sched_entity *parent;
450 /* rq on which this entity is (to be) queued: */
451 struct cfs_rq *cfs_rq;
452 /* rq "owned" by this entity/group: */
453 struct cfs_rq *my_q;
454#endif
Clark Williams8bd75c72013-02-07 09:47:07 -0600455
Alex Shi141965c2013-06-26 13:05:39 +0800456#ifdef CONFIG_SMP
Jiri Olsa5a107802015-12-08 21:23:59 +0100457 /*
458 * Per entity load average tracking.
459 *
460 * Put into separate cache line so it does not
461 * collide with read-mostly values above.
462 */
463 struct sched_avg avg ____cacheline_aligned_in_smp;
Paul Turner9d85f212012-10-04 13:18:29 +0200464#endif
Ingo Molnar20b8a592007-07-09 18:51:58 +0200465};
Ingo Molnar70b97a72006-07-03 00:25:42 -0700466
Peter Zijlstrafa717062008-01-25 21:08:27 +0100467struct sched_rt_entity {
468 struct list_head run_list;
Peter Zijlstra78f2c7d2008-01-25 21:08:27 +0100469 unsigned long timeout;
Ying Xue57d2aa02012-07-17 15:03:43 +0800470 unsigned long watchdog_stamp;
Richard Kennedybee367e2008-08-01 13:24:08 +0100471 unsigned int time_slice;
Peter Zijlstraff77e462016-01-18 15:27:07 +0100472 unsigned short on_rq;
473 unsigned short on_list;
Peter Zijlstra6f505b12008-01-25 21:08:30 +0100474
Peter Zijlstra58d6c2d2008-04-19 19:45:00 +0200475 struct sched_rt_entity *back;
Peter Zijlstra052f1dc2008-02-13 15:45:40 +0100476#ifdef CONFIG_RT_GROUP_SCHED
Peter Zijlstra6f505b12008-01-25 21:08:30 +0100477 struct sched_rt_entity *parent;
478 /* rq on which this entity is (to be) queued: */
479 struct rt_rq *rt_rq;
480 /* rq "owned" by this entity/group: */
481 struct rt_rq *my_q;
482#endif
Peter Zijlstrafa717062008-01-25 21:08:27 +0100483};
484
Dario Faggioliaab03e02013-11-28 11:14:43 +0100485struct sched_dl_entity {
486 struct rb_node rb_node;
487
488 /*
489 * Original scheduling parameters. Copied here from sched_attr
xiaofeng.yan4027d082014-05-09 03:21:27 +0000490 * during sched_setattr(), they will remain the same until
491 * the next sched_setattr().
Dario Faggioliaab03e02013-11-28 11:14:43 +0100492 */
493 u64 dl_runtime; /* maximum runtime for each instance */
494 u64 dl_deadline; /* relative deadline of each instance */
Harald Gustafsson755378a2013-11-07 14:43:40 +0100495 u64 dl_period; /* separation of two instances (period) */
Dario Faggioli332ac172013-11-07 14:43:45 +0100496 u64 dl_bw; /* dl_runtime / dl_deadline */
Dario Faggioliaab03e02013-11-28 11:14:43 +0100497
498 /*
499 * Actual scheduling parameters. Initialized with the values above,
500 * they are continously updated during task execution. Note that
501 * the remaining runtime could be < 0 in case we are in overrun.
502 */
503 s64 runtime; /* remaining runtime for this instance */
504 u64 deadline; /* absolute deadline for this instance */
505 unsigned int flags; /* specifying the scheduler behaviour */
506
507 /*
508 * Some bool flags:
509 *
510 * @dl_throttled tells if we exhausted the runtime. If so, the
511 * task has to wait for a replenishment to be performed at the
512 * next firing of dl_timer.
513 *
Dario Faggioli2d3d8912013-11-07 14:43:44 +0100514 * @dl_boosted tells if we are boosted due to DI. If so we are
515 * outside bandwidth enforcement mechanism (but only until we
Juri Lelli5bfd1262014-04-15 13:49:04 +0200516 * exit the critical section);
517 *
518 * @dl_yielded tells if task gave up the cpu before consuming
519 * all its available runtime during the last job.
Dario Faggioliaab03e02013-11-28 11:14:43 +0100520 */
Luca Abeni72f9f3f2016-03-07 12:27:04 +0100521 int dl_throttled, dl_boosted, dl_yielded;
Dario Faggioliaab03e02013-11-28 11:14:43 +0100522
523 /*
524 * Bandwidth enforcement timer. Each -deadline task has its
525 * own bandwidth to be enforced, thus we need one timer per task.
526 */
527 struct hrtimer dl_timer;
528};
Clark Williams8bd75c72013-02-07 09:47:07 -0600529
Paul E. McKenney1d082fd2014-08-14 16:01:53 -0700530union rcu_special {
531 struct {
Paul E. McKenney8203d6d2015-08-02 13:53:17 -0700532 u8 blocked;
533 u8 need_qs;
534 u8 exp_need_qs;
535 u8 pad; /* Otherwise the compiler can store garbage here. */
536 } b; /* Bits. */
537 u32 s; /* Set of bits. */
Paul E. McKenney1d082fd2014-08-14 16:01:53 -0700538};
Paul E. McKenney86848962009-08-27 15:00:12 -0700539
Peter Zijlstra8dc85d5472010-09-02 16:50:03 +0200540enum perf_event_task_context {
541 perf_invalid_context = -1,
542 perf_hw_context = 0,
Peter Zijlstra89a1e182010-09-07 17:34:50 +0200543 perf_sw_context,
Peter Zijlstra8dc85d5472010-09-02 16:50:03 +0200544 perf_nr_task_contexts,
545};
546
Ingo Molnareb61baf2017-02-01 17:09:06 +0100547struct wake_q_node {
548 struct wake_q_node *next;
549};
550
Mel Gorman72b252a2015-09-04 15:47:32 -0700551/* Track pages that require TLB flushes */
552struct tlbflush_unmap_batch {
553 /*
554 * Each bit set is a CPU that potentially has a TLB entry for one of
555 * the PFNs being flushed. See set_tlb_ubc_flush_pending().
556 */
557 struct cpumask cpumask;
558
559 /* True if any bit in cpumask is set */
560 bool flush_required;
Mel Gormand950c942015-09-04 15:47:35 -0700561
562 /*
563 * If true then the PTE was dirty when unmapped. The entry must be
564 * flushed before IO is initiated or a stale TLB entry potentially
565 * allows an update without redirtying the page.
566 */
567 bool writable;
Mel Gorman72b252a2015-09-04 15:47:32 -0700568};
569
Linus Torvalds1da177e2005-04-16 15:20:36 -0700570struct task_struct {
Andy Lutomirskic65eacb2016-09-13 14:29:24 -0700571#ifdef CONFIG_THREAD_INFO_IN_TASK
572 /*
573 * For reasons of header soup (see current_thread_info()), this
574 * must be the first element of task_struct.
575 */
576 struct thread_info thread_info;
577#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700578 volatile long state; /* -1 unrunnable, 0 runnable, >0 stopped */
Roman Zippelf7e42172007-05-09 02:35:17 -0700579 void *stack;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580 atomic_t usage;
William Cohen97dc32c2007-05-08 00:23:41 -0700581 unsigned int flags; /* per process flags, defined below */
582 unsigned int ptrace;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583
Peter Williams2dd73a42006-06-27 02:54:34 -0700584#ifdef CONFIG_SMP
Peter Zijlstrafa14ff42011-09-12 13:06:17 +0200585 struct llist_node wake_entry;
Peter Zijlstra3ca7a442011-04-05 17:23:40 +0200586 int on_cpu;
Andy Lutomirskic65eacb2016-09-13 14:29:24 -0700587#ifdef CONFIG_THREAD_INFO_IN_TASK
588 unsigned int cpu; /* current CPU */
589#endif
Mike Galbraith63b0e9e2015-07-14 17:39:50 +0200590 unsigned int wakee_flips;
Michael Wang62470412013-07-04 12:55:51 +0800591 unsigned long wakee_flip_decay_ts;
Mike Galbraith63b0e9e2015-07-14 17:39:50 +0200592 struct task_struct *last_wakee;
Peter Zijlstraac66f542013-10-07 11:29:16 +0100593
594 int wake_cpu;
Nick Piggin4866cde2005-06-25 14:57:23 -0700595#endif
Peter Zijlstrafd2f4412011-04-05 17:23:44 +0200596 int on_rq;
Ingo Molnar50e645a2007-07-09 18:52:00 +0200597
Ingo Molnarb29739f2006-06-27 02:54:51 -0700598 int prio, static_prio, normal_prio;
Richard Kennedyc7aceab2008-05-15 12:09:15 +0100599 unsigned int rt_priority;
Ingo Molnar5522d5d2007-10-15 17:00:12 +0200600 const struct sched_class *sched_class;
Ingo Molnar20b8a592007-07-09 18:51:58 +0200601 struct sched_entity se;
Peter Zijlstrafa717062008-01-25 21:08:27 +0100602 struct sched_rt_entity rt;
Peter Zijlstra8323f262012-06-22 13:36:05 +0200603#ifdef CONFIG_CGROUP_SCHED
604 struct task_group *sched_task_group;
605#endif
Dario Faggioliaab03e02013-11-28 11:14:43 +0100606 struct sched_dl_entity dl;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607
Avi Kivitye107be32007-07-26 13:40:43 +0200608#ifdef CONFIG_PREEMPT_NOTIFIERS
609 /* list of struct preempt_notifier: */
610 struct hlist_head preempt_notifiers;
611#endif
612
Alexey Dobriyan6c5c9342006-09-29 01:59:40 -0700613#ifdef CONFIG_BLK_DEV_IO_TRACE
Jens Axboe2056a782006-03-23 20:00:26 +0100614 unsigned int btrace_seq;
Alexey Dobriyan6c5c9342006-09-29 01:59:40 -0700615#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616
William Cohen97dc32c2007-05-08 00:23:41 -0700617 unsigned int policy;
Peter Zijlstra29baa742012-04-23 12:11:21 +0200618 int nr_cpus_allowed;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 cpumask_t cpus_allowed;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700620
Paul E. McKenneya57eb942010-06-29 16:49:16 -0700621#ifdef CONFIG_PREEMPT_RCU
Paul E. McKenneye260be62008-01-25 21:08:24 +0100622 int rcu_read_lock_nesting;
Paul E. McKenney1d082fd2014-08-14 16:01:53 -0700623 union rcu_special rcu_read_unlock_special;
Paul E. McKenneyf41d9112009-08-22 13:56:52 -0700624 struct list_head rcu_node_entry;
Paul E. McKenneya57eb942010-06-29 16:49:16 -0700625 struct rcu_node *rcu_blocked_node;
Pranith Kumar28f65692014-09-22 14:00:48 -0400626#endif /* #ifdef CONFIG_PREEMPT_RCU */
Paul E. McKenney8315f422014-06-27 13:42:20 -0700627#ifdef CONFIG_TASKS_RCU
628 unsigned long rcu_tasks_nvcsw;
629 bool rcu_tasks_holdout;
630 struct list_head rcu_tasks_holdout_list;
Paul E. McKenney176f8f72014-08-04 17:43:50 -0700631 int rcu_tasks_idle_cpu;
Paul E. McKenney8315f422014-06-27 13:42:20 -0700632#endif /* #ifdef CONFIG_TASKS_RCU */
Paul E. McKenneye260be62008-01-25 21:08:24 +0100633
Naveen N. Raof6db83472015-06-25 23:53:37 +0530634#ifdef CONFIG_SCHED_INFO
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635 struct sched_info sched_info;
636#endif
637
638 struct list_head tasks;
Dario Faggioli806c09a2010-11-30 19:51:33 +0100639#ifdef CONFIG_SMP
Gregory Haskins917b6272008-12-29 09:39:53 -0500640 struct plist_node pushable_tasks;
Juri Lelli1baca4c2013-11-07 14:43:38 +0100641 struct rb_node pushable_dl_tasks;
Dario Faggioli806c09a2010-11-30 19:51:33 +0100642#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643
644 struct mm_struct *mm, *active_mm;
Ingo Molnar314ff782017-02-03 11:03:31 +0100645
646 /* Per-thread vma caching: */
647 struct vmacache vmacache;
648
KAMEZAWA Hiroyuki34e55232010-03-05 13:41:40 -0800649#if defined(SPLIT_RSS_COUNTING)
650 struct task_rss_stat rss_stat;
651#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652/* task state */
William Cohen97dc32c2007-05-08 00:23:41 -0700653 int exit_state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654 int exit_code, exit_signal;
655 int pdeath_signal; /* The signal sent when the parent dies */
Palmer Dabbelte7cc4172015-04-30 21:19:55 -0700656 unsigned long jobctl; /* JOBCTL_*, siglock protected */
Andrei Epure9b89f6b2013-04-11 20:30:29 +0300657
658 /* Used for emulating ABI behavior of previous Linux versions */
William Cohen97dc32c2007-05-08 00:23:41 -0700659 unsigned int personality;
Andrei Epure9b89f6b2013-04-11 20:30:29 +0300660
Peter Zijlstrabe958bd2015-11-25 16:02:07 +0100661 /* scheduler bits, serialized by scheduler locks */
Lennart Poetteringca94c442009-06-15 17:17:47 +0200662 unsigned sched_reset_on_fork:1;
Peter Zijlstraa8e4f2e2011-04-05 17:23:49 +0200663 unsigned sched_contributes_to_load:1;
Peter Zijlstraff303e62015-04-17 20:05:30 +0200664 unsigned sched_migrated:1;
Peter Zijlstrab7e7ade2016-05-23 11:19:07 +0200665 unsigned sched_remote_wakeup:1;
Peter Zijlstrabe958bd2015-11-25 16:02:07 +0100666 unsigned :0; /* force alignment to the next boundary */
667
668 /* unserialized, strictly 'current' */
669 unsigned in_execve:1; /* bit to tell LSMs we're in execve */
670 unsigned in_iowait:1;
Andy Lutomirski7e781412016-08-02 14:05:36 -0700671#if !defined(TIF_RESTORE_SIGMASK)
672 unsigned restore_sigmask:1;
673#endif
Tejun Heo626ebc42015-11-05 18:46:09 -0800674#ifdef CONFIG_MEMCG
675 unsigned memcg_may_oom:1;
Johannes Weiner127424c2016-01-20 15:02:32 -0800676#ifndef CONFIG_SLOB
Vladimir Davydov6f185c22014-12-12 16:55:15 -0800677 unsigned memcg_kmem_skip_account:1;
678#endif
Johannes Weiner127424c2016-01-20 15:02:32 -0800679#endif
Peter Zijlstraff303e62015-04-17 20:05:30 +0200680#ifdef CONFIG_COMPAT_BRK
681 unsigned brk_randomized:1;
682#endif
Vladimir Davydov6f185c22014-12-12 16:55:15 -0800683
Kees Cook1d4457f2014-05-21 15:23:46 -0700684 unsigned long atomic_flags; /* Flags needing atomic access. */
685
Andy Lutomirskif56141e2015-02-12 15:01:14 -0800686 struct restart_block restart_block;
687
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688 pid_t pid;
689 pid_t tgid;
Arjan van de Ven0a4254052006-09-26 10:52:38 +0200690
Hiroshi Shimamoto13145622009-08-18 15:06:02 +0900691#ifdef CONFIG_CC_STACKPROTECTOR
Arjan van de Ven0a4254052006-09-26 10:52:38 +0200692 /* Canary value for the -fstack-protector gcc feature */
693 unsigned long stack_canary;
Hiroshi Shimamoto13145622009-08-18 15:06:02 +0900694#endif
Oleg Nesterov4d1d61a2012-05-11 10:59:08 +1000695 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696 * pointers to (original) parent process, youngest child, younger sibling,
Oleg Nesterov4d1d61a2012-05-11 10:59:08 +1000697 * older sibling, respectively. (p->father can be replaced with
Roland McGrathf4700212008-03-24 18:36:23 -0700698 * p->real_parent->pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700699 */
Kees Cookabd63bc2011-12-14 14:39:26 -0800700 struct task_struct __rcu *real_parent; /* real parent process */
701 struct task_struct __rcu *parent; /* recipient of SIGCHLD, wait4() reports */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 /*
Roland McGrathf4700212008-03-24 18:36:23 -0700703 * children/sibling forms the list of my natural children
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 */
705 struct list_head children; /* list of my children */
706 struct list_head sibling; /* linkage in my parent's children list */
707 struct task_struct *group_leader; /* threadgroup leader */
708
Roland McGrathf4700212008-03-24 18:36:23 -0700709 /*
710 * ptraced is the list of tasks this task is using ptrace on.
711 * This includes both natural children and PTRACE_ATTACH targets.
712 * p->ptrace_entry is p's link on the p->parent->ptraced list.
713 */
714 struct list_head ptraced;
715 struct list_head ptrace_entry;
716
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717 /* PID/PID hash table linkage. */
Eric W. Biederman92476d72006-03-31 02:31:42 -0800718 struct pid_link pids[PIDTYPE_MAX];
Oleg Nesterov47e65322006-03-28 16:11:25 -0800719 struct list_head thread_group;
Oleg Nesterov0c740d02014-01-21 15:49:56 -0800720 struct list_head thread_node;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721
722 struct completion *vfork_done; /* for vfork() */
723 int __user *set_child_tid; /* CLONE_CHILD_SETTID */
724 int __user *clear_child_tid; /* CLONE_CHILD_CLEARTID */
725
Frederic Weisbecker5613fda2017-01-31 04:09:23 +0100726 u64 utime, stime;
Stanislaw Gruszka40565b52016-11-15 03:06:51 +0100727#ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME
Frederic Weisbecker5613fda2017-01-31 04:09:23 +0100728 u64 utimescaled, stimescaled;
Stanislaw Gruszka40565b52016-11-15 03:06:51 +0100729#endif
Frederic Weisbecker16a6d9b2017-01-31 04:09:21 +0100730 u64 gtime;
Peter Zijlstra9d7fb042015-06-30 11:30:54 +0200731 struct prev_cputime prev_cputime;
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100732#ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
Frederic Weisbeckerb7ce2272015-11-19 16:47:34 +0100733 seqcount_t vtime_seqcount;
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100734 unsigned long long vtime_snap;
735 enum {
Frederic Weisbecker7098c1e2015-11-19 16:47:30 +0100736 /* Task is sleeping or running in a CPU with VTIME inactive */
737 VTIME_INACTIVE = 0,
738 /* Task runs in userspace in a CPU with VTIME active */
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100739 VTIME_USER,
Frederic Weisbecker7098c1e2015-11-19 16:47:30 +0100740 /* Task runs in kernelspace in a CPU with VTIME active */
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100741 VTIME_SYS,
742 } vtime_snap_whence;
743#endif
Frederic Weisbeckerd027d452015-06-07 15:54:30 +0200744
745#ifdef CONFIG_NO_HZ_FULL
Frederic Weisbeckerf009a7a2016-03-24 15:38:00 +0100746 atomic_t tick_dep_mask;
Frederic Weisbeckerd027d452015-06-07 15:54:30 +0200747#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 unsigned long nvcsw, nivcsw; /* context switch counts */
Thomas Gleixnerccbf62d2014-07-16 21:04:34 +0000749 u64 start_time; /* monotonic time in nsec */
Thomas Gleixner57e0be02014-07-16 21:04:32 +0000750 u64 real_start_time; /* boot based time in nsec */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751/* mm fault and swap info: this can arguably be seen as either mm-specific or thread-specific */
752 unsigned long min_flt, maj_flt;
753
Nicolas Pitreb18b6a92017-01-21 00:09:08 -0500754#ifdef CONFIG_POSIX_TIMERS
Frank Mayharf06febc2008-09-12 09:54:39 -0700755 struct task_cputime cputime_expires;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700756 struct list_head cpu_timers[3];
Nicolas Pitreb18b6a92017-01-21 00:09:08 -0500757#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758
759/* process credentials */
Eric W. Biederman64b875f2016-11-14 18:48:07 -0600760 const struct cred __rcu *ptracer_cred; /* Tracer's credentials at attach */
Arnd Bergmann1b0ba1c2010-02-24 19:45:09 +0100761 const struct cred __rcu *real_cred; /* objective and real subjective task
David Howells3b11a1d2008-11-14 10:39:26 +1100762 * credentials (COW) */
Arnd Bergmann1b0ba1c2010-02-24 19:45:09 +0100763 const struct cred __rcu *cred; /* effective (overridable) subjective task
David Howells3b11a1d2008-11-14 10:39:26 +1100764 * credentials (COW) */
Paolo 'Blaisorblade' Giarrusso36772092005-05-05 16:16:12 -0700765 char comm[TASK_COMM_LEN]; /* executable name excluding path
766 - access with [gs]et_task_comm (which lock
767 it with task_lock())
Linus Torvalds221af7f2010-01-28 22:14:42 -0800768 - initialized normally by setup_new_exec */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700769/* file system info */
NeilBrown756daf22015-03-23 13:37:38 +1100770 struct nameidata *nameidata;
Alexey Dobriyan3d5b6fc2006-09-29 01:59:40 -0700771#ifdef CONFIG_SYSVIPC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772/* ipc stuff */
773 struct sysv_sem sysvsem;
Jack Millerab602f72014-08-08 14:23:19 -0700774 struct sysv_shm sysvshm;
Alexey Dobriyan3d5b6fc2006-09-29 01:59:40 -0700775#endif
Mandeep Singh Bainese162b392009-01-15 11:08:40 -0800776#ifdef CONFIG_DETECT_HUNG_TASK
Ingo Molnar82a1fcb2008-01-25 21:08:02 +0100777/* hung task detection */
Ingo Molnar82a1fcb2008-01-25 21:08:02 +0100778 unsigned long last_switch_count;
779#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780/* filesystem information */
781 struct fs_struct *fs;
782/* open file information */
783 struct files_struct *files;
Serge E. Hallyn1651e142006-10-02 02:18:08 -0700784/* namespaces */
Serge E. Hallynab516012006-10-02 02:18:06 -0700785 struct nsproxy *nsproxy;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786/* signal handlers */
787 struct signal_struct *signal;
788 struct sighand_struct *sighand;
789
790 sigset_t blocked, real_blocked;
Roland McGrathf3de2722008-04-30 00:53:09 -0700791 sigset_t saved_sigmask; /* restored if set_restore_sigmask() was used */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792 struct sigpending pending;
793
794 unsigned long sas_ss_sp;
795 size_t sas_ss_size;
Stas Sergeev2a742132016-04-14 23:20:04 +0300796 unsigned sas_ss_flags;
Oleg Nesterov2e01fab2015-11-06 16:32:19 -0800797
Al Viro67d12142012-06-27 11:07:19 +0400798 struct callback_head *task_works;
Oleg Nesterove73f8952012-05-11 10:59:07 +1000799
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800 struct audit_context *audit_context;
Al Virobfef93a2008-01-10 04:53:18 -0500801#ifdef CONFIG_AUDITSYSCALL
Eric W. Biedermane1760bd2012-09-10 22:39:43 -0700802 kuid_t loginuid;
Eric Paris4746ec52008-01-08 10:06:53 -0500803 unsigned int sessionid;
Al Virobfef93a2008-01-10 04:53:18 -0500804#endif
Will Drewry932eceb2012-04-12 16:47:54 -0500805 struct seccomp seccomp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700806
807/* Thread group tracking */
808 u32 parent_exec_id;
809 u32 self_exec_id;
Miao Xie58568d22009-06-16 15:31:49 -0700810/* Protection of (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed,
811 * mempolicy */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700812 spinlock_t alloc_lock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700813
Ingo Molnarb29739f2006-06-27 02:54:51 -0700814 /* Protection of the PI data structures: */
Thomas Gleixner1d615482009-11-17 14:54:03 +0100815 raw_spinlock_t pi_lock;
Ingo Molnarb29739f2006-06-27 02:54:51 -0700816
Peter Zijlstra76751042015-05-01 08:27:50 -0700817 struct wake_q_node wake_q;
818
Ingo Molnar23f78d4a2006-06-27 02:54:53 -0700819#ifdef CONFIG_RT_MUTEXES
820 /* PI waiters blocked on a rt_mutex held by this task */
Peter Zijlstrafb00aca2013-11-07 14:43:43 +0100821 struct rb_root pi_waiters;
822 struct rb_node *pi_waiters_leftmost;
Ingo Molnar23f78d4a2006-06-27 02:54:53 -0700823 /* Deadlock detection and priority inheritance handling */
824 struct rt_mutex_waiter *pi_blocked_on;
Ingo Molnar23f78d4a2006-06-27 02:54:53 -0700825#endif
826
Ingo Molnar408894e2006-01-09 15:59:20 -0800827#ifdef CONFIG_DEBUG_MUTEXES
828 /* mutex deadlock detection */
829 struct mutex_waiter *blocked_on;
830#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700831#ifdef CONFIG_TRACE_IRQFLAGS
832 unsigned int irq_events;
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700833 unsigned long hardirq_enable_ip;
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700834 unsigned long hardirq_disable_ip;
Hiroshi Shimamotofa1452e2009-11-30 14:59:44 +0900835 unsigned int hardirq_enable_event;
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700836 unsigned int hardirq_disable_event;
Hiroshi Shimamotofa1452e2009-11-30 14:59:44 +0900837 int hardirqs_enabled;
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700838 int hardirq_context;
Hiroshi Shimamotofa1452e2009-11-30 14:59:44 +0900839 unsigned long softirq_disable_ip;
840 unsigned long softirq_enable_ip;
841 unsigned int softirq_disable_event;
842 unsigned int softirq_enable_event;
843 int softirqs_enabled;
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700844 int softirq_context;
845#endif
Ingo Molnarfbb9ce952006-07-03 00:24:50 -0700846#ifdef CONFIG_LOCKDEP
Peter Zijlstrabdb94412008-02-25 23:02:48 +0100847# define MAX_LOCK_DEPTH 48UL
Ingo Molnarfbb9ce952006-07-03 00:24:50 -0700848 u64 curr_chain_key;
849 int lockdep_depth;
Ingo Molnarfbb9ce952006-07-03 00:24:50 -0700850 unsigned int lockdep_recursion;
Richard Kennedyc7aceab2008-05-15 12:09:15 +0100851 struct held_lock held_locks[MAX_LOCK_DEPTH];
Nick Piggincf40bd12009-01-21 08:12:39 +0100852 gfp_t lockdep_reclaim_gfp;
Ingo Molnarfbb9ce952006-07-03 00:24:50 -0700853#endif
Andrey Ryabininc6d30852016-01-20 15:00:55 -0800854#ifdef CONFIG_UBSAN
855 unsigned int in_ubsan;
856#endif
Ingo Molnar408894e2006-01-09 15:59:20 -0800857
Linus Torvalds1da177e2005-04-16 15:20:36 -0700858/* journalling filesystem info */
859 void *journal_info;
860
Neil Brownd89d8792007-05-01 09:53:42 +0200861/* stacked block device info */
Akinobu Mitabddd87c2010-02-23 08:55:42 +0100862 struct bio_list *bio_list;
Neil Brownd89d8792007-05-01 09:53:42 +0200863
Jens Axboe73c10102011-03-08 13:19:51 +0100864#ifdef CONFIG_BLOCK
865/* stack plugging */
866 struct blk_plug *plug;
867#endif
868
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869/* VM state */
870 struct reclaim_state *reclaim_state;
871
Linus Torvalds1da177e2005-04-16 15:20:36 -0700872 struct backing_dev_info *backing_dev_info;
873
874 struct io_context *io_context;
875
876 unsigned long ptrace_message;
877 siginfo_t *last_siginfo; /* For ptrace use. */
Andrew Morton7c3ab7382006-12-10 02:19:19 -0800878 struct task_io_accounting ioac;
Jay Lan8f0ab512006-09-30 23:28:59 -0700879#if defined(CONFIG_TASK_XACCT)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880 u64 acct_rss_mem1; /* accumulated rss usage */
881 u64 acct_vm_mem1; /* accumulated virtual memory usage */
Frederic Weisbecker605dc2b2017-01-31 04:09:30 +0100882 u64 acct_timexpd; /* stime + utime since last update */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700883#endif
884#ifdef CONFIG_CPUSETS
Miao Xie58568d22009-06-16 15:31:49 -0700885 nodemask_t mems_allowed; /* Protected by alloc_lock */
Mel Gormancc9a6c82012-03-21 16:34:11 -0700886 seqcount_t mems_allowed_seq; /* Seqence no to catch updates */
Paul Jackson825a46a2006-03-24 03:16:03 -0800887 int cpuset_mem_spread_rotor;
Jack Steiner6adef3e2010-05-26 14:42:49 -0700888 int cpuset_slab_spread_rotor;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700889#endif
Paul Menageddbcc7e2007-10-18 23:39:30 -0700890#ifdef CONFIG_CGROUPS
Paul Menage817929e2007-10-18 23:39:36 -0700891 /* Control Group info protected by css_set_lock */
Arnd Bergmann2c392b82010-02-24 19:41:39 +0100892 struct css_set __rcu *cgroups;
Paul Menage817929e2007-10-18 23:39:36 -0700893 /* cg_list protected by css_set_lock and tsk->alloc_lock */
894 struct list_head cg_list;
Paul Menageddbcc7e2007-10-18 23:39:30 -0700895#endif
Fenghua Yue02737d2016-10-28 15:04:46 -0700896#ifdef CONFIG_INTEL_RDT_A
897 int closid;
898#endif
Alexey Dobriyan42b2dd02007-10-16 23:27:30 -0700899#ifdef CONFIG_FUTEX
Ingo Molnar0771dfe2006-03-27 01:16:22 -0800900 struct robust_list_head __user *robust_list;
Ingo Molnar34f192c2006-03-27 01:16:24 -0800901#ifdef CONFIG_COMPAT
902 struct compat_robust_list_head __user *compat_robust_list;
903#endif
Ingo Molnarc87e2832006-06-27 02:54:58 -0700904 struct list_head pi_state_list;
905 struct futex_pi_state *pi_state_cache;
Alexey Dobriyan42b2dd02007-10-16 23:27:30 -0700906#endif
Ingo Molnarcdd6c482009-09-21 12:02:48 +0200907#ifdef CONFIG_PERF_EVENTS
Peter Zijlstra8dc85d5472010-09-02 16:50:03 +0200908 struct perf_event_context *perf_event_ctxp[perf_nr_task_contexts];
Ingo Molnarcdd6c482009-09-21 12:02:48 +0200909 struct mutex perf_event_mutex;
910 struct list_head perf_event_list;
Paul Mackerrasa63eaf32009-05-22 14:17:31 +1000911#endif
Thomas Gleixner8f47b182014-02-07 20:58:39 +0100912#ifdef CONFIG_DEBUG_PREEMPT
913 unsigned long preempt_disable_ip;
914#endif
Richard Kennedyc7aceab2008-05-15 12:09:15 +0100915#ifdef CONFIG_NUMA
Miao Xie58568d22009-06-16 15:31:49 -0700916 struct mempolicy *mempolicy; /* Protected by alloc_lock */
Richard Kennedyc7aceab2008-05-15 12:09:15 +0100917 short il_next;
Eric Dumazet207205a2011-03-22 16:30:44 -0700918 short pref_node_fork;
Richard Kennedyc7aceab2008-05-15 12:09:15 +0100919#endif
Peter Zijlstracbee9f82012-10-25 14:16:43 +0200920#ifdef CONFIG_NUMA_BALANCING
921 int numa_scan_seq;
Peter Zijlstracbee9f82012-10-25 14:16:43 +0200922 unsigned int numa_scan_period;
Mel Gorman598f0ec2013-10-07 11:28:55 +0100923 unsigned int numa_scan_period_max;
Rik van Rielde1c9ce62013-10-07 11:29:39 +0100924 int numa_preferred_nid;
Mel Gorman6b9a7462013-10-07 11:29:11 +0100925 unsigned long numa_migrate_retry;
Peter Zijlstracbee9f82012-10-25 14:16:43 +0200926 u64 node_stamp; /* migration stamp */
Rik van Riel7e2703e2014-01-27 17:03:45 -0500927 u64 last_task_numa_placement;
928 u64 last_sum_exec_runtime;
Peter Zijlstracbee9f82012-10-25 14:16:43 +0200929 struct callback_head numa_work;
Mel Gormanf809ca92013-10-07 11:28:57 +0100930
Peter Zijlstra8c8a7432013-10-07 11:29:21 +0100931 struct list_head numa_entry;
932 struct numa_group *numa_group;
933
Mel Gorman745d6142013-10-07 11:28:59 +0100934 /*
Iulia Manda44dba3d2014-10-31 02:13:31 +0200935 * numa_faults is an array split into four regions:
936 * faults_memory, faults_cpu, faults_memory_buffer, faults_cpu_buffer
937 * in this precise order.
938 *
939 * faults_memory: Exponential decaying average of faults on a per-node
940 * basis. Scheduling placement decisions are made based on these
941 * counts. The values remain static for the duration of a PTE scan.
942 * faults_cpu: Track the nodes the process was running on when a NUMA
943 * hinting fault was incurred.
944 * faults_memory_buffer and faults_cpu_buffer: Record faults per node
945 * during the current scan window. When the scan completes, the counts
946 * in faults_memory and faults_cpu decay and these values are copied.
Mel Gorman745d6142013-10-07 11:28:59 +0100947 */
Iulia Manda44dba3d2014-10-31 02:13:31 +0200948 unsigned long *numa_faults;
Mel Gorman83e1d2c2013-10-07 11:29:27 +0100949 unsigned long total_numa_faults;
Mel Gorman745d6142013-10-07 11:28:59 +0100950
951 /*
Rik van Riel04bb2f92013-10-07 11:29:36 +0100952 * numa_faults_locality tracks if faults recorded during the last
Mel Gorman074c2382015-03-25 15:55:42 -0700953 * scan window were remote/local or failed to migrate. The task scan
954 * period is adapted based on the locality of the faults with different
955 * weights depending on whether they were shared or private faults
Rik van Riel04bb2f92013-10-07 11:29:36 +0100956 */
Mel Gorman074c2382015-03-25 15:55:42 -0700957 unsigned long numa_faults_locality[3];
Rik van Riel04bb2f92013-10-07 11:29:36 +0100958
Ingo Molnarb32e86b2013-10-07 11:29:30 +0100959 unsigned long numa_pages_migrated;
Peter Zijlstracbee9f82012-10-25 14:16:43 +0200960#endif /* CONFIG_NUMA_BALANCING */
961
Mel Gorman72b252a2015-09-04 15:47:32 -0700962#ifdef CONFIG_ARCH_WANT_BATCHED_UNMAP_TLB_FLUSH
963 struct tlbflush_unmap_batch tlb_ubc;
964#endif
965
Ingo Molnare56d0902006-01-08 01:01:37 -0800966 struct rcu_head rcu;
Jens Axboeb92ce552006-04-11 13:52:07 +0200967
968 /*
969 * cache last used pipe for splice
970 */
971 struct pipe_inode_info *splice_pipe;
Eric Dumazet5640f762012-09-23 23:04:42 +0000972
973 struct page_frag task_frag;
974
Ingo Molnar47913d42017-02-01 18:00:26 +0100975#ifdef CONFIG_TASK_DELAY_ACCT
976 struct task_delay_info *delays;
Shailabh Nagarca74e922006-07-14 00:24:36 -0700977#endif
Ingo Molnar47913d42017-02-01 18:00:26 +0100978
Akinobu Mitaf4f154f2006-12-08 02:39:47 -0800979#ifdef CONFIG_FAULT_INJECTION
980 int make_it_fail;
981#endif
Wu Fengguang9d823e82011-06-11 18:10:12 -0600982 /*
983 * when (nr_dirtied >= nr_dirtied_pause), it's time to call
984 * balance_dirty_pages() for some dirty throttling pause
985 */
986 int nr_dirtied;
987 int nr_dirtied_pause;
Wu Fengguang83712352011-06-11 19:25:42 -0600988 unsigned long dirty_paused_when; /* start of a write-and-pause period */
Wu Fengguang9d823e82011-06-11 18:10:12 -0600989
Arjan van de Ven97455122008-01-25 21:08:34 +0100990#ifdef CONFIG_LATENCYTOP
991 int latency_record_count;
992 struct latency_record latency_record[LT_SAVECOUNT];
993#endif
Arjan van de Ven69766752008-09-01 15:52:40 -0700994 /*
995 * time slack values; these are used to round up poll() and
996 * select() etc timeout values. These are in nanoseconds.
997 */
John Stultzda8b44d2016-03-17 14:20:51 -0700998 u64 timer_slack_ns;
999 u64 default_timer_slack_ns;
David Millerf8d570a2008-11-06 00:37:40 -08001000
Andrey Ryabinin0b24bec2015-02-13 14:39:17 -08001001#ifdef CONFIG_KASAN
1002 unsigned int kasan_depth;
1003#endif
Frederic Weisbeckerfb526072008-11-25 21:07:04 +01001004#ifdef CONFIG_FUNCTION_GRAPH_TRACER
Daniel Mack3ad2f3fb2010-02-03 08:01:28 +08001005 /* Index of current stored address in ret_stack */
Frederic Weisbeckerf201ae22008-11-23 06:22:56 +01001006 int curr_ret_stack;
1007 /* Stack of return addresses for return function tracing */
1008 struct ftrace_ret_stack *ret_stack;
Steven Rostedt8aef2d22009-03-24 01:10:15 -04001009 /* time stamp for last schedule */
1010 unsigned long long ftrace_timestamp;
Frederic Weisbeckerf201ae22008-11-23 06:22:56 +01001011 /*
1012 * Number of functions that haven't been traced
1013 * because of depth overrun.
1014 */
1015 atomic_t trace_overrun;
Frederic Weisbecker380c4b12008-12-06 03:43:41 +01001016 /* Pause for the tracing */
1017 atomic_t tracing_graph_pause;
Frederic Weisbeckerf201ae22008-11-23 06:22:56 +01001018#endif
Steven Rostedtea4e2bc2008-12-03 15:36:57 -05001019#ifdef CONFIG_TRACING
1020 /* state flags for use by tracers */
1021 unsigned long trace;
Steven Rostedtb1cff0a2011-05-25 14:27:43 -04001022 /* bitmask and counter of trace recursion */
Steven Rostedt261842b2009-04-16 21:41:52 -04001023 unsigned long trace_recursion;
1024#endif /* CONFIG_TRACING */
Dmitry Vyukov5c9a8752016-03-22 14:27:30 -07001025#ifdef CONFIG_KCOV
1026 /* Coverage collection mode enabled for this task (0 if disabled). */
1027 enum kcov_mode kcov_mode;
1028 /* Size of the kcov_area. */
1029 unsigned kcov_size;
1030 /* Buffer for coverage collection. */
1031 void *kcov_area;
1032 /* kcov desciptor wired with this task or NULL. */
1033 struct kcov *kcov;
1034#endif
Vladimir Davydov6f185c22014-12-12 16:55:15 -08001035#ifdef CONFIG_MEMCG
Tejun Heo626ebc42015-11-05 18:46:09 -08001036 struct mem_cgroup *memcg_in_oom;
1037 gfp_t memcg_oom_gfp_mask;
1038 int memcg_oom_order;
Tejun Heob23afb92015-11-05 18:46:11 -08001039
1040 /* number of pages to reclaim on returning to userland */
1041 unsigned int memcg_nr_pages_over_high;
KAMEZAWA Hiroyuki569b8462009-12-15 16:47:03 -08001042#endif
Srikar Dronamraju0326f5a2012-03-13 23:30:11 +05301043#ifdef CONFIG_UPROBES
1044 struct uprobe_task *utask;
Srikar Dronamraju0326f5a2012-03-13 23:30:11 +05301045#endif
Kent Overstreetcafe5632013-03-23 16:11:31 -07001046#if defined(CONFIG_BCACHE) || defined(CONFIG_BCACHE_MODULE)
1047 unsigned int sequential_io;
1048 unsigned int sequential_io_avg;
1049#endif
Peter Zijlstra8eb23b92014-09-24 10:18:55 +02001050#ifdef CONFIG_DEBUG_ATOMIC_SLEEP
1051 unsigned long task_state_change;
1052#endif
David Hildenbrand8bcbde52015-05-11 17:52:06 +02001053 int pagefault_disabled;
Michal Hocko03049262016-03-25 14:20:33 -07001054#ifdef CONFIG_MMU
Vladimir Davydov29c696e2016-03-25 14:20:39 -07001055 struct task_struct *oom_reaper_list;
Michal Hocko03049262016-03-25 14:20:33 -07001056#endif
Andy Lutomirskiba14a192016-08-11 02:35:21 -07001057#ifdef CONFIG_VMAP_STACK
1058 struct vm_struct *stack_vm_area;
1059#endif
Andy Lutomirski68f24b082016-09-15 22:45:48 -07001060#ifdef CONFIG_THREAD_INFO_IN_TASK
1061 /* A live task holds one reference. */
1062 atomic_t stack_refcount;
1063#endif
Dave Hansen0c8c0f02015-07-17 12:28:11 +02001064/* CPU-specific state of this task */
1065 struct thread_struct thread;
1066/*
1067 * WARNING: on x86, 'thread_struct' contains a variable-sized
1068 * structure. It *MUST* be at the end of 'task_struct'.
1069 *
1070 * Do not put anything below here!
1071 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072};
1073
Alexey Dobriyane8681712007-10-26 12:17:22 +04001074static inline struct pid *task_pid(struct task_struct *task)
Eric W. Biederman22c935f2006-10-02 02:17:09 -07001075{
1076 return task->pids[PIDTYPE_PID].pid;
1077}
1078
Alexey Dobriyane8681712007-10-26 12:17:22 +04001079static inline struct pid *task_tgid(struct task_struct *task)
Eric W. Biederman22c935f2006-10-02 02:17:09 -07001080{
1081 return task->group_leader->pids[PIDTYPE_PID].pid;
1082}
1083
Oleg Nesterov6dda81f2009-04-02 16:58:35 -07001084/*
1085 * Without tasklist or rcu lock it is not safe to dereference
1086 * the result of task_pgrp/task_session even if task == current,
1087 * we can race with another thread doing sys_setsid/sys_setpgid.
1088 */
Alexey Dobriyane8681712007-10-26 12:17:22 +04001089static inline struct pid *task_pgrp(struct task_struct *task)
Eric W. Biederman22c935f2006-10-02 02:17:09 -07001090{
1091 return task->group_leader->pids[PIDTYPE_PGID].pid;
1092}
1093
Alexey Dobriyane8681712007-10-26 12:17:22 +04001094static inline struct pid *task_session(struct task_struct *task)
Eric W. Biederman22c935f2006-10-02 02:17:09 -07001095{
1096 return task->group_leader->pids[PIDTYPE_SID].pid;
1097}
1098
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001099/*
1100 * the helpers to get the task's different pids as they are seen
1101 * from various namespaces
1102 *
1103 * task_xid_nr() : global id, i.e. the id seen from the init namespace;
Eric W. Biederman44c4e1b2008-02-08 04:19:15 -08001104 * task_xid_vnr() : virtual id, i.e. the id seen from the pid namespace of
1105 * current.
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001106 * task_xid_nr_ns() : id seen from the ns specified;
1107 *
1108 * set_task_vxid() : assigns a virtual id to a task;
1109 *
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001110 * see also pid_nr() etc in include/linux/pid.h
1111 */
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001112pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type,
1113 struct pid_namespace *ns);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001114
Alexey Dobriyane8681712007-10-26 12:17:22 +04001115static inline pid_t task_pid_nr(struct task_struct *tsk)
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001116{
1117 return tsk->pid;
1118}
1119
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001120static inline pid_t task_pid_nr_ns(struct task_struct *tsk,
1121 struct pid_namespace *ns)
1122{
1123 return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
1124}
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001125
1126static inline pid_t task_pid_vnr(struct task_struct *tsk)
1127{
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001128 return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001129}
1130
1131
Alexey Dobriyane8681712007-10-26 12:17:22 +04001132static inline pid_t task_tgid_nr(struct task_struct *tsk)
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001133{
1134 return tsk->tgid;
1135}
1136
Pavel Emelyanov2f2a3a42007-10-18 23:40:19 -07001137pid_t task_tgid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001138
1139static inline pid_t task_tgid_vnr(struct task_struct *tsk)
1140{
1141 return pid_vnr(task_tgid(tsk));
1142}
1143
1144
Richard Guy Briggs80e0b6e2014-03-16 14:00:19 -04001145static inline int pid_alive(const struct task_struct *p);
Richard Guy Briggsad36d282013-08-15 18:05:12 -04001146static inline pid_t task_ppid_nr_ns(const struct task_struct *tsk, struct pid_namespace *ns)
1147{
1148 pid_t pid = 0;
1149
1150 rcu_read_lock();
1151 if (pid_alive(tsk))
1152 pid = task_tgid_nr_ns(rcu_dereference(tsk->real_parent), ns);
1153 rcu_read_unlock();
1154
1155 return pid;
1156}
1157
1158static inline pid_t task_ppid_nr(const struct task_struct *tsk)
1159{
1160 return task_ppid_nr_ns(tsk, &init_pid_ns);
1161}
1162
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001163static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk,
1164 struct pid_namespace *ns)
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001165{
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001166 return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001167}
1168
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001169static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
1170{
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001171 return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001172}
1173
1174
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001175static inline pid_t task_session_nr_ns(struct task_struct *tsk,
1176 struct pid_namespace *ns)
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001177{
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001178 return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001179}
1180
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001181static inline pid_t task_session_vnr(struct task_struct *tsk)
1182{
Oleg Nesterov52ee2df2009-04-02 16:58:38 -07001183 return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001184}
1185
Oleg Nesterov1b0f7ff2009-04-02 16:58:39 -07001186/* obsolete, do not use */
1187static inline pid_t task_pgrp_nr(struct task_struct *tsk)
1188{
1189 return task_pgrp_nr_ns(tsk, &init_pid_ns);
1190}
Pavel Emelyanov7af57292007-10-18 23:40:06 -07001191
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192/**
1193 * pid_alive - check that a task structure is not stale
1194 * @p: Task structure to be checked.
1195 *
1196 * Test if a process is not yet dead (at most zombie state)
1197 * If pid_alive fails, then pointers within the task structure
1198 * can be stale and must not be dereferenced.
Yacine Belkadie69f6182013-07-12 20:45:47 +02001199 *
1200 * Return: 1 if the process is alive. 0 otherwise.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201 */
Richard Guy Briggsad36d282013-08-15 18:05:12 -04001202static inline int pid_alive(const struct task_struct *p)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001203{
Eric W. Biederman92476d72006-03-31 02:31:42 -08001204 return p->pids[PIDTYPE_PID].pid != NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001205}
1206
Sukadev Bhattiproluf400e192006-09-29 02:00:07 -07001207/**
Sergey Senozhatsky570f5242016-01-01 23:03:01 +09001208 * is_global_init - check if a task structure is init. Since init
1209 * is free to have sub-threads we need to check tgid.
Henne32602592006-10-06 00:44:01 -07001210 * @tsk: Task structure to be checked.
1211 *
1212 * Check if a task structure is the first user space task the kernel created.
Yacine Belkadie69f6182013-07-12 20:45:47 +02001213 *
1214 * Return: 1 if the task structure is init. 0 otherwise.
Sukadev Bhattiproluf400e192006-09-29 02:00:07 -07001215 */
Alexey Dobriyane8681712007-10-26 12:17:22 +04001216static inline int is_global_init(struct task_struct *tsk)
Pavel Emelyanovb461cc02007-10-18 23:40:09 -07001217{
Sergey Senozhatsky570f5242016-01-01 23:03:01 +09001218 return task_tgid_nr(tsk) == 1;
Pavel Emelyanovb461cc02007-10-18 23:40:09 -07001219}
Serge E. Hallynb460cbc2007-10-18 23:39:52 -07001220
Cedric Le Goater9ec52092006-10-02 02:19:00 -07001221extern struct pid *cad_pid;
1222
Linus Torvalds1da177e2005-04-16 15:20:36 -07001223extern void free_task(struct task_struct *tsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224#define get_task_struct(tsk) do { atomic_inc(&(tsk)->usage); } while(0)
Ingo Molnare56d0902006-01-08 01:01:37 -08001225
Andrew Morton158d9eb2006-03-31 02:31:34 -08001226extern void __put_task_struct(struct task_struct *t);
Ingo Molnare56d0902006-01-08 01:01:37 -08001227
1228static inline void put_task_struct(struct task_struct *t)
1229{
1230 if (atomic_dec_and_test(&t->usage))
Eric W. Biederman8c7904a2006-03-31 02:31:37 -08001231 __put_task_struct(t);
Ingo Molnare56d0902006-01-08 01:01:37 -08001232}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001233
Oleg Nesterov150593b2016-05-18 19:02:18 +02001234struct task_struct *task_rcu_dereference(struct task_struct **ptask);
1235struct task_struct *try_get_task_struct(struct task_struct **ptask);
1236
Frederic Weisbecker6a616712012-12-16 20:00:34 +01001237#ifdef CONFIG_VIRT_CPU_ACCOUNTING_GEN
1238extern void task_cputime(struct task_struct *t,
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001239 u64 *utime, u64 *stime);
Frederic Weisbecker16a6d9b2017-01-31 04:09:21 +01001240extern u64 task_gtime(struct task_struct *t);
Frederic Weisbecker6a616712012-12-16 20:00:34 +01001241#else
Frederic Weisbecker6fac4822012-11-13 14:20:55 +01001242static inline void task_cputime(struct task_struct *t,
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001243 u64 *utime, u64 *stime)
Frederic Weisbecker6fac4822012-11-13 14:20:55 +01001244{
Stanislaw Gruszka353c50e2016-11-15 03:06:52 +01001245 *utime = t->utime;
1246 *stime = t->stime;
Frederic Weisbecker6fac4822012-11-13 14:20:55 +01001247}
Frederic Weisbecker6a616712012-12-16 20:00:34 +01001248
Frederic Weisbecker16a6d9b2017-01-31 04:09:21 +01001249static inline u64 task_gtime(struct task_struct *t)
Frederic Weisbecker6a616712012-12-16 20:00:34 +01001250{
1251 return t->gtime;
1252}
1253#endif
Stanislaw Gruszka40565b52016-11-15 03:06:51 +01001254
1255#ifdef CONFIG_ARCH_HAS_SCALED_CPUTIME
Jens Axboeb31dc662006-06-13 08:26:10 +02001256static inline void task_cputime_scaled(struct task_struct *t,
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001257 u64 *utimescaled,
1258 u64 *stimescaled)
Jens Axboeb31dc662006-06-13 08:26:10 +02001259{
Stanislaw Gruszka353c50e2016-11-15 03:06:52 +01001260 *utimescaled = t->utimescaled;
1261 *stimescaled = t->stimescaled;
Tejun Heo58a69cb2011-02-16 09:25:31 +01001262}
Stanislaw Gruszka40565b52016-11-15 03:06:51 +01001263#else
1264static inline void task_cputime_scaled(struct task_struct *t,
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001265 u64 *utimescaled,
1266 u64 *stimescaled)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267{
Stanislaw Gruszka40565b52016-11-15 03:06:51 +01001268 task_cputime(t, utimescaled, stimescaled);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001269}
1270#endif
Stanislaw Gruszka40565b52016-11-15 03:06:51 +01001271
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001272extern void task_cputime_adjusted(struct task_struct *p, u64 *ut, u64 *st);
1273extern void thread_group_cputime_adjusted(struct task_struct *p, u64 *ut, u64 *st);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001274
1275/*
1276 * Per process flags
1277 */
Peter Zijlstrac1de45c2016-11-28 23:03:05 -08001278#define PF_IDLE 0x00000002 /* I am an IDLE thread */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001279#define PF_EXITING 0x00000004 /* getting shut down */
1280#define PF_EXITPIDONE 0x00000008 /* pi exit done on shut down */
1281#define PF_VCPU 0x00000010 /* I'm a virtual CPU */
1282#define PF_WQ_WORKER 0x00000020 /* I'm a workqueue worker */
1283#define PF_FORKNOEXEC 0x00000040 /* forked but didn't exec */
1284#define PF_MCE_PROCESS 0x00000080 /* process policy on mce errors */
1285#define PF_SUPERPRIV 0x00000100 /* used super-user privileges */
1286#define PF_DUMPCORE 0x00000200 /* dumped core */
1287#define PF_SIGNALED 0x00000400 /* killed by a signal */
1288#define PF_MEMALLOC 0x00000800 /* Allocating memory */
1289#define PF_NPROC_EXCEEDED 0x00001000 /* set_user noticed that RLIMIT_NPROC was exceeded */
1290#define PF_USED_MATH 0x00002000 /* if unset the fpu must be initialized before use */
1291#define PF_USED_ASYNC 0x00004000 /* used async_schedule*(), used by module init */
1292#define PF_NOFREEZE 0x00008000 /* this thread should not be frozen */
1293#define PF_FROZEN 0x00010000 /* frozen for system suspend */
1294#define PF_FSTRANS 0x00020000 /* inside a filesystem transaction */
1295#define PF_KSWAPD 0x00040000 /* I am kswapd */
Ming Lei21caf2f2013-02-22 16:34:08 -08001296#define PF_MEMALLOC_NOIO 0x00080000 /* Allocating memory without IO involved */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001297#define PF_LESS_THROTTLE 0x00100000 /* Throttle me less: I clean memory */
1298#define PF_KTHREAD 0x00200000 /* I am a kernel thread */
1299#define PF_RANDOMIZE 0x00400000 /* randomize virtual address space */
1300#define PF_SWAPWRITE 0x00800000 /* Allowed to write to swap */
Tejun Heo14a40ff2013-03-19 13:45:20 -07001301#define PF_NO_SETAFFINITY 0x04000000 /* Userland is not allowed to meddle with cpus_allowed */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001302#define PF_MCE_EARLY 0x08000000 /* Early kill for mce process policy */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001303#define PF_MUTEX_TESTER 0x20000000 /* Thread belongs to the rt mutex tester */
1304#define PF_FREEZER_SKIP 0x40000000 /* Freezer should not count it as freezable */
Colin Cross2b44c4d2013-07-24 17:41:33 -07001305#define PF_SUSPEND_TASK 0x80000000 /* this thread called freeze_processes and should not be frozen */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001306
1307/*
1308 * Only the _current_ task can read/write to tsk->flags, but other
1309 * tasks can access tsk->flags in readonly mode for example
1310 * with tsk_used_math (like during threaded core dumping).
1311 * There is however an exception to this rule during ptrace
1312 * or during fork: the ptracer task is allowed to write to the
1313 * child->flags of its traced child (same goes for fork, the parent
1314 * can write to the child->flags), because we're guaranteed the
1315 * child is not running and in turn not changing child->flags
1316 * at the same time the parent does it.
1317 */
1318#define clear_stopped_child_used_math(child) do { (child)->flags &= ~PF_USED_MATH; } while (0)
1319#define set_stopped_child_used_math(child) do { (child)->flags |= PF_USED_MATH; } while (0)
1320#define clear_used_math() clear_stopped_child_used_math(current)
1321#define set_used_math() set_stopped_child_used_math(current)
1322#define conditional_stopped_child_used_math(condition, child) \
1323 do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= (condition) ? PF_USED_MATH : 0; } while (0)
1324#define conditional_used_math(condition) \
1325 conditional_stopped_child_used_math(condition, current)
1326#define copy_to_stopped_child_used_math(child) \
1327 do { (child)->flags &= ~PF_USED_MATH, (child)->flags |= current->flags & PF_USED_MATH; } while (0)
1328/* NOTE: this will return 0 or PF_USED_MATH, it will never return 1 */
1329#define tsk_used_math(p) ((p)->flags & PF_USED_MATH)
1330#define used_math() tsk_used_math(current)
1331
Kees Cook1d4457f2014-05-21 15:23:46 -07001332/* Per-process atomic flags. */
Zefan Lia2b86f72014-09-25 09:40:17 +08001333#define PFA_NO_NEW_PRIVS 0 /* May not gain new privileges. */
Zefan Li2ad654b2014-09-25 09:41:02 +08001334#define PFA_SPREAD_PAGE 1 /* Spread page cache over cpuset */
1335#define PFA_SPREAD_SLAB 2 /* Spread some slab caches over cpuset */
Tetsuo Handa77ed2c52016-03-08 20:01:32 +09001336#define PFA_LMK_WAITING 3 /* Lowmemorykiller is waiting */
Kees Cook1d4457f2014-05-21 15:23:46 -07001337
Kees Cook1d4457f2014-05-21 15:23:46 -07001338
Zefan Lie0e50702014-09-25 09:40:40 +08001339#define TASK_PFA_TEST(name, func) \
1340 static inline bool task_##func(struct task_struct *p) \
1341 { return test_bit(PFA_##name, &p->atomic_flags); }
1342#define TASK_PFA_SET(name, func) \
1343 static inline void task_set_##func(struct task_struct *p) \
1344 { set_bit(PFA_##name, &p->atomic_flags); }
1345#define TASK_PFA_CLEAR(name, func) \
1346 static inline void task_clear_##func(struct task_struct *p) \
1347 { clear_bit(PFA_##name, &p->atomic_flags); }
Kees Cook1d4457f2014-05-21 15:23:46 -07001348
Zefan Lie0e50702014-09-25 09:40:40 +08001349TASK_PFA_TEST(NO_NEW_PRIVS, no_new_privs)
1350TASK_PFA_SET(NO_NEW_PRIVS, no_new_privs)
Kees Cook1d4457f2014-05-21 15:23:46 -07001351
Zefan Li2ad654b2014-09-25 09:41:02 +08001352TASK_PFA_TEST(SPREAD_PAGE, spread_page)
1353TASK_PFA_SET(SPREAD_PAGE, spread_page)
1354TASK_PFA_CLEAR(SPREAD_PAGE, spread_page)
1355
1356TASK_PFA_TEST(SPREAD_SLAB, spread_slab)
1357TASK_PFA_SET(SPREAD_SLAB, spread_slab)
1358TASK_PFA_CLEAR(SPREAD_SLAB, spread_slab)
Tejun Heo544b2c92011-06-14 11:20:18 +02001359
Tetsuo Handa77ed2c52016-03-08 20:01:32 +09001360TASK_PFA_TEST(LMK_WAITING, lmk_waiting)
1361TASK_PFA_SET(LMK_WAITING, lmk_waiting)
1362
Mel Gorman907aed42012-07-31 16:44:07 -07001363static inline void tsk_restore_flags(struct task_struct *task,
1364 unsigned long orig_flags, unsigned long flags)
1365{
1366 task->flags &= ~flags;
1367 task->flags |= orig_flags & flags;
1368}
1369
Juri Lellif82f8042014-10-07 09:52:11 +01001370extern int cpuset_cpumask_can_shrink(const struct cpumask *cur,
1371 const struct cpumask *trial);
Juri Lelli7f514122014-09-19 10:22:40 +01001372extern int task_can_attach(struct task_struct *p,
1373 const struct cpumask *cs_cpus_allowed);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001374#ifdef CONFIG_SMP
KOSAKI Motohiro1e1b6c512011-05-19 15:08:58 +09001375extern void do_set_cpus_allowed(struct task_struct *p,
1376 const struct cpumask *new_mask);
1377
Mike Traviscd8ba7c2008-03-26 14:23:49 -07001378extern int set_cpus_allowed_ptr(struct task_struct *p,
Rusty Russell96f874e22008-11-25 02:35:14 +10301379 const struct cpumask *new_mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001380#else
KOSAKI Motohiro1e1b6c512011-05-19 15:08:58 +09001381static inline void do_set_cpus_allowed(struct task_struct *p,
1382 const struct cpumask *new_mask)
1383{
1384}
Mike Traviscd8ba7c2008-03-26 14:23:49 -07001385static inline int set_cpus_allowed_ptr(struct task_struct *p,
Rusty Russell96f874e22008-11-25 02:35:14 +10301386 const struct cpumask *new_mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387{
Rusty Russell96f874e22008-11-25 02:35:14 +10301388 if (!cpumask_test_cpu(0, new_mask))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001389 return -EINVAL;
1390 return 0;
1391}
1392#endif
Rusty Russelle0ad9552009-09-24 09:34:38 -06001393
Christian Borntraeger6d0d2872016-11-16 13:23:05 +01001394#ifndef cpu_relax_yield
1395#define cpu_relax_yield() cpu_relax()
1396#endif
1397
Ingo Molnar36c8b582006-07-03 00:25:41 -07001398extern unsigned long long
Ingo Molnar41b86e92007-07-09 18:51:58 +02001399task_sched_runtime(struct task_struct *task);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001400
1401/* sched_exec is called by processes performing an exec */
1402#ifdef CONFIG_SMP
1403extern void sched_exec(void);
1404#else
1405#define sched_exec() {}
1406#endif
1407
Dan Carpenterfa933842014-05-23 13:20:42 +03001408extern int yield_to(struct task_struct *p, bool preempt);
Ingo Molnar36c8b582006-07-03 00:25:41 -07001409extern void set_user_nice(struct task_struct *p, long nice);
1410extern int task_prio(const struct task_struct *p);
Dongsheng Yangd0ea0262014-01-27 22:00:45 -05001411/**
1412 * task_nice - return the nice value of a given task.
1413 * @p: the task in question.
1414 *
1415 * Return: The nice value [ -20 ... 0 ... 19 ].
1416 */
1417static inline int task_nice(const struct task_struct *p)
1418{
1419 return PRIO_TO_NICE((p)->static_prio);
1420}
Ingo Molnar36c8b582006-07-03 00:25:41 -07001421extern int can_nice(const struct task_struct *p, const int nice);
1422extern int task_curr(const struct task_struct *p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001423extern int idle_cpu(int cpu);
KOSAKI Motohirofe7de492010-10-20 16:01:12 -07001424extern int sched_setscheduler(struct task_struct *, int,
1425 const struct sched_param *);
Rusty Russell961ccdd2008-06-23 13:55:38 +10001426extern int sched_setscheduler_nocheck(struct task_struct *, int,
KOSAKI Motohirofe7de492010-10-20 16:01:12 -07001427 const struct sched_param *);
Dario Faggiolid50dde52013-11-07 14:43:36 +01001428extern int sched_setattr(struct task_struct *,
1429 const struct sched_attr *);
Ingo Molnar36c8b582006-07-03 00:25:41 -07001430extern struct task_struct *idle_task(int cpu);
Paul E. McKenneyc4f30602011-11-10 12:41:56 -08001431/**
1432 * is_idle_task - is the specified task an idle task?
Randy Dunlapfa757282012-01-21 11:03:13 -08001433 * @p: the task in question.
Yacine Belkadie69f6182013-07-12 20:45:47 +02001434 *
1435 * Return: 1 if @p is an idle task. 0 otherwise.
Paul E. McKenneyc4f30602011-11-10 12:41:56 -08001436 */
Paul E. McKenney7061ca32011-12-20 08:20:46 -08001437static inline bool is_idle_task(const struct task_struct *p)
Paul E. McKenneyc4f30602011-11-10 12:41:56 -08001438{
Peter Zijlstrac1de45c2016-11-28 23:03:05 -08001439 return !!(p->flags & PF_IDLE);
Paul E. McKenneyc4f30602011-11-10 12:41:56 -08001440}
Ingo Molnar36c8b582006-07-03 00:25:41 -07001441extern struct task_struct *curr_task(int cpu);
Peter Zijlstraa458ae22016-09-20 20:29:40 +02001442extern void ia64_set_curr_task(int cpu, struct task_struct *p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001443
1444void yield(void);
1445
Linus Torvalds1da177e2005-04-16 15:20:36 -07001446union thread_union {
Andy Lutomirskic65eacb2016-09-13 14:29:24 -07001447#ifndef CONFIG_THREAD_INFO_IN_TASK
Linus Torvalds1da177e2005-04-16 15:20:36 -07001448 struct thread_info thread_info;
Andy Lutomirskic65eacb2016-09-13 14:29:24 -07001449#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001450 unsigned long stack[THREAD_SIZE/sizeof(long)];
1451};
1452
Ingo Molnarf3ac6062017-02-03 22:59:33 +01001453#ifdef CONFIG_THREAD_INFO_IN_TASK
1454static inline struct thread_info *task_thread_info(struct task_struct *task)
1455{
1456 return &task->thread_info;
1457}
1458#elif !defined(__HAVE_THREAD_FUNCTIONS)
1459# define task_thread_info(task) ((struct thread_info *)(task)->stack)
1460#endif
1461
Linus Torvalds1da177e2005-04-16 15:20:36 -07001462#ifndef __HAVE_ARCH_KSTACK_END
1463static inline int kstack_end(void *addr)
1464{
1465 /* Reliable end of stack detection:
1466 * Some APM bios versions misalign the stack
1467 */
1468 return !(((unsigned long)addr+sizeof(void*)-1) & (THREAD_SIZE-sizeof(void*)));
1469}
1470#endif
1471
1472extern union thread_union init_thread_union;
1473extern struct task_struct init_task;
1474
Pavel Emelyanov198fe212007-10-18 23:40:06 -07001475extern struct pid_namespace init_pid_ns;
1476
1477/*
1478 * find a task by one of its numerical ids
1479 *
Pavel Emelyanov198fe212007-10-18 23:40:06 -07001480 * find_task_by_pid_ns():
1481 * finds a task by its pid in the specified namespace
Pavel Emelyanov228ebcb2007-10-18 23:40:16 -07001482 * find_task_by_vpid():
1483 * finds a task by its virtual pid
Pavel Emelyanov198fe212007-10-18 23:40:06 -07001484 *
Pavel Emelyanove49859e2008-07-25 01:48:36 -07001485 * see also find_vpid() etc in include/linux/pid.h
Pavel Emelyanov198fe212007-10-18 23:40:06 -07001486 */
1487
Pavel Emelyanov228ebcb2007-10-18 23:40:16 -07001488extern struct task_struct *find_task_by_vpid(pid_t nr);
1489extern struct task_struct *find_task_by_pid_ns(pid_t nr,
1490 struct pid_namespace *ns);
Pavel Emelyanov198fe212007-10-18 23:40:06 -07001491
Harvey Harrisonb3c97522008-02-13 15:03:15 -08001492extern int wake_up_state(struct task_struct *tsk, unsigned int state);
1493extern int wake_up_process(struct task_struct *tsk);
Samir Bellabes3e51e3e2011-05-11 18:18:05 +02001494extern void wake_up_new_task(struct task_struct *tsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495#ifdef CONFIG_SMP
1496 extern void kick_process(struct task_struct *tsk);
1497#else
1498 static inline void kick_process(struct task_struct *tsk) { }
1499#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001500
Linus Torvalds1da177e2005-04-16 15:20:36 -07001501extern void exit_files(struct task_struct *);
Oleg Nesterovcbaffba2008-05-26 20:55:42 +04001502
Linus Torvalds1da177e2005-04-16 15:20:36 -07001503extern void exit_itimers(struct signal_struct *);
1504
Linus Torvaldsc4ad8f92014-02-05 12:54:53 -08001505extern int do_execve(struct filename *,
David Howellsd7627462010-08-17 23:52:56 +01001506 const char __user * const __user *,
Al Viroda3d4c52012-10-20 21:49:33 -04001507 const char __user * const __user *);
David Drysdale51f39a12014-12-12 16:57:29 -08001508extern int do_execveat(int, struct filename *,
1509 const char __user * const __user *,
1510 const char __user * const __user *,
1511 int);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001512
Adrian Hunter82b89772014-05-28 11:45:04 +03001513extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
1514static inline void set_task_comm(struct task_struct *tsk, const char *from)
1515{
1516 __set_task_comm(tsk, from, false);
1517}
Andrew Morton59714d62008-02-04 22:27:21 -08001518extern char *get_task_comm(char *to, struct task_struct *tsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001519
1520#ifdef CONFIG_SMP
Peter Zijlstra317f3942011-04-05 17:23:58 +02001521void scheduler_ipi(void);
Roland McGrath85ba2d82008-07-25 19:45:58 -07001522extern unsigned long wait_task_inactive(struct task_struct *, long match_state);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001523#else
Peter Zijlstra184748c2011-04-05 17:23:39 +02001524static inline void scheduler_ipi(void) { }
Roland McGrath85ba2d82008-07-25 19:45:58 -07001525static inline unsigned long wait_task_inactive(struct task_struct *p,
1526 long match_state)
1527{
1528 return 1;
1529}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530#endif
1531
Linus Torvalds1da177e2005-04-16 15:20:36 -07001532/*
Eric W. Biederman260ea102006-06-23 02:05:18 -07001533 * Protects ->fs, ->files, ->mm, ->group_info, ->comm, keyring
Jens Axboe22e2c502005-06-27 10:55:12 +02001534 * subscriptions and synchronises with wait4(). Also used in procfs. Also
Paul Menageddbcc7e2007-10-18 23:39:30 -07001535 * pins the final release of task.io_context. Also protects ->cpuset and
Oleg Nesterovd68b46f2012-03-05 14:59:13 -08001536 * ->cgroup.subsys[]. And ->vfork_done.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001537 *
1538 * Nests both inside and outside of read_lock(&tasklist_lock).
1539 * It must not be nested with write_lock_irq(&tasklist_lock),
1540 * neither inside nor outside.
1541 */
1542static inline void task_lock(struct task_struct *p)
1543{
1544 spin_lock(&p->alloc_lock);
1545}
1546
1547static inline void task_unlock(struct task_struct *p)
1548{
1549 spin_unlock(&p->alloc_lock);
1550}
1551
1552/* set thread flags in other task's structures
1553 * - see asm/thread_info.h for TIF_xxxx flags available
1554 */
1555static inline void set_tsk_thread_flag(struct task_struct *tsk, int flag)
1556{
Al Viroa1261f542005-11-13 16:06:55 -08001557 set_ti_thread_flag(task_thread_info(tsk), flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001558}
1559
1560static inline void clear_tsk_thread_flag(struct task_struct *tsk, int flag)
1561{
Al Viroa1261f542005-11-13 16:06:55 -08001562 clear_ti_thread_flag(task_thread_info(tsk), flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001563}
1564
1565static inline int test_and_set_tsk_thread_flag(struct task_struct *tsk, int flag)
1566{
Al Viroa1261f542005-11-13 16:06:55 -08001567 return test_and_set_ti_thread_flag(task_thread_info(tsk), flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001568}
1569
1570static inline int test_and_clear_tsk_thread_flag(struct task_struct *tsk, int flag)
1571{
Al Viroa1261f542005-11-13 16:06:55 -08001572 return test_and_clear_ti_thread_flag(task_thread_info(tsk), flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001573}
1574
1575static inline int test_tsk_thread_flag(struct task_struct *tsk, int flag)
1576{
Al Viroa1261f542005-11-13 16:06:55 -08001577 return test_ti_thread_flag(task_thread_info(tsk), flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001578}
1579
1580static inline void set_tsk_need_resched(struct task_struct *tsk)
1581{
1582 set_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
1583}
1584
1585static inline void clear_tsk_need_resched(struct task_struct *tsk)
1586{
1587 clear_tsk_thread_flag(tsk,TIF_NEED_RESCHED);
1588}
1589
Gregory Haskins8ae121a2008-04-23 07:13:29 -04001590static inline int test_tsk_need_resched(struct task_struct *tsk)
1591{
1592 return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
1593}
1594
Linus Torvalds1da177e2005-04-16 15:20:36 -07001595/*
1596 * cond_resched() and cond_resched_lock(): latency reduction via
1597 * explicit rescheduling in places that are safe. The return
1598 * value indicates whether a reschedule was done in fact.
1599 * cond_resched_lock() will drop the spinlock before scheduling,
1600 * cond_resched_softirq() will enable bhs before scheduling.
1601 */
Peter Zijlstra35a773a2016-09-19 12:57:53 +02001602#ifndef CONFIG_PREEMPT
Linus Torvaldsc3921ab2008-05-11 16:04:48 -07001603extern int _cond_resched(void);
Peter Zijlstra35a773a2016-09-19 12:57:53 +02001604#else
1605static inline int _cond_resched(void) { return 0; }
1606#endif
Frederic Weisbecker6f80bd92009-07-16 15:44:29 +02001607
Frederic Weisbecker613afbf2009-07-16 15:44:29 +02001608#define cond_resched() ({ \
Peter Zijlstra34274452014-09-24 10:18:56 +02001609 ___might_sleep(__FILE__, __LINE__, 0); \
Frederic Weisbecker613afbf2009-07-16 15:44:29 +02001610 _cond_resched(); \
1611})
Frederic Weisbecker6f80bd92009-07-16 15:44:29 +02001612
Frederic Weisbecker613afbf2009-07-16 15:44:29 +02001613extern int __cond_resched_lock(spinlock_t *lock);
1614
1615#define cond_resched_lock(lock) ({ \
Peter Zijlstra34274452014-09-24 10:18:56 +02001616 ___might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET);\
Frederic Weisbecker613afbf2009-07-16 15:44:29 +02001617 __cond_resched_lock(lock); \
1618})
1619
1620extern int __cond_resched_softirq(void);
1621
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -07001622#define cond_resched_softirq() ({ \
Peter Zijlstra34274452014-09-24 10:18:56 +02001623 ___might_sleep(__FILE__, __LINE__, SOFTIRQ_DISABLE_OFFSET); \
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -07001624 __cond_resched_softirq(); \
Frederic Weisbecker613afbf2009-07-16 15:44:29 +02001625})
Linus Torvalds1da177e2005-04-16 15:20:36 -07001626
Simon Hormanf6f3c432013-05-22 14:50:31 +09001627static inline void cond_resched_rcu(void)
1628{
1629#if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU)
1630 rcu_read_unlock();
1631 cond_resched();
1632 rcu_read_lock();
1633#endif
1634}
1635
Linus Torvalds1da177e2005-04-16 15:20:36 -07001636/*
1637 * Does a critical section need to be broken due to another
Nick Piggin95c354f2008-01-30 13:31:20 +01001638 * task waiting?: (technically does not depend on CONFIG_PREEMPT,
1639 * but a general need for low latency)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001640 */
Nick Piggin95c354f2008-01-30 13:31:20 +01001641static inline int spin_needbreak(spinlock_t *lock)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001642{
Nick Piggin95c354f2008-01-30 13:31:20 +01001643#ifdef CONFIG_PREEMPT
1644 return spin_is_contended(lock);
1645#else
Linus Torvalds1da177e2005-04-16 15:20:36 -07001646 return 0;
Nick Piggin95c354f2008-01-30 13:31:20 +01001647#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001648}
1649
Peter Zijlstra75f93fe2013-09-27 17:30:03 +02001650static __always_inline bool need_resched(void)
1651{
1652 return unlikely(tif_need_resched());
1653}
1654
Thomas Gleixneree761f62013-03-21 22:49:32 +01001655/*
Frank Mayharf06febc2008-09-12 09:54:39 -07001656 * Thread group CPU time accounting.
1657 */
Peter Zijlstra4cd4c1b2009-02-05 12:24:16 +01001658void thread_group_cputime(struct task_struct *tsk, struct task_cputime *times);
Peter Zijlstra4da94d492009-02-11 11:30:27 +01001659void thread_group_cputimer(struct task_struct *tsk, struct task_cputime *times);
Frank Mayharf06febc2008-09-12 09:54:39 -07001660
Frank Mayharf06febc2008-09-12 09:54:39 -07001661/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07001662 * Wrappers for p->thread_info->cpu access. No-op on UP.
1663 */
1664#ifdef CONFIG_SMP
1665
1666static inline unsigned int task_cpu(const struct task_struct *p)
1667{
Andy Lutomirskic65eacb2016-09-13 14:29:24 -07001668#ifdef CONFIG_THREAD_INFO_IN_TASK
1669 return p->cpu;
1670#else
Al Viroa1261f542005-11-13 16:06:55 -08001671 return task_thread_info(p)->cpu;
Andy Lutomirskic65eacb2016-09-13 14:29:24 -07001672#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001673}
1674
Ingo Molnarb32e86b2013-10-07 11:29:30 +01001675static inline int task_node(const struct task_struct *p)
1676{
1677 return cpu_to_node(task_cpu(p));
1678}
1679
Ingo Molnarc65cc872007-07-09 18:51:58 +02001680extern void set_task_cpu(struct task_struct *p, unsigned int cpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001681
1682#else
1683
1684static inline unsigned int task_cpu(const struct task_struct *p)
1685{
1686 return 0;
1687}
1688
1689static inline void set_task_cpu(struct task_struct *p, unsigned int cpu)
1690{
1691}
1692
1693#endif /* CONFIG_SMP */
1694
Pan Xinhuid9345c62016-11-02 05:08:28 -04001695/*
1696 * In order to reduce various lock holder preemption latencies provide an
1697 * interface to see if a vCPU is currently running or not.
1698 *
1699 * This allows us to terminate optimistic spin loops and block, analogous to
1700 * the native optimistic spin heuristic of testing if the lock owner task is
1701 * running or not.
1702 */
1703#ifndef vcpu_is_preempted
1704# define vcpu_is_preempted(cpu) false
1705#endif
1706
Rusty Russell96f874e22008-11-25 02:35:14 +10301707extern long sched_setaffinity(pid_t pid, const struct cpumask *new_mask);
1708extern long sched_getaffinity(pid_t pid, struct cpumask *mask);
Siddha, Suresh B5c45bf22006-06-27 02:54:42 -07001709
Dhaval Giani7c941432010-01-20 13:26:18 +01001710#ifdef CONFIG_CGROUP_SCHED
Yong Zhang07e06b02011-01-07 15:17:36 +08001711extern struct task_group root_task_group;
Peter Zijlstra8323f262012-06-22 13:36:05 +02001712#endif /* CONFIG_CGROUP_SCHED */
Srivatsa Vaddagiri9b5b7752007-10-15 17:00:09 +02001713
Dhaval Giani54e99122009-02-27 15:13:54 +05301714extern int task_can_switch_user(struct user_struct *up,
1715 struct task_struct *tsk);
1716
Dave Hansen82455252008-02-04 22:28:59 -08001717#ifndef TASK_SIZE_OF
1718#define TASK_SIZE_OF(tsk) TASK_SIZE
1719#endif
1720
Linus Torvalds1da177e2005-04-16 15:20:36 -07001721#endif