Blame - kernel/sched/sched.h - linux

blob: 001fe047bd5d80b841776719b5fa73f4401288a4 [file] [log] [blame]

Greg Kroah-Hartman	b244131	2017-11-01 15:07:57 +0100	[diff] [blame]	1	/* SPDX-License-Identifier: GPL-2.0 */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2	/*
				3	* Scheduler internal types and methods:
				4	*/
Ingo Molnar	9545847	2022-02-22 14:50:43 +0100	[diff] [blame]	5	#ifndef _KERNEL_SCHED_SCHED_H
				6	#define _KERNEL_SCHED_SCHED_H
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	7
Ingo Molnar	801c141	2022-02-22 13:23:24 +0100	[diff] [blame]	8	#include <linux/sched/affinity.h>
Ingo Molnar	dfc3401	2017-02-03 23:15:21 +0100	[diff] [blame]	9	#include <linux/sched/autogroup.h>
Ingo Molnar	55687da	2017-02-08 18:51:31 +0100	[diff] [blame]	10	#include <linux/sched/cpufreq.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	11	#include <linux/sched/deadline.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	12	#include <linux/sched.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	13	#include <linux/sched/loadavg.h>
				14	#include <linux/sched/mm.h>
Ingo Molnar	801c141	2022-02-22 13:23:24 +0100	[diff] [blame]	15	#include <linux/sched/rseq_api.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	16	#include <linux/sched/signal.h>
Thomas Gleixner	321a874	2018-11-25 19:33:38 +0100	[diff] [blame]	17	#include <linux/sched/smt.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	18	#include <linux/sched/stat.h>
				19	#include <linux/sched/sysctl.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	20	#include <linux/sched/task_flags.h>
Ingo Molnar	2993002	2017-02-08 18:51:36 +0100	[diff] [blame]	21	#include <linux/sched/task.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	22	#include <linux/sched/topology.h>
Ingo Molnar	ef8bd77	2017-02-08 18:51:36 +0100	[diff] [blame]	23
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	24	#include <linux/atomic.h>
				25	#include <linux/bitmap.h>
				26	#include <linux/bug.h>
				27	#include <linux/capability.h>
				28	#include <linux/cgroup_api.h>
				29	#include <linux/cgroup.h>
Frederic Weisbecker	e67198c	2022-06-08 16:40:25 +0200	[diff] [blame]	30	#include <linux/context_tracking.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	31	#include <linux/cpufreq.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	32	#include <linux/cpumask_api.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	33	#include <linux/ctype.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	34	#include <linux/file.h>
				35	#include <linux/fs_api.h>
				36	#include <linux/hrtimer_api.h>
				37	#include <linux/interrupt.h>
				38	#include <linux/irq_work.h>
				39	#include <linux/jiffies.h>
				40	#include <linux/kref_api.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	41	#include <linux/kthread.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	42	#include <linux/ktime_api.h>
				43	#include <linux/lockdep_api.h>
				44	#include <linux/lockdep.h>
				45	#include <linux/minmax.h>
				46	#include <linux/mm.h>
				47	#include <linux/module.h>
				48	#include <linux/mutex_api.h>
				49	#include <linux/plist.h>
				50	#include <linux/poll.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	51	#include <linux/proc_fs.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	52	#include <linux/profile.h>
Johannes Weiner	eb41468	2018-10-26 15:06:27 -0700	[diff] [blame]	53	#include <linux/psi.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	54	#include <linux/rcupdate.h>
				55	#include <linux/seq_file.h>
				56	#include <linux/seqlock.h>
				57	#include <linux/softirq.h>
				58	#include <linux/spinlock_api.h>
				59	#include <linux/static_key.h>
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	60	#include <linux/stop_machine.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	61	#include <linux/syscalls_api.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	62	#include <linux/syscalls.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	63	#include <linux/tick.h>
				64	#include <linux/topology.h>
				65	#include <linux/types.h>
				66	#include <linux/u64_stats_sync_api.h>
				67	#include <linux/uaccess.h>
				68	#include <linux/wait_api.h>
				69	#include <linux/wait_bit.h>
				70	#include <linux/workqueue_api.h>
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	71
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	72	#include <trace/events/power.h>
Ingo Molnar	b9e9c6ca	2022-02-13 08:19:43 +0100	[diff] [blame]	73	#include <trace/events/sched.h>
				74
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	75	#include "../workqueue_internal.h"
				76
Ingo Molnar	7fce777	2017-02-02 14:47:27 +0100	[diff] [blame]	77	#ifdef CONFIG_PARAVIRT
Ingo Molnar	325ea10	2018-03-03 12:20:47 +0100	[diff] [blame]	78	# include <asm/paravirt.h>
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	79	# include <asm/paravirt_api_clock.h>
Ingo Molnar	7fce777	2017-02-02 14:47:27 +0100	[diff] [blame]	80	#endif
				81
Peter Zijlstra	391e43d	2011-11-15 17:14:39 +0100	[diff] [blame]	82	#include "cpupri.h"
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	83	#include "cpudeadline.h"
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	84
Peter Zijlstra	9148a3a	2016-09-20 22:34:51 +0200	[diff] [blame]	85	#ifdef CONFIG_SCHED_DEBUG
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	86	# define SCHED_WARN_ON(x) WARN_ONCE(x, #x)
Peter Zijlstra	9148a3a	2016-09-20 22:34:51 +0200	[diff] [blame]	87	#else
Ingo Molnar	4ff8f2c	2022-02-22 14:51:58 +0100	[diff] [blame]	88	# define SCHED_WARN_ON(x) ({ (void)(x), 0; })
Peter Zijlstra	9148a3a	2016-09-20 22:34:51 +0200	[diff] [blame]	89	#endif
				90
Paul Gortmaker	45ceebf	2013-04-19 15:10:49 -0400	[diff] [blame]	91	struct rq;
Daniel Lezcano	442bf3a	2014-09-04 11:32:09 -0400	[diff] [blame]	92	struct cpuidle_state;
Paul Gortmaker	45ceebf	2013-04-19 15:10:49 -0400	[diff] [blame]	93
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	94	/* task_struct::on_rq states: */
				95	#define TASK_ON_RQ_QUEUED 1
Kirill Tkhai	cca26e8	2014-08-20 13:47:42 +0400	[diff] [blame]	96	#define TASK_ON_RQ_MIGRATING 2
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	97
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	98	extern __read_mostly int scheduler_running;
				99
Paul Gortmaker	45ceebf	2013-04-19 15:10:49 -0400	[diff] [blame]	100	extern unsigned long calc_load_update;
				101	extern atomic_long_t calc_load_tasks;
				102
Peter Zijlstra	3289bdb	2015-04-14 13:19:42 +0200	[diff] [blame]	103	extern void calc_global_load_tick(struct rq *this_rq);
Thomas Gleixner	d60585c	2016-07-12 18:33:56 +0200	[diff] [blame]	104	extern long calc_load_fold_active(struct rq *this_rq, long adjust);
Peter Zijlstra	3289bdb	2015-04-14 13:19:42 +0200	[diff] [blame]	105
Phil Auld	9d24605	2020-06-29 15:23:03 -0400	[diff] [blame]	106	extern void call_trace_sched_update_nr_running(struct rq *rq, int count);
Zhen Ni	d9ab0e6	2022-02-15 19:45:59 +0800	[diff] [blame]	107
Yajun Deng	089768d	2023-10-08 10:15:38 +0800	[diff] [blame]	108	extern int sysctl_sched_rt_period;
Zhen Ni	d9ab0e6	2022-02-15 19:45:59 +0800	[diff] [blame]	109	extern int sysctl_sched_rt_runtime;
Zhen Ni	dafd7a9	2022-02-15 19:46:01 +0800	[diff] [blame]	110	extern int sched_rr_timeslice;
Zhen Ni	d9ab0e6	2022-02-15 19:45:59 +0800	[diff] [blame]	111
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	112	/*
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	113	* Helpers for converting nanosecond timing to jiffy resolution
				114	*/
				115	#define NS_TO_JIFFIES(TIME) ((unsigned long)(TIME) / (NSEC_PER_SEC / HZ))
				116
Li Zefan	cc1f4b1	2013-03-05 16:06:09 +0800	[diff] [blame]	117	/*
				118	* Increase resolution of nice-level calculations for 64-bit architectures.
				119	* The extra resolution improves shares distribution and load balancing of
				120	* low-weight task groups (eg. nice +19 on an autogroup), deeper taskgroup
				121	* hierarchies, especially on larger systems. This is not a user-visible change
				122	* and does not change the user-interface for setting shares/weights.
				123	*
				124	* We increase resolution only if we have enough bits to allow this increased
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	125	* resolution (i.e. 64-bit). The costs for increasing resolution when 32-bit
				126	* are pretty high and the returns do not justify the increased costs.
Peter Zijlstra	2159197	2016-04-28 12:49:38 +0200	[diff] [blame]	127	*
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	128	* Really only required when CONFIG_FAIR_GROUP_SCHED=y is also set, but to
				129	* increase coverage and consistency always enable it on 64-bit platforms.
Li Zefan	cc1f4b1	2013-03-05 16:06:09 +0800	[diff] [blame]	130	*/
Peter Zijlstra	2159197	2016-04-28 12:49:38 +0200	[diff] [blame]	131	#ifdef CONFIG_64BIT
Yuyang Du	172895e	2016-04-05 12:12:27 +0800	[diff] [blame]	132	# define NICE_0_LOAD_SHIFT (SCHED_FIXEDPOINT_SHIFT + SCHED_FIXEDPOINT_SHIFT)
Yuyang Du	6ecdd74	2016-04-05 12:12:26 +0800	[diff] [blame]	133	# define scale_load(w) ((w) << SCHED_FIXEDPOINT_SHIFT)
Michael Wang	26cf522	2020-03-18 10:15:15 +0800	[diff] [blame]	134	# define scale_load_down(w) \
				135	({ \
				136	unsigned long __w = (w); \
				137	if (__w) \
				138	__w = max(2UL, __w >> SCHED_FIXEDPOINT_SHIFT); \
				139	__w; \
				140	})
Li Zefan	cc1f4b1	2013-03-05 16:06:09 +0800	[diff] [blame]	141	#else
Yuyang Du	172895e	2016-04-05 12:12:27 +0800	[diff] [blame]	142	# define NICE_0_LOAD_SHIFT (SCHED_FIXEDPOINT_SHIFT)
Li Zefan	cc1f4b1	2013-03-05 16:06:09 +0800	[diff] [blame]	143	# define scale_load(w) (w)
				144	# define scale_load_down(w) (w)
				145	#endif
				146
Yuyang Du	6ecdd74	2016-04-05 12:12:26 +0800	[diff] [blame]	147	/*
Yuyang Du	172895e	2016-04-05 12:12:27 +0800	[diff] [blame]	148	* Task weight (visible to users) and its load (invisible to users) have
				149	* independent resolution, but they should be well calibrated. We use
				150	* scale_load() and scale_load_down(w) to convert between them. The
				151	* following must be true:
				152	*
Dietmar Eggemann	9d061ba6	2021-01-28 14:10:39 +0100	[diff] [blame]	153	* scale_load(sched_prio_to_weight[NICE_TO_PRIO(0)-MAX_RT_PRIO]) == NICE_0_LOAD
Yuyang Du	172895e	2016-04-05 12:12:27 +0800	[diff] [blame]	154	*
Yuyang Du	6ecdd74	2016-04-05 12:12:26 +0800	[diff] [blame]	155	*/
Yuyang Du	172895e	2016-04-05 12:12:27 +0800	[diff] [blame]	156	#define NICE_0_LOAD (1L << NICE_0_LOAD_SHIFT)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	157
				158	/*
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	159	* Single value that decides SCHED_DEADLINE internal math precision.
				160	* 10 -> just above 1us
				161	* 9 -> just above 0.5us
				162	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	163	#define DL_SCALE 10
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	164
				165	/*
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	166	* Single value that denotes runtime == period, ie unlimited time.
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	167	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	168	#define RUNTIME_INF ((u64)~0ULL)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	169
Henrik Austad	20f9cd2	2015-09-09 17:00:41 +0200	[diff] [blame]	170	static inline int idle_policy(int policy)
				171	{
				172	return policy == SCHED_IDLE;
				173	}
Dario Faggioli	d50dde5	2013-11-07 14:43:36 +0100	[diff] [blame]	174	static inline int fair_policy(int policy)
				175	{
				176	return policy == SCHED_NORMAL \|\| policy == SCHED_BATCH;
				177	}
				178
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	179	static inline int rt_policy(int policy)
				180	{
Dario Faggioli	d50dde5	2013-11-07 14:43:36 +0100	[diff] [blame]	181	return policy == SCHED_FIFO \|\| policy == SCHED_RR;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	182	}
				183
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	184	static inline int dl_policy(int policy)
				185	{
				186	return policy == SCHED_DEADLINE;
				187	}
Henrik Austad	20f9cd2	2015-09-09 17:00:41 +0200	[diff] [blame]	188	static inline bool valid_policy(int policy)
				189	{
				190	return idle_policy(policy) \|\| fair_policy(policy) \|\|
				191	rt_policy(policy) \|\| dl_policy(policy);
				192	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	193
Viresh Kumar	1da1843	2018-11-05 16:51:55 +0530	[diff] [blame]	194	static inline int task_has_idle_policy(struct task_struct *p)
				195	{
				196	return idle_policy(p->policy);
				197	}
				198
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	199	static inline int task_has_rt_policy(struct task_struct *p)
				200	{
				201	return rt_policy(p->policy);
				202	}
				203
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	204	static inline int task_has_dl_policy(struct task_struct *p)
				205	{
				206	return dl_policy(p->policy);
				207	}
				208
Juri Lelli	0788116	2017-12-04 11:23:25 +0100	[diff] [blame]	209	#define cap_scale(v, s) ((v)*(s) >> SCHED_CAPACITY_SHIFT)
				210
Valentin Schneider	d76343c	2020-03-30 10:01:27 +0100	[diff] [blame]	211	static inline void update_avg(u64 *avg, u64 sample)
				212	{
				213	s64 diff = sample - *avg;
				214	*avg += diff / 8;
				215	}
				216
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	217	/*
Valentin Schneider	39a2a6e	2021-02-25 17:56:56 +0000	[diff] [blame]	218	* Shifting a value by an exponent greater or equal to the size of said value
				219	* is UB; cap at size-1.
				220	*/
				221	#define shr_bound(val, shift) \
				222	(val >> min_t(typeof(shift), shift, BITS_PER_TYPE(typeof(val)) - 1))
				223
				224	/*
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	225	* !! For sched_setattr_nocheck() (kernel) only !!
				226	*
				227	* This is actually gross. :(
				228	*
				229	* It is used to make schedutil kworker(s) higher priority than SCHED_DEADLINE
				230	* tasks, but still be able to sleep. We need this on platforms that cannot
				231	* atomically change clock frequency. Remove once fast switching will be
				232	* available on such platforms.
				233	*
				234	* SUGOV stands for SchedUtil GOVernor.
				235	*/
				236	#define SCHED_FLAG_SUGOV 0x10000000
				237
Quentin Perret	f950915	2021-07-27 11:11:01 +0100	[diff] [blame]	238	#define SCHED_DL_FLAGS (SCHED_FLAG_RECLAIM \| SCHED_FLAG_DL_OVERRUN \| SCHED_FLAG_SUGOV)
				239
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	240	static inline bool dl_entity_is_special(const struct sched_dl_entity *dl_se)
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	241	{
				242	#ifdef CONFIG_CPU_FREQ_GOV_SCHEDUTIL
				243	return unlikely(dl_se->flags & SCHED_FLAG_SUGOV);
				244	#else
				245	return false;
				246	#endif
				247	}
				248
				249	/*
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	250	* Tells if entity @a should preempt entity @b.
				251	*/
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	252	static inline bool dl_entity_preempt(const struct sched_dl_entity *a,
				253	const struct sched_dl_entity *b)
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	254	{
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	255	return dl_entity_is_special(a) \|\|
				256	dl_time_before(a->deadline, b->deadline);
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	257	}
				258
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	259	/*
				260	* This is the priority-queue data structure of the RT scheduling class:
				261	*/
				262	struct rt_prio_array {
				263	DECLARE_BITMAP(bitmap, MAX_RT_PRIO+1); /* include 1 bit for delimiter */
				264	struct list_head queue[MAX_RT_PRIO];
				265	};
				266
				267	struct rt_bandwidth {
				268	/* nests inside the rq lock: */
				269	raw_spinlock_t rt_runtime_lock;
				270	ktime_t rt_period;
				271	u64 rt_runtime;
				272	struct hrtimer rt_period_timer;
Peter Zijlstra	4cfafd3	2015-05-14 12:23:11 +0200	[diff] [blame]	273	unsigned int rt_period_active;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	274	};
Juri Lelli	a5e7be3	2014-09-19 10:22:39 +0100	[diff] [blame]	275
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	276	static inline int dl_bandwidth_enabled(void)
				277	{
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	278	return sysctl_sched_rt_runtime >= 0;
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	279	}
				280
Peng Liu	a57415f	2020-10-08 23:49:42 +0800	[diff] [blame]	281	/*
				282	* To keep the bandwidth of -deadline tasks under control
				283	* we need some place where:
				284	* - store the maximum -deadline bandwidth of each cpu;
				285	* - cache the fraction of bandwidth that is currently allocated in
				286	* each root domain;
				287	*
				288	* This is all done in the data structure below. It is similar to the
				289	* one used for RT-throttling (rt_bandwidth), with the main difference
				290	* that, since here we are only interested in admission control, we
				291	* do not decrease any runtime while the group "executes", neither we
				292	* need a timer to replenish it.
				293	*
				294	* With respect to SMP, bandwidth is given on a per root domain basis,
				295	* meaning that:
				296	* - bw (< 100%) is the deadline bandwidth of each CPU;
				297	* - total_bw is the currently allocated bandwidth in each root domain;
				298	*/
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	299	struct dl_bw {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	300	raw_spinlock_t lock;
				301	u64 bw;
				302	u64 total_bw;
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	303	};
				304
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	305	extern void init_dl_bw(struct dl_bw *dl_b);
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	306	extern int sched_dl_global_validate(void);
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	307	extern void sched_dl_do_global(void);
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	308	extern int sched_dl_overflow(struct task_struct p, int policy, const struct sched_attr attr);
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	309	extern void __setparam_dl(struct task_struct p, const struct sched_attr attr);
				310	extern void __getparam_dl(struct task_struct p, struct sched_attr attr);
				311	extern bool __checkparam_dl(const struct sched_attr *attr);
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	312	extern bool dl_param_changed(struct task_struct p, const struct sched_attr attr);
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	313	extern int dl_cpuset_cpumask_can_shrink(const struct cpumask cur, const struct cpumask trial);
Dietmar Eggemann	8598910	2023-05-08 09:58:53 +0200	[diff] [blame]	314	extern int dl_bw_check_overflow(int cpu);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	315
Peter Zijlstra	63ba842	2023-11-04 11:59:21 +0100	[diff] [blame]	316	/*
				317	* SCHED_DEADLINE supports servers (nested scheduling) with the following
				318	* interface:
				319	*
				320	* dl_se::rq -- runqueue we belong to.
				321	*
				322	* dl_se::server_has_tasks() -- used on bandwidth enforcement; we 'stop' the
				323	* server when it runs out of tasks to run.
				324	*
				325	* dl_se::server_pick() -- nested pick_next_task(); we yield the period if this
				326	* returns NULL.
				327	*
				328	* dl_server_update() -- called from update_curr_common(), propagates runtime
				329	* to the server.
				330	*
				331	* dl_server_start()
				332	* dl_server_stop() -- start/stop the server when it has (no) tasks.
				333	*
				334	* dl_server_init() -- initializes the server.
				335	*/
				336	extern void dl_server_update(struct sched_dl_entity *dl_se, s64 delta_exec);
				337	extern void dl_server_start(struct sched_dl_entity *dl_se);
				338	extern void dl_server_stop(struct sched_dl_entity *dl_se);
				339	extern void dl_server_init(struct sched_dl_entity dl_se, struct rq rq,
				340	dl_server_has_tasks_f has_tasks,
				341	dl_server_pick_f pick);
				342
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	343	#ifdef CONFIG_CGROUP_SCHED
				344
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	345	struct cfs_rq;
				346	struct rt_rq;
				347
Mike Galbraith	35cf4e5	2012-08-07 05:00:13 +0200	[diff] [blame]	348	extern struct list_head task_groups;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	349
				350	struct cfs_bandwidth {
				351	#ifdef CONFIG_CFS_BANDWIDTH
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	352	raw_spinlock_t lock;
				353	ktime_t period;
				354	u64 quota;
				355	u64 runtime;
Huaixin Chang	f418371	2021-06-21 17:27:58 +0800	[diff] [blame]	356	u64 burst;
Huaixin Chang	bcb1704	2021-08-30 11:22:14 +0800	[diff] [blame]	357	u64 runtime_snap;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	358	s64 hierarchical_quota;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	359
bsegall@google.com	66567fc	2019-06-06 10:21:01 -0700	[diff] [blame]	360	u8 idle;
				361	u8 period_active;
bsegall@google.com	66567fc	2019-06-06 10:21:01 -0700	[diff] [blame]	362	u8 slack_started;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	363	struct hrtimer period_timer;
				364	struct hrtimer slack_timer;
				365	struct list_head throttled_cfs_rq;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	366
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	367	/* Statistics: */
				368	int nr_periods;
				369	int nr_throttled;
Huaixin Chang	bcb1704	2021-08-30 11:22:14 +0800	[diff] [blame]	370	int nr_burst;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	371	u64 throttled_time;
Huaixin Chang	bcb1704	2021-08-30 11:22:14 +0800	[diff] [blame]	372	u64 burst_time;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	373	#endif
				374	};
				375
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	376	/* Task group related information */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	377	struct task_group {
				378	struct cgroup_subsys_state css;
				379
				380	#ifdef CONFIG_FAIR_GROUP_SCHED
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	381	/* schedulable entities of this group on each CPU */
				382	struct sched_entity **se;
				383	/* runqueue "owned" by this group on each CPU */
				384	struct cfs_rq **cfs_rq;
				385	unsigned long shares;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	386
Josh Don	3040003	2021-07-29 19:00:18 -0700	[diff] [blame]	387	/* A positive value indicates that this is a SCHED_IDLE group. */
				388	int idle;
				389
Alex Shi	fa6bdde	2013-06-20 10:18:46 +0800	[diff] [blame]	390	#ifdef CONFIG_SMP
Waiman Long	b036762	2015-12-02 13:41:49 -0500	[diff] [blame]	391	/*
				392	* load_avg can be heavily contended at clock tick time, so put
				393	* it in its own cacheline separated from the fields above which
				394	* will also be accessed at each tick.
				395	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	396	atomic_long_t load_avg ____cacheline_aligned;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	397	#endif
Alex Shi	fa6bdde	2013-06-20 10:18:46 +0800	[diff] [blame]	398	#endif
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	399
				400	#ifdef CONFIG_RT_GROUP_SCHED
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	401	struct sched_rt_entity **rt_se;
				402	struct rt_rq **rt_rq;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	403
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	404	struct rt_bandwidth rt_bandwidth;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	405	#endif
				406
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	407	struct rcu_head rcu;
				408	struct list_head list;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	409
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	410	struct task_group *parent;
				411	struct list_head siblings;
				412	struct list_head children;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	413
				414	#ifdef CONFIG_SCHED_AUTOGROUP
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	415	struct autogroup *autogroup;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	416	#endif
				417
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	418	struct cfs_bandwidth cfs_bandwidth;
Patrick Bellasi	2480c09	2019-08-22 14:28:06 +0100	[diff] [blame]	419
				420	#ifdef CONFIG_UCLAMP_TASK_GROUP
				421	/* The two decimal precision [%] value requested from user-space */
				422	unsigned int uclamp_pct[UCLAMP_CNT];
				423	/* Clamp values requested for a task group */
				424	struct uclamp_se uclamp_req[UCLAMP_CNT];
Patrick Bellasi	0b60ba2	2019-08-22 14:28:07 +0100	[diff] [blame]	425	/* Effective clamp values used for a task group */
				426	struct uclamp_se uclamp[UCLAMP_CNT];
Patrick Bellasi	2480c09	2019-08-22 14:28:06 +0100	[diff] [blame]	427	#endif
				428
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	429	};
				430
				431	#ifdef CONFIG_FAIR_GROUP_SCHED
				432	#define ROOT_TASK_GROUP_LOAD NICE_0_LOAD
				433
				434	/*
				435	* A weight of 0 or 1 can cause arithmetics problems.
				436	* A weight of a cfs_rq is the sum of weights of which entities
				437	* are queued on this cfs_rq, so a weight of a entity should not be
				438	* too large, so as the shares value of a task group.
				439	* (The default weight is 1024 - so there's no practical
				440	* limitation from this.)
				441	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	442	#define MIN_SHARES (1UL << 1)
				443	#define MAX_SHARES (1UL << 18)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	444	#endif
				445
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	446	typedef int (tg_visitor)(struct task_group , void *);
				447
				448	extern int walk_tg_tree_from(struct task_group *from,
				449	tg_visitor down, tg_visitor up, void *data);
				450
				451	/*
				452	* Iterate the full tree, calling @down when first entering a node and @up when
				453	* leaving it for the final time.
				454	*
				455	* Caller must hold rcu_lock or sufficient equivalent.
				456	*/
				457	static inline int walk_tg_tree(tg_visitor down, tg_visitor up, void *data)
				458	{
				459	return walk_tg_tree_from(&root_task_group, down, up, data);
				460	}
				461
				462	extern int tg_nop(struct task_group tg, void data);
				463
Arnd Bergmann	b1c3efe	2023-11-23 12:05:03 +0100	[diff] [blame]	464	#ifdef CONFIG_FAIR_GROUP_SCHED
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	465	extern void free_fair_sched_group(struct task_group *tg);
				466	extern int alloc_fair_sched_group(struct task_group tg, struct task_group parent);
Peter Zijlstra	8663e24	2016-06-22 14:58:02 +0200	[diff] [blame]	467	extern void online_fair_sched_group(struct task_group *tg);
Peter Zijlstra	6fe1f34	2016-01-21 22:24:16 +0100	[diff] [blame]	468	extern void unregister_fair_sched_group(struct task_group *tg);
Arnd Bergmann	b1c3efe	2023-11-23 12:05:03 +0100	[diff] [blame]	469	#else
				470	static inline void free_fair_sched_group(struct task_group *tg) { }
				471	static inline int alloc_fair_sched_group(struct task_group tg, struct task_group parent)
				472	{
				473	return 1;
				474	}
				475	static inline void online_fair_sched_group(struct task_group *tg) { }
				476	static inline void unregister_fair_sched_group(struct task_group *tg) { }
				477	#endif
				478
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	479	extern void init_tg_cfs_entry(struct task_group tg, struct cfs_rq cfs_rq,
				480	struct sched_entity *se, int cpu,
				481	struct sched_entity *parent);
Phil Auld	c98c18270	2023-07-14 08:57:46 -0400	[diff] [blame]	482	extern void init_cfs_bandwidth(struct cfs_bandwidth cfs_b, struct cfs_bandwidth parent);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	483
				484	extern void __refill_cfs_bandwidth_runtime(struct cfs_bandwidth *cfs_b);
Peter Zijlstra	77a4d1a	2015-04-15 11:41:57 +0200	[diff] [blame]	485	extern void start_cfs_bandwidth(struct cfs_bandwidth *cfs_b);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	486	extern void unthrottle_cfs_rq(struct cfs_rq *cfs_rq);
Phil Auld	88c56cf	2023-07-12 09:33:57 -0400	[diff] [blame]	487	extern bool cfs_task_bw_constrained(struct task_struct *p);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	488
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	489	extern void init_tg_rt_entry(struct task_group tg, struct rt_rq rt_rq,
				490	struct sched_rt_entity *rt_se, int cpu,
				491	struct sched_rt_entity *parent);
Nicolas Pitre	8887cd9	2017-06-21 14:22:02 -0400	[diff] [blame]	492	extern int sched_group_set_rt_runtime(struct task_group *tg, long rt_runtime_us);
				493	extern int sched_group_set_rt_period(struct task_group *tg, u64 rt_period_us);
				494	extern long sched_group_rt_runtime(struct task_group *tg);
				495	extern long sched_group_rt_period(struct task_group *tg);
				496	extern int sched_rt_can_attach(struct task_group tg, struct task_struct tsk);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	497
Li Zefan	25cc7da	2013-03-05 16:07:33 +0800	[diff] [blame]	498	extern struct task_group sched_create_group(struct task_group parent);
				499	extern void sched_online_group(struct task_group *tg,
				500	struct task_group *parent);
				501	extern void sched_destroy_group(struct task_group *tg);
Mathias Krause	b027789	2021-11-03 20:06:13 +0100	[diff] [blame]	502	extern void sched_release_group(struct task_group *tg);
Li Zefan	25cc7da	2013-03-05 16:07:33 +0800	[diff] [blame]	503
				504	extern void sched_move_task(struct task_struct *tsk);
				505
				506	#ifdef CONFIG_FAIR_GROUP_SCHED
				507	extern int sched_group_set_shares(struct task_group *tg, unsigned long shares);
Byungchul Park	ad936d8	2015-10-24 01:16:19 +0900	[diff] [blame]	508
Josh Don	3040003	2021-07-29 19:00:18 -0700	[diff] [blame]	509	extern int sched_group_set_idle(struct task_group *tg, long idle);
				510
Byungchul Park	ad936d8	2015-10-24 01:16:19 +0900	[diff] [blame]	511	#ifdef CONFIG_SMP
				512	extern void set_task_rq_fair(struct sched_entity *se,
				513	struct cfs_rq prev, struct cfs_rq next);
				514	#else /* !CONFIG_SMP */
				515	static inline void set_task_rq_fair(struct sched_entity *se,
				516	struct cfs_rq prev, struct cfs_rq next) { }
				517	#endif /* CONFIG_SMP */
				518	#endif /* CONFIG_FAIR_GROUP_SCHED */
Li Zefan	25cc7da	2013-03-05 16:07:33 +0800	[diff] [blame]	519
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	520	#else /* CONFIG_CGROUP_SCHED */
				521
				522	struct cfs_bandwidth { };
Phil Auld	88c56cf	2023-07-12 09:33:57 -0400	[diff] [blame]	523	static inline bool cfs_task_bw_constrained(struct task_struct *p) { return false; }
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	524
				525	#endif /* CONFIG_CGROUP_SCHED */
				526
Ben Dooks	87514b2	2022-07-21 15:51:55 +0100	[diff] [blame]	527	extern void unregister_rt_sched_group(struct task_group *tg);
				528	extern void free_rt_sched_group(struct task_group *tg);
				529	extern int alloc_rt_sched_group(struct task_group tg, struct task_group parent);
				530
Vincent Donnefort	d05b430	2022-06-21 10:04:08 +0100	[diff] [blame]	531	/*
				532	* u64_u32_load/u64_u32_store
				533	*
				534	* Use a copy of a u64 value to protect against data race. This is only
				535	* applicable for 32-bits architectures.
				536	*/
				537	#ifdef CONFIG_64BIT
				538	# define u64_u32_load_copy(var, copy) var
				539	# define u64_u32_store_copy(var, copy, val) (var = val)
				540	#else
				541	# define u64_u32_load_copy(var, copy) \
				542	({ \
				543	u64 __val, __val_copy; \
				544	do { \
				545	__val_copy = copy; \
				546	/* \
				547	* paired with u64_u32_store_copy(), ordering access \
				548	* to var and copy. \
				549	*/ \
				550	smp_rmb(); \
				551	__val = var; \
				552	} while (__val != __val_copy); \
				553	__val; \
				554	})
				555	# define u64_u32_store_copy(var, copy, val) \
				556	do { \
				557	typeof(val) __val = (val); \
				558	var = __val; \
				559	/* \
				560	* paired with u64_u32_load_copy(), ordering access to var and \
				561	* copy. \
				562	*/ \
				563	smp_wmb(); \
				564	copy = __val; \
				565	} while (0)
				566	#endif
				567	# define u64_u32_load(var) u64_u32_load_copy(var, var##_copy)
				568	# define u64_u32_store(var, val) u64_u32_store_copy(var, var##_copy, val)
				569
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	570	/* CFS-related fields in a runqueue */
				571	struct cfs_rq {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	572	struct load_weight load;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	573	unsigned int nr_running;
Viresh Kumar	43e9f7f	2019-06-26 10:36:29 +0530	[diff] [blame]	574	unsigned int h_nr_running; /* SCHED_{NORMAL,BATCH,IDLE} */
Josh Don	a480add	2021-08-19 18:04:01 -0700	[diff] [blame]	575	unsigned int idle_nr_running; /* SCHED_IDLE */
Viresh Kumar	43e9f7f	2019-06-26 10:36:29 +0530	[diff] [blame]	576	unsigned int idle_h_nr_running; /* SCHED_IDLE */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	577
Peter Zijlstra	af4cf40	2023-05-31 13:58:40 +0200	[diff] [blame]	578	s64 avg_vruntime;
				579	u64 avg_load;
				580
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	581	u64 exec_clock;
				582	u64 min_vruntime;
Joel Fernandes (Google)	c6047c2	2020-11-17 18:19:39 -0500	[diff] [blame]	583	#ifdef CONFIG_SCHED_CORE
				584	unsigned int forceidle_seq;
				585	u64 min_vruntime_fi;
				586	#endif
				587
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	588	#ifndef CONFIG_64BIT
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	589	u64 min_vruntime_copy;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	590	#endif
				591
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	592	struct rb_root_cached tasks_timeline;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	593
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	594	/*
				595	* 'curr' points to currently running entity on this cfs_rq.
				596	* It is set to NULL otherwise (i.e when none are currently running).
				597	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	598	struct sched_entity *curr;
				599	struct sched_entity *next;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	600
				601	#ifdef CONFIG_SCHED_DEBUG
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	602	unsigned int nr_spread_over;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	603	#endif
				604
Paul Turner	2dac754	2012-10-04 13:18:30 +0200	[diff] [blame]	605	#ifdef CONFIG_SMP
				606	/*
Yuyang Du	9d89c25	2015-07-15 08:04:37 +0800	[diff] [blame]	607	* CFS load tracking
Paul Turner	2dac754	2012-10-04 13:18:30 +0200	[diff] [blame]	608	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	609	struct sched_avg avg;
Peter Zijlstra	2a2f5d4e	2017-05-08 16:51:41 +0200	[diff] [blame]	610	#ifndef CONFIG_64BIT
Vincent Donnefort	d05b430	2022-06-21 10:04:08 +0100	[diff] [blame]	611	u64 last_update_time_copy;
Peter Zijlstra	2a2f5d4e	2017-05-08 16:51:41 +0200	[diff] [blame]	612	#endif
Peter Zijlstra	2a2f5d4e	2017-05-08 16:51:41 +0200	[diff] [blame]	613	struct {
				614	raw_spinlock_t lock ____cacheline_aligned;
				615	int nr;
				616	unsigned long load_avg;
				617	unsigned long util_avg;
Vincent Guittot	9f68395	2020-02-24 09:52:18 +0000	[diff] [blame]	618	unsigned long runnable_avg;
Peter Zijlstra	2a2f5d4e	2017-05-08 16:51:41 +0200	[diff] [blame]	619	} removed;
Alex Shi	141965c	2013-06-26 13:05:39 +0800	[diff] [blame]	620
Paul Turner	c566e8e	2012-10-04 13:18:30 +0200	[diff] [blame]	621	#ifdef CONFIG_FAIR_GROUP_SCHED
Aaron Lu	1528c66	2023-09-12 14:58:08 +0800	[diff] [blame]	622	u64 last_update_tg_load_avg;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	623	unsigned long tg_load_avg_contrib;
				624	long propagate;
				625	long prop_runnable_sum;
Peter Zijlstra	0e2d2aa	2017-05-08 17:30:46 +0200	[diff] [blame]	626
Paul Turner	8295836	2012-10-04 13:18:31 +0200	[diff] [blame]	627	/*
				628	* h_load = weight * f(tg)
				629	*
				630	* Where f(tg) is the recursive weight fraction assigned to
				631	* this group.
				632	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	633	unsigned long h_load;
				634	u64 last_h_load_update;
				635	struct sched_entity *h_load_next;
Vladimir Davydov	6852079	2013-07-15 17:49:19 +0400	[diff] [blame]	636	#endif /* CONFIG_FAIR_GROUP_SCHED */
Paul Turner	8295836	2012-10-04 13:18:31 +0200	[diff] [blame]	637	#endif /* CONFIG_SMP */
				638
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	639	#ifdef CONFIG_FAIR_GROUP_SCHED
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	640	struct rq rq; / CPU runqueue to which this cfs_rq is attached */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	641
				642	/*
				643	* leaf cfs_rqs are those that hold tasks (lowest schedulable entity in
				644	* a hierarchy). Non-leaf lrqs hold other higher schedulable entities
				645	* (like users, containers etc.)
				646	*
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	647	* leaf_cfs_rq_list ties together list of leaf cfs_rq's in a CPU.
				648	* This list is used during load balance.
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	649	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	650	int on_list;
				651	struct list_head leaf_cfs_rq_list;
				652	struct task_group tg; / group that "owns" this runqueue */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	653
Josh Don	3040003	2021-07-29 19:00:18 -0700	[diff] [blame]	654	/* Locally cached copy of our task_group's idle value */
				655	int idle;
				656
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	657	#ifdef CONFIG_CFS_BANDWIDTH
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	658	int runtime_enabled;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	659	s64 runtime_remaining;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	660
Vincent Donnefort	e2f3e35	2022-06-21 10:04:09 +0100	[diff] [blame]	661	u64 throttled_pelt_idle;
				662	#ifndef CONFIG_64BIT
				663	u64 throttled_pelt_idle_copy;
				664	#endif
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	665	u64 throttled_clock;
Chengming Zhou	64eaf50	2022-04-08 19:53:08 +0800	[diff] [blame]	666	u64 throttled_clock_pelt;
				667	u64 throttled_clock_pelt_time;
Josh Don	677ea01	2023-06-20 11:32:47 -0700	[diff] [blame]	668	u64 throttled_clock_self;
				669	u64 throttled_clock_self_time;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	670	int throttled;
				671	int throttle_count;
				672	struct list_head throttled_list;
Josh Don	8ad075c	2022-11-16 16:54:18 -0800	[diff] [blame]	673	struct list_head throttled_csd_list;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	674	#endif /* CONFIG_CFS_BANDWIDTH */
				675	#endif /* CONFIG_FAIR_GROUP_SCHED */
				676	};
				677
				678	static inline int rt_bandwidth_enabled(void)
				679	{
				680	return sysctl_sched_rt_runtime >= 0;
				681	}
				682
Steven Rostedt	b6366f0	2015-03-18 14:49:46 -0400	[diff] [blame]	683	/* RT IPI pull logic requires IRQ_WORK */
Steven Rostedt (Red Hat)	4bdced5	2017-10-06 14:05:04 -0400	[diff] [blame]	684	#if defined(CONFIG_IRQ_WORK) && defined(CONFIG_SMP)
Steven Rostedt	b6366f0	2015-03-18 14:49:46 -0400	[diff] [blame]	685	# define HAVE_RT_PUSH_IPI
				686	#endif
				687
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	688	/* Real-Time classes' related field in a runqueue: */
				689	struct rt_rq {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	690	struct rt_prio_array active;
				691	unsigned int rt_nr_running;
				692	unsigned int rr_nr_running;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	693	#if defined CONFIG_SMP \|\| defined CONFIG_RT_GROUP_SCHED
				694	struct {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	695	int curr; /* highest queued rt task prio */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	696	#ifdef CONFIG_SMP
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	697	int next; /* next highest */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	698	#endif
				699	} highest_prio;
				700	#endif
				701	#ifdef CONFIG_SMP
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	702	int overloaded;
				703	struct plist_head pushable_tasks;
Vincent Guittot	371bf42	2018-06-28 17:45:05 +0200	[diff] [blame]	704
Steven Rostedt	b6366f0	2015-03-18 14:49:46 -0400	[diff] [blame]	705	#endif /* CONFIG_SMP */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	706	int rt_queued;
Kirill Tkhai	f4ebcbc	2014-03-15 02:15:00 +0400	[diff] [blame]	707
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	708	int rt_throttled;
				709	u64 rt_time;
				710	u64 rt_runtime;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	711	/* Nests inside the rq lock: */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	712	raw_spinlock_t rt_runtime_lock;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	713
				714	#ifdef CONFIG_RT_GROUP_SCHED
Alexey Dobriyan	e6fe3f4	2021-04-22 23:02:28 +0300	[diff] [blame]	715	unsigned int rt_nr_boosted;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	716
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	717	struct rq *rq;
				718	struct task_group *tg;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	719	#endif
				720	};
				721
Vincent Guittot	296b2ff	2018-06-26 15:53:22 +0200	[diff] [blame]	722	static inline bool rt_rq_is_runnable(struct rt_rq *rt_rq)
				723	{
				724	return rt_rq->rt_queued && rt_rq->rt_nr_running;
				725	}
				726
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	727	/* Deadline class' related fields in a runqueue */
				728	struct dl_rq {
				729	/* runqueue is an rbtree, ordered by deadline */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	730	struct rb_root_cached root;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	731
Alexey Dobriyan	e6fe3f4	2021-04-22 23:02:28 +0300	[diff] [blame]	732	unsigned int dl_nr_running;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	733
				734	#ifdef CONFIG_SMP
				735	/*
				736	* Deadline values of the currently executing and the
				737	* earliest ready task on this rq. Caching these facilitates
Ingo Molnar	dfcb245	2018-12-03 10:05:56 +0100	[diff] [blame]	738	* the decision whether or not a ready but not running task
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	739	* should migrate somewhere else.
				740	*/
				741	struct {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	742	u64 curr;
				743	u64 next;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	744	} earliest_dl;
				745
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	746	int overloaded;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	747
				748	/*
				749	* Tasks on this rq that can be pushed away. They are kept in
				750	* an rb-tree, ordered by tasks' deadlines, with caching
				751	* of the leftmost (earliest deadline) element.
				752	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	753	struct rb_root_cached pushable_dl_tasks_root;
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	754	#else
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	755	struct dl_bw dl_bw;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	756	#endif
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	757	/*
				758	* "Active utilization" for this runqueue: increased when a
				759	* task wakes up (becomes TASK_RUNNING) and decreased when a
				760	* task blocks
				761	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	762	u64 running_bw;
Luca Abeni	4da3abc	2017-05-18 22:13:32 +0200	[diff] [blame]	763
				764	/*
Luca Abeni	8fd27231	2017-05-18 22:13:34 +0200	[diff] [blame]	765	* Utilization of the tasks "assigned" to this runqueue (including
				766	* the tasks that are in runqueue and the tasks that executed on this
				767	* CPU and blocked). Increased when a task moves to this runqueue, and
				768	* decreased when the task moves away (migrates, changes scheduling
				769	* policy, or terminates).
				770	* This is needed to compute the "inactive utilization" for the
				771	* runqueue (inactive utilization = this_bw - running_bw).
				772	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	773	u64 this_bw;
				774	u64 extra_bw;
Luca Abeni	8fd27231	2017-05-18 22:13:34 +0200	[diff] [blame]	775
				776	/*
Vineeth Pillai	6a9d623	2023-05-30 09:55:25 -0400	[diff] [blame]	777	* Maximum available bandwidth for reclaiming by SCHED_FLAG_RECLAIM
				778	* tasks of this rq. Used in calculation of reclaimable bandwidth(GRUB).
				779	*/
				780	u64 max_bw;
				781
				782	/*
Luca Abeni	4da3abc	2017-05-18 22:13:32 +0200	[diff] [blame]	783	* Inverse of the fraction of CPU utilization that can be reclaimed
				784	* by the GRUB algorithm.
				785	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	786	u64 bw_ratio;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	787	};
				788
Vincent Guittot	c079629	2018-06-28 17:45:04 +0200	[diff] [blame]	789	#ifdef CONFIG_FAIR_GROUP_SCHED
				790	/* An entity is a task if it doesn't "own" a runqueue */
				791	#define entity_is_task(se) (!se->my_q)
Vincent Guittot	0dacee1	2020-02-24 09:52:17 +0000	[diff] [blame]	792
Vincent Guittot	9f68395	2020-02-24 09:52:18 +0000	[diff] [blame]	793	static inline void se_update_runnable(struct sched_entity *se)
				794	{
				795	if (!entity_is_task(se))
				796	se->runnable_weight = se->my_q->h_nr_running;
				797	}
				798
				799	static inline long se_runnable(struct sched_entity *se)
				800	{
				801	if (entity_is_task(se))
				802	return !!se->on_rq;
				803	else
				804	return se->runnable_weight;
				805	}
				806
Vincent Guittot	c079629	2018-06-28 17:45:04 +0200	[diff] [blame]	807	#else
				808	#define entity_is_task(se) 1
Vincent Guittot	0dacee1	2020-02-24 09:52:17 +0000	[diff] [blame]	809
Vincent Guittot	9f68395	2020-02-24 09:52:18 +0000	[diff] [blame]	810	static inline void se_update_runnable(struct sched_entity *se) {}
				811
				812	static inline long se_runnable(struct sched_entity *se)
				813	{
				814	return !!se->on_rq;
				815	}
Vincent Guittot	c079629	2018-06-28 17:45:04 +0200	[diff] [blame]	816	#endif
				817
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	818	#ifdef CONFIG_SMP
Vincent Guittot	c079629	2018-06-28 17:45:04 +0200	[diff] [blame]	819	/*
				820	* XXX we want to get rid of these helpers and use the full load resolution.
				821	*/
				822	static inline long se_weight(struct sched_entity *se)
				823	{
				824	return scale_load_down(se->load.weight);
				825	}
				826
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	827
Tim Chen	afe06ef	2016-11-22 12:23:53 -0800	[diff] [blame]	828	static inline bool sched_asym_prefer(int a, int b)
				829	{
				830	return arch_asym_cpu_priority(a) > arch_asym_cpu_priority(b);
				831	}
				832
Quentin Perret	6aa140f	2018-12-03 09:56:18 +0000	[diff] [blame]	833	struct perf_domain {
				834	struct em_perf_domain *em_pd;
				835	struct perf_domain *next;
				836	struct rcu_head rcu;
				837	};
				838
Quentin Perret	630246a	2018-12-03 09:56:24 +0000	[diff] [blame]	839	/* Scheduling group status flags */
				840	#define SG_OVERLOAD 0x1 /* More than one runnable task on a CPU. */
Morten Rasmussen	2802bf3	2018-12-03 09:56:25 +0000	[diff] [blame]	841	#define SG_OVERUTILIZED 0x2 /* One or more CPUs are over-utilized. */
Quentin Perret	630246a	2018-12-03 09:56:24 +0000	[diff] [blame]	842
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	843	/*
				844	* We add the notion of a root-domain which will be used to define per-domain
				845	* variables. Each exclusive cpuset essentially defines an island domain by
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	846	* fully partitioning the member CPUs from any other cpuset. Whenever a new
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	847	* exclusive cpuset is created, we also create and attach a new root-domain
				848	* object.
				849	*
				850	*/
				851	struct root_domain {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	852	atomic_t refcount;
				853	atomic_t rto_count;
				854	struct rcu_head rcu;
				855	cpumask_var_t span;
				856	cpumask_var_t online;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	857
Valentin Schneider	757ffdd	2018-07-04 11:17:47 +0100	[diff] [blame]	858	/*
				859	* Indicate pullable load on at least one CPU, e.g:
				860	* - More than one runnable task
				861	* - Running task is misfit
				862	*/
Valentin Schneider	575638d	2018-07-04 11:17:45 +0100	[diff] [blame]	863	int overload;
Tim Chen	4486edd	2014-06-23 12:16:49 -0700	[diff] [blame]	864
Morten Rasmussen	2802bf3	2018-12-03 09:56:25 +0000	[diff] [blame]	865	/* Indicate one or more cpus over-utilized (tipping point) */
				866	int overutilized;
				867
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	868	/*
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	869	* The bit corresponding to a CPU gets set here if such CPU has more
				870	* than one runnable -deadline task (as it is below for RT tasks).
				871	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	872	cpumask_var_t dlo_mask;
				873	atomic_t dlo_count;
				874	struct dl_bw dl_bw;
				875	struct cpudl cpudl;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	876
Peng Liu	2676242	2020-10-08 23:48:46 +0800	[diff] [blame]	877	/*
				878	* Indicate whether a root_domain's dl_bw has been checked or
				879	* updated. It's monotonously increasing value.
				880	*
				881	* Also, some corner cases, like 'wrap around' is dangerous, but given
				882	* that u64 is 'big enough'. So that shouldn't be a concern.
				883	*/
				884	u64 visit_gen;
				885
Steven Rostedt (Red Hat)	4bdced5	2017-10-06 14:05:04 -0400	[diff] [blame]	886	#ifdef HAVE_RT_PUSH_IPI
				887	/*
				888	* For IPI pull requests, loop across the rto_mask.
				889	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	890	struct irq_work rto_push_work;
				891	raw_spinlock_t rto_lock;
Steven Rostedt (Red Hat)	4bdced5	2017-10-06 14:05:04 -0400	[diff] [blame]	892	/* These are only updated and read within rto_lock */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	893	int rto_loop;
				894	int rto_cpu;
Steven Rostedt (Red Hat)	4bdced5	2017-10-06 14:05:04 -0400	[diff] [blame]	895	/* These atomics are updated outside of a lock */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	896	atomic_t rto_loop_next;
				897	atomic_t rto_loop_start;
Steven Rostedt (Red Hat)	4bdced5	2017-10-06 14:05:04 -0400	[diff] [blame]	898	#endif
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	899	/*
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	900	* The "RT overload" flag: it gets set if a CPU has more than
				901	* one runnable RT task.
				902	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	903	cpumask_var_t rto_mask;
				904	struct cpupri cpupri;
Dietmar Eggemann	cd92bfd	2016-08-01 19:53:35 +0100	[diff] [blame]	905
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	906	unsigned long max_cpu_capacity;
Quentin Perret	6aa140f	2018-12-03 09:56:18 +0000	[diff] [blame]	907
				908	/*
				909	* NULL-terminated list of performance domains intersecting with the
				910	* CPUs of the rd. Protected by RCU.
				911	*/
Joel Fernandes (Google)	7ba7319	2019-03-20 20:34:26 -0400	[diff] [blame]	912	struct perf_domain __rcu *pd;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	913	};
				914
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	915	extern void init_defrootdomain(void);
Peter Zijlstra	8d5dc51	2017-04-25 15:29:40 +0200	[diff] [blame]	916	extern int sched_init_domains(const struct cpumask *cpu_map);
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	917	extern void rq_attach_root(struct rq rq, struct root_domain rd);
Steven Rostedt (VMware)	364f566	2018-01-23 20:45:38 -0500	[diff] [blame]	918	extern void sched_get_rd(struct root_domain *rd);
				919	extern void sched_put_rd(struct root_domain *rd);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	920
Steven Rostedt (Red Hat)	4bdced5	2017-10-06 14:05:04 -0400	[diff] [blame]	921	#ifdef HAVE_RT_PUSH_IPI
				922	extern void rto_push_irq_work_func(struct irq_work *work);
				923	#endif
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	924	#endif /* CONFIG_SMP */
				925
Patrick Bellasi	69842cb	2019-06-21 09:42:02 +0100	[diff] [blame]	926	#ifdef CONFIG_UCLAMP_TASK
				927	/*
				928	* struct uclamp_bucket - Utilization clamp bucket
				929	* @value: utilization clamp value for tasks on this clamp bucket
				930	* @tasks: number of RUNNABLE tasks on this clamp bucket
				931	*
				932	* Keep track of how many tasks are RUNNABLE for a given utilization
				933	* clamp value.
				934	*/
				935	struct uclamp_bucket {
				936	unsigned long value : bits_per(SCHED_CAPACITY_SCALE);
				937	unsigned long tasks : BITS_PER_LONG - bits_per(SCHED_CAPACITY_SCALE);
				938	};
				939
				940	/*
				941	* struct uclamp_rq - rq's utilization clamp
				942	* @value: currently active clamp values for a rq
				943	* @bucket: utilization clamp buckets affecting a rq
				944	*
				945	* Keep track of RUNNABLE tasks on a rq to aggregate their clamp values.
				946	* A clamp value is affecting a rq when there is at least one task RUNNABLE
				947	* (or actually running) with that value.
				948	*
				949	* There are up to UCLAMP_CNT possible different clamp values, currently there
				950	* are only two: minimum utilization and maximum utilization.
				951	*
				952	* All utilization clamping values are MAX aggregated, since:
				953	* - for util_min: we want to run the CPU at least at the max of the minimum
				954	* utilization required by its currently RUNNABLE tasks.
				955	* - for util_max: we want to allow the CPU to run up to the max of the
				956	* maximum utilization allowed by its currently RUNNABLE tasks.
				957	*
				958	* Since on each system we expect only a limited number of different
				959	* utilization clamp values (UCLAMP_BUCKETS), use a simple array to track
				960	* the metrics required to compute all the per-rq utilization clamp values.
				961	*/
				962	struct uclamp_rq {
				963	unsigned int value;
				964	struct uclamp_bucket bucket[UCLAMP_BUCKETS];
				965	};
Qais Yousef	46609ce	2020-06-30 12:21:23 +0100	[diff] [blame]	966
				967	DECLARE_STATIC_KEY_FALSE(sched_uclamp_used);
Patrick Bellasi	69842cb	2019-06-21 09:42:02 +0100	[diff] [blame]	968	#endif /* CONFIG_UCLAMP_TASK */
				969
Kees Cook	8e5bad7	2022-10-07 17:07:58 -0700	[diff] [blame]	970	struct rq;
				971	struct balance_callback {
				972	struct balance_callback *next;
				973	void (func)(struct rq rq);
				974	};
				975
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	976	/*
				977	* This is the main, per-CPU runqueue data structure.
				978	*
				979	* Locking rule: those places that want to lock multiple runqueues
				980	* (such as the load balancing or the thread migration code), lock
				981	* acquire operations must be ordered by ascending &runqueue.
				982	*/
				983	struct rq {
				984	/* runqueue lock: */
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	985	raw_spinlock_t __lock;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	986
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	987	unsigned int nr_running;
Peter Zijlstra	0ec8aa0	2013-10-07 11:29:33 +0100	[diff] [blame]	988	#ifdef CONFIG_NUMA_BALANCING
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	989	unsigned int nr_numa_running;
				990	unsigned int nr_preferred_running;
Srikar Dronamraju	a4739ec	2018-09-21 23:18:56 +0530	[diff] [blame]	991	unsigned int numa_migrate_on;
Peter Zijlstra	0ec8aa0	2013-10-07 11:29:33 +0100	[diff] [blame]	992	#endif
Frederic Weisbecker	3451d02	2011-08-10 23:21:01 +0200	[diff] [blame]	993	#ifdef CONFIG_NO_HZ_COMMON
Frederic Weisbecker	9fd81dd	2016-04-19 17:36:51 +0200	[diff] [blame]	994	#ifdef CONFIG_SMP
Peter Zijlstra	e022e0d	2017-12-21 11:20:23 +0100	[diff] [blame]	995	unsigned long last_blocked_load_update_tick;
Vincent Guittot	f643ea2	2018-02-13 11:31:17 +0100	[diff] [blame]	996	unsigned int has_blocked_load;
Peter Zijlstra (Intel)	90b5363	2020-03-27 11:44:56 +0100	[diff] [blame]	997	call_single_data_t nohz_csd;
Frederic Weisbecker	9fd81dd	2016-04-19 17:36:51 +0200	[diff] [blame]	998	#endif /* CONFIG_SMP */
Peter Zijlstra	00357f5	2017-12-21 15:06:50 +0100	[diff] [blame]	999	unsigned int nohz_tick_stopped;
Peter Zijlstra (Intel)	90b5363	2020-03-27 11:44:56 +0100	[diff] [blame]	1000	atomic_t nohz_flags;
Frederic Weisbecker	9fd81dd	2016-04-19 17:36:51 +0200	[diff] [blame]	1001	#endif /* CONFIG_NO_HZ_COMMON */
Frederic Weisbecker	dcdedb2	2018-02-21 05:17:28 +0100	[diff] [blame]	1002
Peter Zijlstra	126c209	2020-05-26 18:11:03 +0200	[diff] [blame]	1003	#ifdef CONFIG_SMP
				1004	unsigned int ttwu_pending;
				1005	#endif
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1006	u64 nr_switches;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1007
Patrick Bellasi	69842cb	2019-06-21 09:42:02 +0100	[diff] [blame]	1008	#ifdef CONFIG_UCLAMP_TASK
				1009	/* Utilization clamp values based on CPU's RUNNABLE tasks */
				1010	struct uclamp_rq uclamp[UCLAMP_CNT] ____cacheline_aligned;
Patrick Bellasi	e496187	2019-06-21 09:42:04 +0100	[diff] [blame]	1011	unsigned int uclamp_flags;
				1012	#define UCLAMP_FLAG_IDLE 0x01
Patrick Bellasi	69842cb	2019-06-21 09:42:02 +0100	[diff] [blame]	1013	#endif
				1014
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1015	struct cfs_rq cfs;
				1016	struct rt_rq rt;
				1017	struct dl_rq dl;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1018
				1019	#ifdef CONFIG_FAIR_GROUP_SCHED
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1020	/* list of leaf cfs_rq on this CPU: */
				1021	struct list_head leaf_cfs_rq_list;
				1022	struct list_head *tmp_alone_branch;
Peter Zijlstra	a35b646	2012-08-08 21:46:40 +0200	[diff] [blame]	1023	#endif /* CONFIG_FAIR_GROUP_SCHED */
				1024
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1025	/*
				1026	* This is part of a global counter where only the total sum
				1027	* over all CPUs matters. A task can increase this counter on
				1028	* one CPU and if it got migrated afterwards it may decrease
				1029	* it on another CPU. Always updated under the runqueue lock:
				1030	*/
Alexey Dobriyan	e6fe3f4	2021-04-22 23:02:28 +0300	[diff] [blame]	1031	unsigned int nr_uninterruptible;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1032
Madhuparna Bhowmik	4104a56	2020-02-01 18:28:03 +0530	[diff] [blame]	1033	struct task_struct __rcu *curr;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1034	struct task_struct *idle;
				1035	struct task_struct *stop;
				1036	unsigned long next_balance;
				1037	struct mm_struct *prev_mm;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1038
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1039	unsigned int clock_update_flags;
				1040	u64 clock;
Vincent Guittot	2312729	2019-01-23 16:26:53 +0100	[diff] [blame]	1041	/* Ensure that all clocks are in the same cache line */
				1042	u64 clock_task ____cacheline_aligned;
				1043	u64 clock_pelt;
				1044	unsigned long lost_idle_time;
Vincent Donnefort	e2f3e35	2022-06-21 10:04:09 +0100	[diff] [blame]	1045	u64 clock_pelt_idle;
				1046	u64 clock_idle;
				1047	#ifndef CONFIG_64BIT
				1048	u64 clock_pelt_idle_copy;
				1049	u64 clock_idle_copy;
				1050	#endif
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1051
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1052	atomic_t nr_iowait;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1053
Paul Turner	c006fac	2021-04-16 14:29:36 -0700	[diff] [blame]	1054	#ifdef CONFIG_SCHED_DEBUG
				1055	u64 last_seen_need_resched_ns;
				1056	int ticks_without_resched;
				1057	#endif
				1058
Mathieu Desnoyers	227a4aa	2019-09-19 13:37:02 -0400	[diff] [blame]	1059	#ifdef CONFIG_MEMBARRIER
				1060	int membarrier_state;
				1061	#endif
				1062
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1063	#ifdef CONFIG_SMP
Joel Fernandes (Google)	994aeb7	2019-03-20 20:34:24 -0400	[diff] [blame]	1064	struct root_domain *rd;
				1065	struct sched_domain __rcu *sd;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1066
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1067	unsigned long cpu_capacity;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1068
Kees Cook	8e5bad7	2022-10-07 17:07:58 -0700	[diff] [blame]	1069	struct balance_callback *balance_callback;
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	1070
Peter Zijlstra	19a1f5e	2020-05-26 18:10:58 +0200	[diff] [blame]	1071	unsigned char nohz_idle_balance;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1072	unsigned char idle_balance;
				1073
Morten Rasmussen	3b1baa6	2018-07-04 11:17:40 +0100	[diff] [blame]	1074	unsigned long misfit_task_load;
				1075
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1076	/* For active balancing */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1077	int active_balance;
				1078	int push_cpu;
				1079	struct cpu_stop_work active_balance_work;
				1080
				1081	/* CPU of this runqueue: */
				1082	int cpu;
				1083	int online;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1084
Peter Zijlstra	367456c	2012-02-20 21:49:09 +0100	[diff] [blame]	1085	struct list_head cfs_tasks;
				1086
Vincent Guittot	371bf42	2018-06-28 17:45:05 +0200	[diff] [blame]	1087	struct sched_avg avg_rt;
Vincent Guittot	3727e0e	2018-06-28 17:45:07 +0200	[diff] [blame]	1088	struct sched_avg avg_dl;
Vincent Guittot	11d4afd	2018-09-25 11:17:42 +0200	[diff] [blame]	1089	#ifdef CONFIG_HAVE_SCHED_AVG_IRQ
Vincent Guittot	91c2749	2018-06-28 17:45:09 +0200	[diff] [blame]	1090	struct sched_avg avg_irq;
				1091	#endif
Thara Gopinath	7650479	2020-02-21 19:52:05 -0500	[diff] [blame]	1092	#ifdef CONFIG_SCHED_THERMAL_PRESSURE
				1093	struct sched_avg avg_thermal;
				1094	#endif
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1095	u64 idle_stamp;
				1096	u64 avg_idle;
Jason Low	9bd721c	2013-09-13 11:26:52 -0700	[diff] [blame]	1097
				1098	/* This is used to determine avg_idle's max value */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1099	u64 max_idle_balance_cost;
Thomas Gleixner	f2469a1	2020-09-14 14:47:28 +0200	[diff] [blame]	1100
				1101	#ifdef CONFIG_HOTPLUG_CPU
				1102	struct rcuwait hotplug_wait;
				1103	#endif
Peter Zijlstra (Intel)	90b5363	2020-03-27 11:44:56 +0100	[diff] [blame]	1104	#endif /* CONFIG_SMP */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1105
				1106	#ifdef CONFIG_IRQ_TIME_ACCOUNTING
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1107	u64 prev_irq_time;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1108	#endif
				1109	#ifdef CONFIG_PARAVIRT
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1110	u64 prev_steal_time;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1111	#endif
				1112	#ifdef CONFIG_PARAVIRT_TIME_ACCOUNTING
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1113	u64 prev_steal_time_rq;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1114	#endif
				1115
				1116	/* calc_load related fields */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1117	unsigned long calc_load_update;
				1118	long calc_load_active;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1119
				1120	#ifdef CONFIG_SCHED_HRTICK
				1121	#ifdef CONFIG_SMP
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1122	call_single_data_t hrtick_csd;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1123	#endif
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1124	struct hrtimer hrtick_timer;
Juri Lelli	156ec6f	2021-02-08 08:35:53 +0100	[diff] [blame]	1125	ktime_t hrtick_time;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1126	#endif
				1127
				1128	#ifdef CONFIG_SCHEDSTATS
				1129	/* latency stats */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1130	struct sched_info rq_sched_info;
				1131	unsigned long long rq_cpu_time;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1132	/* could above be rq->cfs_rq.exec_clock + rq->rt_rq.rt_runtime ? */
				1133
				1134	/* sys_sched_yield() stats */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1135	unsigned int yld_count;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1136
				1137	/* schedule() stats */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1138	unsigned int sched_count;
				1139	unsigned int sched_goidle;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1140
				1141	/* try_to_wake_up() stats */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1142	unsigned int ttwu_count;
				1143	unsigned int ttwu_local;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1144	#endif
				1145
Daniel Lezcano	442bf3a	2014-09-04 11:32:09 -0400	[diff] [blame]	1146	#ifdef CONFIG_CPU_IDLE
				1147	/* Must be inspected within a rcu lock section */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1148	struct cpuidle_state *idle_state;
Daniel Lezcano	442bf3a	2014-09-04 11:32:09 -0400	[diff] [blame]	1149	#endif
Thomas Gleixner	3015ef4	2020-08-26 14:08:10 +0200	[diff] [blame]	1150
Thomas Gleixner	74d862b6	2020-11-18 20:48:42 +0100	[diff] [blame]	1151	#ifdef CONFIG_SMP
Thomas Gleixner	3015ef4	2020-08-26 14:08:10 +0200	[diff] [blame]	1152	unsigned int nr_pinned;
				1153	#endif
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	1154	unsigned int push_busy;
				1155	struct cpu_stop_work push_work;
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1156
				1157	#ifdef CONFIG_SCHED_CORE
				1158	/* per rq */
				1159	struct rq *core;
Peter Zijlstra	539f651	2020-11-17 18:19:37 -0500	[diff] [blame]	1160	struct task_struct *core_pick;
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1161	unsigned int core_enabled;
Peter Zijlstra	539f651	2020-11-17 18:19:37 -0500	[diff] [blame]	1162	unsigned int core_sched_seq;
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1163	struct rb_root core_tree;
				1164
Peter Zijlstra	3c474b3	2021-08-19 13:09:17 +0200	[diff] [blame]	1165	/* shared state -- careful with sched_core_cpu_deactivate() */
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1166	unsigned int core_task_seq;
Peter Zijlstra	539f651	2020-11-17 18:19:37 -0500	[diff] [blame]	1167	unsigned int core_pick_seq;
				1168	unsigned long core_cookie;
Josh Don	4feee7d1	2021-10-18 13:34:28 -0700	[diff] [blame]	1169	unsigned int core_forceidle_count;
Joel Fernandes (Google)	c6047c2	2020-11-17 18:19:39 -0500	[diff] [blame]	1170	unsigned int core_forceidle_seq;
Josh Don	4feee7d1	2021-10-18 13:34:28 -0700	[diff] [blame]	1171	unsigned int core_forceidle_occupation;
				1172	u64 core_forceidle_start;
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1173	#endif
Waiman Long	da01903	2022-09-22 14:00:39 -0400	[diff] [blame]	1174
				1175	/* Scratch cpumask to be temporarily used under rq_lock */
				1176	cpumask_var_t scratch_mask;
Josh Don	8ad075c	2022-11-16 16:54:18 -0800	[diff] [blame]	1177
				1178	#if defined(CONFIG_CFS_BANDWIDTH) && defined(CONFIG_SMP)
				1179	call_single_data_t cfsb_csd;
				1180	struct list_head cfsb_csd_list;
				1181	#endif
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1182	};
				1183
Vincent Guittot	62478d9	2019-01-23 16:26:52 +0100	[diff] [blame]	1184	#ifdef CONFIG_FAIR_GROUP_SCHED
				1185
				1186	/* CPU runqueue to which this cfs_rq is attached */
				1187	static inline struct rq rq_of(struct cfs_rq cfs_rq)
				1188	{
				1189	return cfs_rq->rq;
				1190	}
				1191
				1192	#else
				1193
				1194	static inline struct rq rq_of(struct cfs_rq cfs_rq)
				1195	{
				1196	return container_of(cfs_rq, struct rq, cfs);
				1197	}
				1198	#endif
				1199
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1200	static inline int cpu_of(struct rq *rq)
				1201	{
				1202	#ifdef CONFIG_SMP
				1203	return rq->cpu;
				1204	#else
				1205	return 0;
				1206	#endif
				1207	}
				1208
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	1209	#define MDF_PUSH 0x01
				1210
				1211	static inline bool is_migration_disabled(struct task_struct *p)
				1212	{
Thomas Gleixner	74d862b6	2020-11-18 20:48:42 +0100	[diff] [blame]	1213	#ifdef CONFIG_SMP
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	1214	return p->migration_disabled;
				1215	#else
				1216	return false;
				1217	#endif
				1218	}
Peter Zijlstra	1b568f0	2016-05-09 10:38:41 +0200	[diff] [blame]	1219
Lin Shengwang	e705968	2022-10-08 10:27:09 +0800	[diff] [blame]	1220	DECLARE_PER_CPU_SHARED_ALIGNED(struct rq, runqueues);
				1221
				1222	#define cpu_rq(cpu) (&per_cpu(runqueues, (cpu)))
				1223	#define this_rq() this_cpu_ptr(&runqueues)
				1224	#define task_rq(p) cpu_rq(task_cpu(p))
				1225	#define cpu_curr(cpu) (cpu_rq(cpu)->curr)
				1226	#define raw_rq() raw_cpu_ptr(&runqueues)
				1227
Aubrey Li	97886d9	2021-03-24 17:40:13 -0400	[diff] [blame]	1228	struct sched_group;
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1229	#ifdef CONFIG_SCHED_CORE
Aubrey Li	97886d9	2021-03-24 17:40:13 -0400	[diff] [blame]	1230	static inline struct cpumask sched_group_span(struct sched_group sg);
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1231
				1232	DECLARE_STATIC_KEY_FALSE(__sched_core_enabled);
				1233
				1234	static inline bool sched_core_enabled(struct rq *rq)
				1235	{
				1236	return static_branch_unlikely(&__sched_core_enabled) && rq->core_enabled;
				1237	}
				1238
				1239	static inline bool sched_core_disabled(void)
				1240	{
				1241	return !static_branch_unlikely(&__sched_core_enabled);
				1242	}
				1243
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1244	/*
				1245	* Be careful with this function; not for general use. The return value isn't
				1246	* stable unless you actually hold a relevant rq->__lock.
				1247	*/
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1248	static inline raw_spinlock_t rq_lockp(struct rq rq)
				1249	{
				1250	if (sched_core_enabled(rq))
				1251	return &rq->core->__lock;
				1252
				1253	return &rq->__lock;
				1254	}
				1255
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1256	static inline raw_spinlock_t __rq_lockp(struct rq rq)
				1257	{
				1258	if (rq->core_enabled)
				1259	return &rq->core->__lock;
				1260
				1261	return &rq->__lock;
				1262	}
				1263
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	1264	bool cfs_prio_less(const struct task_struct a, const struct task_struct b,
				1265	bool fi);
Peter Zijlstra	22dc02f	2023-07-24 21:30:54 +0200	[diff] [blame]	1266	void task_vruntime_update(struct rq rq, struct task_struct p, bool in_fi);
Joel Fernandes (Google)	c6047c2	2020-11-17 18:19:39 -0500	[diff] [blame]	1267
Aubrey Li	97886d9	2021-03-24 17:40:13 -0400	[diff] [blame]	1268	/*
				1269	* Helpers to check if the CPU's core cookie matches with the task's cookie
				1270	* when core scheduling is enabled.
				1271	* A special case is that the task's cookie always matches with CPU's core
				1272	* cookie if the CPU is in an idle core.
				1273	*/
				1274	static inline bool sched_cpu_cookie_match(struct rq rq, struct task_struct p)
				1275	{
				1276	/* Ignore cookie match if core scheduler is not enabled on the CPU. */
				1277	if (!sched_core_enabled(rq))
				1278	return true;
				1279
				1280	return rq->core->core_cookie == p->core_cookie;
				1281	}
				1282
				1283	static inline bool sched_core_cookie_match(struct rq rq, struct task_struct p)
				1284	{
				1285	bool idle_core = true;
				1286	int cpu;
				1287
				1288	/* Ignore cookie match if core scheduler is not enabled on the CPU. */
				1289	if (!sched_core_enabled(rq))
				1290	return true;
				1291
				1292	for_each_cpu(cpu, cpu_smt_mask(cpu_of(rq))) {
				1293	if (!available_idle_cpu(cpu)) {
				1294	idle_core = false;
				1295	break;
				1296	}
				1297	}
				1298
				1299	/*
				1300	* A CPU in an idle core is always the best choice for tasks with
				1301	* cookies.
				1302	*/
				1303	return idle_core \|\| rq->core->core_cookie == p->core_cookie;
				1304	}
				1305
				1306	static inline bool sched_group_cookie_match(struct rq *rq,
				1307	struct task_struct *p,
				1308	struct sched_group *group)
				1309	{
				1310	int cpu;
				1311
				1312	/* Ignore cookie match if core scheduler is not enabled on the CPU. */
				1313	if (!sched_core_enabled(rq))
				1314	return true;
				1315
				1316	for_each_cpu_and(cpu, sched_group_span(group), p->cpus_ptr) {
Lin Shengwang	e705968	2022-10-08 10:27:09 +0800	[diff] [blame]	1317	if (sched_core_cookie_match(cpu_rq(cpu), p))
Aubrey Li	97886d9	2021-03-24 17:40:13 -0400	[diff] [blame]	1318	return true;
				1319	}
				1320	return false;
				1321	}
				1322
Peter Zijlstra	6e33cad	2021-03-26 18:55:06 +0100	[diff] [blame]	1323	static inline bool sched_core_enqueued(struct task_struct *p)
				1324	{
				1325	return !RB_EMPTY_NODE(&p->core_node);
				1326	}
				1327
				1328	extern void sched_core_enqueue(struct rq rq, struct task_struct p);
Josh Don	4feee7d1	2021-10-18 13:34:28 -0700	[diff] [blame]	1329	extern void sched_core_dequeue(struct rq rq, struct task_struct p, int flags);
Peter Zijlstra	6e33cad	2021-03-26 18:55:06 +0100	[diff] [blame]	1330
				1331	extern void sched_core_get(void);
				1332	extern void sched_core_put(void);
				1333
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1334	#else /* !CONFIG_SCHED_CORE */
				1335
				1336	static inline bool sched_core_enabled(struct rq *rq)
				1337	{
				1338	return false;
				1339	}
				1340
Peter Zijlstra	d66f1b0	2021-03-02 12:16:48 +0100	[diff] [blame]	1341	static inline bool sched_core_disabled(void)
				1342	{
				1343	return true;
				1344	}
				1345
Peter Zijlstra	39d371b	2021-03-02 12:13:13 +0100	[diff] [blame]	1346	static inline raw_spinlock_t rq_lockp(struct rq rq)
				1347	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1348	return &rq->__lock;
Peter Zijlstra	39d371b	2021-03-02 12:13:13 +0100	[diff] [blame]	1349	}
				1350
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1351	static inline raw_spinlock_t __rq_lockp(struct rq rq)
				1352	{
				1353	return &rq->__lock;
				1354	}
				1355
Aubrey Li	97886d9	2021-03-24 17:40:13 -0400	[diff] [blame]	1356	static inline bool sched_cpu_cookie_match(struct rq rq, struct task_struct p)
				1357	{
				1358	return true;
				1359	}
				1360
				1361	static inline bool sched_core_cookie_match(struct rq rq, struct task_struct p)
				1362	{
				1363	return true;
				1364	}
				1365
				1366	static inline bool sched_group_cookie_match(struct rq *rq,
				1367	struct task_struct *p,
				1368	struct sched_group *group)
				1369	{
				1370	return true;
				1371	}
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	1372	#endif /* CONFIG_SCHED_CORE */
				1373
Peter Zijlstra	39d371b	2021-03-02 12:13:13 +0100	[diff] [blame]	1374	static inline void lockdep_assert_rq_held(struct rq *rq)
				1375	{
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1376	lockdep_assert_held(__rq_lockp(rq));
Peter Zijlstra	39d371b	2021-03-02 12:13:13 +0100	[diff] [blame]	1377	}
				1378
				1379	extern void raw_spin_rq_lock_nested(struct rq *rq, int subclass);
				1380	extern bool raw_spin_rq_trylock(struct rq *rq);
				1381	extern void raw_spin_rq_unlock(struct rq *rq);
				1382
				1383	static inline void raw_spin_rq_lock(struct rq *rq)
				1384	{
				1385	raw_spin_rq_lock_nested(rq, 0);
				1386	}
				1387
				1388	static inline void raw_spin_rq_lock_irq(struct rq *rq)
				1389	{
				1390	local_irq_disable();
				1391	raw_spin_rq_lock(rq);
				1392	}
				1393
				1394	static inline void raw_spin_rq_unlock_irq(struct rq *rq)
				1395	{
				1396	raw_spin_rq_unlock(rq);
				1397	local_irq_enable();
				1398	}
				1399
				1400	static inline unsigned long _raw_spin_rq_lock_irqsave(struct rq *rq)
				1401	{
				1402	unsigned long flags;
				1403	local_irq_save(flags);
				1404	raw_spin_rq_lock(rq);
				1405	return flags;
				1406	}
				1407
				1408	static inline void raw_spin_rq_unlock_irqrestore(struct rq *rq, unsigned long flags)
				1409	{
				1410	raw_spin_rq_unlock(rq);
				1411	local_irq_restore(flags);
				1412	}
				1413
				1414	#define raw_spin_rq_lock_irqsave(rq, flags) \
				1415	do { \
				1416	flags = _raw_spin_rq_lock_irqsave(rq); \
				1417	} while (0)
				1418
Peter Zijlstra	1b568f0	2016-05-09 10:38:41 +0200	[diff] [blame]	1419	#ifdef CONFIG_SCHED_SMT
Peter Zijlstra	1b568f0	2016-05-09 10:38:41 +0200	[diff] [blame]	1420	extern void __update_idle_core(struct rq *rq);
				1421
				1422	static inline void update_idle_core(struct rq *rq)
				1423	{
				1424	if (static_branch_unlikely(&sched_smt_present))
				1425	__update_idle_core(rq);
				1426	}
				1427
				1428	#else
				1429	static inline void update_idle_core(struct rq *rq) { }
				1430	#endif
				1431
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1432	#ifdef CONFIG_FAIR_GROUP_SCHED
				1433	static inline struct task_struct task_of(struct sched_entity se)
				1434	{
				1435	SCHED_WARN_ON(!entity_is_task(se));
				1436	return container_of(se, struct task_struct, se);
				1437	}
				1438
				1439	static inline struct cfs_rq task_cfs_rq(struct task_struct p)
				1440	{
				1441	return p->se.cfs_rq;
				1442	}
				1443
				1444	/* runqueue on which this entity is (to be) queued */
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	1445	static inline struct cfs_rq cfs_rq_of(const struct sched_entity se)
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1446	{
				1447	return se->cfs_rq;
				1448	}
				1449
				1450	/* runqueue "owned" by this group */
				1451	static inline struct cfs_rq group_cfs_rq(struct sched_entity grp)
				1452	{
				1453	return grp->my_q;
				1454	}
				1455
				1456	#else
				1457
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	1458	#define task_of(_se) container_of(_se, struct task_struct, se)
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1459
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	1460	static inline struct cfs_rq task_cfs_rq(const struct task_struct p)
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1461	{
				1462	return &task_rq(p)->cfs;
				1463	}
				1464
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	1465	static inline struct cfs_rq cfs_rq_of(const struct sched_entity se)
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1466	{
Matthew Wilcox (Oracle)	904cbab	2022-12-12 14:49:46 +0000	[diff] [blame]	1467	const struct task_struct *p = task_of(se);
Peter Zijlstra	8a311c7	2020-11-17 18:19:36 -0500	[diff] [blame]	1468	struct rq *rq = task_rq(p);
				1469
				1470	return &rq->cfs;
				1471	}
				1472
				1473	/* runqueue "owned" by this group */
				1474	static inline struct cfs_rq group_cfs_rq(struct sched_entity grp)
				1475	{
				1476	return NULL;
				1477	}
				1478	#endif
				1479
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1480	extern void update_rq_clock(struct rq *rq);
				1481
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1482	/*
				1483	* rq::clock_update_flags bits
				1484	*
				1485	* %RQCF_REQ_SKIP - will request skipping of clock update on the next
				1486	* call to __schedule(). This is an optimisation to avoid
				1487	* neighbouring rq clock updates.
				1488	*
				1489	* %RQCF_ACT_SKIP - is set from inside of __schedule() when skipping is
				1490	* in effect and calls to update_rq_clock() are being ignored.
				1491	*
				1492	* %RQCF_UPDATED - is a debug flag that indicates whether a call has been
				1493	* made to update_rq_clock() since the last time rq::lock was pinned.
				1494	*
				1495	* If inside of __schedule(), clock_update_flags will have been
				1496	* shifted left (a left shift is a cheap operation for the fast path
				1497	* to promote %RQCF_REQ_SKIP to %RQCF_ACT_SKIP), so you must use,
				1498	*
				1499	* if (rq-clock_update_flags >= RQCF_UPDATED)
				1500	*
Ingo Molnar	3b03706	2021-03-18 13:38:50 +0100	[diff] [blame]	1501	* to check if %RQCF_UPDATED is set. It'll never be shifted more than
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1502	* one position though, because the next rq_unpin_lock() will shift it
				1503	* back.
				1504	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1505	#define RQCF_REQ_SKIP 0x01
				1506	#define RQCF_ACT_SKIP 0x02
				1507	#define RQCF_UPDATED 0x04
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1508
				1509	static inline void assert_clock_updated(struct rq *rq)
				1510	{
				1511	/*
				1512	* The only reason for not seeing a clock update since the
				1513	* last rq_pin_lock() is if we're currently skipping updates.
				1514	*/
				1515	SCHED_WARN_ON(rq->clock_update_flags < RQCF_ACT_SKIP);
				1516	}
				1517
Frederic Weisbecker	78becc2	2013-04-12 01:51:02 +0200	[diff] [blame]	1518	static inline u64 rq_clock(struct rq *rq)
				1519	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1520	lockdep_assert_rq_held(rq);
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1521	assert_clock_updated(rq);
				1522
Frederic Weisbecker	78becc2	2013-04-12 01:51:02 +0200	[diff] [blame]	1523	return rq->clock;
				1524	}
				1525
				1526	static inline u64 rq_clock_task(struct rq *rq)
				1527	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1528	lockdep_assert_rq_held(rq);
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1529	assert_clock_updated(rq);
				1530
Frederic Weisbecker	78becc2	2013-04-12 01:51:02 +0200	[diff] [blame]	1531	return rq->clock_task;
				1532	}
				1533
Thara Gopinath	05289b9	2020-02-21 19:52:13 -0500	[diff] [blame]	1534	/**
				1535	* By default the decay is the default pelt decay period.
				1536	* The decay shift can change the decay period in
				1537	* multiples of 32.
				1538	* Decay shift Decay period(ms)
				1539	* 0 32
				1540	* 1 64
				1541	* 2 128
				1542	* 3 256
				1543	* 4 512
				1544	*/
				1545	extern int sched_thermal_decay_shift;
				1546
				1547	static inline u64 rq_clock_thermal(struct rq *rq)
				1548	{
				1549	return rq_clock_task(rq) >> sched_thermal_decay_shift;
				1550	}
				1551
Davidlohr Bueso	adcc8da	2018-04-04 09:15:39 -0700	[diff] [blame]	1552	static inline void rq_clock_skip_update(struct rq *rq)
Peter Zijlstra	9edfbfe	2015-01-05 11:18:11 +0100	[diff] [blame]	1553	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1554	lockdep_assert_rq_held(rq);
Davidlohr Bueso	adcc8da	2018-04-04 09:15:39 -0700	[diff] [blame]	1555	rq->clock_update_flags \|= RQCF_REQ_SKIP;
				1556	}
				1557
				1558	/*
Davidlohr Bueso	595058b	2018-05-30 15:49:40 -0700	[diff] [blame]	1559	* See rt task throttling, which is the only time a skip
Ingo Molnar	3b03706	2021-03-18 13:38:50 +0100	[diff] [blame]	1560	* request is canceled.
Davidlohr Bueso	adcc8da	2018-04-04 09:15:39 -0700	[diff] [blame]	1561	*/
				1562	static inline void rq_clock_cancel_skipupdate(struct rq *rq)
				1563	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1564	lockdep_assert_rq_held(rq);
Davidlohr Bueso	adcc8da	2018-04-04 09:15:39 -0700	[diff] [blame]	1565	rq->clock_update_flags &= ~RQCF_REQ_SKIP;
Peter Zijlstra	9edfbfe	2015-01-05 11:18:11 +0100	[diff] [blame]	1566	}
				1567
Hao Jia	ebb83d8	2023-06-13 16:20:11 +0800	[diff] [blame]	1568	/*
				1569	* During cpu offlining and rq wide unthrottling, we can trigger
				1570	* an update_rq_clock() for several cfs and rt runqueues (Typically
				1571	* when using list_for_each_entry_*)
				1572	* rq_clock_start_loop_update() can be called after updating the clock
				1573	* once and before iterating over the list to prevent multiple update.
				1574	* After the iterative traversal, we need to call rq_clock_stop_loop_update()
				1575	* to clear RQCF_ACT_SKIP of rq->clock_update_flags.
				1576	*/
				1577	static inline void rq_clock_start_loop_update(struct rq *rq)
				1578	{
				1579	lockdep_assert_rq_held(rq);
				1580	SCHED_WARN_ON(rq->clock_update_flags & RQCF_ACT_SKIP);
				1581	rq->clock_update_flags \|= RQCF_ACT_SKIP;
				1582	}
				1583
				1584	static inline void rq_clock_stop_loop_update(struct rq *rq)
				1585	{
				1586	lockdep_assert_rq_held(rq);
				1587	rq->clock_update_flags &= ~RQCF_ACT_SKIP;
				1588	}
				1589
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1590	struct rq_flags {
				1591	unsigned long flags;
				1592	struct pin_cookie cookie;
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1593	#ifdef CONFIG_SCHED_DEBUG
				1594	/*
				1595	* A copy of (rq::clock_update_flags & RQCF_UPDATED) for the
				1596	* current pin context is stashed here in case it needs to be
				1597	* restored in rq_repin_lock().
				1598	*/
				1599	unsigned int clock_update_flags;
				1600	#endif
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1601	};
				1602
Kees Cook	8e5bad7	2022-10-07 17:07:58 -0700	[diff] [blame]	1603	extern struct balance_callback balance_push_callback;
Peter Zijlstra	ae79270	2020-12-10 17:14:08 +0100	[diff] [blame]	1604
Peter Zijlstra	58877d3	2020-07-02 14:52:11 +0200	[diff] [blame]	1605	/*
				1606	* Lockdep annotation that avoids accidental unlocks; it's like a
				1607	* sticky/continuous lockdep_assert_held().
				1608	*
				1609	* This avoids code that has access to 'struct rq *rq' (basically everything in
				1610	* the scheduler) from accidentally unlocking the rq if they do not also have a
				1611	* copy of the (on-stack) 'struct rq_flags rf'.
				1612	*
				1613	* Also see Documentation/locking/lockdep-design.rst.
				1614	*/
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1615	static inline void rq_pin_lock(struct rq rq, struct rq_flags rf)
				1616	{
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1617	rf->cookie = lockdep_pin_lock(__rq_lockp(rq));
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1618
				1619	#ifdef CONFIG_SCHED_DEBUG
				1620	rq->clock_update_flags &= (RQCF_REQ_SKIP\|RQCF_ACT_SKIP);
				1621	rf->clock_update_flags = 0;
Peter Zijlstra	565790d2	2020-05-11 14:13:00 +0200	[diff] [blame]	1622	#ifdef CONFIG_SMP
Peter Zijlstra	ae79270	2020-12-10 17:14:08 +0100	[diff] [blame]	1623	SCHED_WARN_ON(rq->balance_callback && rq->balance_callback != &balance_push_callback);
				1624	#endif
Peter Zijlstra	565790d2	2020-05-11 14:13:00 +0200	[diff] [blame]	1625	#endif
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1626	}
				1627
				1628	static inline void rq_unpin_lock(struct rq rq, struct rq_flags rf)
				1629	{
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1630	#ifdef CONFIG_SCHED_DEBUG
				1631	if (rq->clock_update_flags > RQCF_ACT_SKIP)
				1632	rf->clock_update_flags = RQCF_UPDATED;
				1633	#endif
				1634
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1635	lockdep_unpin_lock(__rq_lockp(rq), rf->cookie);
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1636	}
				1637
				1638	static inline void rq_repin_lock(struct rq rq, struct rq_flags rf)
				1639	{
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	1640	lockdep_repin_lock(__rq_lockp(rq), rf->cookie);
Matt Fleming	cb42c9a	2016-09-21 14:38:13 +0100	[diff] [blame]	1641
				1642	#ifdef CONFIG_SCHED_DEBUG
				1643	/*
				1644	* Restore the value we stashed in @rf for this pin context.
				1645	*/
				1646	rq->clock_update_flags \|= rf->clock_update_flags;
				1647	#endif
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1648	}
				1649
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1650	struct rq __task_rq_lock(struct task_struct p, struct rq_flags *rf)
				1651	__acquires(rq->lock);
				1652
				1653	struct rq task_rq_lock(struct task_struct p, struct rq_flags *rf)
				1654	__acquires(p->pi_lock)
				1655	__acquires(rq->lock);
				1656
				1657	static inline void __task_rq_unlock(struct rq rq, struct rq_flags rf)
				1658	__releases(rq->lock)
				1659	{
				1660	rq_unpin_lock(rq, rf);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1661	raw_spin_rq_unlock(rq);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1662	}
				1663
				1664	static inline void
				1665	task_rq_unlock(struct rq rq, struct task_struct p, struct rq_flags *rf)
				1666	__releases(rq->lock)
				1667	__releases(p->pi_lock)
				1668	{
				1669	rq_unpin_lock(rq, rf);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1670	raw_spin_rq_unlock(rq);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1671	raw_spin_unlock_irqrestore(&p->pi_lock, rf->flags);
				1672	}
				1673
Peter Zijlstra	94b548a	2023-06-09 20:52:55 +0200	[diff] [blame]	1674	DEFINE_LOCK_GUARD_1(task_rq_lock, struct task_struct,
				1675	_T->rq = task_rq_lock(_T->lock, &_T->rf),
				1676	task_rq_unlock(_T->rq, _T->lock, &_T->rf),
				1677	struct rq *rq; struct rq_flags rf)
				1678
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1679	static inline void
				1680	rq_lock_irqsave(struct rq rq, struct rq_flags rf)
				1681	__acquires(rq->lock)
				1682	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1683	raw_spin_rq_lock_irqsave(rq, rf->flags);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1684	rq_pin_lock(rq, rf);
				1685	}
				1686
				1687	static inline void
				1688	rq_lock_irq(struct rq rq, struct rq_flags rf)
				1689	__acquires(rq->lock)
				1690	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1691	raw_spin_rq_lock_irq(rq);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1692	rq_pin_lock(rq, rf);
				1693	}
				1694
				1695	static inline void
				1696	rq_lock(struct rq rq, struct rq_flags rf)
				1697	__acquires(rq->lock)
				1698	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1699	raw_spin_rq_lock(rq);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1700	rq_pin_lock(rq, rf);
				1701	}
				1702
				1703	static inline void
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1704	rq_unlock_irqrestore(struct rq rq, struct rq_flags rf)
				1705	__releases(rq->lock)
				1706	{
				1707	rq_unpin_lock(rq, rf);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1708	raw_spin_rq_unlock_irqrestore(rq, rf->flags);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1709	}
				1710
				1711	static inline void
				1712	rq_unlock_irq(struct rq rq, struct rq_flags rf)
				1713	__releases(rq->lock)
				1714	{
				1715	rq_unpin_lock(rq, rf);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1716	raw_spin_rq_unlock_irq(rq);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1717	}
				1718
				1719	static inline void
				1720	rq_unlock(struct rq rq, struct rq_flags rf)
				1721	__releases(rq->lock)
				1722	{
				1723	rq_unpin_lock(rq, rf);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1724	raw_spin_rq_unlock(rq);
Johannes Weiner	1f351d7	2018-10-26 15:06:19 -0700	[diff] [blame]	1725	}
				1726
Peter Zijlstra	4eb054f	2023-08-01 22:41:25 +0200	[diff] [blame]	1727	DEFINE_LOCK_GUARD_1(rq_lock, struct rq,
				1728	rq_lock(_T->lock, &_T->rf),
				1729	rq_unlock(_T->lock, &_T->rf),
				1730	struct rq_flags rf)
				1731
				1732	DEFINE_LOCK_GUARD_1(rq_lock_irq, struct rq,
				1733	rq_lock_irq(_T->lock, &_T->rf),
				1734	rq_unlock_irq(_T->lock, &_T->rf),
				1735	struct rq_flags rf)
				1736
				1737	DEFINE_LOCK_GUARD_1(rq_lock_irqsave, struct rq,
				1738	rq_lock_irqsave(_T->lock, &_T->rf),
				1739	rq_unlock_irqrestore(_T->lock, &_T->rf),
				1740	struct rq_flags rf)
				1741
Johannes Weiner	246b3b3	2018-10-26 15:06:23 -0700	[diff] [blame]	1742	static inline struct rq *
				1743	this_rq_lock_irq(struct rq_flags *rf)
				1744	__acquires(rq->lock)
				1745	{
				1746	struct rq *rq;
				1747
				1748	local_irq_disable();
				1749	rq = this_rq();
				1750	rq_lock(rq, rf);
				1751	return rq;
				1752	}
				1753
Rik van Riel	9942f79	2014-10-17 03:29:49 -0400	[diff] [blame]	1754	#ifdef CONFIG_NUMA
Rik van Riel	e3fe70b	2014-10-17 03:29:50 -0400	[diff] [blame]	1755	enum numa_topology_type {
				1756	NUMA_DIRECT,
				1757	NUMA_GLUELESS_MESH,
				1758	NUMA_BACKPLANE,
				1759	};
				1760	extern enum numa_topology_type sched_numa_topology_type;
Rik van Riel	9942f79	2014-10-17 03:29:49 -0400	[diff] [blame]	1761	extern int sched_max_numa_distance;
				1762	extern bool find_numa_distance(int distance);
Huang Ying	0fb3978b	2022-02-14 20:15:52 +0800	[diff] [blame]	1763	extern void sched_init_numa(int offline_node);
				1764	extern void sched_update_numa(int cpu, bool online);
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	1765	extern void sched_domains_numa_masks_set(unsigned int cpu);
				1766	extern void sched_domains_numa_masks_clear(unsigned int cpu);
Wanpeng Li	e0e8d49	2019-06-28 16:51:41 +0800	[diff] [blame]	1767	extern int sched_numa_find_closest(const struct cpumask *cpus, int cpu);
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	1768	#else
Huang Ying	0fb3978b	2022-02-14 20:15:52 +0800	[diff] [blame]	1769	static inline void sched_init_numa(int offline_node) { }
				1770	static inline void sched_update_numa(int cpu, bool online) { }
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	1771	static inline void sched_domains_numa_masks_set(unsigned int cpu) { }
				1772	static inline void sched_domains_numa_masks_clear(unsigned int cpu) { }
Wanpeng Li	e0e8d49	2019-06-28 16:51:41 +0800	[diff] [blame]	1773	static inline int sched_numa_find_closest(const struct cpumask *cpus, int cpu)
				1774	{
				1775	return nr_cpu_ids;
				1776	}
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	1777	#endif
				1778
Mel Gorman	f809ca9	2013-10-07 11:28:57 +0100	[diff] [blame]	1779	#ifdef CONFIG_NUMA_BALANCING
Iulia Manda	44dba3d	2014-10-31 02:13:31 +0200	[diff] [blame]	1780	/* The regions in numa_faults array from task_struct */
				1781	enum numa_faults_stats {
				1782	NUMA_MEM = 0,
				1783	NUMA_CPU,
				1784	NUMA_MEMBUF,
				1785	NUMA_CPUBUF
				1786	};
Peter Zijlstra	0ec8aa0	2013-10-07 11:29:33 +0100	[diff] [blame]	1787	extern void sched_setnuma(struct task_struct *p, int node);
Mel Gorman	e6628d5	2013-10-07 11:29:02 +0100	[diff] [blame]	1788	extern int migrate_task_to(struct task_struct *p, int cpu);
Srikar Dronamraju	0ad4e3d	2018-06-20 22:32:50 +0530	[diff] [blame]	1789	extern int migrate_swap(struct task_struct p, struct task_struct t,
				1790	int cpu, int scpu);
Mel Gorman	1378447	2018-05-04 16:41:09 +0100	[diff] [blame]	1791	extern void init_numa_balancing(unsigned long clone_flags, struct task_struct *p);
				1792	#else
				1793	static inline void
				1794	init_numa_balancing(unsigned long clone_flags, struct task_struct *p)
				1795	{
				1796	}
Mel Gorman	f809ca9	2013-10-07 11:28:57 +0100	[diff] [blame]	1797	#endif /* CONFIG_NUMA_BALANCING */
				1798
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1799	#ifdef CONFIG_SMP
				1800
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	1801	static inline void
				1802	queue_balance_callback(struct rq *rq,
Kees Cook	8e5bad7	2022-10-07 17:07:58 -0700	[diff] [blame]	1803	struct balance_callback *head,
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	1804	void (func)(struct rq rq))
				1805	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	1806	lockdep_assert_rq_held(rq);
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	1807
Peter Zijlstra	04193d5	2022-06-07 22:41:55 +0200	[diff] [blame]	1808	/*
				1809	* Don't (re)queue an already queued item; nor queue anything when
				1810	* balance_push() is active, see the comment with
				1811	* balance_push_callback.
				1812	*/
Peter Zijlstra	ae79270	2020-12-10 17:14:08 +0100	[diff] [blame]	1813	if (unlikely(head->next \|\| rq->balance_callback == &balance_push_callback))
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	1814	return;
				1815
Kees Cook	8e5bad7	2022-10-07 17:07:58 -0700	[diff] [blame]	1816	head->func = func;
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	1817	head->next = rq->balance_callback;
				1818	rq->balance_callback = head;
				1819	}
				1820
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1821	#define rcu_dereference_check_sched_domain(p) \
				1822	rcu_dereference_check((p), \
				1823	lockdep_is_held(&sched_domains_mutex))
				1824
				1825	/*
				1826	* The domain tree (rq->sd) is protected by RCU's quiescent state transition.
Paul E. McKenney	337e9b0	2018-11-06 19:10:53 -0800	[diff] [blame]	1827	* See destroy_sched_domains: call_rcu for details.
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1828	*
				1829	* The domain tree of any CPU may only be accessed from within
				1830	* preempt-disabled sections.
				1831	*/
				1832	#define for_each_domain(cpu, __sd) \
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1833	for (__sd = rcu_dereference_check_sched_domain(cpu_rq(cpu)->sd); \
				1834	__sd; __sd = __sd->parent)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1835
Ricardo Neri	40b4d3d	2023-04-06 13:31:44 -0700	[diff] [blame]	1836	/* A mask of all the SD flags that have the SDF_SHARED_CHILD metaflag */
				1837	#define SD_FLAG(name, mflags) (name * !!((mflags) & SDF_SHARED_CHILD)) \|
				1838	static const unsigned int SD_SHARED_CHILD_MASK =
				1839	#include <linux/sched/sd_flags.h>
				1840	0;
				1841	#undef SD_FLAG
				1842
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1843	/**
				1844	* highest_flag_domain - Return highest sched_domain containing flag.
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1845	* @cpu: The CPU whose highest level of sched domain is to
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1846	* be returned.
				1847	* @flag: The flag to check for the highest sched_domain
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1848	* for the given CPU.
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1849	*
Ricardo Neri	40b4d3d	2023-04-06 13:31:44 -0700	[diff] [blame]	1850	* Returns the highest sched_domain of a CPU which contains @flag. If @flag has
				1851	* the SDF_SHARED_CHILD metaflag, all the children domains also have @flag.
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1852	*/
				1853	static inline struct sched_domain *highest_flag_domain(int cpu, int flag)
				1854	{
				1855	struct sched_domain sd, hsd = NULL;
				1856
				1857	for_each_domain(cpu, sd) {
Ricardo Neri	40b4d3d	2023-04-06 13:31:44 -0700	[diff] [blame]	1858	if (sd->flags & flag) {
				1859	hsd = sd;
				1860	continue;
				1861	}
				1862
				1863	/*
				1864	* Stop the search if @flag is known to be shared at lower
				1865	* levels. It will not be found further up.
				1866	*/
				1867	if (flag & SD_SHARED_CHILD_MASK)
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1868	break;
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1869	}
				1870
				1871	return hsd;
				1872	}
				1873
Mel Gorman	fb13c7e	2013-10-07 11:29:17 +0100	[diff] [blame]	1874	static inline struct sched_domain *lowest_flag_domain(int cpu, int flag)
				1875	{
				1876	struct sched_domain *sd;
				1877
				1878	for_each_domain(cpu, sd) {
				1879	if (sd->flags & flag)
				1880	break;
				1881	}
				1882
				1883	return sd;
				1884	}
				1885
Joel Fernandes (Google)	994aeb7	2019-03-20 20:34:24 -0400	[diff] [blame]	1886	DECLARE_PER_CPU(struct sched_domain __rcu *, sd_llc);
Peter Zijlstra	7d9ffa8	2013-07-04 12:56:46 +0800	[diff] [blame]	1887	DECLARE_PER_CPU(int, sd_llc_size);
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1888	DECLARE_PER_CPU(int, sd_llc_id);
Barry Song	b95303e	2023-10-19 11:33:21 +0800	[diff] [blame]	1889	DECLARE_PER_CPU(int, sd_share_id);
Joel Fernandes (Google)	994aeb7	2019-03-20 20:34:24 -0400	[diff] [blame]	1890	DECLARE_PER_CPU(struct sched_domain_shared __rcu *, sd_llc_shared);
				1891	DECLARE_PER_CPU(struct sched_domain __rcu *, sd_numa);
				1892	DECLARE_PER_CPU(struct sched_domain __rcu *, sd_asym_packing);
				1893	DECLARE_PER_CPU(struct sched_domain __rcu *, sd_asym_cpucapacity);
Morten Rasmussen	df054e8	2018-07-04 11:17:39 +0100	[diff] [blame]	1894	extern struct static_key_false sched_asym_cpucapacity;
Barry Song	8881e16	2023-10-19 11:33:22 +0800	[diff] [blame]	1895	extern struct static_key_false sched_cluster_active;
Peter Zijlstra	518cd62	2011-12-07 15:07:31 +0100	[diff] [blame]	1896
Dietmar Eggemann	740cf8a	2022-07-29 13:13:03 +0200	[diff] [blame]	1897	static __always_inline bool sched_asym_cpucap_active(void)
				1898	{
				1899	return static_branch_unlikely(&sched_asym_cpucapacity);
				1900	}
				1901
Nicolas Pitre	63b2ca3	2014-05-26 18:19:37 -0400	[diff] [blame]	1902	struct sched_group_capacity {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1903	atomic_t ref;
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1904	/*
Yuyang Du	172895e	2016-04-05 12:12:27 +0800	[diff] [blame]	1905	* CPU capacity of this group, SCHED_CAPACITY_SCALE being max capacity
Nicolas Pitre	63b2ca3	2014-05-26 18:19:37 -0400	[diff] [blame]	1906	* for a single CPU.
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1907	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1908	unsigned long capacity;
				1909	unsigned long min_capacity; /* Min per-CPU capacity in group */
Morten Rasmussen	e3d6d0c	2018-07-04 11:17:41 +0100	[diff] [blame]	1910	unsigned long max_capacity; /* Max per-CPU capacity in group */
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1911	unsigned long next_update;
				1912	int imbalance; /* XXX unrelated to capacity but shared group state */
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1913
Peter Zijlstra	005f874	2017-04-26 17:35:35 +0200	[diff] [blame]	1914	#ifdef CONFIG_SCHED_DEBUG
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1915	int id;
Peter Zijlstra	005f874	2017-04-26 17:35:35 +0200	[diff] [blame]	1916	#endif
				1917
zhuguangqing	eba9f08	2020-10-14 22:02:20 +0800	[diff] [blame]	1918	unsigned long cpumask[]; /* Balance mask */
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1919	};
				1920
				1921	struct sched_group {
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1922	struct sched_group next; / Must be a circular list */
				1923	atomic_t ref;
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1924
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1925	unsigned int group_weight;
Tim C Chen	d24cb0d	2023-07-07 15:57:01 -0700	[diff] [blame]	1926	unsigned int cores;
Nicolas Pitre	63b2ca3	2014-05-26 18:19:37 -0400	[diff] [blame]	1927	struct sched_group_capacity *sgc;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1928	int asym_prefer_cpu; /* CPU of highest priority in group */
Ricardo Neri	16d364b	2021-09-10 18:18:15 -0700	[diff] [blame]	1929	int flags;
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1930
				1931	/*
				1932	* The CPUs this group covers.
				1933	*
				1934	* NOTE: this field is variable length. (Allocated dynamically
				1935	* by attaching extra space to the end of the structure,
				1936	* depending on how many CPUs the kernel has booted up with)
				1937	*/
Gustavo A. R. Silva	04f5c36	2020-05-07 14:21:41 -0500	[diff] [blame]	1938	unsigned long cpumask[];
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1939	};
				1940
Peter Zijlstra	ae4df9d	2017-05-01 11:03:12 +0200	[diff] [blame]	1941	static inline struct cpumask sched_group_span(struct sched_group sg)
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1942	{
				1943	return to_cpumask(sg->cpumask);
				1944	}
				1945
				1946	/*
Peter Zijlstra	e5c14b1	2017-05-01 10:47:02 +0200	[diff] [blame]	1947	* See build_balance_mask().
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1948	*/
Peter Zijlstra	e5c14b1	2017-05-01 10:47:02 +0200	[diff] [blame]	1949	static inline struct cpumask group_balance_mask(struct sched_group sg)
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1950	{
Nicolas Pitre	63b2ca3	2014-05-26 18:19:37 -0400	[diff] [blame]	1951	return to_cpumask(sg->sgc->cpumask);
Li Zefan	5e6521e	2013-03-05 16:06:23 +0800	[diff] [blame]	1952	}
				1953
Peter Zijlstra	c117487	2012-05-31 14:47:33 +0200	[diff] [blame]	1954	extern int group_balance_cpu(struct sched_group *sg);
				1955
Peter Zijlstra	3b87f13	2021-03-25 11:31:20 +0100	[diff] [blame]	1956	#ifdef CONFIG_SCHED_DEBUG
				1957	void update_sched_domain_debugfs(void);
Peter Zijlstra	bbdacdf	2017-08-10 17:10:26 +0200	[diff] [blame]	1958	void dirty_sched_domain_sysctl(int cpu);
Steven Rostedt (Red Hat)	3866e84	2016-02-22 16:26:51 -0500	[diff] [blame]	1959	#else
Peter Zijlstra	3b87f13	2021-03-25 11:31:20 +0100	[diff] [blame]	1960	static inline void update_sched_domain_debugfs(void)
Steven Rostedt (Red Hat)	3866e84	2016-02-22 16:26:51 -0500	[diff] [blame]	1961	{
				1962	}
Peter Zijlstra	bbdacdf	2017-08-10 17:10:26 +0200	[diff] [blame]	1963	static inline void dirty_sched_domain_sysctl(int cpu)
				1964	{
				1965	}
Steven Rostedt (Red Hat)	3866e84	2016-02-22 16:26:51 -0500	[diff] [blame]	1966	#endif
				1967
Peter Zijlstra	8a99b68	2021-03-24 11:43:21 +0100	[diff] [blame]	1968	extern int sched_update_scaling(void);
Waiman Long	8f9ea86	2022-09-22 14:00:38 -0400	[diff] [blame]	1969
				1970	static inline const struct cpumask task_user_cpus(struct task_struct p)
				1971	{
				1972	if (!p->user_cpus_ptr)
				1973	return cpu_possible_mask; /* &init_task.cpus_mask */
				1974	return p->user_cpus_ptr;
				1975	}
Thomas Gleixner	d664e39	2022-04-13 15:31:02 +0200	[diff] [blame]	1976	#endif /* CONFIG_SMP */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1977
Peter Zijlstra	391e43d	2011-11-15 17:14:39 +0100	[diff] [blame]	1978	#include "stats.h"
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	1979
Josh Don	4feee7d1	2021-10-18 13:34:28 -0700	[diff] [blame]	1980	#if defined(CONFIG_SCHED_CORE) && defined(CONFIG_SCHEDSTATS)
				1981
				1982	extern void __sched_core_account_forceidle(struct rq *rq);
				1983
				1984	static inline void sched_core_account_forceidle(struct rq *rq)
				1985	{
				1986	if (schedstat_enabled())
				1987	__sched_core_account_forceidle(rq);
				1988	}
				1989
				1990	extern void __sched_core_tick(struct rq *rq);
				1991
				1992	static inline void sched_core_tick(struct rq *rq)
				1993	{
				1994	if (sched_core_enabled(rq) && schedstat_enabled())
				1995	__sched_core_tick(rq);
				1996	}
				1997
				1998	#else
				1999
				2000	static inline void sched_core_account_forceidle(struct rq *rq) {}
				2001
				2002	static inline void sched_core_tick(struct rq *rq) {}
				2003
				2004	#endif /* CONFIG_SCHED_CORE && CONFIG_SCHEDSTATS */
				2005
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2006	#ifdef CONFIG_CGROUP_SCHED
				2007
				2008	/*
				2009	* Return the group to which this tasks belongs.
				2010	*
Tejun Heo	8af01f56	2013-08-08 20:11:22 -0400	[diff] [blame]	2011	* We cannot use task_css() and friends because the cgroup subsystem
				2012	* changes that value before the cgroup_subsys::attach() method is called,
				2013	* therefore we cannot pin it and might observe the wrong value.
Peter Zijlstra	8323f26	2012-06-22 13:36:05 +0200	[diff] [blame]	2014	*
				2015	* The same is true for autogroup's p->signal->autogroup->tg, the autogroup
				2016	* core changes this before calling sched_move_task().
				2017	*
				2018	* Instead we use a 'copy' which is updated from sched_move_task() while
				2019	* holding both task_struct::pi_lock and rq::lock.
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2020	*/
				2021	static inline struct task_group task_group(struct task_struct p)
				2022	{
Peter Zijlstra	8323f26	2012-06-22 13:36:05 +0200	[diff] [blame]	2023	return p->sched_task_group;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2024	}
				2025
				2026	/* Change a task's cfs_rq and parent entity if it moves across CPUs/groups */
				2027	static inline void set_task_rq(struct task_struct *p, unsigned int cpu)
				2028	{
				2029	#if defined(CONFIG_FAIR_GROUP_SCHED) \|\| defined(CONFIG_RT_GROUP_SCHED)
				2030	struct task_group *tg = task_group(p);
				2031	#endif
				2032
				2033	#ifdef CONFIG_FAIR_GROUP_SCHED
Byungchul Park	ad936d8	2015-10-24 01:16:19 +0900	[diff] [blame]	2034	set_task_rq_fair(&p->se, p->se.cfs_rq, tg->cfs_rq[cpu]);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2035	p->se.cfs_rq = tg->cfs_rq[cpu];
				2036	p->se.parent = tg->se[cpu];
Chengming Zhou	78b6b15	2022-08-18 20:47:57 +0800	[diff] [blame]	2037	p->se.depth = tg->se[cpu] ? tg->se[cpu]->depth + 1 : 0;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2038	#endif
				2039
				2040	#ifdef CONFIG_RT_GROUP_SCHED
				2041	p->rt.rt_rq = tg->rt_rq[cpu];
				2042	p->rt.parent = tg->rt_se[cpu];
				2043	#endif
				2044	}
				2045
				2046	#else /* CONFIG_CGROUP_SCHED */
				2047
				2048	static inline void set_task_rq(struct task_struct *p, unsigned int cpu) { }
				2049	static inline struct task_group task_group(struct task_struct p)
				2050	{
				2051	return NULL;
				2052	}
				2053
				2054	#endif /* CONFIG_CGROUP_SCHED */
				2055
				2056	static inline void __set_task_cpu(struct task_struct *p, unsigned int cpu)
				2057	{
				2058	set_task_rq(p, cpu);
				2059	#ifdef CONFIG_SMP
				2060	/*
				2061	* After ->cpu is set up to a new value, task_rq_lock(p, ...) can be
Ingo Molnar	dfcb245	2018-12-03 10:05:56 +0100	[diff] [blame]	2062	* successfully executed on another CPU. We must ensure that updates of
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2063	* per-task data have been completed by this moment.
				2064	*/
				2065	smp_wmb();
Andrea Parri	c546951	2019-01-21 16:52:40 +0100	[diff] [blame]	2066	WRITE_ONCE(task_thread_info(p)->cpu, cpu);
Peter Zijlstra	ac66f54	2013-10-07 11:29:16 +0100	[diff] [blame]	2067	p->wake_cpu = cpu;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2068	#endif
				2069	}
				2070
				2071	/*
				2072	* Tunables that become constants when CONFIG_SCHED_DEBUG is off:
				2073	*/
				2074	#ifdef CONFIG_SCHED_DEBUG
				2075	# define const_debug __read_mostly
				2076	#else
				2077	# define const_debug const
				2078	#endif
				2079
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2080	#define SCHED_FEAT(name, enabled) \
				2081	__SCHED_FEAT_##name ,
				2082
				2083	enum {
Peter Zijlstra	391e43d	2011-11-15 17:14:39 +0100	[diff] [blame]	2084	#include "features.h"
Peter Zijlstra	f8b6d1c	2011-07-06 14:20:14 +0200	[diff] [blame]	2085	__SCHED_FEAT_NR,
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2086	};
				2087
				2088	#undef SCHED_FEAT
				2089
Juri Lelli	a73f863	2020-10-13 07:31:14 +0200	[diff] [blame]	2090	#ifdef CONFIG_SCHED_DEBUG
Patrick Bellasi	765cc3a	2017-11-08 18:41:01 +0000	[diff] [blame]	2091
				2092	/*
				2093	* To support run-time toggling of sched features, all the translation units
				2094	* (but core.c) reference the sysctl_sched_features defined in core.c.
				2095	*/
				2096	extern const_debug unsigned int sysctl_sched_features;
				2097
Juri Lelli	a73f863	2020-10-13 07:31:14 +0200	[diff] [blame]	2098	#ifdef CONFIG_JUMP_LABEL
Peter Zijlstra	f8b6d1c	2011-07-06 14:20:14 +0200	[diff] [blame]	2099	#define SCHED_FEAT(name, enabled) \
Ingo Molnar	c5905af	2012-02-24 08:31:31 +0100	[diff] [blame]	2100	static __always_inline bool static_branch_##name(struct static_key *key) \
Peter Zijlstra	f8b6d1c	2011-07-06 14:20:14 +0200	[diff] [blame]	2101	{ \
Jason Baron	6e76ea8	2014-07-02 15:52:41 +0000	[diff] [blame]	2102	return static_key_##enabled(key); \
Peter Zijlstra	f8b6d1c	2011-07-06 14:20:14 +0200	[diff] [blame]	2103	}
				2104
				2105	#include "features.h"
Peter Zijlstra	f8b6d1c	2011-07-06 14:20:14 +0200	[diff] [blame]	2106	#undef SCHED_FEAT
				2107
Ingo Molnar	c5905af	2012-02-24 08:31:31 +0100	[diff] [blame]	2108	extern struct static_key sched_feat_keys[__SCHED_FEAT_NR];
Peter Zijlstra	f8b6d1c	2011-07-06 14:20:14 +0200	[diff] [blame]	2109	#define sched_feat(x) (static_branch_##x(&sched_feat_keys[__SCHED_FEAT_##x]))
Patrick Bellasi	765cc3a	2017-11-08 18:41:01 +0000	[diff] [blame]	2110
Juri Lelli	a73f863	2020-10-13 07:31:14 +0200	[diff] [blame]	2111	#else /* !CONFIG_JUMP_LABEL */
				2112
				2113	#define sched_feat(x) (sysctl_sched_features & (1UL << __SCHED_FEAT_##x))
				2114
				2115	#endif /* CONFIG_JUMP_LABEL */
				2116
				2117	#else /* !SCHED_DEBUG */
Patrick Bellasi	765cc3a	2017-11-08 18:41:01 +0000	[diff] [blame]	2118
				2119	/*
				2120	* Each translation unit has its own copy of sysctl_sched_features to allow
				2121	* constants propagation at compile time and compiler optimization based on
				2122	* features default.
				2123	*/
				2124	#define SCHED_FEAT(name, enabled) \
				2125	(1UL << __SCHED_FEAT_##name) * enabled \|
				2126	static const_debug __maybe_unused unsigned int sysctl_sched_features =
				2127	#include "features.h"
				2128	0;
				2129	#undef SCHED_FEAT
				2130
Peter Zijlstra	7e6f4c5	2018-08-29 11:45:21 +0200	[diff] [blame]	2131	#define sched_feat(x) !!(sysctl_sched_features & (1UL << __SCHED_FEAT_##x))
Patrick Bellasi	765cc3a	2017-11-08 18:41:01 +0000	[diff] [blame]	2132
Juri Lelli	a73f863	2020-10-13 07:31:14 +0200	[diff] [blame]	2133	#endif /* SCHED_DEBUG */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2134
Srikar Dronamraju	2a59572	2015-08-11 21:54:21 +0530	[diff] [blame]	2135	extern struct static_key_false sched_numa_balancing;
Mel Gorman	cb25176	2016-02-05 09:08:36 +0000	[diff] [blame]	2136	extern struct static_key_false sched_schedstats;
Peter Zijlstra	cbee9f8	2012-10-25 14:16:43 +0200	[diff] [blame]	2137
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2138	static inline u64 global_rt_period(void)
				2139	{
				2140	return (u64)sysctl_sched_rt_period * NSEC_PER_USEC;
				2141	}
				2142
				2143	static inline u64 global_rt_runtime(void)
				2144	{
				2145	if (sysctl_sched_rt_runtime < 0)
				2146	return RUNTIME_INF;
				2147
				2148	return (u64)sysctl_sched_rt_runtime * NSEC_PER_USEC;
				2149	}
				2150
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2151	static inline int task_current(struct rq rq, struct task_struct p)
				2152	{
				2153	return rq->curr == p;
				2154	}
				2155
Peter Zijlstra	0b9d46f	2022-09-06 12:33:04 +0200	[diff] [blame]	2156	static inline int task_on_cpu(struct rq rq, struct task_struct p)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2157	{
				2158	#ifdef CONFIG_SMP
				2159	return p->on_cpu;
				2160	#else
				2161	return task_current(rq, p);
				2162	#endif
				2163	}
				2164
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	2165	static inline int task_on_rq_queued(struct task_struct *p)
				2166	{
				2167	return p->on_rq == TASK_ON_RQ_QUEUED;
				2168	}
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2169
Kirill Tkhai	cca26e8	2014-08-20 13:47:42 +0400	[diff] [blame]	2170	static inline int task_on_rq_migrating(struct task_struct *p)
				2171	{
Andrea Parri	c546951	2019-01-21 16:52:40 +0100	[diff] [blame]	2172	return READ_ONCE(p->on_rq) == TASK_ON_RQ_MIGRATING;
Kirill Tkhai	cca26e8	2014-08-20 13:47:42 +0400	[diff] [blame]	2173	}
				2174
Valentin Schneider	1777057	2020-11-02 18:45:12 +0000	[diff] [blame]	2175	/* Wake flags. The first three directly map to some SD flag value */
Peter Oskolkov	ab83f45	2023-03-07 23:31:57 -0800	[diff] [blame]	2176	#define WF_EXEC 0x02 /* Wakeup after exec; maps to SD_BALANCE_EXEC */
				2177	#define WF_FORK 0x04 /* Wakeup after fork; maps to SD_BALANCE_FORK */
				2178	#define WF_TTWU 0x08 /* Wakeup; maps to SD_BALANCE_WAKE */
Valentin Schneider	1777057	2020-11-02 18:45:12 +0000	[diff] [blame]	2179
Peter Oskolkov	ab83f45	2023-03-07 23:31:57 -0800	[diff] [blame]	2180	#define WF_SYNC 0x10 /* Waker goes to sleep after wakeup */
				2181	#define WF_MIGRATED 0x20 /* Internal use, task got migrated */
				2182	#define WF_CURRENT_CPU 0x40 /* Prefer to move the wakee to the current CPU. */
Valentin Schneider	1777057	2020-11-02 18:45:12 +0000	[diff] [blame]	2183
				2184	#ifdef CONFIG_SMP
				2185	static_assert(WF_EXEC == SD_BALANCE_EXEC);
				2186	static_assert(WF_FORK == SD_BALANCE_FORK);
				2187	static_assert(WF_TTWU == SD_BALANCE_WAKE);
				2188	#endif
Li Zefan	b13095f	2013-03-05 16:06:38 +0800	[diff] [blame]	2189
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2190	/*
				2191	* To aid in avoiding the subversion of "niceness" due to uneven distribution
				2192	* of tasks with abnormal "nice" values across CPUs the contribution that
				2193	* each task makes to its run queue's load is weighted according to its
				2194	* scheduling class and "nice" value. For SCHED_NORMAL tasks this is just a
				2195	* scaled version of the new time slice allocation that they receive on time
				2196	* slice expiry etc.
				2197	*/
				2198
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2199	#define WEIGHT_IDLEPRIO 3
				2200	#define WMULT_IDLEPRIO 1431655765
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2201
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2202	extern const int sched_prio_to_weight[40];
				2203	extern const u32 sched_prio_to_wmult[40];
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2204
Peter Zijlstra	ff77e46	2016-01-18 15:27:07 +0100	[diff] [blame]	2205	/*
				2206	* {de,en}queue flags:
				2207	*
				2208	* DEQUEUE_SLEEP - task is no longer runnable
				2209	* ENQUEUE_WAKEUP - task just became runnable
				2210	*
				2211	* SAVE/RESTORE - an otherwise spurious dequeue/enqueue, done to ensure tasks
				2212	* are in a known state which allows modification. Such pairs
				2213	* should preserve as much state as possible.
				2214	*
				2215	* MOVE - paired with SAVE/RESTORE, explicitly does not preserve the location
				2216	* in the runqueue.
				2217	*
Peter Zijlstra	2f7a0f5	2023-11-04 11:59:20 +0100	[diff] [blame]	2218	* NOCLOCK - skip the update_rq_clock() (avoids double updates)
				2219	*
				2220	* MIGRATION - p->on_rq == TASK_ON_RQ_MIGRATING (used for DEADLINE)
				2221	*
Peter Zijlstra	ff77e46	2016-01-18 15:27:07 +0100	[diff] [blame]	2222	* ENQUEUE_HEAD - place at front of runqueue (tail if not specified)
				2223	* ENQUEUE_REPLENISH - CBS (replenish runtime and postpone deadline)
Peter Zijlstra	59efa0b	2016-05-10 18:24:37 +0200	[diff] [blame]	2224	* ENQUEUE_MIGRATED - the task was migrated during wakeup
Peter Zijlstra	ff77e46	2016-01-18 15:27:07 +0100	[diff] [blame]	2225	*
				2226	*/
				2227
				2228	#define DEQUEUE_SLEEP 0x01
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2229	#define DEQUEUE_SAVE 0x02 /* Matches ENQUEUE_RESTORE */
				2230	#define DEQUEUE_MOVE 0x04 /* Matches ENQUEUE_MOVE */
				2231	#define DEQUEUE_NOCLOCK 0x08 /* Matches ENQUEUE_NOCLOCK */
Peter Zijlstra	2f7a0f5	2023-11-04 11:59:20 +0100	[diff] [blame]	2232	#define DEQUEUE_MIGRATING 0x100 /* Matches ENQUEUE_MIGRATING */
Peter Zijlstra	ff77e46	2016-01-18 15:27:07 +0100	[diff] [blame]	2233
Peter Zijlstra	1de6444	2015-09-30 17:44:13 +0200	[diff] [blame]	2234	#define ENQUEUE_WAKEUP 0x01
Peter Zijlstra	ff77e46	2016-01-18 15:27:07 +0100	[diff] [blame]	2235	#define ENQUEUE_RESTORE 0x02
				2236	#define ENQUEUE_MOVE 0x04
Peter Zijlstra	0a67d1e	2016-10-04 16:29:45 +0200	[diff] [blame]	2237	#define ENQUEUE_NOCLOCK 0x08
Peter Zijlstra	ff77e46	2016-01-18 15:27:07 +0100	[diff] [blame]	2238
Peter Zijlstra	0a67d1e	2016-10-04 16:29:45 +0200	[diff] [blame]	2239	#define ENQUEUE_HEAD 0x10
				2240	#define ENQUEUE_REPLENISH 0x20
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2241	#ifdef CONFIG_SMP
Peter Zijlstra	0a67d1e	2016-10-04 16:29:45 +0200	[diff] [blame]	2242	#define ENQUEUE_MIGRATED 0x40
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2243	#else
Peter Zijlstra	59efa0b	2016-05-10 18:24:37 +0200	[diff] [blame]	2244	#define ENQUEUE_MIGRATED 0x00
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2245	#endif
Peter Zijlstra	d07f09a	2023-05-31 13:58:49 +0200	[diff] [blame]	2246	#define ENQUEUE_INITIAL 0x80
Peter Zijlstra	2f7a0f5	2023-11-04 11:59:20 +0100	[diff] [blame]	2247	#define ENQUEUE_MIGRATING 0x100
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2248
Peter Zijlstra	37e117c	2014-02-14 12:25:08 +0100	[diff] [blame]	2249	#define RETRY_TASK ((void *)-1UL)
				2250
Waiman Long	713a2e2	2022-09-22 14:00:40 -0400	[diff] [blame]	2251	struct affinity_context {
				2252	const struct cpumask *new_mask;
Waiman Long	8f9ea86	2022-09-22 14:00:38 -0400	[diff] [blame]	2253	struct cpumask *user_mask;
Waiman Long	713a2e2	2022-09-22 14:00:40 -0400	[diff] [blame]	2254	unsigned int flags;
				2255	};
				2256
Peter Zijlstra	5d69eca	2023-11-04 11:59:18 +0100	[diff] [blame]	2257	extern s64 update_curr_common(struct rq *rq);
				2258
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2259	struct sched_class {
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2260
Patrick Bellasi	69842cb	2019-06-21 09:42:02 +0100	[diff] [blame]	2261	#ifdef CONFIG_UCLAMP_TASK
				2262	int uclamp_enabled;
				2263	#endif
				2264
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2265	void (enqueue_task) (struct rq rq, struct task_struct *p, int flags);
				2266	void (dequeue_task) (struct rq rq, struct task_struct *p, int flags);
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2267	void (yield_task) (struct rq rq);
Dietmar Eggemann	0900acf	2020-06-03 10:03:02 +0200	[diff] [blame]	2268	bool (yield_to_task)(struct rq rq, struct task_struct *p);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2269
Ingo Molnar	e23edc8	2023-09-19 10:38:21 +0200	[diff] [blame]	2270	void (wakeup_preempt)(struct rq rq, struct task_struct *p, int flags);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2271
Peter Zijlstra	98c2f70	2019-11-08 14:15:58 +0100	[diff] [blame]	2272	struct task_struct (pick_next_task)(struct rq *rq);
				2273
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2274	void (put_prev_task)(struct rq rq, struct task_struct *p);
Peter Zijlstra	a0e813f	2019-11-08 14:16:00 +0100	[diff] [blame]	2275	void (set_next_task)(struct rq rq, struct task_struct *p, bool first);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2276
				2277	#ifdef CONFIG_SMP
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2278	int (balance)(struct rq rq, struct task_struct prev, struct rq_flags rf);
Valentin Schneider	3aef1551	2020-11-02 18:45:13 +0000	[diff] [blame]	2279	int (select_task_rq)(struct task_struct p, int task_cpu, int flags);
Peter Zijlstra	21f56ffe	2020-11-17 18:19:32 -0500	[diff] [blame]	2280
				2281	struct task_struct * (pick_task)(struct rq rq);
				2282
Srikar Dronamraju	1327237a5	2018-09-21 23:18:57 +0530	[diff] [blame]	2283	void (migrate_task_rq)(struct task_struct p, int new_cpu);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2284
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2285	void (task_woken)(struct rq this_rq, struct task_struct *task);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2286
Waiman Long	713a2e2	2022-09-22 14:00:40 -0400	[diff] [blame]	2287	void (set_cpus_allowed)(struct task_struct p, struct affinity_context *ctx);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2288
				2289	void (rq_online)(struct rq rq);
				2290	void (rq_offline)(struct rq rq);
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	2291
				2292	struct rq (find_lock_rq)(struct task_struct p, struct rq rq);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2293	#endif
				2294
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2295	void (task_tick)(struct rq rq, struct task_struct *p, int queued);
				2296	void (task_fork)(struct task_struct p);
				2297	void (task_dead)(struct task_struct p);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2298
Kirill Tkhai	67dfa1b	2014-10-27 17:40:52 +0300	[diff] [blame]	2299	/*
				2300	* The switched_from() call is allowed to drop rq->lock, therefore we
Ingo Molnar	3b03706	2021-03-18 13:38:50 +0100	[diff] [blame]	2301	* cannot assume the switched_from/switched_to pair is serialized by
Kirill Tkhai	67dfa1b	2014-10-27 17:40:52 +0300	[diff] [blame]	2302	* rq->lock. They are however serialized by p->pi_lock.
				2303	*/
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2304	void (switched_from)(struct rq this_rq, struct task_struct *task);
				2305	void (switched_to) (struct rq this_rq, struct task_struct *task);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2306	void (prio_changed) (struct rq this_rq, struct task_struct *task,
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2307	int oldprio);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2308
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2309	unsigned int (get_rr_interval)(struct rq rq,
				2310	struct task_struct *task);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2311
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2312	void (update_curr)(struct rq rq);
Stanislaw Gruszka	6e99891	2014-11-12 16:58:44 +0100	[diff] [blame]	2313
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2314	#ifdef CONFIG_FAIR_GROUP_SCHED
Chengming Zhou	39c4261	2022-08-18 20:47:58 +0800	[diff] [blame]	2315	void (task_change_group)(struct task_struct p);
Li Zefan	c82ba9f	2013-03-05 16:06:55 +0800	[diff] [blame]	2316	#endif
Hao Jia	530bfad	2023-03-16 16:18:06 +0800	[diff] [blame]	2317
				2318	#ifdef CONFIG_SCHED_CORE
				2319	int (task_is_throttled)(struct task_struct p, int cpu);
				2320	#endif
Peter Zijlstra	43c31ac	2020-10-21 15:45:33 +0200	[diff] [blame]	2321	};
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2322
Peter Zijlstra	3f1d2a3	2014-02-12 10:49:30 +0100	[diff] [blame]	2323	static inline void put_prev_task(struct rq rq, struct task_struct prev)
				2324	{
Peter Zijlstra	10e7071	2019-08-06 15:13:17 +0200	[diff] [blame]	2325	WARN_ON_ONCE(rq->curr != prev);
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2326	prev->sched_class->put_prev_task(rq, prev);
Peter Zijlstra	3f1d2a3	2014-02-12 10:49:30 +0100	[diff] [blame]	2327	}
				2328
Peter Zijlstra	03b7fad	2019-05-29 20:36:41 +0000	[diff] [blame]	2329	static inline void set_next_task(struct rq rq, struct task_struct next)
Peter Zijlstra	b2bf6c3	2016-09-20 22:00:38 +0200	[diff] [blame]	2330	{
Peter Zijlstra	a0e813f	2019-11-08 14:16:00 +0100	[diff] [blame]	2331	next->sched_class->set_next_task(rq, next, false);
Peter Zijlstra	b2bf6c3	2016-09-20 22:00:38 +0200	[diff] [blame]	2332	}
				2333
Peter Zijlstra	43c31ac	2020-10-21 15:45:33 +0200	[diff] [blame]	2334
				2335	/*
				2336	* Helper to define a sched_class instance; each one is placed in a separate
				2337	* section which is ordered by the linker script:
				2338	*
				2339	* include/asm-generic/vmlinux.lds.h
				2340	*
Peter Zijlstra	546a3fe	2022-05-17 13:46:54 +0200	[diff] [blame]	2341	* CAREFUL they are laid out in REVERSE order!!!
				2342	*
Peter Zijlstra	43c31ac	2020-10-21 15:45:33 +0200	[diff] [blame]	2343	* Also enforce alignment on the instance, not the type, to guarantee layout.
				2344	*/
				2345	#define DEFINE_SCHED_CLASS(name) \
				2346	const struct sched_class name##_sched_class \
				2347	__aligned(__alignof__(struct sched_class)) \
				2348	__section("__" #name "_sched_class")
				2349
Steven Rostedt (VMware)	c3a340f	2019-12-19 16:44:53 -0500	[diff] [blame]	2350	/* Defined in include/asm-generic/vmlinux.lds.h */
Peter Zijlstra	546a3fe	2022-05-17 13:46:54 +0200	[diff] [blame]	2351	extern struct sched_class __sched_class_highest[];
				2352	extern struct sched_class __sched_class_lowest[];
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2353
				2354	#define for_class_range(class, _from, _to) \
Peter Zijlstra	546a3fe	2022-05-17 13:46:54 +0200	[diff] [blame]	2355	for (class = (_from); class < (_to); class++)
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2356
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2357	#define for_each_class(class) \
Peter Zijlstra	546a3fe	2022-05-17 13:46:54 +0200	[diff] [blame]	2358	for_class_range(class, __sched_class_highest, __sched_class_lowest)
				2359
				2360	#define sched_class_above(_a, _b) ((_a) < (_b))
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2361
				2362	extern const struct sched_class stop_sched_class;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2363	extern const struct sched_class dl_sched_class;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2364	extern const struct sched_class rt_sched_class;
				2365	extern const struct sched_class fair_sched_class;
				2366	extern const struct sched_class idle_sched_class;
				2367
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2368	static inline bool sched_stop_runnable(struct rq *rq)
				2369	{
				2370	return rq->stop && task_on_rq_queued(rq->stop);
				2371	}
				2372
				2373	static inline bool sched_dl_runnable(struct rq *rq)
				2374	{
				2375	return rq->dl.dl_nr_running > 0;
				2376	}
				2377
				2378	static inline bool sched_rt_runnable(struct rq *rq)
				2379	{
				2380	return rq->rt.rt_queued > 0;
				2381	}
				2382
				2383	static inline bool sched_fair_runnable(struct rq *rq)
				2384	{
				2385	return rq->cfs.nr_running > 0;
				2386	}
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2387
Peter Zijlstra	5d7d605	2019-11-08 14:15:57 +0100	[diff] [blame]	2388	extern struct task_struct pick_next_task_fair(struct rq rq, struct task_struct prev, struct rq_flags rf);
Peter Zijlstra	98c2f70	2019-11-08 14:15:58 +0100	[diff] [blame]	2389	extern struct task_struct pick_next_task_idle(struct rq rq);
Peter Zijlstra	5d7d605	2019-11-08 14:15:57 +0100	[diff] [blame]	2390
Peter Zijlstra	af44990	2020-09-17 10:38:30 +0200	[diff] [blame]	2391	#define SCA_CHECK 0x01
				2392	#define SCA_MIGRATE_DISABLE 0x02
				2393	#define SCA_MIGRATE_ENABLE 0x04
Will Deacon	07ec77a	2021-07-30 12:24:35 +0100	[diff] [blame]	2394	#define SCA_USER 0x08
Peter Zijlstra	af44990	2020-09-17 10:38:30 +0200	[diff] [blame]	2395
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2396	#ifdef CONFIG_SMP
				2397
Nicolas Pitre	63b2ca3	2014-05-26 18:19:37 -0400	[diff] [blame]	2398	extern void update_group_capacity(struct sched_domain *sd, int cpu);
Li Zefan	b719203	2013-03-07 10:00:26 +0800	[diff] [blame]	2399
Daniel Lezcano	7caff66	2014-01-06 12:34:38 +0100	[diff] [blame]	2400	extern void trigger_load_balance(struct rq *rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2401
Waiman Long	713a2e2	2022-09-22 14:00:40 -0400	[diff] [blame]	2402	extern void set_cpus_allowed_common(struct task_struct p, struct affinity_context ctx);
Peter Zijlstra	c5b2803	2015-05-15 17:43:35 +0200	[diff] [blame]	2403
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	2404	static inline struct task_struct get_push_task(struct rq rq)
				2405	{
				2406	struct task_struct *p = rq->curr;
				2407
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2408	lockdep_assert_rq_held(rq);
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	2409
				2410	if (rq->push_busy)
				2411	return NULL;
				2412
				2413	if (p->nr_cpus_allowed == 1)
				2414	return NULL;
				2415
Sebastian Andrzej Siewior	e681dcb	2021-08-26 15:37:38 +0200	[diff] [blame]	2416	if (p->migration_disabled)
				2417	return NULL;
				2418
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame]	2419	rq->push_busy = true;
				2420	return get_task_struct(p);
				2421	}
				2422
				2423	extern int push_cpu_stop(void *arg);
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	2424
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2425	#endif
				2426
Daniel Lezcano	442bf3a	2014-09-04 11:32:09 -0400	[diff] [blame]	2427	#ifdef CONFIG_CPU_IDLE
				2428	static inline void idle_set_state(struct rq *rq,
				2429	struct cpuidle_state *idle_state)
				2430	{
				2431	rq->idle_state = idle_state;
				2432	}
				2433
				2434	static inline struct cpuidle_state idle_get_state(struct rq rq)
				2435	{
Peter Zijlstra	9148a3a	2016-09-20 22:34:51 +0200	[diff] [blame]	2436	SCHED_WARN_ON(!rcu_read_lock_held());
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2437
Daniel Lezcano	442bf3a	2014-09-04 11:32:09 -0400	[diff] [blame]	2438	return rq->idle_state;
				2439	}
				2440	#else
				2441	static inline void idle_set_state(struct rq *rq,
				2442	struct cpuidle_state *idle_state)
				2443	{
				2444	}
				2445
				2446	static inline struct cpuidle_state idle_get_state(struct rq rq)
				2447	{
				2448	return NULL;
				2449	}
				2450	#endif
				2451
Steven Rostedt (VMware)	8663eff	2017-04-14 08:48:09 -0400	[diff] [blame]	2452	extern void schedule_idle(void);
Peter Zijlstra	22dc02f	2023-07-24 21:30:54 +0200	[diff] [blame]	2453	asmlinkage void schedule_user(void);
Steven Rostedt (VMware)	8663eff	2017-04-14 08:48:09 -0400	[diff] [blame]	2454
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2455	extern void sysrq_sched_debug_show(void);
				2456	extern void sched_init_granularity(void);
				2457	extern void update_max_interval(void);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2458
				2459	extern void init_sched_dl_class(void);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2460	extern void init_sched_rt_class(void);
				2461	extern void init_sched_fair_class(void);
				2462
Vincent Guittot	9059393	2017-05-17 11:50:45 +0200	[diff] [blame]	2463	extern void reweight_task(struct task_struct *p, int prio);
				2464
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	2465	extern void resched_curr(struct rq *rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2466	extern void resched_cpu(int cpu);
				2467
				2468	extern struct rt_bandwidth def_rt_bandwidth;
				2469	extern void init_rt_bandwidth(struct rt_bandwidth *rt_b, u64 period, u64 runtime);
Thomas Gleixner	d664e39	2022-04-13 15:31:02 +0200	[diff] [blame]	2470	extern bool sched_rt_bandwidth_account(struct rt_rq *rt_rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2471
Peter Zijlstra	9e07d45	2023-11-04 11:59:19 +0100	[diff] [blame]	2472	extern void init_dl_entity(struct sched_dl_entity *dl_se);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2473
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2474	#define BW_SHIFT 20
				2475	#define BW_UNIT (1 << BW_SHIFT)
				2476	#define RATIO_SHIFT 8
Huaixin Chang	d505b8a	2020-04-25 18:52:48 +0800	[diff] [blame]	2477	#define MAX_BW_BITS (64 - BW_SHIFT)
				2478	#define MAX_BW ((1ULL << MAX_BW_BITS) - 1)
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	2479	unsigned long to_ratio(u64 period, u64 runtime);
				2480
Yuyang Du	540247f	2015-07-15 08:04:39 +0800	[diff] [blame]	2481	extern void init_entity_runnable_average(struct sched_entity *se);
Dietmar Eggemann	d0fe0b9	2019-01-22 16:25:01 +0000	[diff] [blame]	2482	extern void post_init_entity_util_avg(struct task_struct *p);
Alex Shi	a75cdaa	2013-06-20 10:18:47 +0800	[diff] [blame]	2483
Frederic Weisbecker	76d92ac	2015-07-17 22:25:49 +0200	[diff] [blame]	2484	#ifdef CONFIG_NO_HZ_FULL
				2485	extern bool sched_can_stop_tick(struct rq *rq);
Frederic Weisbecker	d84b313	2018-02-21 05:17:27 +0100	[diff] [blame]	2486	extern int __init sched_tick_offload_init(void);
Frederic Weisbecker	76d92ac	2015-07-17 22:25:49 +0200	[diff] [blame]	2487
				2488	/*
				2489	* Tick may be needed by tasks in the runqueue depending on their policy and
				2490	* requirements. If tick is needed, lets send the target an IPI to kick it out of
				2491	* nohz mode if necessary.
				2492	*/
				2493	static inline void sched_update_tick_dependency(struct rq *rq)
				2494	{
Miaohe Lin	21a6ee1	2020-07-28 19:17:55 +0800	[diff] [blame]	2495	int cpu = cpu_of(rq);
Frederic Weisbecker	76d92ac	2015-07-17 22:25:49 +0200	[diff] [blame]	2496
				2497	if (!tick_nohz_full_cpu(cpu))
				2498	return;
				2499
				2500	if (sched_can_stop_tick(rq))
				2501	tick_nohz_dep_clear_cpu(cpu, TICK_DEP_BIT_SCHED);
				2502	else
				2503	tick_nohz_dep_set_cpu(cpu, TICK_DEP_BIT_SCHED);
				2504	}
				2505	#else
Frederic Weisbecker	d84b313	2018-02-21 05:17:27 +0100	[diff] [blame]	2506	static inline int sched_tick_offload_init(void) { return 0; }
Frederic Weisbecker	76d92ac	2015-07-17 22:25:49 +0200	[diff] [blame]	2507	static inline void sched_update_tick_dependency(struct rq *rq) { }
				2508	#endif
				2509
Kirill Tkhai	7246544	2014-05-09 03:00:14 +0400	[diff] [blame]	2510	static inline void add_nr_running(struct rq *rq, unsigned count)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2511	{
Kirill Tkhai	7246544	2014-05-09 03:00:14 +0400	[diff] [blame]	2512	unsigned prev_nr = rq->nr_running;
				2513
				2514	rq->nr_running = prev_nr + count;
Phil Auld	9d24605	2020-06-29 15:23:03 -0400	[diff] [blame]	2515	if (trace_sched_update_nr_running_tp_enabled()) {
				2516	call_trace_sched_update_nr_running(rq, count);
				2517	}
Frederic Weisbecker	9f3660c	2013-04-20 14:35:09 +0200	[diff] [blame]	2518
Tim Chen	4486edd	2014-06-23 12:16:49 -0700	[diff] [blame]	2519	#ifdef CONFIG_SMP
Viresh Kumar	3e18450	2018-11-06 11:12:57 +0530	[diff] [blame]	2520	if (prev_nr < 2 && rq->nr_running >= 2) {
Valentin Schneider	e90c8fe	2018-07-04 11:17:46 +0100	[diff] [blame]	2521	if (!READ_ONCE(rq->rd->overload))
				2522	WRITE_ONCE(rq->rd->overload, 1);
Tim Chen	4486edd	2014-06-23 12:16:49 -0700	[diff] [blame]	2523	}
Viresh Kumar	3e18450	2018-11-06 11:12:57 +0530	[diff] [blame]	2524	#endif
Frederic Weisbecker	76d92ac	2015-07-17 22:25:49 +0200	[diff] [blame]	2525
				2526	sched_update_tick_dependency(rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2527	}
				2528
Kirill Tkhai	7246544	2014-05-09 03:00:14 +0400	[diff] [blame]	2529	static inline void sub_nr_running(struct rq *rq, unsigned count)
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2530	{
Kirill Tkhai	7246544	2014-05-09 03:00:14 +0400	[diff] [blame]	2531	rq->nr_running -= count;
Phil Auld	9d24605	2020-06-29 15:23:03 -0400	[diff] [blame]	2532	if (trace_sched_update_nr_running_tp_enabled()) {
Phil Auld	a1bd068	2020-08-05 16:31:38 -0400	[diff] [blame]	2533	call_trace_sched_update_nr_running(rq, -count);
Phil Auld	9d24605	2020-06-29 15:23:03 -0400	[diff] [blame]	2534	}
				2535
Frederic Weisbecker	76d92ac	2015-07-17 22:25:49 +0200	[diff] [blame]	2536	/* Check if we still need preemption */
				2537	sched_update_tick_dependency(rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2538	}
				2539
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2540	extern void activate_task(struct rq rq, struct task_struct p, int flags);
				2541	extern void deactivate_task(struct rq rq, struct task_struct p, int flags);
				2542
Ingo Molnar	e23edc8	2023-09-19 10:38:21 +0200	[diff] [blame]	2543	extern void wakeup_preempt(struct rq rq, struct task_struct p, int flags);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2544
Vincent Guittot	c59862f	2022-08-25 14:27:24 +0200	[diff] [blame]	2545	#ifdef CONFIG_PREEMPT_RT
				2546	#define SCHED_NR_MIGRATE_BREAK 8
				2547	#else
				2548	#define SCHED_NR_MIGRATE_BREAK 32
				2549	#endif
				2550
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2551	extern const_debug unsigned int sysctl_sched_nr_migrate;
				2552	extern const_debug unsigned int sysctl_sched_migration_cost;
				2553
Peter Zijlstra	e4ec331	2023-05-31 13:58:48 +0200	[diff] [blame]	2554	extern unsigned int sysctl_sched_base_slice;
Peter Zijlstra	147f3ef	2023-05-31 13:58:44 +0200	[diff] [blame]	2555
Hailong Liu	1876544	2021-06-06 19:54:51 +0800	[diff] [blame]	2556	#ifdef CONFIG_SCHED_DEBUG
Hailong Liu	1876544	2021-06-06 19:54:51 +0800	[diff] [blame]	2557	extern int sysctl_resched_latency_warn_ms;
				2558	extern int sysctl_resched_latency_warn_once;
				2559
				2560	extern unsigned int sysctl_sched_tunable_scaling;
				2561
				2562	extern unsigned int sysctl_numa_balancing_scan_delay;
				2563	extern unsigned int sysctl_numa_balancing_scan_period_min;
				2564	extern unsigned int sysctl_numa_balancing_scan_period_max;
				2565	extern unsigned int sysctl_numa_balancing_scan_size;
Huang Ying	3302453	2022-07-13 16:39:51 +0800	[diff] [blame]	2566	extern unsigned int sysctl_numa_balancing_hot_threshold;
Hailong Liu	1876544	2021-06-06 19:54:51 +0800	[diff] [blame]	2567	#endif
				2568
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2569	#ifdef CONFIG_SCHED_HRTICK
				2570
				2571	/*
				2572	* Use hrtick when:
				2573	* - enabled by features
				2574	* - hrtimer is actually high res
				2575	*/
				2576	static inline int hrtick_enabled(struct rq *rq)
				2577	{
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2578	if (!cpu_active(cpu_of(rq)))
				2579	return 0;
				2580	return hrtimer_is_hres_active(&rq->hrtick_timer);
				2581	}
				2582
Juri Lelli	e0ee463	2021-02-08 08:35:54 +0100	[diff] [blame]	2583	static inline int hrtick_enabled_fair(struct rq *rq)
				2584	{
				2585	if (!sched_feat(HRTICK))
				2586	return 0;
				2587	return hrtick_enabled(rq);
				2588	}
				2589
				2590	static inline int hrtick_enabled_dl(struct rq *rq)
				2591	{
				2592	if (!sched_feat(HRTICK_DL))
				2593	return 0;
				2594	return hrtick_enabled(rq);
				2595	}
				2596
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2597	void hrtick_start(struct rq *rq, u64 delay);
				2598
Mike Galbraith	b39e66e	2011-11-22 15:20:07 +0100	[diff] [blame]	2599	#else
				2600
Juri Lelli	e0ee463	2021-02-08 08:35:54 +0100	[diff] [blame]	2601	static inline int hrtick_enabled_fair(struct rq *rq)
				2602	{
				2603	return 0;
				2604	}
				2605
				2606	static inline int hrtick_enabled_dl(struct rq *rq)
				2607	{
				2608	return 0;
				2609	}
				2610
Mike Galbraith	b39e66e	2011-11-22 15:20:07 +0100	[diff] [blame]	2611	static inline int hrtick_enabled(struct rq *rq)
				2612	{
				2613	return 0;
				2614	}
				2615
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2616	#endif /* CONFIG_SCHED_HRTICK */
				2617
Giovanni Gherdovich	1567c3e3	2020-01-22 16:16:12 +0100	[diff] [blame]	2618	#ifndef arch_scale_freq_tick
				2619	static __always_inline
				2620	void arch_scale_freq_tick(void)
				2621	{
				2622	}
				2623	#endif
				2624
Peter Zijlstra	dfbca41	2015-03-23 14:19:05 +0100	[diff] [blame]	2625	#ifndef arch_scale_freq_capacity
Valentin Schneider	f4470cd	2020-07-31 20:20:14 +0100	[diff] [blame]	2626	/**
				2627	* arch_scale_freq_capacity - get the frequency scale factor of a given CPU.
				2628	* @cpu: the CPU in question.
				2629	*
				2630	* Return: the frequency scale factor normalized against SCHED_CAPACITY_SCALE, i.e.
				2631	*
				2632	* f_curr
				2633	* ------ * SCHED_CAPACITY_SCALE
				2634	* f_max
				2635	*/
Peter Zijlstra	dfbca41	2015-03-23 14:19:05 +0100	[diff] [blame]	2636	static __always_inline
Juri Lelli	7673c8a	2017-12-04 11:23:23 +0100	[diff] [blame]	2637	unsigned long arch_scale_freq_capacity(int cpu)
Peter Zijlstra	dfbca41	2015-03-23 14:19:05 +0100	[diff] [blame]	2638	{
				2639	return SCHED_CAPACITY_SCALE;
				2640	}
				2641	#endif
Vincent Guittot	b5b4860	2015-02-27 16:54:08 +0100	[diff] [blame]	2642
Hao Jia	2679a83	2022-04-30 16:58:42 +0800	[diff] [blame]	2643	#ifdef CONFIG_SCHED_DEBUG
				2644	/*
				2645	* In double_lock_balance()/double_rq_lock(), we use raw_spin_rq_lock() to
				2646	* acquire rq lock instead of rq_lock(). So at the end of these two functions
				2647	* we need to call double_rq_clock_clear_update() to clear RQCF_UPDATED of
				2648	* rq->clock_update_flags to avoid the WARN_DOUBLE_CLOCK warning.
				2649	*/
				2650	static inline void double_rq_clock_clear_update(struct rq rq1, struct rq rq2)
				2651	{
				2652	rq1->clock_update_flags &= (RQCF_REQ_SKIP\|RQCF_ACT_SKIP);
				2653	/* rq1 == rq2 for !CONFIG_SMP, so just clear RQCF_UPDATED once. */
				2654	#ifdef CONFIG_SMP
				2655	rq2->clock_update_flags &= (RQCF_REQ_SKIP\|RQCF_ACT_SKIP);
				2656	#endif
				2657	}
				2658	#else
				2659	static inline void double_rq_clock_clear_update(struct rq rq1, struct rq rq2) {}
				2660	#endif
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2661
Peter Zijlstra	5bb76f1	2023-08-01 22:41:24 +0200	[diff] [blame]	2662	#define DEFINE_LOCK_GUARD_2(name, type, _lock, _unlock, ...) \
				2663	__DEFINE_UNLOCK_GUARD(name, type, _unlock, type *lock2; __VA_ARGS__) \
				2664	static inline class_##name##_t class_##name##_constructor(type lock, type lock2) \
				2665	{ class_##name##_t _t = { .lock = lock, .lock2 = lock2 }, *_T = &_t; \
				2666	_lock; return _t; }
				2667
Peter Zijlstra	d66f1b0	2021-03-02 12:16:48 +0100	[diff] [blame]	2668	#ifdef CONFIG_SMP
				2669
				2670	static inline bool rq_order_less(struct rq rq1, struct rq rq2)
				2671	{
Peter Zijlstra	9edeaea	2020-11-17 18:19:34 -0500	[diff] [blame]	2672	#ifdef CONFIG_SCHED_CORE
				2673	/*
				2674	* In order to not have {0,2},{1,3} turn into into an AB-BA,
				2675	* order by core-id first and cpu-id second.
				2676	*
				2677	* Notably:
				2678	*
				2679	* double_rq_lock(0,3); will take core-0, core-1 lock
				2680	* double_rq_lock(1,2); will take core-1, core-0 lock
				2681	*
				2682	* when only cpu-id is considered.
				2683	*/
				2684	if (rq1->core->cpu < rq2->core->cpu)
				2685	return true;
				2686	if (rq1->core->cpu > rq2->core->cpu)
				2687	return false;
				2688
				2689	/*
				2690	* __sched_core_flip() relies on SMT having cpu-id lock order.
				2691	*/
				2692	#endif
Peter Zijlstra	d66f1b0	2021-03-02 12:16:48 +0100	[diff] [blame]	2693	return rq1->cpu < rq2->cpu;
				2694	}
				2695
				2696	extern void double_rq_lock(struct rq rq1, struct rq rq2);
				2697
				2698	#ifdef CONFIG_PREEMPTION
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2699
				2700	/*
				2701	* fair double_lock_balance: Safely acquires both rq->locks in a fair
				2702	* way at the expense of forcing extra atomic operations in all
				2703	* invocations. This assures that the double_lock is acquired using the
				2704	* same underlying policy as the spinlock_t on this architecture, which
				2705	* reduces latency compared to the unfair variant below. However, it
				2706	* also adds more overhead and therefore may reduce throughput.
				2707	*/
				2708	static inline int _double_lock_balance(struct rq this_rq, struct rq busiest)
				2709	__releases(this_rq->lock)
				2710	__acquires(busiest->lock)
				2711	__acquires(this_rq->lock)
				2712	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2713	raw_spin_rq_unlock(this_rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2714	double_rq_lock(this_rq, busiest);
				2715
				2716	return 1;
				2717	}
				2718
				2719	#else
				2720	/*
				2721	* Unfair double_lock_balance: Optimizes throughput at the expense of
				2722	* latency by eliminating extra atomic operations when the locks are
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2723	* already in proper order on entry. This favors lower CPU-ids and will
				2724	* grant the double lock to lower CPUs over higher ids under contention,
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2725	* regardless of entry order into the function.
				2726	*/
				2727	static inline int _double_lock_balance(struct rq this_rq, struct rq busiest)
				2728	__releases(this_rq->lock)
				2729	__acquires(busiest->lock)
				2730	__acquires(this_rq->lock)
				2731	{
Hao Jia	2679a83	2022-04-30 16:58:42 +0800	[diff] [blame]	2732	if (__rq_lockp(this_rq) == __rq_lockp(busiest) \|\|
				2733	likely(raw_spin_rq_trylock(busiest))) {
				2734	double_rq_clock_clear_update(this_rq, busiest);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2735	return 0;
Hao Jia	2679a83	2022-04-30 16:58:42 +0800	[diff] [blame]	2736	}
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2737
Peter Zijlstra	d66f1b0	2021-03-02 12:16:48 +0100	[diff] [blame]	2738	if (rq_order_less(this_rq, busiest)) {
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2739	raw_spin_rq_lock_nested(busiest, SINGLE_DEPTH_NESTING);
Hao Jia	2679a83	2022-04-30 16:58:42 +0800	[diff] [blame]	2740	double_rq_clock_clear_update(this_rq, busiest);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2741	return 0;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2742	}
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2743
				2744	raw_spin_rq_unlock(this_rq);
Peter Zijlstra	d66f1b0	2021-03-02 12:16:48 +0100	[diff] [blame]	2745	double_rq_lock(this_rq, busiest);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2746
				2747	return 1;
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2748	}
				2749
Thomas Gleixner	c1a280b	2019-07-26 23:19:37 +0200	[diff] [blame]	2750	#endif /* CONFIG_PREEMPTION */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2751
				2752	/*
				2753	* double_lock_balance - lock the busiest runqueue, this_rq is locked already.
				2754	*/
				2755	static inline int double_lock_balance(struct rq this_rq, struct rq busiest)
				2756	{
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2757	lockdep_assert_irqs_disabled();
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2758
				2759	return _double_lock_balance(this_rq, busiest);
				2760	}
				2761
				2762	static inline void double_unlock_balance(struct rq this_rq, struct rq busiest)
				2763	__releases(busiest->lock)
				2764	{
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	2765	if (__rq_lockp(this_rq) != __rq_lockp(busiest))
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2766	raw_spin_rq_unlock(busiest);
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	2767	lock_set_subclass(&__rq_lockp(this_rq)->dep_map, 0, _RET_IP_);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2768	}
				2769
Peter Zijlstra	7460231	2013-10-10 20:17:22 +0200	[diff] [blame]	2770	static inline void double_lock(spinlock_t l1, spinlock_t l2)
				2771	{
				2772	if (l1 > l2)
				2773	swap(l1, l2);
				2774
				2775	spin_lock(l1);
				2776	spin_lock_nested(l2, SINGLE_DEPTH_NESTING);
				2777	}
				2778
Mike Galbraith	60e69ee	2014-04-07 10:55:15 +0200	[diff] [blame]	2779	static inline void double_lock_irq(spinlock_t l1, spinlock_t l2)
				2780	{
				2781	if (l1 > l2)
				2782	swap(l1, l2);
				2783
				2784	spin_lock_irq(l1);
				2785	spin_lock_nested(l2, SINGLE_DEPTH_NESTING);
				2786	}
				2787
Peter Zijlstra	7460231	2013-10-10 20:17:22 +0200	[diff] [blame]	2788	static inline void double_raw_lock(raw_spinlock_t l1, raw_spinlock_t l2)
				2789	{
				2790	if (l1 > l2)
				2791	swap(l1, l2);
				2792
				2793	raw_spin_lock(l1);
				2794	raw_spin_lock_nested(l2, SINGLE_DEPTH_NESTING);
				2795	}
				2796
Peter Zijlstra	5bb76f1	2023-08-01 22:41:24 +0200	[diff] [blame]	2797	static inline void double_raw_unlock(raw_spinlock_t l1, raw_spinlock_t l2)
				2798	{
				2799	raw_spin_unlock(l1);
				2800	raw_spin_unlock(l2);
				2801	}
				2802
				2803	DEFINE_LOCK_GUARD_2(double_raw_spinlock, raw_spinlock_t,
				2804	double_raw_lock(_T->lock, _T->lock2),
				2805	double_raw_unlock(_T->lock, _T->lock2))
				2806
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2807	/*
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2808	* double_rq_unlock - safely unlock two runqueues
				2809	*
				2810	* Note this does not restore interrupts like task_rq_unlock,
				2811	* you need to do so manually after calling.
				2812	*/
				2813	static inline void double_rq_unlock(struct rq rq1, struct rq rq2)
				2814	__releases(rq1->lock)
				2815	__releases(rq2->lock)
				2816	{
Peter Zijlstra	9ef7e7e	2021-03-03 16:45:41 +0100	[diff] [blame]	2817	if (__rq_lockp(rq1) != __rq_lockp(rq2))
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2818	raw_spin_rq_unlock(rq2);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2819	else
				2820	__release(rq2->lock);
Peter Zijlstra	d66f1b0	2021-03-02 12:16:48 +0100	[diff] [blame]	2821	raw_spin_rq_unlock(rq1);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2822	}
				2823
Ingo Molnar	f2cb136	2017-02-01 13:10:18 +0100	[diff] [blame]	2824	extern void set_rq_online (struct rq *rq);
				2825	extern void set_rq_offline(struct rq *rq);
				2826	extern bool sched_smp_initialized;
				2827
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2828	#else /* CONFIG_SMP */
				2829
				2830	/*
				2831	* double_rq_lock - safely lock two runqueues
				2832	*
				2833	* Note this does not disable interrupts like task_rq_lock,
				2834	* you need to do so manually before calling.
				2835	*/
				2836	static inline void double_rq_lock(struct rq rq1, struct rq rq2)
				2837	__acquires(rq1->lock)
				2838	__acquires(rq2->lock)
				2839	{
Ingo Molnar	09348d7	2022-08-11 08:54:52 +0200	[diff] [blame]	2840	WARN_ON_ONCE(!irqs_disabled());
				2841	WARN_ON_ONCE(rq1 != rq2);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2842	raw_spin_rq_lock(rq1);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2843	__acquire(rq2->lock); /* Fake it out ;) */
Hao Jia	2679a83	2022-04-30 16:58:42 +0800	[diff] [blame]	2844	double_rq_clock_clear_update(rq1, rq2);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2845	}
				2846
				2847	/*
				2848	* double_rq_unlock - safely unlock two runqueues
				2849	*
				2850	* Note this does not restore interrupts like task_rq_unlock,
				2851	* you need to do so manually after calling.
				2852	*/
				2853	static inline void double_rq_unlock(struct rq rq1, struct rq rq2)
				2854	__releases(rq1->lock)
				2855	__releases(rq2->lock)
				2856	{
Ingo Molnar	09348d7	2022-08-11 08:54:52 +0200	[diff] [blame]	2857	WARN_ON_ONCE(rq1 != rq2);
Peter Zijlstra	5cb9eaa	2020-11-17 18:19:31 -0500	[diff] [blame]	2858	raw_spin_rq_unlock(rq1);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2859	__release(rq2->lock);
				2860	}
				2861
				2862	#endif
				2863
Peter Zijlstra	5bb76f1	2023-08-01 22:41:24 +0200	[diff] [blame]	2864	DEFINE_LOCK_GUARD_2(double_rq_lock, struct rq,
				2865	double_rq_lock(_T->lock, _T->lock2),
				2866	double_rq_unlock(_T->lock, _T->lock2))
				2867
Abel Wu	2227a95	2023-11-15 11:36:45 +0800	[diff] [blame]	2868	extern struct sched_entity __pick_root_entity(struct cfs_rq cfs_rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2869	extern struct sched_entity __pick_first_entity(struct cfs_rq cfs_rq);
				2870	extern struct sched_entity __pick_last_entity(struct cfs_rq cfs_rq);
Srikar Dronamraju	6b55c96	2015-06-25 22:51:41 +0530	[diff] [blame]	2871
				2872	#ifdef CONFIG_SCHED_DEBUG
Peter Zijlstra	9406415	2021-04-15 18:23:17 +0200	[diff] [blame]	2873	extern bool sched_debug_verbose;
Peter Zijlstra	9469eb0	2017-09-07 17:03:53 +0200	[diff] [blame]	2874
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2875	extern void print_cfs_stats(struct seq_file *m, int cpu);
				2876	extern void print_rt_stats(struct seq_file *m, int cpu);
Wanpeng Li	acb3213	2014-10-31 06:39:33 +0800	[diff] [blame]	2877	extern void print_dl_stats(struct seq_file *m, int cpu);
Mathieu Malaterre	f6a34630	2018-05-16 21:53:47 +0200	[diff] [blame]	2878	extern void print_cfs_rq(struct seq_file m, int cpu, struct cfs_rq cfs_rq);
				2879	extern void print_rt_rq(struct seq_file m, int cpu, struct rt_rq rt_rq);
				2880	extern void print_dl_rq(struct seq_file m, int cpu, struct dl_rq dl_rq);
Paul Turner	c006fac	2021-04-16 14:29:36 -0700	[diff] [blame]	2881
				2882	extern void resched_latency_warn(int cpu, u64 latency);
Srikar Dronamraju	397f237	2015-06-25 22:51:43 +0530	[diff] [blame]	2883	#ifdef CONFIG_NUMA_BALANCING
				2884	extern void
				2885	show_numa_stats(struct task_struct p, struct seq_file m);
				2886	extern void
				2887	print_numa_stats(struct seq_file *m, int node, unsigned long tsf,
				2888	unsigned long tpf, unsigned long gsf, unsigned long gpf);
				2889	#endif /* CONFIG_NUMA_BALANCING */
Paul Turner	c006fac	2021-04-16 14:29:36 -0700	[diff] [blame]	2890	#else
				2891	static inline void resched_latency_warn(int cpu, u64 latency) {}
Srikar Dronamraju	397f237	2015-06-25 22:51:43 +0530	[diff] [blame]	2892	#endif /* CONFIG_SCHED_DEBUG */
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2893
				2894	extern void init_cfs_rq(struct cfs_rq *cfs_rq);
Abel Vesa	07c54f7	2015-03-03 13:50:27 +0200	[diff] [blame]	2895	extern void init_rt_rq(struct rt_rq *rt_rq);
				2896	extern void init_dl_rq(struct dl_rq *dl_rq);
Peter Zijlstra	029632f	2011-10-25 10:00:11 +0200	[diff] [blame]	2897
Ben Segall	1ee14e6	2013-10-16 11:16:12 -0700	[diff] [blame]	2898	extern void cfs_bandwidth_usage_inc(void);
				2899	extern void cfs_bandwidth_usage_dec(void);
Suresh Siddha	1c792db	2011-12-01 17:07:32 -0800	[diff] [blame]	2900
Frederic Weisbecker	3451d02	2011-08-10 23:21:01 +0200	[diff] [blame]	2901	#ifdef CONFIG_NO_HZ_COMMON
Peter Zijlstra	00357f5	2017-12-21 15:06:50 +0100	[diff] [blame]	2902	#define NOHZ_BALANCE_KICK_BIT 0
				2903	#define NOHZ_STATS_KICK_BIT 1
Vincent Guittot	c6f8865	2021-02-24 14:30:06 +0100	[diff] [blame]	2904	#define NOHZ_NEWILB_KICK_BIT 2
Valentin Schneider	efd984c	2021-08-23 12:16:59 +0100	[diff] [blame]	2905	#define NOHZ_NEXT_KICK_BIT 3
Peter Zijlstra	a22e47a	2017-12-21 10:01:24 +0100	[diff] [blame]	2906
Valentin Schneider	efd984c	2021-08-23 12:16:59 +0100	[diff] [blame]	2907	/* Run rebalance_domains() */
Peter Zijlstra	a22e47a	2017-12-21 10:01:24 +0100	[diff] [blame]	2908	#define NOHZ_BALANCE_KICK BIT(NOHZ_BALANCE_KICK_BIT)
Valentin Schneider	efd984c	2021-08-23 12:16:59 +0100	[diff] [blame]	2909	/* Update blocked load */
Peter Zijlstra	b7031a0	2017-12-21 10:11:09 +0100	[diff] [blame]	2910	#define NOHZ_STATS_KICK BIT(NOHZ_STATS_KICK_BIT)
Valentin Schneider	efd984c	2021-08-23 12:16:59 +0100	[diff] [blame]	2911	/* Update blocked load when entering idle */
Vincent Guittot	c6f8865	2021-02-24 14:30:06 +0100	[diff] [blame]	2912	#define NOHZ_NEWILB_KICK BIT(NOHZ_NEWILB_KICK_BIT)
Valentin Schneider	efd984c	2021-08-23 12:16:59 +0100	[diff] [blame]	2913	/* Update nohz.next_balance */
				2914	#define NOHZ_NEXT_KICK BIT(NOHZ_NEXT_KICK_BIT)
Peter Zijlstra	b7031a0	2017-12-21 10:11:09 +0100	[diff] [blame]	2915
Valentin Schneider	efd984c	2021-08-23 12:16:59 +0100	[diff] [blame]	2916	#define NOHZ_KICK_MASK (NOHZ_BALANCE_KICK \| NOHZ_STATS_KICK \| NOHZ_NEXT_KICK)
Suresh Siddha	1c792db	2011-12-01 17:07:32 -0800	[diff] [blame]	2917
				2918	#define nohz_flags(cpu) (&cpu_rq(cpu)->nohz_flags)
Thomas Gleixner	20a5c8c	2016-03-10 12:54:20 +0100	[diff] [blame]	2919
Peter Zijlstra	00357f5	2017-12-21 15:06:50 +0100	[diff] [blame]	2920	extern void nohz_balance_exit_idle(struct rq *rq);
Thomas Gleixner	20a5c8c	2016-03-10 12:54:20 +0100	[diff] [blame]	2921	#else
Peter Zijlstra	00357f5	2017-12-21 15:06:50 +0100	[diff] [blame]	2922	static inline void nohz_balance_exit_idle(struct rq *rq) { }
Suresh Siddha	1c792db	2011-12-01 17:07:32 -0800	[diff] [blame]	2923	#endif
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2924
Vincent Guittot	c6f8865	2021-02-24 14:30:06 +0100	[diff] [blame]	2925	#if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
				2926	extern void nohz_run_idle_balance(int cpu);
				2927	#else
				2928	static inline void nohz_run_idle_balance(int cpu) { }
				2929	#endif
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	2930
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2931	#ifdef CONFIG_IRQ_TIME_ACCOUNTING
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2932	struct irqtime {
Frederic Weisbecker	25e2d8c	2017-04-25 16:10:48 +0200	[diff] [blame]	2933	u64 total;
Frederic Weisbecker	a499a5a	2017-01-31 04:09:32 +0100	[diff] [blame]	2934	u64 tick_delta;
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2935	u64 irq_start_time;
				2936	struct u64_stats_sync sync;
				2937	};
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2938
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2939	DECLARE_PER_CPU(struct irqtime, cpu_irqtime);
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2940
Frederic Weisbecker	25e2d8c	2017-04-25 16:10:48 +0200	[diff] [blame]	2941	/*
				2942	* Returns the irqtime minus the softirq time computed by ksoftirqd.
Ingo Molnar	3b03706	2021-03-18 13:38:50 +0100	[diff] [blame]	2943	* Otherwise ksoftirqd's sum_exec_runtime is subtracted its own runtime
Frederic Weisbecker	25e2d8c	2017-04-25 16:10:48 +0200	[diff] [blame]	2944	* and never move forward.
				2945	*/
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2946	static inline u64 irq_time_read(int cpu)
				2947	{
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2948	struct irqtime *irqtime = &per_cpu(cpu_irqtime, cpu);
				2949	unsigned int seq;
				2950	u64 total;
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2951
				2952	do {
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2953	seq = __u64_stats_fetch_begin(&irqtime->sync);
Frederic Weisbecker	25e2d8c	2017-04-25 16:10:48 +0200	[diff] [blame]	2954	total = irqtime->total;
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2955	} while (__u64_stats_fetch_retry(&irqtime->sync, seq));
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2956
Frederic Weisbecker	19d23dbf	2016-09-26 02:29:20 +0200	[diff] [blame]	2957	return total;
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2958	}
Frederic Weisbecker	73fbec6	2012-06-16 15:57:37 +0200	[diff] [blame]	2959	#endif /* CONFIG_IRQ_TIME_ACCOUNTING */
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2960
				2961	#ifdef CONFIG_CPU_FREQ
Joel Fernandes (Google)	b10abd0	2019-03-20 20:34:23 -0400	[diff] [blame]	2962	DECLARE_PER_CPU(struct update_util_data __rcu *, cpufreq_update_util_data);
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2963
				2964	/**
				2965	* cpufreq_update_util - Take a note about CPU utilization changes.
Rafael J. Wysocki	12bde33	2016-08-10 03:11:17 +0200	[diff] [blame]	2966	* @rq: Runqueue to carry out the update for.
Rafael J. Wysocki	58919e8	2016-08-16 22:14:55 +0200	[diff] [blame]	2967	* @flags: Update reason flags.
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2968	*
Rafael J. Wysocki	58919e8	2016-08-16 22:14:55 +0200	[diff] [blame]	2969	* This function is called by the scheduler on the CPU whose utilization is
				2970	* being updated.
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2971	*
				2972	* It can only be called from RCU-sched read-side critical sections.
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2973	*
				2974	* The way cpufreq is currently arranged requires it to evaluate the CPU
				2975	* performance state (frequency/voltage) on a regular basis to prevent it from
				2976	* being stuck in a completely inadequate performance level for too long.
Juri Lelli	e0367b1	2017-12-04 11:23:19 +0100	[diff] [blame]	2977	* That is not guaranteed to happen if the updates are only triggered from CFS
				2978	* and DL, though, because they may not be coming in if only RT tasks are
				2979	* active all the time (or there are RT tasks only).
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2980	*
Juri Lelli	e0367b1	2017-12-04 11:23:19 +0100	[diff] [blame]	2981	* As a workaround for that issue, this function is called periodically by the
				2982	* RT sched class to trigger extra cpufreq updates to prevent it from stalling,
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2983	* but that really is a band-aid. Going forward it should be replaced with
Juri Lelli	e0367b1	2017-12-04 11:23:19 +0100	[diff] [blame]	2984	* solutions targeted more specifically at RT tasks.
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2985	*/
Rafael J. Wysocki	12bde33	2016-08-10 03:11:17 +0200	[diff] [blame]	2986	static inline void cpufreq_update_util(struct rq *rq, unsigned int flags)
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2987	{
Rafael J. Wysocki	58919e8	2016-08-16 22:14:55 +0200	[diff] [blame]	2988	struct update_util_data *data;
				2989
Viresh Kumar	674e754	2017-07-28 12:16:38 +0530	[diff] [blame]	2990	data = rcu_dereference_sched(*per_cpu_ptr(&cpufreq_update_util_data,
				2991	cpu_of(rq)));
Rafael J. Wysocki	58919e8	2016-08-16 22:14:55 +0200	[diff] [blame]	2992	if (data)
Rafael J. Wysocki	12bde33	2016-08-10 03:11:17 +0200	[diff] [blame]	2993	data->func(data, rq_clock(rq), flags);
				2994	}
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2995	#else
Rafael J. Wysocki	12bde33	2016-08-10 03:11:17 +0200	[diff] [blame]	2996	static inline void cpufreq_update_util(struct rq *rq, unsigned int flags) {}
Rafael J. Wysocki	adaf9fc	2016-03-10 20:44:47 +0100	[diff] [blame]	2997	#endif /* CONFIG_CPU_FREQ */
Linus Torvalds	be53f58	2016-03-24 09:42:50 -0700	[diff] [blame]	2998
Rafael J. Wysocki	9bdcb44	2016-04-02 01:09:12 +0200	[diff] [blame]	2999	#ifdef arch_scale_freq_capacity
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	3000	# ifndef arch_scale_freq_invariant
				3001	# define arch_scale_freq_invariant() true
				3002	# endif
				3003	#else
				3004	# define arch_scale_freq_invariant() false
Rafael J. Wysocki	9bdcb44	2016-04-02 01:09:12 +0200	[diff] [blame]	3005	#endif
Juri Lelli	d4edd66	2017-12-04 11:23:18 +0100	[diff] [blame]	3006
Vincent Guittot	10a35e6	2019-01-23 16:26:54 +0100	[diff] [blame]	3007	#ifdef CONFIG_SMP
Viresh Kumar	a5418be	2020-12-08 09:46:56 +0530	[diff] [blame]	3008	unsigned long effective_cpu_util(int cpu, unsigned long util_cfs,
Vincent Guittot	9c0b4bb	2023-11-22 14:39:03 +0100	[diff] [blame]	3009	unsigned long *min,
				3010	unsigned long *max);
				3011
				3012	unsigned long sugov_effective_cpu_perf(int cpu, unsigned long actual,
				3013	unsigned long min,
				3014	unsigned long max);
				3015
Quentin Perret	938e5e4	2018-12-03 09:56:15 +0000	[diff] [blame]	3016
Dietmar Eggemann	b3f53da	2022-07-29 13:13:05 +0200	[diff] [blame]	3017	/*
				3018	* Verify the fitness of task @p to run on @cpu taking into account the
				3019	* CPU original capacity and the runtime/deadline ratio of the task.
				3020	*
				3021	* The function will return true if the original capacity of @cpu is
				3022	* greater than or equal to task's deadline density right shifted by
				3023	* (BW_SHIFT - SCHED_CAPACITY_SHIFT) and false otherwise.
				3024	*/
				3025	static inline bool dl_task_fits_capacity(struct task_struct *p, int cpu)
				3026	{
				3027	unsigned long cap = arch_scale_cpu_capacity(cpu);
				3028
				3029	return cap >= p->dl.dl_density >> (BW_SHIFT - SCHED_CAPACITY_SHIFT);
				3030	}
				3031
Vincent Guittot	8cc9051	2018-06-28 17:45:08 +0200	[diff] [blame]	3032	static inline unsigned long cpu_bw_dl(struct rq *rq)
Juri Lelli	d4edd66	2017-12-04 11:23:18 +0100	[diff] [blame]	3033	{
				3034	return (rq->dl.running_bw * SCHED_CAPACITY_SCALE) >> BW_SHIFT;
				3035	}
				3036
Vincent Guittot	8cc9051	2018-06-28 17:45:08 +0200	[diff] [blame]	3037	static inline unsigned long cpu_util_dl(struct rq *rq)
				3038	{
				3039	return READ_ONCE(rq->avg_dl.util_avg);
				3040	}
				3041
Dietmar Eggemann	82762d2	2021-11-18 17:42:40 +0100	[diff] [blame]	3042
Dietmar Eggemann	3eb6d6e	2023-05-15 13:57:34 +0200	[diff] [blame]	3043	extern unsigned long cpu_util_cfs(int cpu);
Dietmar Eggemann	7d0583c	2023-05-15 13:57:35 +0200	[diff] [blame]	3044	extern unsigned long cpu_util_cfs_boost(int cpu);
Vincent Guittot	371bf42	2018-06-28 17:45:05 +0200	[diff] [blame]	3045
				3046	static inline unsigned long cpu_util_rt(struct rq *rq)
				3047	{
Vincent Guittot	dfa444d	2018-06-28 17:45:11 +0200	[diff] [blame]	3048	return READ_ONCE(rq->avg_rt.util_avg);
Vincent Guittot	371bf42	2018-06-28 17:45:05 +0200	[diff] [blame]	3049	}
Viresh Kumar	7d6a905f	2020-12-08 09:46:55 +0530	[diff] [blame]	3050	#endif
Vincent Guittot	9033ea1	2018-06-28 17:45:10 +0200	[diff] [blame]	3051
Qais Yousef	7a17e1d	2021-12-16 22:53:19 +0000	[diff] [blame]	3052	#ifdef CONFIG_UCLAMP_TASK
				3053	unsigned long uclamp_eff_value(struct task_struct *p, enum uclamp_id clamp_id);
				3054
Qais Yousef	2442260	2022-08-04 15:36:03 +0100	[diff] [blame]	3055	static inline unsigned long uclamp_rq_get(struct rq *rq,
				3056	enum uclamp_id clamp_id)
				3057	{
				3058	return READ_ONCE(rq->uclamp[clamp_id].value);
				3059	}
				3060
				3061	static inline void uclamp_rq_set(struct rq *rq, enum uclamp_id clamp_id,
				3062	unsigned int value)
				3063	{
				3064	WRITE_ONCE(rq->uclamp[clamp_id].value, value);
				3065	}
				3066
				3067	static inline bool uclamp_rq_is_idle(struct rq *rq)
				3068	{
				3069	return rq->uclamp_flags & UCLAMP_FLAG_IDLE;
				3070	}
				3071
Qais Yousef	7a17e1d	2021-12-16 22:53:19 +0000	[diff] [blame]	3072	/* Is the rq being capped/throttled by uclamp_max? */
				3073	static inline bool uclamp_rq_is_capped(struct rq *rq)
				3074	{
				3075	unsigned long rq_util;
				3076	unsigned long max_util;
				3077
				3078	if (!static_branch_likely(&sched_uclamp_used))
				3079	return false;
				3080
				3081	rq_util = cpu_util_cfs(cpu_of(rq)) + cpu_util_rt(rq);
				3082	max_util = READ_ONCE(rq->uclamp[UCLAMP_MAX].value);
				3083
				3084	return max_util != SCHED_CAPACITY_SCALE && rq_util >= max_util;
				3085	}
				3086
				3087	/*
				3088	* When uclamp is compiled in, the aggregation at rq level is 'turned off'
				3089	* by default in the fast path and only gets turned on once userspace performs
				3090	* an operation that requires it.
				3091	*
				3092	* Returns true if userspace opted-in to use uclamp and aggregation at rq level
				3093	* hence is active.
				3094	*/
				3095	static inline bool uclamp_is_used(void)
				3096	{
				3097	return static_branch_likely(&sched_uclamp_used);
				3098	}
				3099	#else /* CONFIG_UCLAMP_TASK */
Qais Yousef	b48e16a	2022-08-04 15:36:02 +0100	[diff] [blame]	3100	static inline unsigned long uclamp_eff_value(struct task_struct *p,
				3101	enum uclamp_id clamp_id)
				3102	{
				3103	if (clamp_id == UCLAMP_MIN)
				3104	return 0;
				3105
				3106	return SCHED_CAPACITY_SCALE;
				3107	}
				3108
Qais Yousef	7a17e1d	2021-12-16 22:53:19 +0000	[diff] [blame]	3109	static inline bool uclamp_rq_is_capped(struct rq *rq) { return false; }
				3110
				3111	static inline bool uclamp_is_used(void)
				3112	{
				3113	return false;
				3114	}
Qais Yousef	2442260	2022-08-04 15:36:03 +0100	[diff] [blame]	3115
				3116	static inline unsigned long uclamp_rq_get(struct rq *rq,
				3117	enum uclamp_id clamp_id)
				3118	{
				3119	if (clamp_id == UCLAMP_MIN)
				3120	return 0;
				3121
				3122	return SCHED_CAPACITY_SCALE;
				3123	}
				3124
				3125	static inline void uclamp_rq_set(struct rq *rq, enum uclamp_id clamp_id,
				3126	unsigned int value)
				3127	{
				3128	}
				3129
				3130	static inline bool uclamp_rq_is_idle(struct rq *rq)
				3131	{
				3132	return false;
				3133	}
Qais Yousef	7a17e1d	2021-12-16 22:53:19 +0000	[diff] [blame]	3134	#endif /* CONFIG_UCLAMP_TASK */
				3135
Vincent Guittot	11d4afd	2018-09-25 11:17:42 +0200	[diff] [blame]	3136	#ifdef CONFIG_HAVE_SCHED_AVG_IRQ
Vincent Guittot	9033ea1	2018-06-28 17:45:10 +0200	[diff] [blame]	3137	static inline unsigned long cpu_util_irq(struct rq *rq)
				3138	{
				3139	return rq->avg_irq.util_avg;
				3140	}
Vincent Guittot	2e62c47	2018-07-19 14:00:06 +0200	[diff] [blame]	3141
				3142	static inline
				3143	unsigned long scale_irq_capacity(unsigned long util, unsigned long irq, unsigned long max)
				3144	{
				3145	util *= (max - irq);
				3146	util /= max;
				3147
				3148	return util;
				3149
				3150	}
Vincent Guittot	9033ea1	2018-06-28 17:45:10 +0200	[diff] [blame]	3151	#else
				3152	static inline unsigned long cpu_util_irq(struct rq *rq)
				3153	{
				3154	return 0;
				3155	}
				3156
Vincent Guittot	2e62c47	2018-07-19 14:00:06 +0200	[diff] [blame]	3157	static inline
				3158	unsigned long scale_irq_capacity(unsigned long util, unsigned long irq, unsigned long max)
				3159	{
				3160	return util;
				3161	}
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	3162	#endif
Quentin Perret	6aa140f	2018-12-03 09:56:18 +0000	[diff] [blame]	3163
Quentin Perret	531b5c9	2018-12-03 09:56:21 +0000	[diff] [blame]	3164	#if defined(CONFIG_ENERGY_MODEL) && defined(CONFIG_CPU_FREQ_GOV_SCHEDUTIL)
Quentin Perret	1f74de8	2018-12-03 09:56:22 +0000	[diff] [blame]	3165
Peter Zijlstra	f8a696f	2018-12-05 11:23:56 +0100	[diff] [blame]	3166	#define perf_domain_span(pd) (to_cpumask(((pd)->em_pd->cpus)))
				3167
				3168	DECLARE_STATIC_KEY_FALSE(sched_energy_present);
				3169
				3170	static inline bool sched_energy_enabled(void)
				3171	{
				3172	return static_branch_unlikely(&sched_energy_present);
				3173	}
				3174
Ingo Molnar	f2273f4	2023-10-09 17:31:26 +0200	[diff] [blame]	3175	extern struct cpufreq_governor schedutil_gov;
				3176
Peter Zijlstra	f8a696f	2018-12-05 11:23:56 +0100	[diff] [blame]	3177	#else /* ! (CONFIG_ENERGY_MODEL && CONFIG_CPU_FREQ_GOV_SCHEDUTIL) */
				3178
				3179	#define perf_domain_span(pd) NULL
				3180	static inline bool sched_energy_enabled(void) { return false; }
				3181
				3182	#endif /* CONFIG_ENERGY_MODEL && CONFIG_CPU_FREQ_GOV_SCHEDUTIL */
Mathieu Desnoyers	227a4aa	2019-09-19 13:37:02 -0400	[diff] [blame]	3183
				3184	#ifdef CONFIG_MEMBARRIER
				3185	/*
				3186	* The scheduler provides memory barriers required by membarrier between:
				3187	* - prior user-space memory accesses and store to rq->membarrier_state,
				3188	* - store to rq->membarrier_state and following user-space memory accesses.
				3189	* In the same way it provides those guarantees around store to rq->curr.
				3190	*/
				3191	static inline void membarrier_switch_mm(struct rq *rq,
				3192	struct mm_struct *prev_mm,
				3193	struct mm_struct *next_mm)
				3194	{
				3195	int membarrier_state;
				3196
				3197	if (prev_mm == next_mm)
				3198	return;
				3199
				3200	membarrier_state = atomic_read(&next_mm->membarrier_state);
				3201	if (READ_ONCE(rq->membarrier_state) == membarrier_state)
				3202	return;
				3203
				3204	WRITE_ONCE(rq->membarrier_state, membarrier_state);
				3205	}
				3206	#else
				3207	static inline void membarrier_switch_mm(struct rq *rq,
				3208	struct mm_struct *prev_mm,
				3209	struct mm_struct *next_mm)
				3210	{
				3211	}
				3212	#endif
Mel Gorman	52262ee	2020-01-28 15:40:06 +0000	[diff] [blame]	3213
				3214	#ifdef CONFIG_SMP
				3215	static inline bool is_per_cpu_kthread(struct task_struct *p)
				3216	{
				3217	if (!(p->flags & PF_KTHREAD))
				3218	return false;
				3219
				3220	if (p->nr_cpus_allowed != 1)
				3221	return false;
				3222
				3223	return true;
				3224	}
				3225	#endif
Thomas Gleixner	b3212fe	2020-03-21 12:25:59 +0100	[diff] [blame]	3226
Peter Zijlstra	1011dcc	2021-03-25 12:21:38 +0100	[diff] [blame]	3227	extern void swake_up_all_locked(struct swait_queue_head *q);
				3228	extern void __prepare_to_swait(struct swait_queue_head q, struct swait_queue wait);
				3229
Peter Oskolkov	ab83f45	2023-03-07 23:31:57 -0800	[diff] [blame]	3230	extern int try_to_wake_up(struct task_struct *tsk, unsigned int state, int wake_flags);
				3231
Peter Zijlstra	1011dcc	2021-03-25 12:21:38 +0100	[diff] [blame]	3232	#ifdef CONFIG_PREEMPT_DYNAMIC
				3233	extern int preempt_dynamic_mode;
				3234	extern int sched_dynamic_mode(const char *str);
				3235	extern void sched_dynamic_update(int mode);
				3236	#endif
				3237
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3238	#ifdef CONFIG_SCHED_MM_CID
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3239
				3240	#define SCHED_MM_CID_PERIOD_NS (100ULL * 1000000) /* 100ms */
				3241	#define MM_CID_SCAN_DELAY 100 /* 100ms */
				3242
				3243	extern raw_spinlock_t cid_lock;
				3244	extern int use_cid_lock;
				3245
				3246	extern void sched_mm_cid_migrate_from(struct task_struct *t);
				3247	extern void sched_mm_cid_migrate_to(struct rq dst_rq, struct task_struct t);
				3248	extern void task_tick_mm_cid(struct rq rq, struct task_struct curr);
				3249	extern void init_sched_mm_cid(struct task_struct *t);
				3250
				3251	static inline void __mm_cid_put(struct mm_struct *mm, int cid)
				3252	{
				3253	if (cid < 0)
				3254	return;
				3255	cpumask_clear_cpu(cid, mm_cidmask(mm));
				3256	}
				3257
				3258	/*
				3259	* The per-mm/cpu cid can have the MM_CID_LAZY_PUT flag set or transition to
				3260	* the MM_CID_UNSET state without holding the rq lock, but the rq lock needs to
				3261	* be held to transition to other states.
				3262	*
				3263	* State transitions synchronized with cmpxchg or try_cmpxchg need to be
				3264	* consistent across cpus, which prevents use of this_cpu_cmpxchg.
				3265	*/
				3266	static inline void mm_cid_put_lazy(struct task_struct *t)
				3267	{
				3268	struct mm_struct *mm = t->mm;
				3269	struct mm_cid __percpu *pcpu_cid = mm->pcpu_cid;
				3270	int cid;
				3271
				3272	lockdep_assert_irqs_disabled();
				3273	cid = __this_cpu_read(pcpu_cid->cid);
				3274	if (!mm_cid_is_lazy_put(cid) \|\|
				3275	!try_cmpxchg(&this_cpu_ptr(pcpu_cid)->cid, &cid, MM_CID_UNSET))
				3276	return;
				3277	__mm_cid_put(mm, mm_cid_clear_lazy_put(cid));
				3278	}
				3279
				3280	static inline int mm_cid_pcpu_unset(struct mm_struct *mm)
				3281	{
				3282	struct mm_cid __percpu *pcpu_cid = mm->pcpu_cid;
				3283	int cid, res;
				3284
				3285	lockdep_assert_irqs_disabled();
				3286	cid = __this_cpu_read(pcpu_cid->cid);
				3287	for (;;) {
				3288	if (mm_cid_is_unset(cid))
				3289	return MM_CID_UNSET;
				3290	/*
				3291	* Attempt transition from valid or lazy-put to unset.
				3292	*/
				3293	res = cmpxchg(&this_cpu_ptr(pcpu_cid)->cid, cid, MM_CID_UNSET);
				3294	if (res == cid)
				3295	break;
				3296	cid = res;
				3297	}
				3298	return cid;
				3299	}
				3300
				3301	static inline void mm_cid_put(struct mm_struct *mm)
				3302	{
				3303	int cid;
				3304
				3305	lockdep_assert_irqs_disabled();
				3306	cid = mm_cid_pcpu_unset(mm);
				3307	if (cid == MM_CID_UNSET)
				3308	return;
				3309	__mm_cid_put(mm, mm_cid_clear_lazy_put(cid));
				3310	}
				3311
				3312	static inline int __mm_cid_try_get(struct mm_struct *mm)
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3313	{
				3314	struct cpumask *cpumask;
				3315	int cid;
				3316
				3317	cpumask = mm_cidmask(mm);
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3318	/*
				3319	* Retry finding first zero bit if the mask is temporarily
				3320	* filled. This only happens during concurrent remote-clear
				3321	* which owns a cid without holding a rq lock.
				3322	*/
				3323	for (;;) {
				3324	cid = cpumask_first_zero(cpumask);
				3325	if (cid < nr_cpu_ids)
				3326	break;
				3327	cpu_relax();
				3328	}
				3329	if (cpumask_test_and_set_cpu(cid, cpumask))
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3330	return -1;
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3331	return cid;
				3332	}
				3333
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3334	/*
				3335	* Save a snapshot of the current runqueue time of this cpu
				3336	* with the per-cpu cid value, allowing to estimate how recently it was used.
				3337	*/
				3338	static inline void mm_cid_snapshot_time(struct rq rq, struct mm_struct mm)
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3339	{
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3340	struct mm_cid *pcpu_cid = per_cpu_ptr(mm->pcpu_cid, cpu_of(rq));
				3341
				3342	lockdep_assert_rq_held(rq);
				3343	WRITE_ONCE(pcpu_cid->time, rq->clock);
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3344	}
				3345
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3346	static inline int __mm_cid_get(struct rq rq, struct mm_struct mm)
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3347	{
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3348	int cid;
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3349
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3350	/*
				3351	* All allocations (even those using the cid_lock) are lock-free. If
				3352	* use_cid_lock is set, hold the cid_lock to perform cid allocation to
				3353	* guarantee forward progress.
				3354	*/
				3355	if (!READ_ONCE(use_cid_lock)) {
				3356	cid = __mm_cid_try_get(mm);
				3357	if (cid >= 0)
				3358	goto end;
				3359	raw_spin_lock(&cid_lock);
				3360	} else {
				3361	raw_spin_lock(&cid_lock);
				3362	cid = __mm_cid_try_get(mm);
				3363	if (cid >= 0)
				3364	goto unlock;
				3365	}
				3366
				3367	/*
				3368	* cid concurrently allocated. Retry while forcing following
				3369	* allocations to use the cid_lock to ensure forward progress.
				3370	*/
				3371	WRITE_ONCE(use_cid_lock, 1);
				3372	/*
				3373	* Set use_cid_lock before allocation. Only care about program order
				3374	* because this is only required for forward progress.
				3375	*/
				3376	barrier();
				3377	/*
				3378	* Retry until it succeeds. It is guaranteed to eventually succeed once
				3379	* all newcoming allocations observe the use_cid_lock flag set.
				3380	*/
				3381	do {
				3382	cid = __mm_cid_try_get(mm);
				3383	cpu_relax();
				3384	} while (cid < 0);
				3385	/*
				3386	* Allocate before clearing use_cid_lock. Only care about
				3387	* program order because this is for forward progress.
				3388	*/
				3389	barrier();
				3390	WRITE_ONCE(use_cid_lock, 0);
				3391	unlock:
				3392	raw_spin_unlock(&cid_lock);
				3393	end:
				3394	mm_cid_snapshot_time(rq, mm);
				3395	return cid;
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3396	}
				3397
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3398	static inline int mm_cid_get(struct rq rq, struct mm_struct mm)
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3399	{
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3400	struct mm_cid __percpu *pcpu_cid = mm->pcpu_cid;
				3401	struct cpumask *cpumask;
				3402	int cid;
				3403
				3404	lockdep_assert_rq_held(rq);
				3405	cpumask = mm_cidmask(mm);
				3406	cid = __this_cpu_read(pcpu_cid->cid);
				3407	if (mm_cid_is_valid(cid)) {
				3408	mm_cid_snapshot_time(rq, mm);
				3409	return cid;
				3410	}
				3411	if (mm_cid_is_lazy_put(cid)) {
				3412	if (try_cmpxchg(&this_cpu_ptr(pcpu_cid)->cid, &cid, MM_CID_UNSET))
				3413	__mm_cid_put(mm, mm_cid_clear_lazy_put(cid));
				3414	}
				3415	cid = __mm_cid_get(rq, mm);
				3416	__this_cpu_write(pcpu_cid->cid, cid);
				3417	return cid;
				3418	}
				3419
				3420	static inline void switch_mm_cid(struct rq *rq,
				3421	struct task_struct *prev,
				3422	struct task_struct *next)
				3423	{
				3424	/*
				3425	* Provide a memory barrier between rq->curr store and load of
				3426	* {prev,next}->mm->pcpu_cid[cpu] on rq->curr->mm transition.
				3427	*
				3428	* Should be adapted if context_switch() is modified.
				3429	*/
				3430	if (!next->mm) { // to kernel
				3431	/*
				3432	* user -> kernel transition does not guarantee a barrier, but
				3433	* we can use the fact that it performs an atomic operation in
				3434	* mmgrab().
				3435	*/
				3436	if (prev->mm) // from user
				3437	smp_mb__after_mmgrab();
				3438	/*
				3439	* kernel -> kernel transition does not change rq->curr->mm
				3440	* state. It stays NULL.
				3441	*/
				3442	} else { // to user
				3443	/*
				3444	* kernel -> user transition does not provide a barrier
				3445	* between rq->curr store and load of {prev,next}->mm->pcpu_cid[cpu].
				3446	* Provide it here.
				3447	*/
				3448	if (!prev->mm) // from kernel
				3449	smp_mb();
				3450	/*
				3451	* user -> user transition guarantees a memory barrier through
				3452	* switch_mm() when current->mm changes. If current->mm is
				3453	* unchanged, no barrier is needed.
				3454	*/
				3455	}
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3456	if (prev->mm_cid_active) {
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3457	mm_cid_snapshot_time(rq, prev->mm);
				3458	mm_cid_put_lazy(prev);
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3459	prev->mm_cid = -1;
				3460	}
				3461	if (next->mm_cid_active)
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3462	next->last_mm_cid = next->mm_cid = mm_cid_get(rq, next->mm);
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3463	}
				3464
				3465	#else
Mathieu Desnoyers	223baf9	2023-04-20 10:55:48 -0400	[diff] [blame]	3466	static inline void switch_mm_cid(struct rq rq, struct task_struct prev, struct task_struct *next) { }
				3467	static inline void sched_mm_cid_migrate_from(struct task_struct *t) { }
				3468	static inline void sched_mm_cid_migrate_to(struct rq dst_rq, struct task_struct t) { }
				3469	static inline void task_tick_mm_cid(struct rq rq, struct task_struct curr) { }
				3470	static inline void init_sched_mm_cid(struct task_struct *t) { }
Mathieu Desnoyers	af7f588	2022-11-22 15:39:09 -0500	[diff] [blame]	3471	#endif
				3472
Peter Zijlstra	af4cf40	2023-05-31 13:58:40 +0200	[diff] [blame]	3473	extern u64 avg_vruntime(struct cfs_rq *cfs_rq);
Peter Zijlstra	147f3ef	2023-05-31 13:58:44 +0200	[diff] [blame]	3474	extern int entity_eligible(struct cfs_rq cfs_rq, struct sched_entity se);
Peter Zijlstra	af4cf40	2023-05-31 13:58:40 +0200	[diff] [blame]	3475
Ingo Molnar	9545847	2022-02-22 14:50:43 +0100	[diff] [blame]	3476	#endif /* _KERNEL_SCHED_SCHED_H */