Blame - kernel/sched/deadline.c - SHIFTPHONES/mainline/linux

blob: eed2e449b3131c7326f97ed8c7928d31fb509457 [file] [log] [blame]

Greg Kroah-Hartman	b244131	2017-11-01 15:07:57 +0100	[diff] [blame]	1	// SPDX-License-Identifier: GPL-2.0
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2	/*
				3	* Deadline Scheduling Class (SCHED_DEADLINE)
				4	*
				5	* Earliest Deadline First (EDF) + Constant Bandwidth Server (CBS).
				6	*
				7	* Tasks that periodically executes their instances for less than their
				8	* runtime won't miss any of their deadlines.
				9	* Tasks that are not periodic or sporadic or that tries to execute more
				10	* than their reserved bandwidth will be slowed down (and may potentially
				11	* miss some of their deadlines), and won't affect any other task.
				12	*
				13	* Copyright (C) 2012 Dario Faggioli <raistlin@linux.it>,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	14	* Juri Lelli <juri.lelli@gmail.com>,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	15	* Michael Trimarchi <michael@amarulasolutions.com>,
				16	* Fabio Checconi <fchecconi@gmail.com>
				17	*/
				18	#include "sched.h"
Vincent Guittot	3727e0e	2018-06-28 17:45:07 +0200	[diff] [blame]	19	#include "pelt.h"
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	20
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	21	struct dl_bandwidth def_dl_bandwidth;
				22
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	23	static inline struct task_struct dl_task_of(struct sched_dl_entity dl_se)
				24	{
				25	return container_of(dl_se, struct task_struct, dl);
				26	}
				27
				28	static inline struct rq rq_of_dl_rq(struct dl_rq dl_rq)
				29	{
				30	return container_of(dl_rq, struct rq, dl);
				31	}
				32
				33	static inline struct dl_rq dl_rq_of_se(struct sched_dl_entity dl_se)
				34	{
				35	struct task_struct *p = dl_task_of(dl_se);
				36	struct rq *rq = task_rq(p);
				37
				38	return &rq->dl;
				39	}
				40
				41	static inline int on_dl_rq(struct sched_dl_entity *dl_se)
				42	{
				43	return !RB_EMPTY_NODE(&dl_se->rb_node);
				44	}
				45
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	46	#ifdef CONFIG_SMP
				47	static inline struct dl_bw *dl_bw_of(int i)
				48	{
				49	RCU_LOCKDEP_WARN(!rcu_read_lock_sched_held(),
				50	"sched RCU must be held");
				51	return &cpu_rq(i)->rd->dl_bw;
				52	}
				53
				54	static inline int dl_bw_cpus(int i)
				55	{
				56	struct root_domain *rd = cpu_rq(i)->rd;
Dietmar Eggemann	c81b893	2020-05-20 15:42:39 +0200	[diff] [blame]	57	int cpus;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	58
				59	RCU_LOCKDEP_WARN(!rcu_read_lock_sched_held(),
				60	"sched RCU must be held");
Dietmar Eggemann	c81b893	2020-05-20 15:42:39 +0200	[diff] [blame]	61
				62	if (cpumask_subset(rd->span, cpu_active_mask))
				63	return cpumask_weight(rd->span);
				64
				65	cpus = 0;
				66
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	67	for_each_cpu_and(i, rd->span, cpu_active_mask)
				68	cpus++;
				69
				70	return cpus;
				71	}
Dietmar Eggemann	fc9dc69	2020-05-20 15:42:40 +0200	[diff] [blame]	72
				73	static inline unsigned long __dl_bw_capacity(int i)
				74	{
				75	struct root_domain *rd = cpu_rq(i)->rd;
				76	unsigned long cap = 0;
				77
				78	RCU_LOCKDEP_WARN(!rcu_read_lock_sched_held(),
				79	"sched RCU must be held");
				80
				81	for_each_cpu_and(i, rd->span, cpu_active_mask)
				82	cap += capacity_orig_of(i);
				83
				84	return cap;
				85	}
				86
				87	/*
				88	* XXX Fix: If 'rq->rd == def_root_domain' perform AC against capacity
				89	* of the CPU the task is running on rather rd's \Sum CPU capacity.
				90	*/
				91	static inline unsigned long dl_bw_capacity(int i)
				92	{
				93	if (!static_branch_unlikely(&sched_asym_cpucapacity) &&
				94	capacity_orig_of(i) == SCHED_CAPACITY_SCALE) {
				95	return dl_bw_cpus(i) << SCHED_CAPACITY_SHIFT;
				96	} else {
				97	return __dl_bw_capacity(i);
				98	}
				99	}
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	100	#else
				101	static inline struct dl_bw *dl_bw_of(int i)
				102	{
				103	return &cpu_rq(i)->dl.dl_bw;
				104	}
				105
				106	static inline int dl_bw_cpus(int i)
				107	{
				108	return 1;
				109	}
Dietmar Eggemann	fc9dc69	2020-05-20 15:42:40 +0200	[diff] [blame]	110
				111	static inline unsigned long dl_bw_capacity(int i)
				112	{
				113	return SCHED_CAPACITY_SCALE;
				114	}
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	115	#endif
				116
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	117	static inline
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	118	void __add_running_bw(u64 dl_bw, struct dl_rq *dl_rq)
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	119	{
				120	u64 old = dl_rq->running_bw;
				121
				122	lockdep_assert_held(&(rq_of_dl_rq(dl_rq))->lock);
				123	dl_rq->running_bw += dl_bw;
				124	SCHED_WARN_ON(dl_rq->running_bw < old); /* overflow */
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	125	SCHED_WARN_ON(dl_rq->running_bw > dl_rq->this_bw);
Juri Lelli	e0367b1	2017-12-04 11:23:19 +0100	[diff] [blame]	126	/* kick cpufreq (see the comment in kernel/sched/sched.h). */
Peter Zijlstra	4042d003	2017-12-20 15:37:26 +0100	[diff] [blame]	127	cpufreq_update_util(rq_of_dl_rq(dl_rq), 0);
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	128	}
				129
				130	static inline
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	131	void __sub_running_bw(u64 dl_bw, struct dl_rq *dl_rq)
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	132	{
				133	u64 old = dl_rq->running_bw;
				134
				135	lockdep_assert_held(&(rq_of_dl_rq(dl_rq))->lock);
				136	dl_rq->running_bw -= dl_bw;
				137	SCHED_WARN_ON(dl_rq->running_bw > old); /* underflow */
				138	if (dl_rq->running_bw > old)
				139	dl_rq->running_bw = 0;
Juri Lelli	e0367b1	2017-12-04 11:23:19 +0100	[diff] [blame]	140	/* kick cpufreq (see the comment in kernel/sched/sched.h). */
Peter Zijlstra	4042d003	2017-12-20 15:37:26 +0100	[diff] [blame]	141	cpufreq_update_util(rq_of_dl_rq(dl_rq), 0);
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	142	}
				143
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	144	static inline
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	145	void __add_rq_bw(u64 dl_bw, struct dl_rq *dl_rq)
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	146	{
				147	u64 old = dl_rq->this_bw;
				148
				149	lockdep_assert_held(&(rq_of_dl_rq(dl_rq))->lock);
				150	dl_rq->this_bw += dl_bw;
				151	SCHED_WARN_ON(dl_rq->this_bw < old); /* overflow */
				152	}
				153
				154	static inline
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	155	void __sub_rq_bw(u64 dl_bw, struct dl_rq *dl_rq)
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	156	{
				157	u64 old = dl_rq->this_bw;
				158
				159	lockdep_assert_held(&(rq_of_dl_rq(dl_rq))->lock);
				160	dl_rq->this_bw -= dl_bw;
				161	SCHED_WARN_ON(dl_rq->this_bw > old); /* underflow */
				162	if (dl_rq->this_bw > old)
				163	dl_rq->this_bw = 0;
				164	SCHED_WARN_ON(dl_rq->running_bw > dl_rq->this_bw);
				165	}
				166
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	167	static inline
				168	void add_rq_bw(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				169	{
				170	if (!dl_entity_is_special(dl_se))
				171	__add_rq_bw(dl_se->dl_bw, dl_rq);
				172	}
				173
				174	static inline
				175	void sub_rq_bw(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				176	{
				177	if (!dl_entity_is_special(dl_se))
				178	__sub_rq_bw(dl_se->dl_bw, dl_rq);
				179	}
				180
				181	static inline
				182	void add_running_bw(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				183	{
				184	if (!dl_entity_is_special(dl_se))
				185	__add_running_bw(dl_se->dl_bw, dl_rq);
				186	}
				187
				188	static inline
				189	void sub_running_bw(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				190	{
				191	if (!dl_entity_is_special(dl_se))
				192	__sub_running_bw(dl_se->dl_bw, dl_rq);
				193	}
				194
Yu Chen	ba4f7bc	2020-02-28 18:03:29 +0800	[diff] [blame]	195	static void dl_change_utilization(struct task_struct *p, u64 new_bw)
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	196	{
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	197	struct rq *rq;
				198
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	199	BUG_ON(p->dl.flags & SCHED_FLAG_SUGOV);
				200
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	201	if (task_on_rq_queued(p))
				202	return;
				203
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	204	rq = task_rq(p);
				205	if (p->dl.dl_non_contending) {
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	206	sub_running_bw(&p->dl, &rq->dl);
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	207	p->dl.dl_non_contending = 0;
				208	/*
				209	* If the timer handler is currently running and the
				210	* timer cannot be cancelled, inactive_task_timer()
				211	* will see that dl_not_contending is not set, and
				212	* will not touch the rq's active utilization,
				213	* so we are still safe.
				214	*/
				215	if (hrtimer_try_to_cancel(&p->dl.inactive_timer) == 1)
				216	put_task_struct(p);
				217	}
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	218	__sub_rq_bw(p->dl.dl_bw, &rq->dl);
				219	__add_rq_bw(new_bw, &rq->dl);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	220	}
				221
				222	/*
				223	* The utilization of a task cannot be immediately removed from
				224	* the rq active utilization (running_bw) when the task blocks.
				225	* Instead, we have to wait for the so called "0-lag time".
				226	*
				227	* If a task blocks before the "0-lag time", a timer (the inactive
				228	* timer) is armed, and running_bw is decreased when the timer
				229	* fires.
				230	*
				231	* If the task wakes up again before the inactive timer fires,
				232	* the timer is cancelled, whereas if the task wakes up after the
				233	* inactive timer fired (and running_bw has been decreased) the
				234	* task's utilization has to be added to running_bw again.
				235	* A flag in the deadline scheduling entity (dl_non_contending)
				236	* is used to avoid race conditions between the inactive timer handler
				237	* and task wakeups.
				238	*
				239	* The following diagram shows how running_bw is updated. A task is
				240	* "ACTIVE" when its utilization contributes to running_bw; an
				241	* "ACTIVE contending" task is in the TASK_RUNNING state, while an
				242	* "ACTIVE non contending" task is a blocked task for which the "0-lag time"
				243	* has not passed yet. An "INACTIVE" task is a task for which the "0-lag"
				244	* time already passed, which does not contribute to running_bw anymore.
				245	* +------------------+
				246	* wakeup \| ACTIVE \|
				247	* +------------------>+ contending \|
				248	* \| add_running_bw \| \|
				249	* \| +----+------+------+
				250	* \| \| ^
				251	* \| dequeue \| \|
				252	* +--------+-------+ \| \|
				253	* \| \| t >= 0-lag \| \| wakeup
				254	* \| INACTIVE \|<---------------+ \|
				255	* \| \| sub_running_bw \| \|
				256	* +--------+-------+ \| \|
				257	* ^ \| \|
				258	* \| t < 0-lag \| \|
				259	* \| \| \|
				260	* \| V \|
				261	* \| +----+------+------+
				262	* \| sub_running_bw \| ACTIVE \|
				263	* +-------------------+ \|
				264	* inactive timer \| non contending \|
				265	* fired +------------------+
				266	*
				267	* The task_non_contending() function is invoked when a task
				268	* blocks, and checks if the 0-lag time already passed or
				269	* not (in the first case, it directly updates running_bw;
				270	* in the second case, it arms the inactive timer).
				271	*
				272	* The task_contending() function is invoked when a task wakes
				273	* up, and checks if the task is still in the "ACTIVE non contending"
				274	* state or not (in the second case, it updates running_bw).
				275	*/
				276	static void task_non_contending(struct task_struct *p)
				277	{
				278	struct sched_dl_entity *dl_se = &p->dl;
				279	struct hrtimer *timer = &dl_se->inactive_timer;
				280	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				281	struct rq *rq = rq_of_dl_rq(dl_rq);
				282	s64 zerolag_time;
				283
				284	/*
				285	* If this is a non-deadline task that has been boosted,
				286	* do nothing
				287	*/
				288	if (dl_se->dl_runtime == 0)
				289	return;
				290
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	291	if (dl_entity_is_special(dl_se))
				292	return;
				293
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	294	WARN_ON(dl_se->dl_non_contending);
				295
				296	zerolag_time = dl_se->deadline -
				297	div64_long((dl_se->runtime * dl_se->dl_period),
				298	dl_se->dl_runtime);
				299
				300	/*
				301	* Using relative times instead of the absolute "0-lag time"
				302	* allows to simplify the code
				303	*/
				304	zerolag_time -= rq_clock(rq);
				305
				306	/*
				307	* If the "0-lag time" already passed, decrease the active
				308	* utilization now, instead of starting a timer
				309	*/
luca abeni	1b02cd6	2019-03-25 14:15:30 +0100	[diff] [blame]	310	if ((zerolag_time < 0) \|\| hrtimer_active(&dl_se->inactive_timer)) {
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	311	if (dl_task(p))
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	312	sub_running_bw(dl_se, dl_rq);
Luca Abeni	387e313	2017-05-18 22:13:30 +0200	[diff] [blame]	313	if (!dl_task(p) \|\| p->state == TASK_DEAD) {
				314	struct dl_bw *dl_b = dl_bw_of(task_cpu(p));
				315
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	316	if (p->state == TASK_DEAD)
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	317	sub_rq_bw(&p->dl, &rq->dl);
Luca Abeni	387e313	2017-05-18 22:13:30 +0200	[diff] [blame]	318	raw_spin_lock(&dl_b->lock);
Peter Zijlstra	8c0944ce	2017-09-07 12:09:30 +0200	[diff] [blame]	319	__dl_sub(dl_b, p->dl.dl_bw, dl_bw_cpus(task_cpu(p)));
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	320	__dl_clear_params(p);
Luca Abeni	387e313	2017-05-18 22:13:30 +0200	[diff] [blame]	321	raw_spin_unlock(&dl_b->lock);
				322	}
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	323
				324	return;
				325	}
				326
				327	dl_se->dl_non_contending = 1;
				328	get_task_struct(p);
Juri Lelli	850377a	2019-07-31 12:37:15 +0200	[diff] [blame]	329	hrtimer_start(timer, ns_to_ktime(zerolag_time), HRTIMER_MODE_REL_HARD);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	330	}
				331
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	332	static void task_contending(struct sched_dl_entity *dl_se, int flags)
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	333	{
				334	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				335
				336	/*
				337	* If this is a non-deadline task that has been boosted,
				338	* do nothing
				339	*/
				340	if (dl_se->dl_runtime == 0)
				341	return;
				342
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	343	if (flags & ENQUEUE_MIGRATED)
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	344	add_rq_bw(dl_se, dl_rq);
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	345
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	346	if (dl_se->dl_non_contending) {
				347	dl_se->dl_non_contending = 0;
				348	/*
				349	* If the timer handler is currently running and the
				350	* timer cannot be cancelled, inactive_task_timer()
				351	* will see that dl_not_contending is not set, and
				352	* will not touch the rq's active utilization,
				353	* so we are still safe.
				354	*/
				355	if (hrtimer_try_to_cancel(&dl_se->inactive_timer) == 1)
				356	put_task_struct(dl_task_of(dl_se));
				357	} else {
				358	/*
				359	* Since "dl_non_contending" is not set, the
				360	* task's utilization has already been removed from
				361	* active utilization (either when the task blocked,
				362	* when the "inactive timer" fired).
				363	* So, add it back.
				364	*/
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	365	add_running_bw(dl_se, dl_rq);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	366	}
				367	}
				368
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	369	static inline int is_leftmost(struct task_struct p, struct dl_rq dl_rq)
				370	{
				371	struct sched_dl_entity *dl_se = &p->dl;
				372
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	373	return dl_rq->root.rb_leftmost == &dl_se->rb_node;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	374	}
				375
Yu Chen	ba4f7bc	2020-02-28 18:03:29 +0800	[diff] [blame]	376	static void init_dl_rq_bw_ratio(struct dl_rq *dl_rq);
				377
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	378	void init_dl_bandwidth(struct dl_bandwidth *dl_b, u64 period, u64 runtime)
				379	{
				380	raw_spin_lock_init(&dl_b->dl_runtime_lock);
				381	dl_b->dl_period = period;
				382	dl_b->dl_runtime = runtime;
				383	}
				384
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	385	void init_dl_bw(struct dl_bw *dl_b)
				386	{
				387	raw_spin_lock_init(&dl_b->lock);
				388	raw_spin_lock(&def_dl_bandwidth.dl_runtime_lock);
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	389	if (global_rt_runtime() == RUNTIME_INF)
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	390	dl_b->bw = -1;
				391	else
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	392	dl_b->bw = to_ratio(global_rt_period(), global_rt_runtime());
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	393	raw_spin_unlock(&def_dl_bandwidth.dl_runtime_lock);
				394	dl_b->total_bw = 0;
				395	}
				396
Abel Vesa	07c54f7	2015-03-03 13:50:27 +0200	[diff] [blame]	397	void init_dl_rq(struct dl_rq *dl_rq)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	398	{
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	399	dl_rq->root = RB_ROOT_CACHED;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	400
				401	#ifdef CONFIG_SMP
				402	/* zero means no -deadline tasks */
				403	dl_rq->earliest_dl.curr = dl_rq->earliest_dl.next = 0;
				404
				405	dl_rq->dl_nr_migratory = 0;
				406	dl_rq->overloaded = 0;
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	407	dl_rq->pushable_dl_tasks_root = RB_ROOT_CACHED;
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	408	#else
				409	init_dl_bw(&dl_rq->dl_bw);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	410	#endif
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	411
				412	dl_rq->running_bw = 0;
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	413	dl_rq->this_bw = 0;
Luca Abeni	4da3abc	2017-05-18 22:13:32 +0200	[diff] [blame]	414	init_dl_rq_bw_ratio(dl_rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	415	}
				416
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	417	#ifdef CONFIG_SMP
				418
				419	static inline int dl_overloaded(struct rq *rq)
				420	{
				421	return atomic_read(&rq->rd->dlo_count);
				422	}
				423
				424	static inline void dl_set_overload(struct rq *rq)
				425	{
				426	if (!rq->online)
				427	return;
				428
				429	cpumask_set_cpu(rq->cpu, rq->rd->dlo_mask);
				430	/*
				431	* Must be visible before the overload count is
				432	* set (as in sched_rt.c).
				433	*
				434	* Matched by the barrier in pull_dl_task().
				435	*/
				436	smp_wmb();
				437	atomic_inc(&rq->rd->dlo_count);
				438	}
				439
				440	static inline void dl_clear_overload(struct rq *rq)
				441	{
				442	if (!rq->online)
				443	return;
				444
				445	atomic_dec(&rq->rd->dlo_count);
				446	cpumask_clear_cpu(rq->cpu, rq->rd->dlo_mask);
				447	}
				448
				449	static void update_dl_migration(struct dl_rq *dl_rq)
				450	{
Kirill Tkhai	995b9ea	2014-02-18 02:24:13 +0400	[diff] [blame]	451	if (dl_rq->dl_nr_migratory && dl_rq->dl_nr_running > 1) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	452	if (!dl_rq->overloaded) {
				453	dl_set_overload(rq_of_dl_rq(dl_rq));
				454	dl_rq->overloaded = 1;
				455	}
				456	} else if (dl_rq->overloaded) {
				457	dl_clear_overload(rq_of_dl_rq(dl_rq));
				458	dl_rq->overloaded = 0;
				459	}
				460	}
				461
				462	static void inc_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				463	{
				464	struct task_struct *p = dl_task_of(dl_se);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	465
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	466	if (p->nr_cpus_allowed > 1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	467	dl_rq->dl_nr_migratory++;
				468
				469	update_dl_migration(dl_rq);
				470	}
				471
				472	static void dec_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				473	{
				474	struct task_struct *p = dl_task_of(dl_se);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	475
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	476	if (p->nr_cpus_allowed > 1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	477	dl_rq->dl_nr_migratory--;
				478
				479	update_dl_migration(dl_rq);
				480	}
				481
				482	/*
				483	* The list of pushable -deadline task is not a plist, like in
				484	* sched_rt.c, it is an rb-tree with tasks ordered by deadline.
				485	*/
				486	static void enqueue_pushable_dl_task(struct rq rq, struct task_struct p)
				487	{
				488	struct dl_rq *dl_rq = &rq->dl;
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	489	struct rb_node **link = &dl_rq->pushable_dl_tasks_root.rb_root.rb_node;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	490	struct rb_node *parent = NULL;
				491	struct task_struct *entry;
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	492	bool leftmost = true;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	493
				494	BUG_ON(!RB_EMPTY_NODE(&p->pushable_dl_tasks));
				495
				496	while (*link) {
				497	parent = *link;
				498	entry = rb_entry(parent, struct task_struct,
				499	pushable_dl_tasks);
				500	if (dl_entity_preempt(&p->dl, &entry->dl))
				501	link = &parent->rb_left;
				502	else {
				503	link = &parent->rb_right;
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	504	leftmost = false;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	505	}
				506	}
				507
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	508	if (leftmost)
Wanpeng Li	7d92de3	2015-12-03 17:42:10 +0800	[diff] [blame]	509	dl_rq->earliest_dl.next = p->dl.deadline;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	510
				511	rb_link_node(&p->pushable_dl_tasks, parent, link);
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	512	rb_insert_color_cached(&p->pushable_dl_tasks,
				513	&dl_rq->pushable_dl_tasks_root, leftmost);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	514	}
				515
				516	static void dequeue_pushable_dl_task(struct rq rq, struct task_struct p)
				517	{
				518	struct dl_rq *dl_rq = &rq->dl;
				519
				520	if (RB_EMPTY_NODE(&p->pushable_dl_tasks))
				521	return;
				522
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	523	if (dl_rq->pushable_dl_tasks_root.rb_leftmost == &p->pushable_dl_tasks) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	524	struct rb_node *next_node;
				525
				526	next_node = rb_next(&p->pushable_dl_tasks);
Wanpeng Li	7d92de3	2015-12-03 17:42:10 +0800	[diff] [blame]	527	if (next_node) {
				528	dl_rq->earliest_dl.next = rb_entry(next_node,
				529	struct task_struct, pushable_dl_tasks)->dl.deadline;
				530	}
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	531	}
				532
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	533	rb_erase_cached(&p->pushable_dl_tasks, &dl_rq->pushable_dl_tasks_root);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	534	RB_CLEAR_NODE(&p->pushable_dl_tasks);
				535	}
				536
				537	static inline int has_pushable_dl_tasks(struct rq *rq)
				538	{
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	539	return !RB_EMPTY_ROOT(&rq->dl.pushable_dl_tasks_root.rb_root);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	540	}
				541
				542	static int push_dl_task(struct rq *rq);
				543
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	544	static inline bool need_pull_dl_task(struct rq rq, struct task_struct prev)
				545	{
Peter Zijlstra	120455c	2020-09-25 16:42:31 +0200	[diff] [blame]	546	return rq->online && dl_task(prev);
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	547	}
				548
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	549	static DEFINE_PER_CPU(struct callback_head, dl_push_head);
				550	static DEFINE_PER_CPU(struct callback_head, dl_pull_head);
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	551
				552	static void push_dl_tasks(struct rq *);
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	553	static void pull_dl_task(struct rq *);
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	554
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	555	static inline void deadline_queue_push_tasks(struct rq *rq)
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	556	{
Peter Zijlstra	e3fca9e	2015-06-11 14:46:37 +0200	[diff] [blame]	557	if (!has_pushable_dl_tasks(rq))
				558	return;
				559
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	560	queue_balance_callback(rq, &per_cpu(dl_push_head, rq->cpu), push_dl_tasks);
				561	}
				562
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	563	static inline void deadline_queue_pull_task(struct rq *rq)
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	564	{
				565	queue_balance_callback(rq, &per_cpu(dl_pull_head, rq->cpu), pull_dl_task);
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	566	}
				567
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	568	static struct rq find_lock_later_rq(struct task_struct task, struct rq *rq);
				569
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	570	static struct rq dl_task_offline_migration(struct rq rq, struct task_struct *p)
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	571	{
				572	struct rq *later_rq = NULL;
Juri Lelli	59d06ce	2019-07-19 15:59:56 +0200	[diff] [blame]	573	struct dl_bw *dl_b;
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	574
				575	later_rq = find_lock_later_rq(p, rq);
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	576	if (!later_rq) {
				577	int cpu;
				578
				579	/*
				580	* If we cannot preempt any rq, fall back to pick any
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	581	* online CPU:
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	582	*/
Sebastian Andrzej Siewior	3bd3706	2019-04-23 16:26:36 +0200	[diff] [blame]	583	cpu = cpumask_any_and(cpu_active_mask, p->cpus_ptr);
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	584	if (cpu >= nr_cpu_ids) {
				585	/*
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	586	* Failed to find any suitable CPU.
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	587	* The task will never come back!
				588	*/
				589	BUG_ON(dl_bandwidth_enabled());
				590
				591	/*
				592	* If admission control is disabled we
				593	* try a little harder to let the task
				594	* run.
				595	*/
				596	cpu = cpumask_any(cpu_active_mask);
				597	}
				598	later_rq = cpu_rq(cpu);
				599	double_lock_balance(rq, later_rq);
				600	}
				601
Juri Lelli	59d06ce	2019-07-19 15:59:56 +0200	[diff] [blame]	602	if (p->dl.dl_non_contending \|\| p->dl.dl_throttled) {
				603	/*
				604	* Inactive timer is armed (or callback is running, but
				605	* waiting for us to release rq locks). In any case, when it
				606	* will fire (or continue), it will see running_bw of this
				607	* task migrated to later_rq (and correctly handle it).
				608	*/
				609	sub_running_bw(&p->dl, &rq->dl);
				610	sub_rq_bw(&p->dl, &rq->dl);
				611
				612	add_rq_bw(&p->dl, &later_rq->dl);
				613	add_running_bw(&p->dl, &later_rq->dl);
				614	} else {
				615	sub_rq_bw(&p->dl, &rq->dl);
				616	add_rq_bw(&p->dl, &later_rq->dl);
				617	}
				618
				619	/*
				620	* And we finally need to fixup root_domain(s) bandwidth accounting,
				621	* since p is still hanging out in the old (now moved to default) root
				622	* domain.
				623	*/
				624	dl_b = &rq->rd->dl_bw;
				625	raw_spin_lock(&dl_b->lock);
				626	__dl_sub(dl_b, p->dl.dl_bw, cpumask_weight(rq->rd->span));
				627	raw_spin_unlock(&dl_b->lock);
				628
				629	dl_b = &later_rq->rd->dl_bw;
				630	raw_spin_lock(&dl_b->lock);
				631	__dl_add(dl_b, p->dl.dl_bw, cpumask_weight(later_rq->rd->span));
				632	raw_spin_unlock(&dl_b->lock);
				633
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	634	set_task_cpu(p, later_rq->cpu);
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	635	double_unlock_balance(later_rq, rq);
				636
				637	return later_rq;
Wanpeng Li	fa9c9d1	2015-03-27 07:08:35 +0800	[diff] [blame]	638	}
				639
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	640	#else
				641
				642	static inline
				643	void enqueue_pushable_dl_task(struct rq rq, struct task_struct p)
				644	{
				645	}
				646
				647	static inline
				648	void dequeue_pushable_dl_task(struct rq rq, struct task_struct p)
				649	{
				650	}
				651
				652	static inline
				653	void inc_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				654	{
				655	}
				656
				657	static inline
				658	void dec_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				659	{
				660	}
				661
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	662	static inline bool need_pull_dl_task(struct rq rq, struct task_struct prev)
				663	{
				664	return false;
				665	}
				666
Peter Zijlstra	0ea60c2	2015-06-11 14:46:42 +0200	[diff] [blame]	667	static inline void pull_dl_task(struct rq *rq)
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	668	{
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	669	}
				670
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	671	static inline void deadline_queue_push_tasks(struct rq *rq)
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	672	{
				673	}
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	674
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	675	static inline void deadline_queue_pull_task(struct rq *rq)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	676	{
				677	}
				678	#endif /* CONFIG_SMP */
				679
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	680	static void enqueue_task_dl(struct rq rq, struct task_struct p, int flags);
				681	static void __dequeue_task_dl(struct rq rq, struct task_struct p, int flags);
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	682	static void check_preempt_curr_dl(struct rq rq, struct task_struct p, int flags);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	683
				684	/*
				685	* We are being explicitly informed that a new instance is starting,
				686	* and this means that:
				687	* - the absolute deadline of the entity has to be placed at
				688	* current time + relative deadline;
				689	* - the runtime of the entity has to be set to the maximum value.
				690	*
				691	* The capability of specifying such event is useful whenever a -deadline
				692	* entity wants to (try to!) synchronize its behaviour with the scheduler's
				693	* one, and to (try to!) reconcile itself with its own scheduling
				694	* parameters.
				695	*/
Juri Lelli	98b0a85	2016-08-05 16:07:55 +0100	[diff] [blame]	696	static inline void setup_new_dl_entity(struct sched_dl_entity *dl_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	697	{
				698	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				699	struct rq *rq = rq_of_dl_rq(dl_rq);
				700
Juri Lelli	98b0a85	2016-08-05 16:07:55 +0100	[diff] [blame]	701	WARN_ON(dl_se->dl_boosted);
Luca Abeni	72f9f3f	2016-03-07 12:27:04 +0100	[diff] [blame]	702	WARN_ON(dl_time_before(rq_clock(rq), dl_se->deadline));
				703
				704	/*
				705	* We are racing with the deadline timer. So, do nothing because
				706	* the deadline timer handler will take care of properly recharging
				707	* the runtime and postponing the deadline
				708	*/
				709	if (dl_se->dl_throttled)
				710	return;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	711
				712	/*
				713	* We use the regular wall clock time to set deadlines in the
				714	* future; in fact, we must consider execution overheads (time
				715	* spent on hardirq context, etc.).
				716	*/
Juri Lelli	98b0a85	2016-08-05 16:07:55 +0100	[diff] [blame]	717	dl_se->deadline = rq_clock(rq) + dl_se->dl_deadline;
				718	dl_se->runtime = dl_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	719	}
				720
				721	/*
				722	* Pure Earliest Deadline First (EDF) scheduling does not deal with the
				723	* possibility of a entity lasting more than what it declared, and thus
				724	* exhausting its runtime.
				725	*
				726	* Here we are interested in making runtime overrun possible, but we do
				727	* not want a entity which is misbehaving to affect the scheduling of all
				728	* other entities.
				729	* Therefore, a budgeting strategy called Constant Bandwidth Server (CBS)
				730	* is used, in order to confine each entity within its own bandwidth.
				731	*
				732	* This function deals exactly with that, and ensures that when the runtime
				733	* of a entity is replenished, its deadline is also postponed. That ensures
				734	* the overrunning entity can't interfere with other entity in the system and
				735	* can't make them miss their deadlines. Reasons why this kind of overruns
				736	* could happen are, typically, a entity voluntarily trying to overcome its
xiaofeng.yan	1b09d29	2014-07-07 05:59:04 +0000	[diff] [blame]	737	* runtime, or it just underestimated it during sched_setattr().
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	738	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	739	static void replenish_dl_entity(struct sched_dl_entity *dl_se,
				740	struct sched_dl_entity *pi_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	741	{
				742	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				743	struct rq *rq = rq_of_dl_rq(dl_rq);
				744
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	745	BUG_ON(pi_se->dl_runtime <= 0);
				746
				747	/*
				748	* This could be the case for a !-dl task that is boosted.
				749	* Just go with full inherited parameters.
				750	*/
				751	if (dl_se->dl_deadline == 0) {
				752	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				753	dl_se->runtime = pi_se->dl_runtime;
				754	}
				755
Peter Zijlstra	48be3a6	2016-02-23 13:28:22 +0100	[diff] [blame]	756	if (dl_se->dl_yielded && dl_se->runtime > 0)
				757	dl_se->runtime = 0;
				758
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	759	/*
				760	* We keep moving the deadline away until we get some
				761	* available runtime for the entity. This ensures correct
				762	* handling of situations where the runtime overrun is
				763	* arbitrary large.
				764	*/
				765	while (dl_se->runtime <= 0) {
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	766	dl_se->deadline += pi_se->dl_period;
				767	dl_se->runtime += pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	768	}
				769
				770	/*
				771	* At this point, the deadline really should be "in
				772	* the future" with respect to rq->clock. If it's
				773	* not, we are, for some reason, lagging too much!
				774	* Anyway, after having warn userspace abut that,
				775	* we still try to keep the things running by
				776	* resetting the deadline and the budget of the
				777	* entity.
				778	*/
				779	if (dl_time_before(dl_se->deadline, rq_clock(rq))) {
Steven Rostedt	c219b7d	2016-02-10 12:04:22 -0500	[diff] [blame]	780	printk_deferred_once("sched: DL replenish lagged too much\n");
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	781	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				782	dl_se->runtime = pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	783	}
Peter Zijlstra	1019a35	2014-11-26 08:44:03 +0800	[diff] [blame]	784
				785	if (dl_se->dl_yielded)
				786	dl_se->dl_yielded = 0;
				787	if (dl_se->dl_throttled)
				788	dl_se->dl_throttled = 0;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	789	}
				790
				791	/*
				792	* Here we check if --at time t-- an entity (which is probably being
				793	* [re]activated or, in general, enqueued) can use its remaining runtime
				794	* and its current deadline _without_ exceeding the bandwidth it is
				795	* assigned (function returns true if it can't). We are in fact applying
				796	* one of the CBS rules: when a task wakes up, if the residual runtime
				797	* over residual deadline fits within the allocated bandwidth, then we
				798	* can keep the current (absolute) deadline and residual budget without
				799	* disrupting the schedulability of the system. Otherwise, we should
				800	* refill the runtime and set the deadline a period in the future,
				801	* because keeping the current (absolute) deadline of the task would
Dario Faggioli	712e5e3	2014-01-27 12:20:15 +0100	[diff] [blame]	802	* result in breaking guarantees promised to other tasks (refer to
Mauro Carvalho Chehab	d6a3b24	2019-06-12 14:53:03 -0300	[diff] [blame]	803	* Documentation/scheduler/sched-deadline.rst for more information).
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	804	*
				805	* This function returns true if:
				806	*
Steven Rostedt (VMware)	2317d5f	2017-03-02 15:10:59 +0100	[diff] [blame]	807	* runtime / (deadline - t) > dl_runtime / dl_deadline ,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	808	*
				809	* IOW we can't recycle current parameters.
Harald Gustafsson	755378a	2013-11-07 14:43:40 +0100	[diff] [blame]	810	*
Steven Rostedt (VMware)	2317d5f	2017-03-02 15:10:59 +0100	[diff] [blame]	811	* Notice that the bandwidth check is done against the deadline. For
Harald Gustafsson	755378a	2013-11-07 14:43:40 +0100	[diff] [blame]	812	* task with deadline equal to period this is the same of using
Steven Rostedt (VMware)	2317d5f	2017-03-02 15:10:59 +0100	[diff] [blame]	813	* dl_period instead of dl_deadline in the equation above.
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	814	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	815	static bool dl_entity_overflow(struct sched_dl_entity *dl_se,
				816	struct sched_dl_entity *pi_se, u64 t)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	817	{
				818	u64 left, right;
				819
				820	/*
				821	* left and right are the two sides of the equation above,
				822	* after a bit of shuffling to use multiplications instead
				823	* of divisions.
				824	*
				825	* Note that none of the time values involved in the two
				826	* multiplications are absolute: dl_deadline and dl_runtime
				827	* are the relative deadline and the maximum runtime of each
				828	* instance, runtime is the runtime left for the last instance
				829	* and (deadline - t), since t is rq->clock, is the time left
				830	* to the (absolute) deadline. Even if overflowing the u64 type
				831	* is very unlikely to occur in both cases, here we scale down
				832	* as we want to avoid that risk at all. Scaling down by 10
				833	* means that we reduce granularity to 1us. We are fine with it,
				834	* since this is only a true/false check and, anyway, thinking
				835	* of anything below microseconds resolution is actually fiction
				836	* (but still we want to give the user that illusion >;).
				837	*/
Steven Rostedt (VMware)	2317d5f	2017-03-02 15:10:59 +0100	[diff] [blame]	838	left = (pi_se->dl_deadline >> DL_SCALE) * (dl_se->runtime >> DL_SCALE);
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	839	right = ((dl_se->deadline - t) >> DL_SCALE) *
				840	(pi_se->dl_runtime >> DL_SCALE);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	841
				842	return dl_time_before(right, left);
				843	}
				844
				845	/*
Daniel Bristot de Oliveira	3effcb4	2017-05-29 16:24:03 +0200	[diff] [blame]	846	* Revised wakeup rule [1]: For self-suspending tasks, rather then
				847	* re-initializing task's runtime and deadline, the revised wakeup
				848	* rule adjusts the task's runtime to avoid the task to overrun its
				849	* density.
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	850	*
Daniel Bristot de Oliveira	3effcb4	2017-05-29 16:24:03 +0200	[diff] [blame]	851	* Reasoning: a task may overrun the density if:
				852	* runtime / (deadline - t) > dl_runtime / dl_deadline
				853	*
				854	* Therefore, runtime can be adjusted to:
				855	* runtime = (dl_runtime / dl_deadline) * (deadline - t)
				856	*
				857	* In such way that runtime will be equal to the maximum density
				858	* the task can use without breaking any rule.
				859	*
				860	* [1] Luca Abeni, Giuseppe Lipari, and Juri Lelli. 2015. Constant
				861	* bandwidth server revisited. SIGBED Rev. 11, 4 (January 2015), 19-24.
				862	*/
				863	static void
				864	update_dl_revised_wakeup(struct sched_dl_entity dl_se, struct rq rq)
				865	{
				866	u64 laxity = dl_se->deadline - rq_clock(rq);
				867
				868	/*
				869	* If the task has deadline < period, and the deadline is in the past,
				870	* it should already be throttled before this check.
				871	*
				872	* See update_dl_entity() comments for further details.
				873	*/
				874	WARN_ON(dl_time_before(dl_se->deadline, rq_clock(rq)));
				875
				876	dl_se->runtime = (dl_se->dl_density * laxity) >> BW_SHIFT;
				877	}
				878
				879	/*
				880	* Regarding the deadline, a task with implicit deadline has a relative
				881	* deadline == relative period. A task with constrained deadline has a
				882	* relative deadline <= relative period.
				883	*
				884	* We support constrained deadline tasks. However, there are some restrictions
				885	* applied only for tasks which do not have an implicit deadline. See
				886	* update_dl_entity() to know more about such restrictions.
				887	*
				888	* The dl_is_implicit() returns true if the task has an implicit deadline.
				889	*/
				890	static inline bool dl_is_implicit(struct sched_dl_entity *dl_se)
				891	{
				892	return dl_se->dl_deadline == dl_se->dl_period;
				893	}
				894
				895	/*
				896	* When a deadline entity is placed in the runqueue, its runtime and deadline
				897	* might need to be updated. This is done by a CBS wake up rule. There are two
				898	* different rules: 1) the original CBS; and 2) the Revisited CBS.
				899	*
				900	* When the task is starting a new period, the Original CBS is used. In this
				901	* case, the runtime is replenished and a new absolute deadline is set.
				902	*
				903	* When a task is queued before the begin of the next period, using the
				904	* remaining runtime and deadline could make the entity to overflow, see
				905	* dl_entity_overflow() to find more about runtime overflow. When such case
				906	* is detected, the runtime and deadline need to be updated.
				907	*
				908	* If the task has an implicit deadline, i.e., deadline == period, the Original
				909	* CBS is applied. the runtime is replenished and a new absolute deadline is
				910	* set, as in the previous cases.
				911	*
				912	* However, the Original CBS does not work properly for tasks with
				913	* deadline < period, which are said to have a constrained deadline. By
				914	* applying the Original CBS, a constrained deadline task would be able to run
				915	* runtime/deadline in a period. With deadline < period, the task would
				916	* overrun the runtime/period allowed bandwidth, breaking the admission test.
				917	*
				918	* In order to prevent this misbehave, the Revisited CBS is used for
				919	* constrained deadline tasks when a runtime overflow is detected. In the
				920	* Revisited CBS, rather than replenishing & setting a new absolute deadline,
				921	* the remaining runtime of the task is reduced to avoid runtime overflow.
				922	* Please refer to the comments update_dl_revised_wakeup() function to find
				923	* more about the Revised CBS rule.
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	924	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	925	static void update_dl_entity(struct sched_dl_entity *dl_se,
				926	struct sched_dl_entity *pi_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	927	{
				928	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				929	struct rq *rq = rq_of_dl_rq(dl_rq);
				930
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	931	if (dl_time_before(dl_se->deadline, rq_clock(rq)) \|\|
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	932	dl_entity_overflow(dl_se, pi_se, rq_clock(rq))) {
Daniel Bristot de Oliveira	3effcb4	2017-05-29 16:24:03 +0200	[diff] [blame]	933
				934	if (unlikely(!dl_is_implicit(dl_se) &&
				935	!dl_time_before(dl_se->deadline, rq_clock(rq)) &&
				936	!dl_se->dl_boosted)){
				937	update_dl_revised_wakeup(dl_se, rq);
				938	return;
				939	}
				940
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	941	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				942	dl_se->runtime = pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	943	}
				944	}
				945
Daniel Bristot de Oliveira	5ac69d3	2017-03-02 15:10:57 +0100	[diff] [blame]	946	static inline u64 dl_next_period(struct sched_dl_entity *dl_se)
				947	{
				948	return dl_se->deadline - dl_se->dl_deadline + dl_se->dl_period;
				949	}
				950
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	951	/*
				952	* If the entity depleted all its runtime, and if we want it to sleep
				953	* while waiting for some new execution time to become available, we
Daniel Bristot de Oliveira	5ac69d3	2017-03-02 15:10:57 +0100	[diff] [blame]	954	* set the bandwidth replenishment timer to the replenishment instant
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	955	* and try to activate it.
				956	*
				957	* Notice that it is important for the caller to know if the timer
				958	* actually started or not (i.e., the replenishment instant is in
				959	* the future or in the past).
				960	*/
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	961	static int start_dl_timer(struct task_struct *p)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	962	{
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	963	struct sched_dl_entity *dl_se = &p->dl;
				964	struct hrtimer *timer = &dl_se->dl_timer;
				965	struct rq *rq = task_rq(p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	966	ktime_t now, act;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	967	s64 delta;
				968
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	969	lockdep_assert_held(&rq->lock);
				970
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	971	/*
				972	* We want the timer to fire at the deadline, but considering
				973	* that it is actually coming from rq->clock and not from
				974	* hrtimer's time base reading.
				975	*/
Daniel Bristot de Oliveira	5ac69d3	2017-03-02 15:10:57 +0100	[diff] [blame]	976	act = ns_to_ktime(dl_next_period(dl_se));
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	977	now = hrtimer_cb_get_time(timer);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	978	delta = ktime_to_ns(now) - rq_clock(rq);
				979	act = ktime_add_ns(act, delta);
				980
				981	/*
				982	* If the expiry time already passed, e.g., because the value
				983	* chosen as the deadline is too small, don't even try to
				984	* start the timer in the past!
				985	*/
				986	if (ktime_us_delta(act, now) < 0)
				987	return 0;
				988
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	989	/*
				990	* !enqueued will guarantee another callback; even if one is already in
				991	* progress. This ensures a balanced {get,put}_task_struct().
				992	*
				993	* The race against __run_timer() clearing the enqueued state is
				994	* harmless because we're holding task_rq()->lock, therefore the timer
				995	* expiring after we've done the check will wait on its task_rq_lock()
				996	* and observe our state.
				997	*/
				998	if (!hrtimer_is_queued(timer)) {
				999	get_task_struct(p);
Sebastian Andrzej Siewior	d5096aa	2019-07-26 20:30:52 +0200	[diff] [blame]	1000	hrtimer_start(timer, act, HRTIMER_MODE_ABS_HARD);
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1001	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1002
Thomas Gleixner	cc9684d	2015-04-14 21:09:06 +0000	[diff] [blame]	1003	return 1;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1004	}
				1005
				1006	/*
				1007	* This is the bandwidth enforcement timer callback. If here, we know
				1008	* a task is not on its dl_rq, since the fact that the timer was running
				1009	* means the task is throttled and needs a runtime replenishment.
				1010	*
				1011	* However, what we actually do depends on the fact the task is active,
				1012	* (it is on its rq) or has been removed from there by a call to
				1013	* dequeue_task_dl(). In the former case we must issue the runtime
				1014	* replenishment and add the task back to the dl_rq; in the latter, we just
				1015	* do nothing but clearing dl_throttled, so that runtime and deadline
				1016	* updating (and the queueing back to dl_rq) will be done by the
				1017	* next call to enqueue_task_dl().
				1018	*/
				1019	static enum hrtimer_restart dl_task_timer(struct hrtimer *timer)
				1020	{
				1021	struct sched_dl_entity *dl_se = container_of(timer,
				1022	struct sched_dl_entity,
				1023	dl_timer);
				1024	struct task_struct *p = dl_task_of(dl_se);
Peter Zijlstra	eb58075	2015-07-31 21:28:18 +0200	[diff] [blame]	1025	struct rq_flags rf;
Kirill Tkhai	0f397f2	2014-05-20 13:33:42 +0400	[diff] [blame]	1026	struct rq *rq;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1027
Peter Zijlstra	eb58075	2015-07-31 21:28:18 +0200	[diff] [blame]	1028	rq = task_rq_lock(p, &rf);
Kirill Tkhai	0f397f2	2014-05-20 13:33:42 +0400	[diff] [blame]	1029
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1030	/*
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1031	* The task might have changed its scheduling policy to something
Daniel Bristot de Oliveira	9846d50	2016-11-08 11:15:23 +0100	[diff] [blame]	1032	* different than SCHED_DEADLINE (through switched_from_dl()).
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1033	*/
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1034	if (!dl_task(p))
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1035	goto unlock;
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1036
				1037	/*
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1038	* The task might have been boosted by someone else and might be in the
				1039	* boosting/deboosting path, its not throttled.
				1040	*/
				1041	if (dl_se->dl_boosted)
				1042	goto unlock;
				1043
				1044	/*
				1045	* Spurious timer due to start_dl_timer() race; or we already received
				1046	* a replenishment from rt_mutex_setprio().
				1047	*/
				1048	if (!dl_se->dl_throttled)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1049	goto unlock;
				1050
				1051	sched_clock_tick();
				1052	update_rq_clock(rq);
Kirill Tkhai	a79ec89	2015-02-16 15:38:34 +0300	[diff] [blame]	1053
				1054	/*
				1055	* If the throttle happened during sched-out; like:
				1056	*
				1057	* schedule()
				1058	* deactivate_task()
				1059	* dequeue_task_dl()
				1060	* update_curr_dl()
				1061	* start_dl_timer()
				1062	* __dequeue_task_dl()
				1063	* prev->on_rq = 0;
				1064	*
				1065	* We can be both throttled and !queued. Replenish the counter
				1066	* but do not enqueue -- wait for our wakeup to do that.
				1067	*/
				1068	if (!task_on_rq_queued(p)) {
				1069	replenish_dl_entity(dl_se, dl_se);
				1070	goto unlock;
				1071	}
				1072
Wanpeng Li	61c7aca	2016-08-31 18:27:44 +0800	[diff] [blame]	1073	#ifdef CONFIG_SMP
				1074	if (unlikely(!rq->online)) {
				1075	/*
				1076	* If the runqueue is no longer available, migrate the
				1077	* task elsewhere. This necessarily changes rq.
				1078	*/
				1079	lockdep_unpin_lock(&rq->lock, rf.cookie);
				1080	rq = dl_task_offline_migration(rq, p);
				1081	rf.cookie = lockdep_pin_lock(&rq->lock);
Wanpeng Li	dcc3b5f	2017-03-06 21:51:28 -0800	[diff] [blame]	1082	update_rq_clock(rq);
Wanpeng Li	61c7aca	2016-08-31 18:27:44 +0800	[diff] [blame]	1083
				1084	/*
				1085	* Now that the task has been migrated to the new RQ and we
				1086	* have that locked, proceed as normal and enqueue the task
				1087	* there.
				1088	*/
				1089	}
				1090	#endif
				1091
Peter Zijlstra	1019a35	2014-11-26 08:44:03 +0800	[diff] [blame]	1092	enqueue_task_dl(rq, p, ENQUEUE_REPLENISH);
				1093	if (dl_task(rq->curr))
				1094	check_preempt_curr_dl(rq, p, 0);
				1095	else
				1096	resched_curr(rq);
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1097
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1098	#ifdef CONFIG_SMP
Peter Zijlstra	1019a35	2014-11-26 08:44:03 +0800	[diff] [blame]	1099	/*
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1100	* Queueing this task back might have overloaded rq, check if we need
				1101	* to kick someone away.
Peter Zijlstra	1019a35	2014-11-26 08:44:03 +0800	[diff] [blame]	1102	*/
Peter Zijlstra	0aaafaa	2015-10-23 11:50:08 +0200	[diff] [blame]	1103	if (has_pushable_dl_tasks(rq)) {
				1104	/*
				1105	* Nothing relies on rq->lock after this, so its safe to drop
				1106	* rq->lock.
				1107	*/
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1108	rq_unpin_lock(rq, &rf);
Peter Zijlstra	1019a35	2014-11-26 08:44:03 +0800	[diff] [blame]	1109	push_dl_task(rq);
Matt Fleming	d8ac897	2016-09-21 14:38:10 +0100	[diff] [blame]	1110	rq_repin_lock(rq, &rf);
Peter Zijlstra	0aaafaa	2015-10-23 11:50:08 +0200	[diff] [blame]	1111	}
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1112	#endif
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1113
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1114	unlock:
Peter Zijlstra	eb58075	2015-07-31 21:28:18 +0200	[diff] [blame]	1115	task_rq_unlock(rq, p, &rf);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1116
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1117	/*
				1118	* This can free the task_struct, including this hrtimer, do not touch
				1119	* anything related to that after this.
				1120	*/
				1121	put_task_struct(p);
				1122
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1123	return HRTIMER_NORESTART;
				1124	}
				1125
				1126	void init_dl_task_timer(struct sched_dl_entity *dl_se)
				1127	{
				1128	struct hrtimer *timer = &dl_se->dl_timer;
				1129
Sebastian Andrzej Siewior	d5096aa	2019-07-26 20:30:52 +0200	[diff] [blame]	1130	hrtimer_init(timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL_HARD);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1131	timer->function = dl_task_timer;
				1132	}
				1133
Daniel Bristot de Oliveira	df8eac8	2017-03-02 15:10:58 +0100	[diff] [blame]	1134	/*
				1135	* During the activation, CBS checks if it can reuse the current task's
				1136	* runtime and period. If the deadline of the task is in the past, CBS
				1137	* cannot use the runtime, and so it replenishes the task. This rule
				1138	* works fine for implicit deadline tasks (deadline == period), and the
				1139	* CBS was designed for implicit deadline tasks. However, a task with
Christophe JAILLET	c496941	2020-06-02 21:50:02 +0200	[diff] [blame]	1140	* constrained deadline (deadline < period) might be awakened after the
Daniel Bristot de Oliveira	df8eac8	2017-03-02 15:10:58 +0100	[diff] [blame]	1141	* deadline, but before the next period. In this case, replenishing the
				1142	* task would allow it to run for runtime / deadline. As in this case
				1143	* deadline < period, CBS enables a task to run for more than the
				1144	* runtime / period. In a very loaded system, this can cause a domino
				1145	* effect, making other tasks miss their deadlines.
				1146	*
				1147	* To avoid this problem, in the activation of a constrained deadline
				1148	* task after the deadline but before the next period, throttle the
				1149	* task and set the replenishing timer to the begin of the next period,
				1150	* unless it is boosted.
				1151	*/
				1152	static inline void dl_check_constrained_dl(struct sched_dl_entity *dl_se)
				1153	{
				1154	struct task_struct *p = dl_task_of(dl_se);
				1155	struct rq *rq = rq_of_dl_rq(dl_rq_of_se(dl_se));
				1156
				1157	if (dl_time_before(dl_se->deadline, rq_clock(rq)) &&
				1158	dl_time_before(rq_clock(rq), dl_next_period(dl_se))) {
				1159	if (unlikely(dl_se->dl_boosted \|\| !start_dl_timer(p)))
				1160	return;
				1161	dl_se->dl_throttled = 1;
Xunlei Pang	ae83b56	2017-05-10 21:03:37 +0800	[diff] [blame]	1162	if (dl_se->runtime > 0)
				1163	dl_se->runtime = 0;
Daniel Bristot de Oliveira	df8eac8	2017-03-02 15:10:58 +0100	[diff] [blame]	1164	}
				1165	}
				1166
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1167	static
Zhiqiang Zhang	6fab541	2015-06-15 11:15:20 +0800	[diff] [blame]	1168	int dl_runtime_exceeded(struct sched_dl_entity *dl_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1169	{
Luca Abeni	269ad80	2014-12-17 11:50:32 +0100	[diff] [blame]	1170	return (dl_se->runtime <= 0);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1171	}
				1172
Juri Lelli	faa5993	2014-02-21 11:37:15 +0100	[diff] [blame]	1173	extern bool sched_rt_bandwidth_account(struct rt_rq *rt_rq);
				1174
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1175	/*
Luca Abeni	c52f14d	2017-05-18 22:13:31 +0200	[diff] [blame]	1176	* This function implements the GRUB accounting rule:
				1177	* according to the GRUB reclaiming algorithm, the runtime is
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	1178	* not decreased as "dq = -dt", but as
				1179	* "dq = -max{u / Umax, (1 - Uinact - Uextra)} dt",
				1180	* where u is the utilization of the task, Umax is the maximum reclaimable
				1181	* utilization, Uinact is the (per-runqueue) inactive utilization, computed
				1182	* as the difference between the "total runqueue utilization" and the
				1183	* runqueue active utilization, and Uextra is the (per runqueue) extra
				1184	* reclaimable utilization.
Luca Abeni	9f0d1a5	2017-05-18 22:13:35 +0200	[diff] [blame]	1185	* Since rq->dl.running_bw and rq->dl.this_bw contain utilizations
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	1186	* multiplied by 2^BW_SHIFT, the result has to be shifted right by
				1187	* BW_SHIFT.
				1188	* Since rq->dl.bw_ratio contains 1 / Umax multipled by 2^RATIO_SHIFT,
				1189	* dl_bw is multiped by rq->dl.bw_ratio and shifted right by RATIO_SHIFT.
				1190	* Since delta is a 64 bit variable, to have an overflow its value
				1191	* should be larger than 2^(64 - 20 - 8), which is more than 64 seconds.
				1192	* So, overflow is not an issue here.
Luca Abeni	c52f14d	2017-05-18 22:13:31 +0200	[diff] [blame]	1193	*/
Mathieu Malaterre	3febfc8a	2018-05-16 22:09:02 +0200	[diff] [blame]	1194	static u64 grub_reclaim(u64 delta, struct rq rq, struct sched_dl_entity dl_se)
Luca Abeni	c52f14d	2017-05-18 22:13:31 +0200	[diff] [blame]	1195	{
Luca Abeni	9f0d1a5	2017-05-18 22:13:35 +0200	[diff] [blame]	1196	u64 u_inact = rq->dl.this_bw - rq->dl.running_bw; /* Utot - Uact */
				1197	u64 u_act;
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	1198	u64 u_act_min = (dl_se->dl_bw * rq->dl.bw_ratio) >> RATIO_SHIFT;
Luca Abeni	c52f14d	2017-05-18 22:13:31 +0200	[diff] [blame]	1199
Luca Abeni	9f0d1a5	2017-05-18 22:13:35 +0200	[diff] [blame]	1200	/*
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	1201	* Instead of computing max{u * bw_ratio, (1 - u_inact - u_extra)},
				1202	* we compare u_inact + rq->dl.extra_bw with
				1203	* 1 - (u * rq->dl.bw_ratio >> RATIO_SHIFT), because
				1204	* u_inact + rq->dl.extra_bw can be larger than
				1205	* 1 * (so, 1 - u_inact - rq->dl.extra_bw would be negative
				1206	* leading to wrong results)
Luca Abeni	9f0d1a5	2017-05-18 22:13:35 +0200	[diff] [blame]	1207	*/
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	1208	if (u_inact + rq->dl.extra_bw > BW_UNIT - u_act_min)
				1209	u_act = u_act_min;
Luca Abeni	9f0d1a5	2017-05-18 22:13:35 +0200	[diff] [blame]	1210	else
Luca Abeni	daec579	2017-05-18 22:13:36 +0200	[diff] [blame]	1211	u_act = BW_UNIT - u_inact - rq->dl.extra_bw;
Luca Abeni	9f0d1a5	2017-05-18 22:13:35 +0200	[diff] [blame]	1212
				1213	return (delta * u_act) >> BW_SHIFT;
Luca Abeni	c52f14d	2017-05-18 22:13:31 +0200	[diff] [blame]	1214	}
				1215
				1216	/*
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1217	* Update the current task's runtime statistics (provided it is still
				1218	* a -deadline task and has not been removed from the dl_rq).
				1219	*/
				1220	static void update_curr_dl(struct rq *rq)
				1221	{
				1222	struct task_struct *curr = rq->curr;
				1223	struct sched_dl_entity *dl_se = &curr->dl;
Juri Lelli	0788116	2017-12-04 11:23:25 +0100	[diff] [blame]	1224	u64 delta_exec, scaled_delta_exec;
				1225	int cpu = cpu_of(rq);
Wen Yang	6fe0ce1	2018-02-06 09:55:48 +0800	[diff] [blame]	1226	u64 now;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1227
				1228	if (!dl_task(curr) \|\| !on_dl_rq(dl_se))
				1229	return;
				1230
				1231	/*
				1232	* Consumed budget is computed considering the time as
				1233	* observed by schedulable tasks (excluding time spent
				1234	* in hardirq context, etc.). Deadlines are instead
				1235	* computed using hard walltime. This seems to be the more
				1236	* natural solution, but the full ramifications of this
				1237	* approach need further study.
				1238	*/
Wen Yang	6fe0ce1	2018-02-06 09:55:48 +0800	[diff] [blame]	1239	now = rq_clock_task(rq);
				1240	delta_exec = now - curr->se.exec_start;
Peter Zijlstra	48be3a6	2016-02-23 13:28:22 +0100	[diff] [blame]	1241	if (unlikely((s64)delta_exec <= 0)) {
				1242	if (unlikely(dl_se->dl_yielded))
				1243	goto throttle;
Kirill Tkhai	734ff2a	2014-03-04 19:25:46 +0400	[diff] [blame]	1244	return;
Peter Zijlstra	48be3a6	2016-02-23 13:28:22 +0100	[diff] [blame]	1245	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1246
				1247	schedstat_set(curr->se.statistics.exec_max,
				1248	max(curr->se.statistics.exec_max, delta_exec));
				1249
				1250	curr->se.sum_exec_runtime += delta_exec;
				1251	account_group_exec_runtime(curr, delta_exec);
				1252
Wen Yang	6fe0ce1	2018-02-06 09:55:48 +0800	[diff] [blame]	1253	curr->se.exec_start = now;
Tejun Heo	d2cc5ed	2017-09-25 08:12:04 -0700	[diff] [blame]	1254	cgroup_account_cputime(curr, delta_exec);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1255
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1256	if (dl_entity_is_special(dl_se))
				1257	return;
				1258
Juri Lelli	0788116	2017-12-04 11:23:25 +0100	[diff] [blame]	1259	/*
				1260	* For tasks that participate in GRUB, we implement GRUB-PA: the
				1261	* spare reclaimed bandwidth is used to clock down frequency.
				1262	*
				1263	* For the others, we still need to scale reservation parameters
				1264	* according to current frequency and CPU maximum capacity.
				1265	*/
				1266	if (unlikely(dl_se->flags & SCHED_FLAG_RECLAIM)) {
				1267	scaled_delta_exec = grub_reclaim(delta_exec,
				1268	rq,
				1269	&curr->dl);
				1270	} else {
				1271	unsigned long scale_freq = arch_scale_freq_capacity(cpu);
Vincent Guittot	8ec59c0	2019-06-17 17:00:17 +0200	[diff] [blame]	1272	unsigned long scale_cpu = arch_scale_cpu_capacity(cpu);
Juri Lelli	0788116	2017-12-04 11:23:25 +0100	[diff] [blame]	1273
				1274	scaled_delta_exec = cap_scale(delta_exec, scale_freq);
				1275	scaled_delta_exec = cap_scale(scaled_delta_exec, scale_cpu);
				1276	}
				1277
				1278	dl_se->runtime -= scaled_delta_exec;
Peter Zijlstra	48be3a6	2016-02-23 13:28:22 +0100	[diff] [blame]	1279
				1280	throttle:
				1281	if (dl_runtime_exceeded(dl_se) \|\| dl_se->dl_yielded) {
Peter Zijlstra	1019a35	2014-11-26 08:44:03 +0800	[diff] [blame]	1282	dl_se->dl_throttled = 1;
Juri Lelli	34be393	2017-12-12 12:10:24 +0100	[diff] [blame]	1283
				1284	/* If requested, inform the user about runtime overruns. */
				1285	if (dl_runtime_exceeded(dl_se) &&
				1286	(dl_se->flags & SCHED_FLAG_DL_OVERRUN))
				1287	dl_se->dl_overrun = 1;
				1288
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1289	__dequeue_task_dl(rq, curr, 0);
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	1290	if (unlikely(dl_se->dl_boosted \|\| !start_dl_timer(curr)))
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1291	enqueue_task_dl(rq, curr, ENQUEUE_REPLENISH);
				1292
				1293	if (!is_leftmost(curr, &rq->dl))
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	1294	resched_curr(rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1295	}
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	1296
				1297	/*
				1298	* Because -- for now -- we share the rt bandwidth, we need to
				1299	* account our runtime there too, otherwise actual rt tasks
				1300	* would be able to exceed the shared quota.
				1301	*
				1302	* Account to the root rt group for now.
				1303	*
				1304	* The solution we're working towards is having the RT groups scheduled
				1305	* using deadline servers -- however there's a few nasties to figure
				1306	* out before that can happen.
				1307	*/
				1308	if (rt_bandwidth_enabled()) {
				1309	struct rt_rq *rt_rq = &rq->rt;
				1310
				1311	raw_spin_lock(&rt_rq->rt_runtime_lock);
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	1312	/*
				1313	* We'll let actual RT tasks worry about the overflow here, we
Juri Lelli	faa5993	2014-02-21 11:37:15 +0100	[diff] [blame]	1314	* have our own CBS to keep us inline; only account when RT
				1315	* bandwidth is relevant.
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	1316	*/
Juri Lelli	faa5993	2014-02-21 11:37:15 +0100	[diff] [blame]	1317	if (sched_rt_bandwidth_account(rt_rq))
				1318	rt_rq->rt_time += delta_exec;
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	1319	raw_spin_unlock(&rt_rq->rt_runtime_lock);
				1320	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1321	}
				1322
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1323	static enum hrtimer_restart inactive_task_timer(struct hrtimer *timer)
				1324	{
				1325	struct sched_dl_entity *dl_se = container_of(timer,
				1326	struct sched_dl_entity,
				1327	inactive_timer);
				1328	struct task_struct *p = dl_task_of(dl_se);
				1329	struct rq_flags rf;
				1330	struct rq *rq;
				1331
				1332	rq = task_rq_lock(p, &rf);
				1333
Juri Lelli	ecda2b6	2018-05-30 18:08:09 +0200	[diff] [blame]	1334	sched_clock_tick();
				1335	update_rq_clock(rq);
				1336
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1337	if (!dl_task(p) \|\| p->state == TASK_DEAD) {
Luca Abeni	387e313	2017-05-18 22:13:30 +0200	[diff] [blame]	1338	struct dl_bw *dl_b = dl_bw_of(task_cpu(p));
				1339
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1340	if (p->state == TASK_DEAD && dl_se->dl_non_contending) {
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1341	sub_running_bw(&p->dl, dl_rq_of_se(&p->dl));
				1342	sub_rq_bw(&p->dl, dl_rq_of_se(&p->dl));
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1343	dl_se->dl_non_contending = 0;
				1344	}
Luca Abeni	387e313	2017-05-18 22:13:30 +0200	[diff] [blame]	1345
				1346	raw_spin_lock(&dl_b->lock);
Peter Zijlstra	8c0944ce	2017-09-07 12:09:30 +0200	[diff] [blame]	1347	__dl_sub(dl_b, p->dl.dl_bw, dl_bw_cpus(task_cpu(p)));
Luca Abeni	387e313	2017-05-18 22:13:30 +0200	[diff] [blame]	1348	raw_spin_unlock(&dl_b->lock);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1349	__dl_clear_params(p);
				1350
				1351	goto unlock;
				1352	}
				1353	if (dl_se->dl_non_contending == 0)
				1354	goto unlock;
				1355
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1356	sub_running_bw(dl_se, &rq->dl);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1357	dl_se->dl_non_contending = 0;
				1358	unlock:
				1359	task_rq_unlock(rq, p, &rf);
				1360	put_task_struct(p);
				1361
				1362	return HRTIMER_NORESTART;
				1363	}
				1364
				1365	void init_dl_inactive_task_timer(struct sched_dl_entity *dl_se)
				1366	{
				1367	struct hrtimer *timer = &dl_se->inactive_timer;
				1368
Juri Lelli	850377a	2019-07-31 12:37:15 +0200	[diff] [blame]	1369	hrtimer_init(timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL_HARD);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1370	timer->function = inactive_task_timer;
				1371	}
				1372
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1373	#ifdef CONFIG_SMP
				1374
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1375	static void inc_dl_deadline(struct dl_rq *dl_rq, u64 deadline)
				1376	{
				1377	struct rq *rq = rq_of_dl_rq(dl_rq);
				1378
				1379	if (dl_rq->earliest_dl.curr == 0 \|\|
				1380	dl_time_before(deadline, dl_rq->earliest_dl.curr)) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1381	dl_rq->earliest_dl.curr = deadline;
Tommaso Cucinotta	d8206bb	2016-08-14 16:27:08 +0200	[diff] [blame]	1382	cpudl_set(&rq->rd->cpudl, rq->cpu, deadline);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1383	}
				1384	}
				1385
				1386	static void dec_dl_deadline(struct dl_rq *dl_rq, u64 deadline)
				1387	{
				1388	struct rq *rq = rq_of_dl_rq(dl_rq);
				1389
				1390	/*
				1391	* Since we may have removed our earliest (and/or next earliest)
				1392	* task we must recompute them.
				1393	*/
				1394	if (!dl_rq->dl_nr_running) {
				1395	dl_rq->earliest_dl.curr = 0;
				1396	dl_rq->earliest_dl.next = 0;
Tommaso Cucinotta	d8206bb	2016-08-14 16:27:08 +0200	[diff] [blame]	1397	cpudl_clear(&rq->rd->cpudl, rq->cpu);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1398	} else {
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	1399	struct rb_node *leftmost = dl_rq->root.rb_leftmost;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1400	struct sched_dl_entity *entry;
				1401
				1402	entry = rb_entry(leftmost, struct sched_dl_entity, rb_node);
				1403	dl_rq->earliest_dl.curr = entry->deadline;
Tommaso Cucinotta	d8206bb	2016-08-14 16:27:08 +0200	[diff] [blame]	1404	cpudl_set(&rq->rd->cpudl, rq->cpu, entry->deadline);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1405	}
				1406	}
				1407
				1408	#else
				1409
				1410	static inline void inc_dl_deadline(struct dl_rq *dl_rq, u64 deadline) {}
				1411	static inline void dec_dl_deadline(struct dl_rq *dl_rq, u64 deadline) {}
				1412
				1413	#endif /* CONFIG_SMP */
				1414
				1415	static inline
				1416	void inc_dl_tasks(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				1417	{
				1418	int prio = dl_task_of(dl_se)->prio;
				1419	u64 deadline = dl_se->deadline;
				1420
				1421	WARN_ON(!dl_prio(prio));
				1422	dl_rq->dl_nr_running++;
Kirill Tkhai	7246544	2014-05-09 03:00:14 +0400	[diff] [blame]	1423	add_nr_running(rq_of_dl_rq(dl_rq), 1);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1424
				1425	inc_dl_deadline(dl_rq, deadline);
				1426	inc_dl_migration(dl_se, dl_rq);
				1427	}
				1428
				1429	static inline
				1430	void dec_dl_tasks(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				1431	{
				1432	int prio = dl_task_of(dl_se)->prio;
				1433
				1434	WARN_ON(!dl_prio(prio));
				1435	WARN_ON(!dl_rq->dl_nr_running);
				1436	dl_rq->dl_nr_running--;
Kirill Tkhai	7246544	2014-05-09 03:00:14 +0400	[diff] [blame]	1437	sub_nr_running(rq_of_dl_rq(dl_rq), 1);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1438
				1439	dec_dl_deadline(dl_rq, dl_se->deadline);
				1440	dec_dl_migration(dl_se, dl_rq);
				1441	}
				1442
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1443	static void __enqueue_dl_entity(struct sched_dl_entity *dl_se)
				1444	{
				1445	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	1446	struct rb_node **link = &dl_rq->root.rb_root.rb_node;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1447	struct rb_node *parent = NULL;
				1448	struct sched_dl_entity *entry;
				1449	int leftmost = 1;
				1450
				1451	BUG_ON(!RB_EMPTY_NODE(&dl_se->rb_node));
				1452
				1453	while (*link) {
				1454	parent = *link;
				1455	entry = rb_entry(parent, struct sched_dl_entity, rb_node);
				1456	if (dl_time_before(dl_se->deadline, entry->deadline))
				1457	link = &parent->rb_left;
				1458	else {
				1459	link = &parent->rb_right;
				1460	leftmost = 0;
				1461	}
				1462	}
				1463
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1464	rb_link_node(&dl_se->rb_node, parent, link);
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	1465	rb_insert_color_cached(&dl_se->rb_node, &dl_rq->root, leftmost);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1466
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1467	inc_dl_tasks(dl_se, dl_rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1468	}
				1469
				1470	static void __dequeue_dl_entity(struct sched_dl_entity *dl_se)
				1471	{
				1472	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				1473
				1474	if (RB_EMPTY_NODE(&dl_se->rb_node))
				1475	return;
				1476
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	1477	rb_erase_cached(&dl_se->rb_node, &dl_rq->root);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1478	RB_CLEAR_NODE(&dl_se->rb_node);
				1479
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1480	dec_dl_tasks(dl_se, dl_rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1481	}
				1482
				1483	static void
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1484	enqueue_dl_entity(struct sched_dl_entity *dl_se,
				1485	struct sched_dl_entity *pi_se, int flags)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1486	{
				1487	BUG_ON(on_dl_rq(dl_se));
				1488
				1489	/*
				1490	* If this is a wakeup or a new instance, the scheduling
				1491	* parameters of the task might need updating. Otherwise,
				1492	* we want a replenishment of its runtime.
				1493	*/
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1494	if (flags & ENQUEUE_WAKEUP) {
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1495	task_contending(dl_se, flags);
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1496	update_dl_entity(dl_se, pi_se);
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1497	} else if (flags & ENQUEUE_REPLENISH) {
Luca Abeni	6a503c3	2014-12-17 11:50:31 +0100	[diff] [blame]	1498	replenish_dl_entity(dl_se, pi_se);
Luca Abeni	295d6d5	2017-09-07 12:09:29 +0200	[diff] [blame]	1499	} else if ((flags & ENQUEUE_RESTORE) &&
				1500	dl_time_before(dl_se->deadline,
				1501	rq_clock(rq_of_dl_rq(dl_rq_of_se(dl_se))))) {
				1502	setup_new_dl_entity(dl_se);
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1503	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1504
				1505	__enqueue_dl_entity(dl_se);
				1506	}
				1507
				1508	static void dequeue_dl_entity(struct sched_dl_entity *dl_se)
				1509	{
				1510	__dequeue_dl_entity(dl_se);
				1511	}
				1512
				1513	static void enqueue_task_dl(struct rq rq, struct task_struct p, int flags)
				1514	{
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1515	struct task_struct *pi_task = rt_mutex_get_top_task(p);
				1516	struct sched_dl_entity *pi_se = &p->dl;
				1517
				1518	/*
Joel Fernandes	193be41	2017-07-12 19:24:29 -0700	[diff] [blame]	1519	* Use the scheduling parameters of the top pi-waiter task if:
				1520	* - we have a top pi-waiter which is a SCHED_DEADLINE task AND
				1521	* - our dl_boosted is set (i.e. the pi-waiter's (absolute) deadline is
				1522	* smaller than our deadline OR we are a !SCHED_DEADLINE task getting
				1523	* boosted due to a SCHED_DEADLINE pi-waiter).
				1524	* Otherwise we keep our runtime and deadline.
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1525	*/
Joel Fernandes	193be41	2017-07-12 19:24:29 -0700	[diff] [blame]	1526	if (pi_task && dl_prio(pi_task->normal_prio) && p->dl.dl_boosted) {
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1527	pi_se = &pi_task->dl;
Daniel Bristot de Oliveira	feff2e6	2020-09-16 09:06:39 +0200	[diff] [blame]	1528	/*
				1529	* Because of delays in the detection of the overrun of a
				1530	* thread's runtime, it might be the case that a thread
				1531	* goes to sleep in a rt mutex with negative runtime. As
				1532	* a consequence, the thread will be throttled.
				1533	*
				1534	* While waiting for the mutex, this thread can also be
				1535	* boosted via PI, resulting in a thread that is throttled
				1536	* and boosted at the same time.
				1537	*
				1538	* In this case, the boost overrides the throttle.
				1539	*/
				1540	if (p->dl.dl_throttled) {
				1541	/*
				1542	* The replenish timer needs to be canceled. No
				1543	* problem if it fires concurrently: boosted threads
				1544	* are ignored in dl_task_timer().
				1545	*/
				1546	hrtimer_try_to_cancel(&p->dl.dl_timer);
				1547	p->dl.dl_throttled = 0;
				1548	}
Juri Lelli	64be6f1	2014-10-24 10:16:37 +0100	[diff] [blame]	1549	} else if (!dl_prio(p->normal_prio)) {
				1550	/*
Lucas Stach	46fcc4b	2020-08-31 13:07:19 +0200	[diff] [blame]	1551	* Special case in which we have a !SCHED_DEADLINE task that is going
				1552	* to be deboosted, but exceeds its runtime while doing so. No point in
				1553	* replenishing it, as it's going to return back to its original
				1554	* scheduling class after this. If it has been throttled, we need to
				1555	* clear the flag, otherwise the task may wake up as throttled after
				1556	* being boosted again with no means to replenish the runtime and clear
				1557	* the throttle.
Juri Lelli	64be6f1	2014-10-24 10:16:37 +0100	[diff] [blame]	1558	*/
Lucas Stach	46fcc4b	2020-08-31 13:07:19 +0200	[diff] [blame]	1559	p->dl.dl_throttled = 0;
Juri Lelli	64be6f1	2014-10-24 10:16:37 +0100	[diff] [blame]	1560	BUG_ON(!p->dl.dl_boosted \|\| flags != ENQUEUE_REPLENISH);
				1561	return;
				1562	}
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1563
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1564	/*
Daniel Bristot de Oliveira	df8eac8	2017-03-02 15:10:58 +0100	[diff] [blame]	1565	* Check if a constrained deadline task was activated
				1566	* after the deadline but before the next period.
				1567	* If that is the case, the task will be throttled and
				1568	* the replenishment timer will be set to the next period.
				1569	*/
Daniel Bristot de Oliveira	3effcb4	2017-05-29 16:24:03 +0200	[diff] [blame]	1570	if (!p->dl.dl_throttled && !dl_is_implicit(&p->dl))
Daniel Bristot de Oliveira	df8eac8	2017-03-02 15:10:58 +0100	[diff] [blame]	1571	dl_check_constrained_dl(&p->dl);
				1572
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1573	if (p->on_rq == TASK_ON_RQ_MIGRATING \|\| flags & ENQUEUE_RESTORE) {
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1574	add_rq_bw(&p->dl, &rq->dl);
				1575	add_running_bw(&p->dl, &rq->dl);
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1576	}
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1577
Daniel Bristot de Oliveira	df8eac8	2017-03-02 15:10:58 +0100	[diff] [blame]	1578	/*
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1579	* If p is throttled, we do not enqueue it. In fact, if it exhausted
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1580	* its budget it needs a replenishment and, since it now is on
				1581	* its rq, the bandwidth timer callback (which clearly has not
				1582	* run yet) will take care of this.
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1583	* However, the active utilization does not depend on the fact
				1584	* that the task is on the runqueue or not (but depends on the
				1585	* task's state - in GRUB parlance, "inactive" vs "active contending").
				1586	* In other words, even if a task is throttled its utilization must
				1587	* be counted in the active utilization; hence, we need to call
				1588	* add_running_bw().
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1589	*/
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1590	if (p->dl.dl_throttled && !(flags & ENQUEUE_REPLENISH)) {
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1591	if (flags & ENQUEUE_WAKEUP)
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1592	task_contending(&p->dl, flags);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1593
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1594	return;
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1595	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1596
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1597	enqueue_dl_entity(&p->dl, pi_se, flags);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1598
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	1599	if (!task_current(rq, p) && p->nr_cpus_allowed > 1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1600	enqueue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1601	}
				1602
				1603	static void __dequeue_task_dl(struct rq rq, struct task_struct p, int flags)
				1604	{
				1605	dequeue_dl_entity(&p->dl);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1606	dequeue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1607	}
				1608
				1609	static void dequeue_task_dl(struct rq rq, struct task_struct p, int flags)
				1610	{
				1611	update_curr_dl(rq);
				1612	__dequeue_task_dl(rq, p, flags);
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1613
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1614	if (p->on_rq == TASK_ON_RQ_MIGRATING \|\| flags & DEQUEUE_SAVE) {
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1615	sub_running_bw(&p->dl, &rq->dl);
				1616	sub_rq_bw(&p->dl, &rq->dl);
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1617	}
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1618
				1619	/*
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1620	* This check allows to start the inactive timer (or to immediately
				1621	* decrease the active utilization, if needed) in two cases:
Luca Abeni	e36d867	2017-05-18 22:13:28 +0200	[diff] [blame]	1622	* when the task blocks and when it is terminating
				1623	* (p->state == TASK_DEAD). We can handle the two cases in the same
				1624	* way, because from GRUB's point of view the same thing is happening
				1625	* (the task moves from "active contending" to "active non contending"
				1626	* or "inactive")
				1627	*/
				1628	if (flags & DEQUEUE_SLEEP)
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1629	task_non_contending(p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1630	}
				1631
				1632	/*
				1633	* Yield task semantic for -deadline tasks is:
				1634	*
				1635	* get off from the CPU until our next instance, with
				1636	* a new runtime. This is of little use now, since we
				1637	* don't have a bandwidth reclaiming mechanism. Anyway,
				1638	* bandwidth reclaiming is planned for the future, and
				1639	* yield_task_dl will indicate that some spare budget
				1640	* is available for other task instances to use it.
				1641	*/
				1642	static void yield_task_dl(struct rq *rq)
				1643	{
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1644	/*
				1645	* We make the task go to sleep until its current deadline by
				1646	* forcing its runtime to zero. This way, update_curr_dl() stops
				1647	* it and the bandwidth timer will wake it up and will give it
Juri Lelli	5bfd126	2014-04-15 13:49:04 +0200	[diff] [blame]	1648	* new scheduling parameters (thanks to dl_yielded=1).
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1649	*/
Peter Zijlstra	48be3a6	2016-02-23 13:28:22 +0100	[diff] [blame]	1650	rq->curr->dl.dl_yielded = 1;
				1651
Kirill Tkhai	6f1607f	2015-02-04 12:09:32 +0300	[diff] [blame]	1652	update_rq_clock(rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1653	update_curr_dl(rq);
Wanpeng Li	44fb085	2015-03-10 12:20:00 +0800	[diff] [blame]	1654	/*
				1655	* Tell update_rq_clock() that we've just updated,
				1656	* so we don't do microscopic update in schedule()
				1657	* and double the fastpath cost.
				1658	*/
Davidlohr Bueso	adcc8da	2018-04-04 09:15:39 -0700	[diff] [blame]	1659	rq_clock_skip_update(rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1660	}
				1661
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1662	#ifdef CONFIG_SMP
				1663
				1664	static int find_later_rq(struct task_struct *task);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1665
				1666	static int
				1667	select_task_rq_dl(struct task_struct *p, int cpu, int sd_flag, int flags)
				1668	{
				1669	struct task_struct *curr;
Luca Abeni	b411898	2020-05-20 15:42:42 +0200	[diff] [blame]	1670	bool select_rq;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1671	struct rq *rq;
				1672
Wanpeng Li	1d7e974	2014-10-14 10:22:39 +0800	[diff] [blame]	1673	if (sd_flag != SD_BALANCE_WAKE)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1674	goto out;
				1675
				1676	rq = cpu_rq(cpu);
				1677
				1678	rcu_read_lock();
Jason Low	316c1608d	2015-04-28 13:00:20 -0700	[diff] [blame]	1679	curr = READ_ONCE(rq->curr); /* unlocked access */
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1680
				1681	/*
				1682	* If we are dealing with a -deadline task, we must
				1683	* decide where to wake it up.
				1684	* If it has a later deadline and the current task
				1685	* on this rq can't move (provided the waking task
				1686	* can!) we prefer to send it somewhere else. On the
				1687	* other hand, if it has a shorter deadline, we
				1688	* try to make it stay here, it might be important.
				1689	*/
Luca Abeni	b411898	2020-05-20 15:42:42 +0200	[diff] [blame]	1690	select_rq = unlikely(dl_task(curr)) &&
				1691	(curr->nr_cpus_allowed < 2 \|\|
				1692	!dl_entity_preempt(&p->dl, &curr->dl)) &&
				1693	p->nr_cpus_allowed > 1;
				1694
				1695	/*
				1696	* Take the capacity of the CPU into account to
				1697	* ensure it fits the requirement of the task.
				1698	*/
				1699	if (static_branch_unlikely(&sched_asym_cpucapacity))
				1700	select_rq \|= !dl_task_fits_capacity(p, cpu);
				1701
				1702	if (select_rq) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1703	int target = find_later_rq(p);
				1704
Wanpeng Li	9d51426	2015-05-13 14:01:03 +0800	[diff] [blame]	1705	if (target != -1 &&
Luca Abeni	5aa5050	2015-10-16 10:06:21 +0200	[diff] [blame]	1706	(dl_time_before(p->dl.deadline,
				1707	cpu_rq(target)->dl.earliest_dl.curr) \|\|
				1708	(cpu_rq(target)->dl.dl_nr_running == 0)))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1709	cpu = target;
				1710	}
				1711	rcu_read_unlock();
				1712
				1713	out:
				1714	return cpu;
				1715	}
				1716
Srikar Dronamraju	1327237a5	2018-09-21 23:18:57 +0530	[diff] [blame]	1717	static void migrate_task_rq_dl(struct task_struct *p, int new_cpu __maybe_unused)
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1718	{
				1719	struct rq *rq;
				1720
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1721	if (p->state != TASK_WAKING)
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1722	return;
				1723
				1724	rq = task_rq(p);
				1725	/*
				1726	* Since p->state == TASK_WAKING, set_task_cpu() has been called
				1727	* from try_to_wake_up(). Hence, p->pi_lock is locked, but
				1728	* rq->lock is not... So, lock it
				1729	*/
				1730	raw_spin_lock(&rq->lock);
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1731	if (p->dl.dl_non_contending) {
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1732	sub_running_bw(&p->dl, &rq->dl);
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	1733	p->dl.dl_non_contending = 0;
				1734	/*
				1735	* If the timer handler is currently running and the
				1736	* timer cannot be cancelled, inactive_task_timer()
				1737	* will see that dl_not_contending is not set, and
				1738	* will not touch the rq's active utilization,
				1739	* so we are still safe.
				1740	*/
				1741	if (hrtimer_try_to_cancel(&p->dl.inactive_timer) == 1)
				1742	put_task_struct(p);
				1743	}
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	1744	sub_rq_bw(&p->dl, &rq->dl);
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	1745	raw_spin_unlock(&rq->lock);
				1746	}
				1747
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1748	static void check_preempt_equal_dl(struct rq rq, struct task_struct p)
				1749	{
				1750	/*
				1751	* Current can't be migrated, useless to reschedule,
				1752	* let's hope p can move out.
				1753	*/
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	1754	if (rq->curr->nr_cpus_allowed == 1 \|\|
Byungchul Park	3261ed0	2017-05-23 11:00:57 +0900	[diff] [blame]	1755	!cpudl_find(&rq->rd->cpudl, rq->curr, NULL))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1756	return;
				1757
				1758	/*
				1759	* p is migratable, so let's not schedule it and
				1760	* see if it is pushed or pulled somewhere else.
				1761	*/
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	1762	if (p->nr_cpus_allowed != 1 &&
Byungchul Park	3261ed0	2017-05-23 11:00:57 +0900	[diff] [blame]	1763	cpudl_find(&rq->rd->cpudl, p, NULL))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1764	return;
				1765
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	1766	resched_curr(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1767	}
				1768
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	1769	static int balance_dl(struct rq rq, struct task_struct p, struct rq_flags *rf)
				1770	{
				1771	if (!on_dl_rq(&p->dl) && need_pull_dl_task(rq, p)) {
				1772	/*
				1773	* This is OK, because current is on_cpu, which avoids it being
				1774	* picked for load-balance and preemption/IRQs are still
				1775	* disabled avoiding further scheduler activity on it and we've
				1776	* not yet started the picking loop.
				1777	*/
				1778	rq_unpin_lock(rq, rf);
				1779	pull_dl_task(rq);
				1780	rq_repin_lock(rq, rf);
				1781	}
				1782
				1783	return sched_stop_runnable(rq) \|\| sched_dl_runnable(rq);
				1784	}
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1785	#endif /* CONFIG_SMP */
				1786
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1787	/*
				1788	* Only called when both the current and waking task are -deadline
				1789	* tasks.
				1790	*/
				1791	static void check_preempt_curr_dl(struct rq rq, struct task_struct p,
				1792	int flags)
				1793	{
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1794	if (dl_entity_preempt(&p->dl, &rq->curr->dl)) {
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	1795	resched_curr(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1796	return;
				1797	}
				1798
				1799	#ifdef CONFIG_SMP
				1800	/*
				1801	* In the unlikely case current and p have the same deadline
				1802	* let us try to decide what's the best thing to do...
				1803	*/
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	1804	if ((p->dl.deadline == rq->curr->dl.deadline) &&
				1805	!test_tsk_need_resched(rq->curr))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1806	check_preempt_equal_dl(rq, p);
				1807	#endif /* CONFIG_SMP */
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1808	}
				1809
				1810	#ifdef CONFIG_SCHED_HRTICK
				1811	static void start_hrtick_dl(struct rq rq, struct task_struct p)
				1812	{
xiaofeng.yan	177ef2a	2014-08-26 03:15:41 +0000	[diff] [blame]	1813	hrtick_start(rq, p->dl.runtime);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1814	}
Wanpeng Li	36ce988	2014-11-11 09:52:26 +0800	[diff] [blame]	1815	#else /* !CONFIG_SCHED_HRTICK */
				1816	static void start_hrtick_dl(struct rq rq, struct task_struct p)
				1817	{
				1818	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1819	#endif
				1820
Peter Zijlstra	a0e813f	2019-11-08 14:16:00 +0100	[diff] [blame]	1821	static void set_next_task_dl(struct rq rq, struct task_struct p, bool first)
Muchun Song	ff1cdc9	2018-10-26 21:17:43 +0800	[diff] [blame]	1822	{
				1823	p->se.exec_start = rq_clock_task(rq);
				1824
				1825	/* You can't push away the running task */
				1826	dequeue_pushable_dl_task(rq, p);
Peter Zijlstra	f95d4ea	2019-05-29 20:36:40 +0000	[diff] [blame]	1827
Peter Zijlstra	a0e813f	2019-11-08 14:16:00 +0100	[diff] [blame]	1828	if (!first)
				1829	return;
				1830
Peter Zijlstra	f95d4ea	2019-05-29 20:36:40 +0000	[diff] [blame]	1831	if (hrtick_enabled(rq))
				1832	start_hrtick_dl(rq, p);
				1833
				1834	if (rq->curr->sched_class != &dl_sched_class)
				1835	update_dl_rq_load_avg(rq_clock_pelt(rq), rq, 0);
				1836
				1837	deadline_queue_push_tasks(rq);
Muchun Song	ff1cdc9	2018-10-26 21:17:43 +0800	[diff] [blame]	1838	}
				1839
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1840	static struct sched_dl_entity pick_next_dl_entity(struct rq rq,
				1841	struct dl_rq *dl_rq)
				1842	{
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	1843	struct rb_node *left = rb_first_cached(&dl_rq->root);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1844
				1845	if (!left)
				1846	return NULL;
				1847
				1848	return rb_entry(left, struct sched_dl_entity, rb_node);
				1849	}
				1850
Peter Zijlstra	98c2f70	2019-11-08 14:15:58 +0100	[diff] [blame]	1851	static struct task_struct pick_next_task_dl(struct rq rq)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1852	{
				1853	struct sched_dl_entity *dl_se;
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	1854	struct dl_rq *dl_rq = &rq->dl;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1855	struct task_struct *p;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1856
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	1857	if (!sched_dl_runnable(rq))
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1858	return NULL;
				1859
				1860	dl_se = pick_next_dl_entity(rq, dl_rq);
				1861	BUG_ON(!dl_se);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1862	p = dl_task_of(dl_se);
Peter Zijlstra	a0e813f	2019-11-08 14:16:00 +0100	[diff] [blame]	1863	set_next_task_dl(rq, p, true);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1864	return p;
				1865	}
				1866
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	1867	static void put_prev_task_dl(struct rq rq, struct task_struct p)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1868	{
				1869	update_curr_dl(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1870
Vincent Guittot	2312729	2019-01-23 16:26:53 +0100	[diff] [blame]	1871	update_dl_rq_load_avg(rq_clock_pelt(rq), rq, 1);
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	1872	if (on_dl_rq(&p->dl) && p->nr_cpus_allowed > 1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1873	enqueue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1874	}
				1875
Frederic Weisbecker	d84b313	2018-02-21 05:17:27 +0100	[diff] [blame]	1876	/*
				1877	* scheduler tick hitting a task of our scheduling class.
				1878	*
				1879	* NOTE: This function can be called remotely by the tick offload that
				1880	* goes along full dynticks. Therefore no local assumption can be made
				1881	* and everything must be accessed through the @rq and @curr passed in
				1882	* parameters.
				1883	*/
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1884	static void task_tick_dl(struct rq rq, struct task_struct p, int queued)
				1885	{
				1886	update_curr_dl(rq);
				1887
Vincent Guittot	2312729	2019-01-23 16:26:53 +0100	[diff] [blame]	1888	update_dl_rq_load_avg(rq_clock_pelt(rq), rq, 1);
Wanpeng Li	a7bebf4	2014-11-26 08:44:01 +0800	[diff] [blame]	1889	/*
				1890	* Even when we have runtime, update_curr_dl() might have resulted in us
				1891	* not being the leftmost task anymore. In that case NEED_RESCHED will
				1892	* be set and schedule() will start a new hrtick for the next task.
				1893	*/
				1894	if (hrtick_enabled(rq) && queued && p->dl.runtime > 0 &&
				1895	is_leftmost(p, &rq->dl))
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1896	start_hrtick_dl(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1897	}
				1898
				1899	static void task_fork_dl(struct task_struct *p)
				1900	{
				1901	/*
				1902	* SCHED_DEADLINE tasks cannot fork and this is achieved through
				1903	* sched_fork()
				1904	*/
				1905	}
				1906
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1907	#ifdef CONFIG_SMP
				1908
				1909	/* Only try algorithms three times */
				1910	#define DL_MAX_TRIES 3
				1911
				1912	static int pick_dl_task(struct rq rq, struct task_struct p, int cpu)
				1913	{
				1914	if (!task_running(rq, p) &&
Peter Zijlstra	95158a8	2020-10-01 16:05:39 +0200	[diff] [blame]	1915	cpumask_test_cpu(cpu, &p->cpus_mask))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1916	return 1;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1917	return 0;
				1918	}
				1919
Wanpeng Li	8b5e770	2015-05-13 14:01:01 +0800	[diff] [blame]	1920	/*
				1921	* Return the earliest pushable rq's task, which is suitable to be executed
				1922	* on the CPU, NULL otherwise:
				1923	*/
				1924	static struct task_struct pick_earliest_pushable_dl_task(struct rq rq, int cpu)
				1925	{
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	1926	struct rb_node *next_node = rq->dl.pushable_dl_tasks_root.rb_leftmost;
Wanpeng Li	8b5e770	2015-05-13 14:01:01 +0800	[diff] [blame]	1927	struct task_struct *p = NULL;
				1928
				1929	if (!has_pushable_dl_tasks(rq))
				1930	return NULL;
				1931
				1932	next_node:
				1933	if (next_node) {
				1934	p = rb_entry(next_node, struct task_struct, pushable_dl_tasks);
				1935
				1936	if (pick_dl_task(rq, p, cpu))
				1937	return p;
				1938
				1939	next_node = rb_next(next_node);
				1940	goto next_node;
				1941	}
				1942
				1943	return NULL;
				1944	}
				1945
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1946	static DEFINE_PER_CPU(cpumask_var_t, local_cpu_mask_dl);
				1947
				1948	static int find_later_rq(struct task_struct *task)
				1949	{
				1950	struct sched_domain *sd;
Christoph Lameter	4ba2968	2014-08-26 19:12:21 -0500	[diff] [blame]	1951	struct cpumask *later_mask = this_cpu_cpumask_var_ptr(local_cpu_mask_dl);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1952	int this_cpu = smp_processor_id();
Byungchul Park	b18c3ca	2017-05-23 11:00:56 +0900	[diff] [blame]	1953	int cpu = task_cpu(task);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1954
				1955	/* Make sure the mask is initialized first */
				1956	if (unlikely(!later_mask))
				1957	return -1;
				1958
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	1959	if (task->nr_cpus_allowed == 1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1960	return -1;
				1961
Juri Lelli	91ec677	2014-09-19 10:22:41 +0100	[diff] [blame]	1962	/*
				1963	* We have to consider system topology and task affinity
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1964	* first, then we can look for a suitable CPU.
Juri Lelli	91ec677	2014-09-19 10:22:41 +0100	[diff] [blame]	1965	*/
Byungchul Park	3261ed0	2017-05-23 11:00:57 +0900	[diff] [blame]	1966	if (!cpudl_find(&task_rq(task)->rd->cpudl, task, later_mask))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1967	return -1;
				1968
				1969	/*
Byungchul Park	b18c3ca	2017-05-23 11:00:56 +0900	[diff] [blame]	1970	* If we are here, some targets have been found, including
				1971	* the most suitable which is, among the runqueues where the
				1972	* current tasks have later deadlines than the task's one, the
				1973	* rq with the latest possible one.
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1974	*
				1975	* Now we check how well this matches with task's
				1976	* affinity and system topology.
				1977	*
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	1978	* The last CPU where the task run is our first
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1979	* guess, since it is most likely cache-hot there.
				1980	*/
				1981	if (cpumask_test_cpu(cpu, later_mask))
				1982	return cpu;
				1983	/*
				1984	* Check if this_cpu is to be skipped (i.e., it is
				1985	* not in the mask) or not.
				1986	*/
				1987	if (!cpumask_test_cpu(this_cpu, later_mask))
				1988	this_cpu = -1;
				1989
				1990	rcu_read_lock();
				1991	for_each_domain(cpu, sd) {
				1992	if (sd->flags & SD_WAKE_AFFINE) {
Byungchul Park	b18c3ca	2017-05-23 11:00:56 +0900	[diff] [blame]	1993	int best_cpu;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1994
				1995	/*
				1996	* If possible, preempting this_cpu is
				1997	* cheaper than migrating.
				1998	*/
				1999	if (this_cpu != -1 &&
				2000	cpumask_test_cpu(this_cpu, sched_domain_span(sd))) {
				2001	rcu_read_unlock();
				2002	return this_cpu;
				2003	}
				2004
Peter Zijlstra	14e292f8	2020-10-01 15:54:14 +0200	[diff] [blame]	2005	best_cpu = cpumask_any_and_distribute(later_mask,
				2006	sched_domain_span(sd));
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2007	/*
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2008	* Last chance: if a CPU being in both later_mask
Byungchul Park	b18c3ca	2017-05-23 11:00:56 +0900	[diff] [blame]	2009	* and current sd span is valid, that becomes our
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2010	* choice. Of course, the latest possible CPU is
Byungchul Park	b18c3ca	2017-05-23 11:00:56 +0900	[diff] [blame]	2011	* already under consideration through later_mask.
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2012	*/
Byungchul Park	b18c3ca	2017-05-23 11:00:56 +0900	[diff] [blame]	2013	if (best_cpu < nr_cpu_ids) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2014	rcu_read_unlock();
				2015	return best_cpu;
				2016	}
				2017	}
				2018	}
				2019	rcu_read_unlock();
				2020
				2021	/*
				2022	* At this point, all our guesses failed, we just return
				2023	* 'something', and let the caller sort the things out.
				2024	*/
				2025	if (this_cpu != -1)
				2026	return this_cpu;
				2027
Peter Zijlstra	14e292f8	2020-10-01 15:54:14 +0200	[diff] [blame]	2028	cpu = cpumask_any_distribute(later_mask);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2029	if (cpu < nr_cpu_ids)
				2030	return cpu;
				2031
				2032	return -1;
				2033	}
				2034
				2035	/* Locks the rq it finds */
				2036	static struct rq find_lock_later_rq(struct task_struct task, struct rq *rq)
				2037	{
				2038	struct rq *later_rq = NULL;
				2039	int tries;
				2040	int cpu;
				2041
				2042	for (tries = 0; tries < DL_MAX_TRIES; tries++) {
				2043	cpu = find_later_rq(task);
				2044
				2045	if ((cpu == -1) \|\| (cpu == rq->cpu))
				2046	break;
				2047
				2048	later_rq = cpu_rq(cpu);
				2049
Luca Abeni	5aa5050	2015-10-16 10:06:21 +0200	[diff] [blame]	2050	if (later_rq->dl.dl_nr_running &&
				2051	!dl_time_before(task->dl.deadline,
Wanpeng Li	9d51426	2015-05-13 14:01:03 +0800	[diff] [blame]	2052	later_rq->dl.earliest_dl.curr)) {
				2053	/*
				2054	* Target rq has tasks of equal or earlier deadline,
				2055	* retrying does not release any lock and is unlikely
				2056	* to yield a different result.
				2057	*/
				2058	later_rq = NULL;
				2059	break;
				2060	}
				2061
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2062	/* Retry if something changed. */
				2063	if (double_lock_balance(rq, later_rq)) {
				2064	if (unlikely(task_rq(task) != rq \|\|
Peter Zijlstra	95158a8	2020-10-01 16:05:39 +0200	[diff] [blame]	2065	!cpumask_test_cpu(later_rq->cpu, &task->cpus_mask) \|\|
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	2066	task_running(rq, task) \|\|
Xunlei Pang	13b5ab0	2016-05-09 12:11:31 +0800	[diff] [blame]	2067	!dl_task(task) \|\|
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	2068	!task_on_rq_queued(task))) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2069	double_unlock_balance(rq, later_rq);
				2070	later_rq = NULL;
				2071	break;
				2072	}
				2073	}
				2074
				2075	/*
				2076	* If the rq we found has no -deadline task, or
				2077	* its earliest one has a later deadline than our
				2078	* task, the rq is a good one.
				2079	*/
				2080	if (!later_rq->dl.dl_nr_running \|\|
				2081	dl_time_before(task->dl.deadline,
				2082	later_rq->dl.earliest_dl.curr))
				2083	break;
				2084
				2085	/* Otherwise we try again. */
				2086	double_unlock_balance(rq, later_rq);
				2087	later_rq = NULL;
				2088	}
				2089
				2090	return later_rq;
				2091	}
				2092
				2093	static struct task_struct pick_next_pushable_dl_task(struct rq rq)
				2094	{
				2095	struct task_struct *p;
				2096
				2097	if (!has_pushable_dl_tasks(rq))
				2098	return NULL;
				2099
Davidlohr Bueso	2161573	2017-09-08 16:14:58 -0700	[diff] [blame]	2100	p = rb_entry(rq->dl.pushable_dl_tasks_root.rb_leftmost,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2101	struct task_struct, pushable_dl_tasks);
				2102
				2103	BUG_ON(rq->cpu != task_cpu(p));
				2104	BUG_ON(task_current(rq, p));
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	2105	BUG_ON(p->nr_cpus_allowed <= 1);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2106
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	2107	BUG_ON(!task_on_rq_queued(p));
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2108	BUG_ON(!dl_task(p));
				2109
				2110	return p;
				2111	}
				2112
				2113	/*
				2114	* See if the non running -deadline tasks on this rq
				2115	* can be sent to some other CPU where they can preempt
				2116	* and start executing.
				2117	*/
				2118	static int push_dl_task(struct rq *rq)
				2119	{
				2120	struct task_struct *next_task;
				2121	struct rq *later_rq;
Wanpeng Li	c51b8ab	2014-11-06 15:22:44 +0800	[diff] [blame]	2122	int ret = 0;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2123
				2124	if (!rq->dl.overloaded)
				2125	return 0;
				2126
				2127	next_task = pick_next_pushable_dl_task(rq);
				2128	if (!next_task)
				2129	return 0;
				2130
				2131	retry:
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame^]	2132	if (is_migration_disabled(next_task))
				2133	return 0;
				2134
Yangtao Li	9ebc605	2018-11-03 13:26:02 -0400	[diff] [blame]	2135	if (WARN_ON(next_task == rq->curr))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2136	return 0;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2137
				2138	/*
				2139	* If next_task preempts rq->curr, and rq->curr
				2140	* can move away, it makes sense to just reschedule
				2141	* without going further in pushing next_task.
				2142	*/
				2143	if (dl_task(rq->curr) &&
				2144	dl_time_before(next_task->dl.deadline, rq->curr->dl.deadline) &&
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	2145	rq->curr->nr_cpus_allowed > 1) {
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	2146	resched_curr(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2147	return 0;
				2148	}
				2149
				2150	/* We might release rq lock */
				2151	get_task_struct(next_task);
				2152
				2153	/* Will lock the rq it'll find */
				2154	later_rq = find_lock_later_rq(next_task, rq);
				2155	if (!later_rq) {
				2156	struct task_struct *task;
				2157
				2158	/*
				2159	* We must check all this again, since
				2160	* find_lock_later_rq releases rq->lock and it is
				2161	* then possible that next_task has migrated.
				2162	*/
				2163	task = pick_next_pushable_dl_task(rq);
Byungchul Park	a776b96	2017-05-12 10:05:59 +0900	[diff] [blame]	2164	if (task == next_task) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2165	/*
				2166	* The task is still there. We don't try
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2167	* again, some other CPU will pull it when ready.
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2168	*/
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2169	goto out;
				2170	}
				2171
				2172	if (!task)
				2173	/* No more tasks */
				2174	goto out;
				2175
				2176	put_task_struct(next_task);
				2177	next_task = task;
				2178	goto retry;
				2179	}
				2180
				2181	deactivate_task(rq, next_task, 0);
				2182	set_task_cpu(next_task, later_rq->cpu);
Daniel Bristot de Oliveira	840d719	2018-07-20 11:16:30 +0200	[diff] [blame]	2183
				2184	/*
				2185	* Update the later_rq clock here, because the clock is used
				2186	* by the cpufreq_update_util() inside __add_running_bw().
				2187	*/
				2188	update_rq_clock(later_rq);
Daniel Bristot de Oliveira	840d719	2018-07-20 11:16:30 +0200	[diff] [blame]	2189	activate_task(later_rq, next_task, ENQUEUE_NOCLOCK);
Wanpeng Li	c51b8ab	2014-11-06 15:22:44 +0800	[diff] [blame]	2190	ret = 1;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2191
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	2192	resched_curr(later_rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2193
				2194	double_unlock_balance(rq, later_rq);
				2195
				2196	out:
				2197	put_task_struct(next_task);
				2198
Wanpeng Li	c51b8ab	2014-11-06 15:22:44 +0800	[diff] [blame]	2199	return ret;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2200	}
				2201
				2202	static void push_dl_tasks(struct rq *rq)
				2203	{
Andrea Parri	4ffa08e	2015-08-05 15:56:18 +0200	[diff] [blame]	2204	/* push_dl_task() will return true if it moved a -deadline task */
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2205	while (push_dl_task(rq))
				2206	;
				2207	}
				2208
Peter Zijlstra	0ea60c2	2015-06-11 14:46:42 +0200	[diff] [blame]	2209	static void pull_dl_task(struct rq *this_rq)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2210	{
Peter Zijlstra	0ea60c2	2015-06-11 14:46:42 +0200	[diff] [blame]	2211	int this_cpu = this_rq->cpu, cpu;
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame^]	2212	struct task_struct p, push_task;
Peter Zijlstra	0ea60c2	2015-06-11 14:46:42 +0200	[diff] [blame]	2213	bool resched = false;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2214	struct rq *src_rq;
				2215	u64 dmin = LONG_MAX;
				2216
				2217	if (likely(!dl_overloaded(this_rq)))
Peter Zijlstra	0ea60c2	2015-06-11 14:46:42 +0200	[diff] [blame]	2218	return;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2219
				2220	/*
				2221	* Match the barrier from dl_set_overloaded; this guarantees that if we
				2222	* see overloaded we must also see the dlo_mask bit.
				2223	*/
				2224	smp_rmb();
				2225
				2226	for_each_cpu(cpu, this_rq->rd->dlo_mask) {
				2227	if (this_cpu == cpu)
				2228	continue;
				2229
				2230	src_rq = cpu_rq(cpu);
				2231
				2232	/*
				2233	* It looks racy, abd it is! However, as in sched_rt.c,
				2234	* we are fine with this.
				2235	*/
				2236	if (this_rq->dl.dl_nr_running &&
				2237	dl_time_before(this_rq->dl.earliest_dl.curr,
				2238	src_rq->dl.earliest_dl.next))
				2239	continue;
				2240
				2241	/* Might drop this_rq->lock */
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame^]	2242	push_task = NULL;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2243	double_lock_balance(this_rq, src_rq);
				2244
				2245	/*
				2246	* If there are no more pullable tasks on the
				2247	* rq, we're done with it.
				2248	*/
				2249	if (src_rq->dl.dl_nr_running <= 1)
				2250	goto skip;
				2251
Wanpeng Li	8b5e770	2015-05-13 14:01:01 +0800	[diff] [blame]	2252	p = pick_earliest_pushable_dl_task(src_rq, this_cpu);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2253
				2254	/*
				2255	* We found a task to be pulled if:
				2256	* - it preempts our current (if there's one),
				2257	* - it will preempt the last one we pulled (if any).
				2258	*/
				2259	if (p && dl_time_before(p->dl.deadline, dmin) &&
				2260	(!this_rq->dl.dl_nr_running \|\|
				2261	dl_time_before(p->dl.deadline,
				2262	this_rq->dl.earliest_dl.curr))) {
				2263	WARN_ON(p == src_rq->curr);
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	2264	WARN_ON(!task_on_rq_queued(p));
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2265
				2266	/*
				2267	* Then we pull iff p has actually an earlier
				2268	* deadline than the current task of its runqueue.
				2269	*/
				2270	if (dl_time_before(p->dl.deadline,
				2271	src_rq->curr->dl.deadline))
				2272	goto skip;
				2273
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame^]	2274	if (is_migration_disabled(p)) {
				2275	push_task = get_push_task(src_rq);
				2276	} else {
				2277	deactivate_task(src_rq, p, 0);
				2278	set_task_cpu(p, this_cpu);
				2279	activate_task(this_rq, p, 0);
				2280	dmin = p->dl.deadline;
				2281	resched = true;
				2282	}
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2283
				2284	/* Is there any other task even earlier? */
				2285	}
				2286	skip:
				2287	double_unlock_balance(this_rq, src_rq);
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame^]	2288
				2289	if (push_task) {
				2290	raw_spin_unlock(&this_rq->lock);
				2291	stop_one_cpu_nowait(src_rq->cpu, push_cpu_stop,
				2292	push_task, &src_rq->push_work);
				2293	raw_spin_lock(&this_rq->lock);
				2294	}
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2295	}
				2296
Peter Zijlstra	0ea60c2	2015-06-11 14:46:42 +0200	[diff] [blame]	2297	if (resched)
				2298	resched_curr(this_rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2299	}
				2300
				2301	/*
				2302	* Since the task is not running and a reschedule is not going to happen
				2303	* anytime soon on its runqueue, we try pushing it away now.
				2304	*/
				2305	static void task_woken_dl(struct rq rq, struct task_struct p)
				2306	{
				2307	if (!task_running(rq, p) &&
				2308	!test_tsk_need_resched(rq->curr) &&
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	2309	p->nr_cpus_allowed > 1 &&
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2310	dl_task(rq->curr) &&
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	2311	(rq->curr->nr_cpus_allowed < 2 \|\|
Wanpeng Li	6b0a563	2014-10-31 06:39:34 +0800	[diff] [blame]	2312	!dl_entity_preempt(&p->dl, &rq->curr->dl))) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2313	push_dl_tasks(rq);
				2314	}
				2315	}
				2316
				2317	static void set_cpus_allowed_dl(struct task_struct *p,
Peter Zijlstra	9cfc3e1	2020-09-16 14:59:08 +0200	[diff] [blame]	2318	const struct cpumask *new_mask,
				2319	u32 flags)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2320	{
Juri Lelli	7f51412	2014-09-19 10:22:40 +0100	[diff] [blame]	2321	struct root_domain *src_rd;
Peter Zijlstra	6c37067	2015-05-15 17:43:36 +0200	[diff] [blame]	2322	struct rq *rq;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2323
				2324	BUG_ON(!dl_task(p));
				2325
Juri Lelli	7f51412	2014-09-19 10:22:40 +0100	[diff] [blame]	2326	rq = task_rq(p);
				2327	src_rd = rq->rd;
				2328	/*
				2329	* Migrating a SCHED_DEADLINE task between exclusive
				2330	* cpusets (different root_domains) entails a bandwidth
				2331	* update. We already made space for us in the destination
				2332	* domain (see cpuset_can_attach()).
				2333	*/
				2334	if (!cpumask_intersects(src_rd->span, new_mask)) {
				2335	struct dl_bw *src_dl_b;
				2336
				2337	src_dl_b = dl_bw_of(cpu_of(rq));
				2338	/*
				2339	* We now free resources of the root_domain we are migrating
				2340	* off. In the worst case, sched_setattr() may temporary fail
				2341	* until we complete the update.
				2342	*/
				2343	raw_spin_lock(&src_dl_b->lock);
Peter Zijlstra	8c0944ce	2017-09-07 12:09:30 +0200	[diff] [blame]	2344	__dl_sub(src_dl_b, p->dl.dl_bw, dl_bw_cpus(task_cpu(p)));
Juri Lelli	7f51412	2014-09-19 10:22:40 +0100	[diff] [blame]	2345	raw_spin_unlock(&src_dl_b->lock);
				2346	}
				2347
Peter Zijlstra	9cfc3e1	2020-09-16 14:59:08 +0200	[diff] [blame]	2348	set_cpus_allowed_common(p, new_mask, flags);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2349	}
				2350
				2351	/* Assumes rq->lock is held */
				2352	static void rq_online_dl(struct rq *rq)
				2353	{
				2354	if (rq->dl.overloaded)
				2355	dl_set_overload(rq);
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	2356
Xunlei Pang	16b2694	2015-01-19 04:49:36 +0000	[diff] [blame]	2357	cpudl_set_freecpu(&rq->rd->cpudl, rq->cpu);
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	2358	if (rq->dl.dl_nr_running > 0)
Tommaso Cucinotta	d8206bb	2016-08-14 16:27:08 +0200	[diff] [blame]	2359	cpudl_set(&rq->rd->cpudl, rq->cpu, rq->dl.earliest_dl.curr);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2360	}
				2361
				2362	/* Assumes rq->lock is held */
				2363	static void rq_offline_dl(struct rq *rq)
				2364	{
				2365	if (rq->dl.overloaded)
				2366	dl_clear_overload(rq);
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	2367
Tommaso Cucinotta	d8206bb	2016-08-14 16:27:08 +0200	[diff] [blame]	2368	cpudl_clear(&rq->rd->cpudl, rq->cpu);
Xunlei Pang	16b2694	2015-01-19 04:49:36 +0000	[diff] [blame]	2369	cpudl_clear_freecpu(&rq->rd->cpudl, rq->cpu);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2370	}
				2371
Wanpeng Li	a6c0e74	2015-05-13 14:01:02 +0800	[diff] [blame]	2372	void __init init_sched_dl_class(void)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2373	{
				2374	unsigned int i;
				2375
				2376	for_each_possible_cpu(i)
				2377	zalloc_cpumask_var_node(&per_cpu(local_cpu_mask_dl, i),
				2378	GFP_KERNEL, cpu_to_node(i));
				2379	}
				2380
Mathieu Poirier	f9a25f7	2019-07-19 15:59:55 +0200	[diff] [blame]	2381	void dl_add_task_root_domain(struct task_struct *p)
				2382	{
				2383	struct rq_flags rf;
				2384	struct rq *rq;
				2385	struct dl_bw *dl_b;
				2386
				2387	rq = task_rq_lock(p, &rf);
				2388	if (!dl_task(p))
				2389	goto unlock;
				2390
				2391	dl_b = &rq->rd->dl_bw;
				2392	raw_spin_lock(&dl_b->lock);
				2393
				2394	__dl_add(dl_b, p->dl.dl_bw, cpumask_weight(rq->rd->span));
				2395
				2396	raw_spin_unlock(&dl_b->lock);
				2397
				2398	unlock:
				2399	task_rq_unlock(rq, p, &rf);
				2400	}
				2401
				2402	void dl_clear_root_domain(struct root_domain *rd)
				2403	{
				2404	unsigned long flags;
				2405
				2406	raw_spin_lock_irqsave(&rd->dl_bw.lock, flags);
				2407	rd->dl_bw.total_bw = 0;
				2408	raw_spin_unlock_irqrestore(&rd->dl_bw.lock, flags);
				2409	}
				2410
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2411	#endif /* CONFIG_SMP */
				2412
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2413	static void switched_from_dl(struct rq rq, struct task_struct p)
				2414	{
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	2415	/*
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	2416	* task_non_contending() can start the "inactive timer" (if the 0-lag
				2417	* time is in the future). If the task switches back to dl before
				2418	* the "inactive timer" fires, it can continue to consume its current
				2419	* runtime using its current deadline. If it stays outside of
				2420	* SCHED_DEADLINE until the 0-lag time passes, inactive_task_timer()
				2421	* will reset the task parameters.
Peter Zijlstra	a649f23	2015-06-11 14:46:49 +0200	[diff] [blame]	2422	*/
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	2423	if (task_on_rq_queued(p) && p->dl.dl_runtime)
				2424	task_non_contending(p);
				2425
Juri Lelli	e117cb5	2018-07-11 09:29:48 +0200	[diff] [blame]	2426	if (!task_on_rq_queued(p)) {
				2427	/*
				2428	* Inactive timer is armed. However, p is leaving DEADLINE and
				2429	* might migrate away from this rq while continuing to run on
				2430	* some other class. We need to remove its contribution from
				2431	* this rq running_bw now, or sub_rq_bw (below) will complain.
				2432	*/
				2433	if (p->dl.dl_non_contending)
				2434	sub_running_bw(&p->dl, &rq->dl);
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	2435	sub_rq_bw(&p->dl, &rq->dl);
Juri Lelli	e117cb5	2018-07-11 09:29:48 +0200	[diff] [blame]	2436	}
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	2437
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	2438	/*
				2439	* We cannot use inactive_task_timer() to invoke sub_running_bw()
				2440	* at the 0-lag time, because the task could have been migrated
				2441	* while SCHED_OTHER in the meanwhile.
				2442	*/
				2443	if (p->dl.dl_non_contending)
				2444	p->dl.dl_non_contending = 0;
Juri Lelli	a5e7be3	2014-09-19 10:22:39 +0100	[diff] [blame]	2445
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2446	/*
				2447	* Since this might be the only -deadline task on the rq,
				2448	* this is the right place to try to pull some other one
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2449	* from an overloaded CPU, if any.
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2450	*/
Wanpeng Li	cd66091	2014-10-31 06:39:35 +0800	[diff] [blame]	2451	if (!task_on_rq_queued(p) \|\| rq->dl.dl_nr_running)
				2452	return;
				2453
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	2454	deadline_queue_pull_task(rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2455	}
				2456
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2457	/*
				2458	* When switching to -deadline, we may overload the rq, then
				2459	* we try to push someone off, if possible.
				2460	*/
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2461	static void switched_to_dl(struct rq rq, struct task_struct p)
				2462	{
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	2463	if (hrtimer_try_to_cancel(&p->dl.inactive_timer) == 1)
				2464	put_task_struct(p);
Luca Abeni	72f9f3f	2016-03-07 12:27:04 +0100	[diff] [blame]	2465
Juri Lelli	98b0a85	2016-08-05 16:07:55 +0100	[diff] [blame]	2466	/* If p is not queued we will update its parameters at next wakeup. */
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	2467	if (!task_on_rq_queued(p)) {
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	2468	add_rq_bw(&p->dl, &rq->dl);
Juri Lelli	98b0a85	2016-08-05 16:07:55 +0100	[diff] [blame]	2469
Luca Abeni	8fd2723	2017-05-18 22:13:34 +0200	[diff] [blame]	2470	return;
				2471	}
Juri Lelli	98b0a85	2016-08-05 16:07:55 +0100	[diff] [blame]	2472
				2473	if (rq->curr != p) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2474	#ifdef CONFIG_SMP
Ingo Molnar	4b53a34	2017-02-05 15:41:03 +0100	[diff] [blame]	2475	if (p->nr_cpus_allowed > 1 && rq->dl.overloaded)
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	2476	deadline_queue_push_tasks(rq);
Sebastian Andrzej Siewior	619bd4a	2017-01-24 15:40:06 +0100	[diff] [blame]	2477	#endif
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	2478	if (dl_task(rq->curr))
				2479	check_preempt_curr_dl(rq, p, 0);
				2480	else
				2481	resched_curr(rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2482	}
				2483	}
				2484
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2485	/*
				2486	* If the scheduling parameters of a -deadline task changed,
				2487	* a push or pull operation might be needed.
				2488	*/
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2489	static void prio_changed_dl(struct rq rq, struct task_struct p,
				2490	int oldprio)
				2491	{
Kirill Tkhai	da0c1e6	2014-08-20 13:47:32 +0400	[diff] [blame]	2492	if (task_on_rq_queued(p) \|\| rq->curr == p) {
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2493	#ifdef CONFIG_SMP
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2494	/*
				2495	* This might be too much, but unfortunately
				2496	* we don't have the old deadline value, and
				2497	* we can't argue if the task is increasing
				2498	* or lowering its prio, so...
				2499	*/
				2500	if (!rq->dl.overloaded)
Ingo Molnar	02d8ec9	2018-03-03 16:27:54 +0100	[diff] [blame]	2501	deadline_queue_pull_task(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2502
				2503	/*
				2504	* If we now have a earlier deadline task than p,
				2505	* then reschedule, provided p is still on this
				2506	* runqueue.
				2507	*/
Peter Zijlstra	9916e21	2015-06-11 14:46:43 +0200	[diff] [blame]	2508	if (dl_time_before(rq->dl.earliest_dl.curr, p->dl.deadline))
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	2509	resched_curr(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2510	#else
				2511	/*
				2512	* Again, we don't know if p has a earlier
				2513	* or later deadline, so let's blindly set a
				2514	* (maybe not needed) rescheduling point.
				2515	*/
Kirill Tkhai	8875125	2014-06-29 00:03:57 +0400	[diff] [blame]	2516	resched_curr(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2517	#endif /* CONFIG_SMP */
Peter Zijlstra	801ccdb	2016-02-25 15:01:49 +0100	[diff] [blame]	2518	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2519	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2520
Steven Rostedt (VMware)	590d697	2019-12-19 16:44:52 -0500	[diff] [blame]	2521	const struct sched_class dl_sched_class
Joe Perches	33def84	2020-10-21 19:36:07 -0700	[diff] [blame]	2522	__section("__dl_sched_class") = {
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2523	.enqueue_task = enqueue_task_dl,
				2524	.dequeue_task = dequeue_task_dl,
				2525	.yield_task = yield_task_dl,
				2526
				2527	.check_preempt_curr = check_preempt_curr_dl,
				2528
				2529	.pick_next_task = pick_next_task_dl,
				2530	.put_prev_task = put_prev_task_dl,
Peter Zijlstra	03b7fad	2019-05-29 20:36:41 +0000	[diff] [blame]	2531	.set_next_task = set_next_task_dl,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2532
				2533	#ifdef CONFIG_SMP
Peter Zijlstra	6e2df05	2019-11-08 11:11:52 +0100	[diff] [blame]	2534	.balance = balance_dl,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2535	.select_task_rq = select_task_rq_dl,
Luca Abeni	209a0cb	2017-05-18 22:13:29 +0200	[diff] [blame]	2536	.migrate_task_rq = migrate_task_rq_dl,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2537	.set_cpus_allowed = set_cpus_allowed_dl,
				2538	.rq_online = rq_online_dl,
				2539	.rq_offline = rq_offline_dl,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	2540	.task_woken = task_woken_dl,
Peter Zijlstra	a7c8155	2020-09-28 17:06:07 +0200	[diff] [blame^]	2541	.find_lock_rq = find_lock_later_rq,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2542	#endif
				2543
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2544	.task_tick = task_tick_dl,
				2545	.task_fork = task_fork_dl,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2546
				2547	.prio_changed = prio_changed_dl,
				2548	.switched_from = switched_from_dl,
				2549	.switched_to = switched_to_dl,
Stanislaw Gruszka	6e99891	2014-11-12 16:58:44 +0100	[diff] [blame]	2550
				2551	.update_curr = update_curr_dl,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	2552	};
Wanpeng Li	acb3213	2014-10-31 06:39:33 +0800	[diff] [blame]	2553
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2554	int sched_dl_global_validate(void)
				2555	{
				2556	u64 runtime = global_rt_runtime();
				2557	u64 period = global_rt_period();
				2558	u64 new_bw = to_ratio(period, runtime);
				2559	struct dl_bw *dl_b;
				2560	int cpu, ret = 0;
				2561	unsigned long flags;
				2562
				2563	/*
				2564	* Here we want to check the bandwidth not being set to some
				2565	* value smaller than the currently allocated bandwidth in
				2566	* any of the root_domains.
				2567	*
				2568	* FIXME: Cycling on all the CPUs is overdoing, but simpler than
				2569	* cycling on root_domains... Discussion on different/better
				2570	* solutions is welcome!
				2571	*/
				2572	for_each_possible_cpu(cpu) {
				2573	rcu_read_lock_sched();
				2574	dl_b = dl_bw_of(cpu);
				2575
				2576	raw_spin_lock_irqsave(&dl_b->lock, flags);
				2577	if (new_bw < dl_b->total_bw)
				2578	ret = -EBUSY;
				2579	raw_spin_unlock_irqrestore(&dl_b->lock, flags);
				2580
				2581	rcu_read_unlock_sched();
				2582
				2583	if (ret)
				2584	break;
				2585	}
				2586
				2587	return ret;
				2588	}
				2589
Yu Chen	ba4f7bc	2020-02-28 18:03:29 +0800	[diff] [blame]	2590	static void init_dl_rq_bw_ratio(struct dl_rq *dl_rq)
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2591	{
				2592	if (global_rt_runtime() == RUNTIME_INF) {
				2593	dl_rq->bw_ratio = 1 << RATIO_SHIFT;
				2594	dl_rq->extra_bw = 1 << BW_SHIFT;
				2595	} else {
				2596	dl_rq->bw_ratio = to_ratio(global_rt_runtime(),
				2597	global_rt_period()) >> (BW_SHIFT - RATIO_SHIFT);
				2598	dl_rq->extra_bw = to_ratio(global_rt_period(),
				2599	global_rt_runtime());
				2600	}
				2601	}
				2602
				2603	void sched_dl_do_global(void)
				2604	{
				2605	u64 new_bw = -1;
				2606	struct dl_bw *dl_b;
				2607	int cpu;
				2608	unsigned long flags;
				2609
				2610	def_dl_bandwidth.dl_period = global_rt_period();
				2611	def_dl_bandwidth.dl_runtime = global_rt_runtime();
				2612
				2613	if (global_rt_runtime() != RUNTIME_INF)
				2614	new_bw = to_ratio(global_rt_period(), global_rt_runtime());
				2615
				2616	/*
				2617	* FIXME: As above...
				2618	*/
				2619	for_each_possible_cpu(cpu) {
				2620	rcu_read_lock_sched();
				2621	dl_b = dl_bw_of(cpu);
				2622
				2623	raw_spin_lock_irqsave(&dl_b->lock, flags);
				2624	dl_b->bw = new_bw;
				2625	raw_spin_unlock_irqrestore(&dl_b->lock, flags);
				2626
				2627	rcu_read_unlock_sched();
				2628	init_dl_rq_bw_ratio(&cpu_rq(cpu)->dl);
				2629	}
				2630	}
				2631
				2632	/*
				2633	* We must be sure that accepting a new task (or allowing changing the
				2634	* parameters of an existing one) is consistent with the bandwidth
				2635	* constraints. If yes, this function also accordingly updates the currently
				2636	* allocated bandwidth to reflect the new situation.
				2637	*
				2638	* This function is called while holding p's rq->lock.
				2639	*/
				2640	int sched_dl_overflow(struct task_struct *p, int policy,
				2641	const struct sched_attr *attr)
				2642	{
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2643	u64 period = attr->sched_period ?: attr->sched_deadline;
				2644	u64 runtime = attr->sched_runtime;
				2645	u64 new_bw = dl_policy(policy) ? to_ratio(period, runtime) : 0;
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2646	int cpus, err = -1, cpu = task_cpu(p);
				2647	struct dl_bw *dl_b = dl_bw_of(cpu);
				2648	unsigned long cap;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2649
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	2650	if (attr->sched_flags & SCHED_FLAG_SUGOV)
				2651	return 0;
				2652
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2653	/* !deadline task may carry old deadline bandwidth */
				2654	if (new_bw == p->dl.dl_bw && task_has_dl_policy(p))
				2655	return 0;
				2656
				2657	/*
				2658	* Either if a task, enters, leave, or stays -deadline but changes
				2659	* its parameters, we may need to update accordingly the total
				2660	* allocated bandwidth of the container.
				2661	*/
				2662	raw_spin_lock(&dl_b->lock);
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2663	cpus = dl_bw_cpus(cpu);
				2664	cap = dl_bw_capacity(cpu);
				2665
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2666	if (dl_policy(policy) && !task_has_dl_policy(p) &&
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2667	!__dl_overflow(dl_b, cap, 0, new_bw)) {
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2668	if (hrtimer_active(&p->dl.inactive_timer))
Peter Zijlstra	8c0944ce	2017-09-07 12:09:30 +0200	[diff] [blame]	2669	__dl_sub(dl_b, p->dl.dl_bw, cpus);
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2670	__dl_add(dl_b, new_bw, cpus);
				2671	err = 0;
				2672	} else if (dl_policy(policy) && task_has_dl_policy(p) &&
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2673	!__dl_overflow(dl_b, cap, p->dl.dl_bw, new_bw)) {
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2674	/*
				2675	* XXX this is slightly incorrect: when the task
				2676	* utilization decreases, we should delay the total
				2677	* utilization change until the task's 0-lag point.
				2678	* But this would require to set the task's "inactive
				2679	* timer" when the task is not inactive.
				2680	*/
Peter Zijlstra	8c0944ce	2017-09-07 12:09:30 +0200	[diff] [blame]	2681	__dl_sub(dl_b, p->dl.dl_bw, cpus);
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2682	__dl_add(dl_b, new_bw, cpus);
				2683	dl_change_utilization(p, new_bw);
				2684	err = 0;
				2685	} else if (!dl_policy(policy) && task_has_dl_policy(p)) {
				2686	/*
				2687	* Do not decrease the total deadline utilization here,
				2688	* switched_from_dl() will take care to do it at the correct
				2689	* (0-lag) time.
				2690	*/
				2691	err = 0;
				2692	}
				2693	raw_spin_unlock(&dl_b->lock);
				2694
				2695	return err;
				2696	}
				2697
				2698	/*
				2699	* This function initializes the sched_dl_entity of a newly becoming
				2700	* SCHED_DEADLINE task.
				2701	*
				2702	* Only the static values are considered here, the actual runtime and the
				2703	* absolute deadline will be properly calculated when the task is enqueued
				2704	* for the first time with its new policy.
				2705	*/
				2706	void __setparam_dl(struct task_struct p, const struct sched_attr attr)
				2707	{
				2708	struct sched_dl_entity *dl_se = &p->dl;
				2709
				2710	dl_se->dl_runtime = attr->sched_runtime;
				2711	dl_se->dl_deadline = attr->sched_deadline;
				2712	dl_se->dl_period = attr->sched_period ?: dl_se->dl_deadline;
				2713	dl_se->flags = attr->sched_flags;
				2714	dl_se->dl_bw = to_ratio(dl_se->dl_period, dl_se->dl_runtime);
				2715	dl_se->dl_density = to_ratio(dl_se->dl_deadline, dl_se->dl_runtime);
				2716	}
				2717
				2718	void __getparam_dl(struct task_struct p, struct sched_attr attr)
				2719	{
				2720	struct sched_dl_entity *dl_se = &p->dl;
				2721
				2722	attr->sched_priority = p->rt_priority;
				2723	attr->sched_runtime = dl_se->dl_runtime;
				2724	attr->sched_deadline = dl_se->dl_deadline;
				2725	attr->sched_period = dl_se->dl_period;
				2726	attr->sched_flags = dl_se->flags;
				2727	}
				2728
				2729	/*
Peter Zijlstra	b4098bf	2019-07-26 16:54:10 +0200	[diff] [blame]	2730	* Default limits for DL period; on the top end we guard against small util
				2731	* tasks still getting rediculous long effective runtimes, on the bottom end we
				2732	* guard against timer DoS.
				2733	*/
				2734	unsigned int sysctl_sched_dl_period_max = 1 << 22; /* ~4 seconds */
				2735	unsigned int sysctl_sched_dl_period_min = 100; /* 100 us */
				2736
				2737	/*
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2738	* This function validates the new parameters of a -deadline task.
				2739	* We ask for the deadline not being zero, and greater or equal
				2740	* than the runtime, as well as the period of being zero or
				2741	* greater than deadline. Furthermore, we have to be sure that
				2742	* user parameters are above the internal resolution of 1us (we
				2743	* check sched_runtime only since it is always the smaller one) and
				2744	* below 2^63 ns (we have to check both sched_deadline and
				2745	* sched_period, as the latter can be zero).
				2746	*/
				2747	bool __checkparam_dl(const struct sched_attr *attr)
				2748	{
Peter Zijlstra	b4098bf	2019-07-26 16:54:10 +0200	[diff] [blame]	2749	u64 period, max, min;
				2750
Juri Lelli	794a56e	2017-12-04 11:23:20 +0100	[diff] [blame]	2751	/* special dl tasks don't actually use any parameter */
				2752	if (attr->sched_flags & SCHED_FLAG_SUGOV)
				2753	return true;
				2754
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2755	/* deadline != 0 */
				2756	if (attr->sched_deadline == 0)
				2757	return false;
				2758
				2759	/*
				2760	* Since we truncate DL_SCALE bits, make sure we're at least
				2761	* that big.
				2762	*/
				2763	if (attr->sched_runtime < (1ULL << DL_SCALE))
				2764	return false;
				2765
				2766	/*
				2767	* Since we use the MSB for wrap-around and sign issues, make
				2768	* sure it's not set (mind that period can be equal to zero).
				2769	*/
				2770	if (attr->sched_deadline & (1ULL << 63) \|\|
				2771	attr->sched_period & (1ULL << 63))
				2772	return false;
				2773
Peter Zijlstra	b4098bf	2019-07-26 16:54:10 +0200	[diff] [blame]	2774	period = attr->sched_period;
				2775	if (!period)
				2776	period = attr->sched_deadline;
				2777
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2778	/* runtime <= deadline <= period (if period != 0) */
Peter Zijlstra	b4098bf	2019-07-26 16:54:10 +0200	[diff] [blame]	2779	if (period < attr->sched_deadline \|\|
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2780	attr->sched_deadline < attr->sched_runtime)
				2781	return false;
				2782
Peter Zijlstra	b4098bf	2019-07-26 16:54:10 +0200	[diff] [blame]	2783	max = (u64)READ_ONCE(sysctl_sched_dl_period_max) * NSEC_PER_USEC;
				2784	min = (u64)READ_ONCE(sysctl_sched_dl_period_min) * NSEC_PER_USEC;
				2785
				2786	if (period < min \|\| period > max)
				2787	return false;
				2788
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2789	return true;
				2790	}
				2791
				2792	/*
				2793	* This function clears the sched_dl_entity static params.
				2794	*/
				2795	void __dl_clear_params(struct task_struct *p)
				2796	{
				2797	struct sched_dl_entity *dl_se = &p->dl;
				2798
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2799	dl_se->dl_runtime = 0;
				2800	dl_se->dl_deadline = 0;
				2801	dl_se->dl_period = 0;
				2802	dl_se->flags = 0;
				2803	dl_se->dl_bw = 0;
				2804	dl_se->dl_density = 0;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2805
Juri Lelli	ce9bc3b	2020-06-17 09:29:19 +0200	[diff] [blame]	2806	dl_se->dl_boosted = 0;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2807	dl_se->dl_throttled = 0;
				2808	dl_se->dl_yielded = 0;
				2809	dl_se->dl_non_contending = 0;
				2810	dl_se->dl_overrun = 0;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2811	}
				2812
				2813	bool dl_param_changed(struct task_struct p, const struct sched_attr attr)
				2814	{
				2815	struct sched_dl_entity *dl_se = &p->dl;
				2816
				2817	if (dl_se->dl_runtime != attr->sched_runtime \|\|
				2818	dl_se->dl_deadline != attr->sched_deadline \|\|
				2819	dl_se->dl_period != attr->sched_period \|\|
				2820	dl_se->flags != attr->sched_flags)
				2821	return true;
				2822
				2823	return false;
				2824	}
				2825
				2826	#ifdef CONFIG_SMP
				2827	int dl_task_can_attach(struct task_struct p, const struct cpumask cs_cpus_allowed)
				2828	{
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2829	unsigned long flags, cap;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2830	unsigned int dest_cpu;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2831	struct dl_bw *dl_b;
				2832	bool overflow;
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2833	int ret;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2834
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2835	dest_cpu = cpumask_any_and(cpu_active_mask, cs_cpus_allowed);
				2836
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2837	rcu_read_lock_sched();
				2838	dl_b = dl_bw_of(dest_cpu);
				2839	raw_spin_lock_irqsave(&dl_b->lock, flags);
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2840	cap = dl_bw_capacity(dest_cpu);
				2841	overflow = __dl_overflow(dl_b, cap, 0, p->dl.dl_bw);
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2842	if (overflow) {
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2843	ret = -EBUSY;
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2844	} else {
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2845	/*
				2846	* We reserve space for this task in the destination
				2847	* root_domain, as we can't fail after this point.
				2848	* We will free resources in the source root_domain
				2849	* later on (see set_cpus_allowed_dl()).
				2850	*/
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2851	int cpus = dl_bw_cpus(dest_cpu);
				2852
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2853	__dl_add(dl_b, p->dl.dl_bw, cpus);
				2854	ret = 0;
				2855	}
				2856	raw_spin_unlock_irqrestore(&dl_b->lock, flags);
				2857	rcu_read_unlock_sched();
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2858
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2859	return ret;
				2860	}
				2861
				2862	int dl_cpuset_cpumask_can_shrink(const struct cpumask *cur,
				2863	const struct cpumask *trial)
				2864	{
				2865	int ret = 1, trial_cpus;
				2866	struct dl_bw *cur_dl_b;
				2867	unsigned long flags;
				2868
				2869	rcu_read_lock_sched();
				2870	cur_dl_b = dl_bw_of(cpumask_any(cur));
				2871	trial_cpus = cpumask_weight(trial);
				2872
				2873	raw_spin_lock_irqsave(&cur_dl_b->lock, flags);
				2874	if (cur_dl_b->bw != -1 &&
				2875	cur_dl_b->bw * trial_cpus < cur_dl_b->total_bw)
				2876	ret = 0;
				2877	raw_spin_unlock_irqrestore(&cur_dl_b->lock, flags);
				2878	rcu_read_unlock_sched();
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2879
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2880	return ret;
				2881	}
				2882
				2883	bool dl_cpu_busy(unsigned int cpu)
				2884	{
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2885	unsigned long flags, cap;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2886	struct dl_bw *dl_b;
				2887	bool overflow;
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2888
				2889	rcu_read_lock_sched();
				2890	dl_b = dl_bw_of(cpu);
				2891	raw_spin_lock_irqsave(&dl_b->lock, flags);
Luca Abeni	60ffd5e	2020-05-20 15:42:41 +0200	[diff] [blame]	2892	cap = dl_bw_capacity(cpu);
				2893	overflow = __dl_overflow(dl_b, cap, 0, 0);
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2894	raw_spin_unlock_irqrestore(&dl_b->lock, flags);
				2895	rcu_read_unlock_sched();
Ingo Molnar	97fb7a0	2018-03-03 14:01:12 +0100	[diff] [blame]	2896
Nicolas Pitre	06a76fe	2017-06-21 14:22:01 -0400	[diff] [blame]	2897	return overflow;
				2898	}
				2899	#endif
				2900
Wanpeng Li	acb3213	2014-10-31 06:39:33 +0800	[diff] [blame]	2901	#ifdef CONFIG_SCHED_DEBUG
Wanpeng Li	acb3213	2014-10-31 06:39:33 +0800	[diff] [blame]	2902	void print_dl_stats(struct seq_file *m, int cpu)
				2903	{
				2904	print_dl_rq(m, cpu, &cpu_rq(cpu)->dl);
				2905	}
				2906	#endif /* CONFIG_SCHED_DEBUG */