Blame - kernel/sched/deadline.c - SHIFTPHONES/android_kernel_shift_sdm845

blob: 14bc348ba3b4658466e24d427a34fdbea62e6d64 [file] [log] [blame]

Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1	/*
				2	* Deadline Scheduling Class (SCHED_DEADLINE)
				3	*
				4	* Earliest Deadline First (EDF) + Constant Bandwidth Server (CBS).
				5	*
				6	* Tasks that periodically executes their instances for less than their
				7	* runtime won't miss any of their deadlines.
				8	* Tasks that are not periodic or sporadic or that tries to execute more
				9	* than their reserved bandwidth will be slowed down (and may potentially
				10	* miss some of their deadlines), and won't affect any other task.
				11	*
				12	* Copyright (C) 2012 Dario Faggioli <raistlin@linux.it>,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	13	* Juri Lelli <juri.lelli@gmail.com>,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	14	* Michael Trimarchi <michael@amarulasolutions.com>,
				15	* Fabio Checconi <fchecconi@gmail.com>
				16	*/
				17	#include "sched.h"
				18
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	19	#include <linux/slab.h>
				20
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	21	struct dl_bandwidth def_dl_bandwidth;
				22
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	23	static inline struct task_struct dl_task_of(struct sched_dl_entity dl_se)
				24	{
				25	return container_of(dl_se, struct task_struct, dl);
				26	}
				27
				28	static inline struct rq rq_of_dl_rq(struct dl_rq dl_rq)
				29	{
				30	return container_of(dl_rq, struct rq, dl);
				31	}
				32
				33	static inline struct dl_rq dl_rq_of_se(struct sched_dl_entity dl_se)
				34	{
				35	struct task_struct *p = dl_task_of(dl_se);
				36	struct rq *rq = task_rq(p);
				37
				38	return &rq->dl;
				39	}
				40
				41	static inline int on_dl_rq(struct sched_dl_entity *dl_se)
				42	{
				43	return !RB_EMPTY_NODE(&dl_se->rb_node);
				44	}
				45
				46	static inline int is_leftmost(struct task_struct p, struct dl_rq dl_rq)
				47	{
				48	struct sched_dl_entity *dl_se = &p->dl;
				49
				50	return dl_rq->rb_leftmost == &dl_se->rb_node;
				51	}
				52
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	53	void init_dl_bandwidth(struct dl_bandwidth *dl_b, u64 period, u64 runtime)
				54	{
				55	raw_spin_lock_init(&dl_b->dl_runtime_lock);
				56	dl_b->dl_period = period;
				57	dl_b->dl_runtime = runtime;
				58	}
				59
				60	extern unsigned long to_ratio(u64 period, u64 runtime);
				61
				62	void init_dl_bw(struct dl_bw *dl_b)
				63	{
				64	raw_spin_lock_init(&dl_b->lock);
				65	raw_spin_lock(&def_dl_bandwidth.dl_runtime_lock);
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	66	if (global_rt_runtime() == RUNTIME_INF)
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	67	dl_b->bw = -1;
				68	else
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	69	dl_b->bw = to_ratio(global_rt_period(), global_rt_runtime());
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	70	raw_spin_unlock(&def_dl_bandwidth.dl_runtime_lock);
				71	dl_b->total_bw = 0;
				72	}
				73
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	74	void init_dl_rq(struct dl_rq dl_rq, struct rq rq)
				75	{
				76	dl_rq->rb_root = RB_ROOT;
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	77
				78	#ifdef CONFIG_SMP
				79	/* zero means no -deadline tasks */
				80	dl_rq->earliest_dl.curr = dl_rq->earliest_dl.next = 0;
				81
				82	dl_rq->dl_nr_migratory = 0;
				83	dl_rq->overloaded = 0;
				84	dl_rq->pushable_dl_tasks_root = RB_ROOT;
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	85	#else
				86	init_dl_bw(&dl_rq->dl_bw);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	87	#endif
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	88	}
				89
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	90	#ifdef CONFIG_SMP
				91
				92	static inline int dl_overloaded(struct rq *rq)
				93	{
				94	return atomic_read(&rq->rd->dlo_count);
				95	}
				96
				97	static inline void dl_set_overload(struct rq *rq)
				98	{
				99	if (!rq->online)
				100	return;
				101
				102	cpumask_set_cpu(rq->cpu, rq->rd->dlo_mask);
				103	/*
				104	* Must be visible before the overload count is
				105	* set (as in sched_rt.c).
				106	*
				107	* Matched by the barrier in pull_dl_task().
				108	*/
				109	smp_wmb();
				110	atomic_inc(&rq->rd->dlo_count);
				111	}
				112
				113	static inline void dl_clear_overload(struct rq *rq)
				114	{
				115	if (!rq->online)
				116	return;
				117
				118	atomic_dec(&rq->rd->dlo_count);
				119	cpumask_clear_cpu(rq->cpu, rq->rd->dlo_mask);
				120	}
				121
				122	static void update_dl_migration(struct dl_rq *dl_rq)
				123	{
Kirill Tkhai	995b9ea	2014-02-18 02:24:13 +0400	[diff] [blame]	124	if (dl_rq->dl_nr_migratory && dl_rq->dl_nr_running > 1) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	125	if (!dl_rq->overloaded) {
				126	dl_set_overload(rq_of_dl_rq(dl_rq));
				127	dl_rq->overloaded = 1;
				128	}
				129	} else if (dl_rq->overloaded) {
				130	dl_clear_overload(rq_of_dl_rq(dl_rq));
				131	dl_rq->overloaded = 0;
				132	}
				133	}
				134
				135	static void inc_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				136	{
				137	struct task_struct *p = dl_task_of(dl_se);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	138
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	139	if (p->nr_cpus_allowed > 1)
				140	dl_rq->dl_nr_migratory++;
				141
				142	update_dl_migration(dl_rq);
				143	}
				144
				145	static void dec_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				146	{
				147	struct task_struct *p = dl_task_of(dl_se);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	148
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	149	if (p->nr_cpus_allowed > 1)
				150	dl_rq->dl_nr_migratory--;
				151
				152	update_dl_migration(dl_rq);
				153	}
				154
				155	/*
				156	* The list of pushable -deadline task is not a plist, like in
				157	* sched_rt.c, it is an rb-tree with tasks ordered by deadline.
				158	*/
				159	static void enqueue_pushable_dl_task(struct rq rq, struct task_struct p)
				160	{
				161	struct dl_rq *dl_rq = &rq->dl;
				162	struct rb_node **link = &dl_rq->pushable_dl_tasks_root.rb_node;
				163	struct rb_node *parent = NULL;
				164	struct task_struct *entry;
				165	int leftmost = 1;
				166
				167	BUG_ON(!RB_EMPTY_NODE(&p->pushable_dl_tasks));
				168
				169	while (*link) {
				170	parent = *link;
				171	entry = rb_entry(parent, struct task_struct,
				172	pushable_dl_tasks);
				173	if (dl_entity_preempt(&p->dl, &entry->dl))
				174	link = &parent->rb_left;
				175	else {
				176	link = &parent->rb_right;
				177	leftmost = 0;
				178	}
				179	}
				180
				181	if (leftmost)
				182	dl_rq->pushable_dl_tasks_leftmost = &p->pushable_dl_tasks;
				183
				184	rb_link_node(&p->pushable_dl_tasks, parent, link);
				185	rb_insert_color(&p->pushable_dl_tasks, &dl_rq->pushable_dl_tasks_root);
				186	}
				187
				188	static void dequeue_pushable_dl_task(struct rq rq, struct task_struct p)
				189	{
				190	struct dl_rq *dl_rq = &rq->dl;
				191
				192	if (RB_EMPTY_NODE(&p->pushable_dl_tasks))
				193	return;
				194
				195	if (dl_rq->pushable_dl_tasks_leftmost == &p->pushable_dl_tasks) {
				196	struct rb_node *next_node;
				197
				198	next_node = rb_next(&p->pushable_dl_tasks);
				199	dl_rq->pushable_dl_tasks_leftmost = next_node;
				200	}
				201
				202	rb_erase(&p->pushable_dl_tasks, &dl_rq->pushable_dl_tasks_root);
				203	RB_CLEAR_NODE(&p->pushable_dl_tasks);
				204	}
				205
				206	static inline int has_pushable_dl_tasks(struct rq *rq)
				207	{
				208	return !RB_EMPTY_ROOT(&rq->dl.pushable_dl_tasks_root);
				209	}
				210
				211	static int push_dl_task(struct rq *rq);
				212
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	213	static inline bool need_pull_dl_task(struct rq rq, struct task_struct prev)
				214	{
				215	return dl_task(prev);
				216	}
				217
				218	static inline void set_post_schedule(struct rq *rq)
				219	{
				220	rq->post_schedule = has_pushable_dl_tasks(rq);
				221	}
				222
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	223	#else
				224
				225	static inline
				226	void enqueue_pushable_dl_task(struct rq rq, struct task_struct p)
				227	{
				228	}
				229
				230	static inline
				231	void dequeue_pushable_dl_task(struct rq rq, struct task_struct p)
				232	{
				233	}
				234
				235	static inline
				236	void inc_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				237	{
				238	}
				239
				240	static inline
				241	void dec_dl_migration(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				242	{
				243	}
				244
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	245	static inline bool need_pull_dl_task(struct rq rq, struct task_struct prev)
				246	{
				247	return false;
				248	}
				249
				250	static inline int pull_dl_task(struct rq *rq)
				251	{
				252	return 0;
				253	}
				254
				255	static inline void set_post_schedule(struct rq *rq)
				256	{
				257	}
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	258	#endif /* CONFIG_SMP */
				259
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	260	static void enqueue_task_dl(struct rq rq, struct task_struct p, int flags);
				261	static void __dequeue_task_dl(struct rq rq, struct task_struct p, int flags);
				262	static void check_preempt_curr_dl(struct rq rq, struct task_struct p,
				263	int flags);
				264
				265	/*
				266	* We are being explicitly informed that a new instance is starting,
				267	* and this means that:
				268	* - the absolute deadline of the entity has to be placed at
				269	* current time + relative deadline;
				270	* - the runtime of the entity has to be set to the maximum value.
				271	*
				272	* The capability of specifying such event is useful whenever a -deadline
				273	* entity wants to (try to!) synchronize its behaviour with the scheduler's
				274	* one, and to (try to!) reconcile itself with its own scheduling
				275	* parameters.
				276	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	277	static inline void setup_new_dl_entity(struct sched_dl_entity *dl_se,
				278	struct sched_dl_entity *pi_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	279	{
				280	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				281	struct rq *rq = rq_of_dl_rq(dl_rq);
				282
				283	WARN_ON(!dl_se->dl_new \|\| dl_se->dl_throttled);
				284
				285	/*
				286	* We use the regular wall clock time to set deadlines in the
				287	* future; in fact, we must consider execution overheads (time
				288	* spent on hardirq context, etc.).
				289	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	290	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				291	dl_se->runtime = pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	292	dl_se->dl_new = 0;
				293	}
				294
				295	/*
				296	* Pure Earliest Deadline First (EDF) scheduling does not deal with the
				297	* possibility of a entity lasting more than what it declared, and thus
				298	* exhausting its runtime.
				299	*
				300	* Here we are interested in making runtime overrun possible, but we do
				301	* not want a entity which is misbehaving to affect the scheduling of all
				302	* other entities.
				303	* Therefore, a budgeting strategy called Constant Bandwidth Server (CBS)
				304	* is used, in order to confine each entity within its own bandwidth.
				305	*
				306	* This function deals exactly with that, and ensures that when the runtime
				307	* of a entity is replenished, its deadline is also postponed. That ensures
				308	* the overrunning entity can't interfere with other entity in the system and
				309	* can't make them miss their deadlines. Reasons why this kind of overruns
				310	* could happen are, typically, a entity voluntarily trying to overcome its
				311	* runtime, or it just underestimated it during sched_setscheduler_ex().
				312	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	313	static void replenish_dl_entity(struct sched_dl_entity *dl_se,
				314	struct sched_dl_entity *pi_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	315	{
				316	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				317	struct rq *rq = rq_of_dl_rq(dl_rq);
				318
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	319	BUG_ON(pi_se->dl_runtime <= 0);
				320
				321	/*
				322	* This could be the case for a !-dl task that is boosted.
				323	* Just go with full inherited parameters.
				324	*/
				325	if (dl_se->dl_deadline == 0) {
				326	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				327	dl_se->runtime = pi_se->dl_runtime;
				328	}
				329
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	330	/*
				331	* We keep moving the deadline away until we get some
				332	* available runtime for the entity. This ensures correct
				333	* handling of situations where the runtime overrun is
				334	* arbitrary large.
				335	*/
				336	while (dl_se->runtime <= 0) {
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	337	dl_se->deadline += pi_se->dl_period;
				338	dl_se->runtime += pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	339	}
				340
				341	/*
				342	* At this point, the deadline really should be "in
				343	* the future" with respect to rq->clock. If it's
				344	* not, we are, for some reason, lagging too much!
				345	* Anyway, after having warn userspace abut that,
				346	* we still try to keep the things running by
				347	* resetting the deadline and the budget of the
				348	* entity.
				349	*/
				350	if (dl_time_before(dl_se->deadline, rq_clock(rq))) {
				351	static bool lag_once = false;
				352
				353	if (!lag_once) {
				354	lag_once = true;
				355	printk_sched("sched: DL replenish lagged to much\n");
				356	}
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	357	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				358	dl_se->runtime = pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	359	}
				360	}
				361
				362	/*
				363	* Here we check if --at time t-- an entity (which is probably being
				364	* [re]activated or, in general, enqueued) can use its remaining runtime
				365	* and its current deadline _without_ exceeding the bandwidth it is
				366	* assigned (function returns true if it can't). We are in fact applying
				367	* one of the CBS rules: when a task wakes up, if the residual runtime
				368	* over residual deadline fits within the allocated bandwidth, then we
				369	* can keep the current (absolute) deadline and residual budget without
				370	* disrupting the schedulability of the system. Otherwise, we should
				371	* refill the runtime and set the deadline a period in the future,
				372	* because keeping the current (absolute) deadline of the task would
Dario Faggioli	712e5e3	2014-01-27 12:20:15 +0100	[diff] [blame]	373	* result in breaking guarantees promised to other tasks (refer to
				374	* Documentation/scheduler/sched-deadline.txt for more informations).
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	375	*
				376	* This function returns true if:
				377	*
Harald Gustafsson	755378a	2013-11-07 14:43:40 +0100	[diff] [blame]	378	* runtime / (deadline - t) > dl_runtime / dl_period ,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	379	*
				380	* IOW we can't recycle current parameters.
Harald Gustafsson	755378a	2013-11-07 14:43:40 +0100	[diff] [blame]	381	*
				382	* Notice that the bandwidth check is done against the period. For
				383	* task with deadline equal to period this is the same of using
				384	* dl_deadline instead of dl_period in the equation above.
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	385	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	386	static bool dl_entity_overflow(struct sched_dl_entity *dl_se,
				387	struct sched_dl_entity *pi_se, u64 t)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	388	{
				389	u64 left, right;
				390
				391	/*
				392	* left and right are the two sides of the equation above,
				393	* after a bit of shuffling to use multiplications instead
				394	* of divisions.
				395	*
				396	* Note that none of the time values involved in the two
				397	* multiplications are absolute: dl_deadline and dl_runtime
				398	* are the relative deadline and the maximum runtime of each
				399	* instance, runtime is the runtime left for the last instance
				400	* and (deadline - t), since t is rq->clock, is the time left
				401	* to the (absolute) deadline. Even if overflowing the u64 type
				402	* is very unlikely to occur in both cases, here we scale down
				403	* as we want to avoid that risk at all. Scaling down by 10
				404	* means that we reduce granularity to 1us. We are fine with it,
				405	* since this is only a true/false check and, anyway, thinking
				406	* of anything below microseconds resolution is actually fiction
				407	* (but still we want to give the user that illusion >;).
				408	*/
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	409	left = (pi_se->dl_period >> DL_SCALE) * (dl_se->runtime >> DL_SCALE);
				410	right = ((dl_se->deadline - t) >> DL_SCALE) *
				411	(pi_se->dl_runtime >> DL_SCALE);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	412
				413	return dl_time_before(right, left);
				414	}
				415
				416	/*
				417	* When a -deadline entity is queued back on the runqueue, its runtime and
				418	* deadline might need updating.
				419	*
				420	* The policy here is that we update the deadline of the entity only if:
				421	* - the current deadline is in the past,
				422	* - using the remaining runtime with the current deadline would make
				423	* the entity exceed its bandwidth.
				424	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	425	static void update_dl_entity(struct sched_dl_entity *dl_se,
				426	struct sched_dl_entity *pi_se)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	427	{
				428	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				429	struct rq *rq = rq_of_dl_rq(dl_rq);
				430
				431	/*
				432	* The arrival of a new instance needs special treatment, i.e.,
				433	* the actual scheduling parameters have to be "renewed".
				434	*/
				435	if (dl_se->dl_new) {
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	436	setup_new_dl_entity(dl_se, pi_se);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	437	return;
				438	}
				439
				440	if (dl_time_before(dl_se->deadline, rq_clock(rq)) \|\|
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	441	dl_entity_overflow(dl_se, pi_se, rq_clock(rq))) {
				442	dl_se->deadline = rq_clock(rq) + pi_se->dl_deadline;
				443	dl_se->runtime = pi_se->dl_runtime;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	444	}
				445	}
				446
				447	/*
				448	* If the entity depleted all its runtime, and if we want it to sleep
				449	* while waiting for some new execution time to become available, we
				450	* set the bandwidth enforcement timer to the replenishment instant
				451	* and try to activate it.
				452	*
				453	* Notice that it is important for the caller to know if the timer
				454	* actually started or not (i.e., the replenishment instant is in
				455	* the future or in the past).
				456	*/
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	457	static int start_dl_timer(struct sched_dl_entity *dl_se, bool boosted)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	458	{
				459	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				460	struct rq *rq = rq_of_dl_rq(dl_rq);
				461	ktime_t now, act;
				462	ktime_t soft, hard;
				463	unsigned long range;
				464	s64 delta;
				465
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	466	if (boosted)
				467	return 0;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	468	/*
				469	* We want the timer to fire at the deadline, but considering
				470	* that it is actually coming from rq->clock and not from
				471	* hrtimer's time base reading.
				472	*/
				473	act = ns_to_ktime(dl_se->deadline);
				474	now = hrtimer_cb_get_time(&dl_se->dl_timer);
				475	delta = ktime_to_ns(now) - rq_clock(rq);
				476	act = ktime_add_ns(act, delta);
				477
				478	/*
				479	* If the expiry time already passed, e.g., because the value
				480	* chosen as the deadline is too small, don't even try to
				481	* start the timer in the past!
				482	*/
				483	if (ktime_us_delta(act, now) < 0)
				484	return 0;
				485
				486	hrtimer_set_expires(&dl_se->dl_timer, act);
				487
				488	soft = hrtimer_get_softexpires(&dl_se->dl_timer);
				489	hard = hrtimer_get_expires(&dl_se->dl_timer);
				490	range = ktime_to_ns(ktime_sub(hard, soft));
				491	__hrtimer_start_range_ns(&dl_se->dl_timer, soft,
				492	range, HRTIMER_MODE_ABS, 0);
				493
				494	return hrtimer_active(&dl_se->dl_timer);
				495	}
				496
				497	/*
				498	* This is the bandwidth enforcement timer callback. If here, we know
				499	* a task is not on its dl_rq, since the fact that the timer was running
				500	* means the task is throttled and needs a runtime replenishment.
				501	*
				502	* However, what we actually do depends on the fact the task is active,
				503	* (it is on its rq) or has been removed from there by a call to
				504	* dequeue_task_dl(). In the former case we must issue the runtime
				505	* replenishment and add the task back to the dl_rq; in the latter, we just
				506	* do nothing but clearing dl_throttled, so that runtime and deadline
				507	* updating (and the queueing back to dl_rq) will be done by the
				508	* next call to enqueue_task_dl().
				509	*/
				510	static enum hrtimer_restart dl_task_timer(struct hrtimer *timer)
				511	{
				512	struct sched_dl_entity *dl_se = container_of(timer,
				513	struct sched_dl_entity,
				514	dl_timer);
				515	struct task_struct *p = dl_task_of(dl_se);
Kirill Tkhai	0f397f2	2014-05-20 13:33:42 +0400	[diff] [blame^]	516	struct rq *rq;
				517	again:
				518	rq = task_rq(p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	519	raw_spin_lock(&rq->lock);
				520
Kirill Tkhai	0f397f2	2014-05-20 13:33:42 +0400	[diff] [blame^]	521	if (rq != task_rq(p)) {
				522	/* Task was moved, retrying. */
				523	raw_spin_unlock(&rq->lock);
				524	goto again;
				525	}
				526
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	527	/*
				528	* We need to take care of a possible races here. In fact, the
				529	* task might have changed its scheduling policy to something
				530	* different from SCHED_DEADLINE or changed its reservation
				531	* parameters (through sched_setscheduler()).
				532	*/
				533	if (!dl_task(p) \|\| dl_se->dl_new)
				534	goto unlock;
				535
				536	sched_clock_tick();
				537	update_rq_clock(rq);
				538	dl_se->dl_throttled = 0;
Juri Lelli	5bfd126	2014-04-15 13:49:04 +0200	[diff] [blame]	539	dl_se->dl_yielded = 0;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	540	if (p->on_rq) {
				541	enqueue_task_dl(rq, p, ENQUEUE_REPLENISH);
				542	if (task_has_dl_policy(rq->curr))
				543	check_preempt_curr_dl(rq, p, 0);
				544	else
				545	resched_task(rq->curr);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	546	#ifdef CONFIG_SMP
				547	/*
				548	* Queueing this task back might have overloaded rq,
				549	* check if we need to kick someone away.
				550	*/
				551	if (has_pushable_dl_tasks(rq))
				552	push_dl_task(rq);
				553	#endif
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	554	}
				555	unlock:
				556	raw_spin_unlock(&rq->lock);
				557
				558	return HRTIMER_NORESTART;
				559	}
				560
				561	void init_dl_task_timer(struct sched_dl_entity *dl_se)
				562	{
				563	struct hrtimer *timer = &dl_se->dl_timer;
				564
				565	if (hrtimer_active(timer)) {
				566	hrtimer_try_to_cancel(timer);
				567	return;
				568	}
				569
				570	hrtimer_init(timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
				571	timer->function = dl_task_timer;
				572	}
				573
				574	static
				575	int dl_runtime_exceeded(struct rq rq, struct sched_dl_entity dl_se)
				576	{
				577	int dmiss = dl_time_before(dl_se->deadline, rq_clock(rq));
				578	int rorun = dl_se->runtime <= 0;
				579
				580	if (!rorun && !dmiss)
				581	return 0;
				582
				583	/*
				584	* If we are beyond our current deadline and we are still
				585	* executing, then we have already used some of the runtime of
				586	* the next instance. Thus, if we do not account that, we are
				587	* stealing bandwidth from the system at each deadline miss!
				588	*/
				589	if (dmiss) {
				590	dl_se->runtime = rorun ? dl_se->runtime : 0;
				591	dl_se->runtime -= rq_clock(rq) - dl_se->deadline;
				592	}
				593
				594	return 1;
				595	}
				596
Juri Lelli	faa5993	2014-02-21 11:37:15 +0100	[diff] [blame]	597	extern bool sched_rt_bandwidth_account(struct rt_rq *rt_rq);
				598
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	599	/*
				600	* Update the current task's runtime statistics (provided it is still
				601	* a -deadline task and has not been removed from the dl_rq).
				602	*/
				603	static void update_curr_dl(struct rq *rq)
				604	{
				605	struct task_struct *curr = rq->curr;
				606	struct sched_dl_entity *dl_se = &curr->dl;
				607	u64 delta_exec;
				608
				609	if (!dl_task(curr) \|\| !on_dl_rq(dl_se))
				610	return;
				611
				612	/*
				613	* Consumed budget is computed considering the time as
				614	* observed by schedulable tasks (excluding time spent
				615	* in hardirq context, etc.). Deadlines are instead
				616	* computed using hard walltime. This seems to be the more
				617	* natural solution, but the full ramifications of this
				618	* approach need further study.
				619	*/
				620	delta_exec = rq_clock_task(rq) - curr->se.exec_start;
Kirill Tkhai	734ff2a	2014-03-04 19:25:46 +0400	[diff] [blame]	621	if (unlikely((s64)delta_exec <= 0))
				622	return;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	623
				624	schedstat_set(curr->se.statistics.exec_max,
				625	max(curr->se.statistics.exec_max, delta_exec));
				626
				627	curr->se.sum_exec_runtime += delta_exec;
				628	account_group_exec_runtime(curr, delta_exec);
				629
				630	curr->se.exec_start = rq_clock_task(rq);
				631	cpuacct_charge(curr, delta_exec);
				632
Dario Faggioli	239be4a	2013-11-07 14:43:39 +0100	[diff] [blame]	633	sched_rt_avg_update(rq, delta_exec);
				634
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	635	dl_se->runtime -= delta_exec;
				636	if (dl_runtime_exceeded(rq, dl_se)) {
				637	__dequeue_task_dl(rq, curr, 0);
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	638	if (likely(start_dl_timer(dl_se, curr->dl.dl_boosted)))
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	639	dl_se->dl_throttled = 1;
				640	else
				641	enqueue_task_dl(rq, curr, ENQUEUE_REPLENISH);
				642
				643	if (!is_leftmost(curr, &rq->dl))
				644	resched_task(curr);
				645	}
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	646
				647	/*
				648	* Because -- for now -- we share the rt bandwidth, we need to
				649	* account our runtime there too, otherwise actual rt tasks
				650	* would be able to exceed the shared quota.
				651	*
				652	* Account to the root rt group for now.
				653	*
				654	* The solution we're working towards is having the RT groups scheduled
				655	* using deadline servers -- however there's a few nasties to figure
				656	* out before that can happen.
				657	*/
				658	if (rt_bandwidth_enabled()) {
				659	struct rt_rq *rt_rq = &rq->rt;
				660
				661	raw_spin_lock(&rt_rq->rt_runtime_lock);
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	662	/*
				663	* We'll let actual RT tasks worry about the overflow here, we
Juri Lelli	faa5993	2014-02-21 11:37:15 +0100	[diff] [blame]	664	* have our own CBS to keep us inline; only account when RT
				665	* bandwidth is relevant.
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	666	*/
Juri Lelli	faa5993	2014-02-21 11:37:15 +0100	[diff] [blame]	667	if (sched_rt_bandwidth_account(rt_rq))
				668	rt_rq->rt_time += delta_exec;
Peter Zijlstra	1724813	2013-12-17 12:44:49 +0100	[diff] [blame]	669	raw_spin_unlock(&rt_rq->rt_runtime_lock);
				670	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	671	}
				672
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	673	#ifdef CONFIG_SMP
				674
				675	static struct task_struct pick_next_earliest_dl_task(struct rq rq, int cpu);
				676
				677	static inline u64 next_deadline(struct rq *rq)
				678	{
				679	struct task_struct *next = pick_next_earliest_dl_task(rq, rq->cpu);
				680
				681	if (next && dl_prio(next->prio))
				682	return next->dl.deadline;
				683	else
				684	return 0;
				685	}
				686
				687	static void inc_dl_deadline(struct dl_rq *dl_rq, u64 deadline)
				688	{
				689	struct rq *rq = rq_of_dl_rq(dl_rq);
				690
				691	if (dl_rq->earliest_dl.curr == 0 \|\|
				692	dl_time_before(deadline, dl_rq->earliest_dl.curr)) {
				693	/*
				694	* If the dl_rq had no -deadline tasks, or if the new task
				695	* has shorter deadline than the current one on dl_rq, we
				696	* know that the previous earliest becomes our next earliest,
				697	* as the new task becomes the earliest itself.
				698	*/
				699	dl_rq->earliest_dl.next = dl_rq->earliest_dl.curr;
				700	dl_rq->earliest_dl.curr = deadline;
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	701	cpudl_set(&rq->rd->cpudl, rq->cpu, deadline, 1);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	702	} else if (dl_rq->earliest_dl.next == 0 \|\|
				703	dl_time_before(deadline, dl_rq->earliest_dl.next)) {
				704	/*
				705	* On the other hand, if the new -deadline task has a
				706	* a later deadline than the earliest one on dl_rq, but
				707	* it is earlier than the next (if any), we must
				708	* recompute the next-earliest.
				709	*/
				710	dl_rq->earliest_dl.next = next_deadline(rq);
				711	}
				712	}
				713
				714	static void dec_dl_deadline(struct dl_rq *dl_rq, u64 deadline)
				715	{
				716	struct rq *rq = rq_of_dl_rq(dl_rq);
				717
				718	/*
				719	* Since we may have removed our earliest (and/or next earliest)
				720	* task we must recompute them.
				721	*/
				722	if (!dl_rq->dl_nr_running) {
				723	dl_rq->earliest_dl.curr = 0;
				724	dl_rq->earliest_dl.next = 0;
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	725	cpudl_set(&rq->rd->cpudl, rq->cpu, 0, 0);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	726	} else {
				727	struct rb_node *leftmost = dl_rq->rb_leftmost;
				728	struct sched_dl_entity *entry;
				729
				730	entry = rb_entry(leftmost, struct sched_dl_entity, rb_node);
				731	dl_rq->earliest_dl.curr = entry->deadline;
				732	dl_rq->earliest_dl.next = next_deadline(rq);
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	733	cpudl_set(&rq->rd->cpudl, rq->cpu, entry->deadline, 1);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	734	}
				735	}
				736
				737	#else
				738
				739	static inline void inc_dl_deadline(struct dl_rq *dl_rq, u64 deadline) {}
				740	static inline void dec_dl_deadline(struct dl_rq *dl_rq, u64 deadline) {}
				741
				742	#endif /* CONFIG_SMP */
				743
				744	static inline
				745	void inc_dl_tasks(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				746	{
				747	int prio = dl_task_of(dl_se)->prio;
				748	u64 deadline = dl_se->deadline;
				749
				750	WARN_ON(!dl_prio(prio));
				751	dl_rq->dl_nr_running++;
Juri Lelli	3d5f35b	2014-02-20 09:19:39 +0100	[diff] [blame]	752	inc_nr_running(rq_of_dl_rq(dl_rq));
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	753
				754	inc_dl_deadline(dl_rq, deadline);
				755	inc_dl_migration(dl_se, dl_rq);
				756	}
				757
				758	static inline
				759	void dec_dl_tasks(struct sched_dl_entity dl_se, struct dl_rq dl_rq)
				760	{
				761	int prio = dl_task_of(dl_se)->prio;
				762
				763	WARN_ON(!dl_prio(prio));
				764	WARN_ON(!dl_rq->dl_nr_running);
				765	dl_rq->dl_nr_running--;
Juri Lelli	3d5f35b	2014-02-20 09:19:39 +0100	[diff] [blame]	766	dec_nr_running(rq_of_dl_rq(dl_rq));
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	767
				768	dec_dl_deadline(dl_rq, dl_se->deadline);
				769	dec_dl_migration(dl_se, dl_rq);
				770	}
				771
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	772	static void __enqueue_dl_entity(struct sched_dl_entity *dl_se)
				773	{
				774	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				775	struct rb_node **link = &dl_rq->rb_root.rb_node;
				776	struct rb_node *parent = NULL;
				777	struct sched_dl_entity *entry;
				778	int leftmost = 1;
				779
				780	BUG_ON(!RB_EMPTY_NODE(&dl_se->rb_node));
				781
				782	while (*link) {
				783	parent = *link;
				784	entry = rb_entry(parent, struct sched_dl_entity, rb_node);
				785	if (dl_time_before(dl_se->deadline, entry->deadline))
				786	link = &parent->rb_left;
				787	else {
				788	link = &parent->rb_right;
				789	leftmost = 0;
				790	}
				791	}
				792
				793	if (leftmost)
				794	dl_rq->rb_leftmost = &dl_se->rb_node;
				795
				796	rb_link_node(&dl_se->rb_node, parent, link);
				797	rb_insert_color(&dl_se->rb_node, &dl_rq->rb_root);
				798
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	799	inc_dl_tasks(dl_se, dl_rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	800	}
				801
				802	static void __dequeue_dl_entity(struct sched_dl_entity *dl_se)
				803	{
				804	struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
				805
				806	if (RB_EMPTY_NODE(&dl_se->rb_node))
				807	return;
				808
				809	if (dl_rq->rb_leftmost == &dl_se->rb_node) {
				810	struct rb_node *next_node;
				811
				812	next_node = rb_next(&dl_se->rb_node);
				813	dl_rq->rb_leftmost = next_node;
				814	}
				815
				816	rb_erase(&dl_se->rb_node, &dl_rq->rb_root);
				817	RB_CLEAR_NODE(&dl_se->rb_node);
				818
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	819	dec_dl_tasks(dl_se, dl_rq);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	820	}
				821
				822	static void
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	823	enqueue_dl_entity(struct sched_dl_entity *dl_se,
				824	struct sched_dl_entity *pi_se, int flags)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	825	{
				826	BUG_ON(on_dl_rq(dl_se));
				827
				828	/*
				829	* If this is a wakeup or a new instance, the scheduling
				830	* parameters of the task might need updating. Otherwise,
				831	* we want a replenishment of its runtime.
				832	*/
				833	if (!dl_se->dl_new && flags & ENQUEUE_REPLENISH)
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	834	replenish_dl_entity(dl_se, pi_se);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	835	else
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	836	update_dl_entity(dl_se, pi_se);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	837
				838	__enqueue_dl_entity(dl_se);
				839	}
				840
				841	static void dequeue_dl_entity(struct sched_dl_entity *dl_se)
				842	{
				843	__dequeue_dl_entity(dl_se);
				844	}
				845
				846	static void enqueue_task_dl(struct rq rq, struct task_struct p, int flags)
				847	{
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	848	struct task_struct *pi_task = rt_mutex_get_top_task(p);
				849	struct sched_dl_entity *pi_se = &p->dl;
				850
				851	/*
				852	* Use the scheduling parameters of the top pi-waiter
				853	* task if we have one and its (relative) deadline is
				854	* smaller than our one... OTW we keep our runtime and
				855	* deadline.
				856	*/
				857	if (pi_task && p->dl.dl_boosted && dl_prio(pi_task->normal_prio))
				858	pi_se = &pi_task->dl;
				859
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	860	/*
				861	* If p is throttled, we do nothing. In fact, if it exhausted
				862	* its budget it needs a replenishment and, since it now is on
				863	* its rq, the bandwidth timer callback (which clearly has not
				864	* run yet) will take care of this.
				865	*/
				866	if (p->dl.dl_throttled)
				867	return;
				868
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	869	enqueue_dl_entity(&p->dl, pi_se, flags);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	870
				871	if (!task_current(rq, p) && p->nr_cpus_allowed > 1)
				872	enqueue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	873	}
				874
				875	static void __dequeue_task_dl(struct rq rq, struct task_struct p, int flags)
				876	{
				877	dequeue_dl_entity(&p->dl);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	878	dequeue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	879	}
				880
				881	static void dequeue_task_dl(struct rq rq, struct task_struct p, int flags)
				882	{
				883	update_curr_dl(rq);
				884	__dequeue_task_dl(rq, p, flags);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	885	}
				886
				887	/*
				888	* Yield task semantic for -deadline tasks is:
				889	*
				890	* get off from the CPU until our next instance, with
				891	* a new runtime. This is of little use now, since we
				892	* don't have a bandwidth reclaiming mechanism. Anyway,
				893	* bandwidth reclaiming is planned for the future, and
				894	* yield_task_dl will indicate that some spare budget
				895	* is available for other task instances to use it.
				896	*/
				897	static void yield_task_dl(struct rq *rq)
				898	{
				899	struct task_struct *p = rq->curr;
				900
				901	/*
				902	* We make the task go to sleep until its current deadline by
				903	* forcing its runtime to zero. This way, update_curr_dl() stops
				904	* it and the bandwidth timer will wake it up and will give it
Juri Lelli	5bfd126	2014-04-15 13:49:04 +0200	[diff] [blame]	905	* new scheduling parameters (thanks to dl_yielded=1).
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	906	*/
				907	if (p->dl.runtime > 0) {
Juri Lelli	5bfd126	2014-04-15 13:49:04 +0200	[diff] [blame]	908	rq->curr->dl.dl_yielded = 1;
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	909	p->dl.runtime = 0;
				910	}
				911	update_curr_dl(rq);
				912	}
				913
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	914	#ifdef CONFIG_SMP
				915
				916	static int find_later_rq(struct task_struct *task);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	917
				918	static int
				919	select_task_rq_dl(struct task_struct *p, int cpu, int sd_flag, int flags)
				920	{
				921	struct task_struct *curr;
				922	struct rq *rq;
				923
				924	if (sd_flag != SD_BALANCE_WAKE && sd_flag != SD_BALANCE_FORK)
				925	goto out;
				926
				927	rq = cpu_rq(cpu);
				928
				929	rcu_read_lock();
				930	curr = ACCESS_ONCE(rq->curr); /* unlocked access */
				931
				932	/*
				933	* If we are dealing with a -deadline task, we must
				934	* decide where to wake it up.
				935	* If it has a later deadline and the current task
				936	* on this rq can't move (provided the waking task
				937	* can!) we prefer to send it somewhere else. On the
				938	* other hand, if it has a shorter deadline, we
				939	* try to make it stay here, it might be important.
				940	*/
				941	if (unlikely(dl_task(curr)) &&
				942	(curr->nr_cpus_allowed < 2 \|\|
				943	!dl_entity_preempt(&p->dl, &curr->dl)) &&
				944	(p->nr_cpus_allowed > 1)) {
				945	int target = find_later_rq(p);
				946
				947	if (target != -1)
				948	cpu = target;
				949	}
				950	rcu_read_unlock();
				951
				952	out:
				953	return cpu;
				954	}
				955
				956	static void check_preempt_equal_dl(struct rq rq, struct task_struct p)
				957	{
				958	/*
				959	* Current can't be migrated, useless to reschedule,
				960	* let's hope p can move out.
				961	*/
				962	if (rq->curr->nr_cpus_allowed == 1 \|\|
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	963	cpudl_find(&rq->rd->cpudl, rq->curr, NULL) == -1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	964	return;
				965
				966	/*
				967	* p is migratable, so let's not schedule it and
				968	* see if it is pushed or pulled somewhere else.
				969	*/
				970	if (p->nr_cpus_allowed != 1 &&
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	971	cpudl_find(&rq->rd->cpudl, p, NULL) != -1)
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	972	return;
				973
				974	resched_task(rq->curr);
				975	}
				976
Peter Zijlstra	38033c3	2014-01-23 20:32:21 +0100	[diff] [blame]	977	static int pull_dl_task(struct rq *this_rq);
				978
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	979	#endif /* CONFIG_SMP */
				980
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	981	/*
				982	* Only called when both the current and waking task are -deadline
				983	* tasks.
				984	*/
				985	static void check_preempt_curr_dl(struct rq rq, struct task_struct p,
				986	int flags)
				987	{
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	988	if (dl_entity_preempt(&p->dl, &rq->curr->dl)) {
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	989	resched_task(rq->curr);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	990	return;
				991	}
				992
				993	#ifdef CONFIG_SMP
				994	/*
				995	* In the unlikely case current and p have the same deadline
				996	* let us try to decide what's the best thing to do...
				997	*/
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	998	if ((p->dl.deadline == rq->curr->dl.deadline) &&
				999	!test_tsk_need_resched(rq->curr))
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1000	check_preempt_equal_dl(rq, p);
				1001	#endif /* CONFIG_SMP */
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1002	}
				1003
				1004	#ifdef CONFIG_SCHED_HRTICK
				1005	static void start_hrtick_dl(struct rq rq, struct task_struct p)
				1006	{
				1007	s64 delta = p->dl.dl_runtime - p->dl.runtime;
				1008
				1009	if (delta > 10000)
				1010	hrtick_start(rq, p->dl.runtime);
				1011	}
				1012	#endif
				1013
				1014	static struct sched_dl_entity pick_next_dl_entity(struct rq rq,
				1015	struct dl_rq *dl_rq)
				1016	{
				1017	struct rb_node *left = dl_rq->rb_leftmost;
				1018
				1019	if (!left)
				1020	return NULL;
				1021
				1022	return rb_entry(left, struct sched_dl_entity, rb_node);
				1023	}
				1024
Peter Zijlstra	606dba2	2012-02-11 06:05:00 +0100	[diff] [blame]	1025	struct task_struct pick_next_task_dl(struct rq rq, struct task_struct *prev)
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1026	{
				1027	struct sched_dl_entity *dl_se;
				1028	struct task_struct *p;
				1029	struct dl_rq *dl_rq;
				1030
				1031	dl_rq = &rq->dl;
				1032
Kirill Tkhai	a1d9a32	2014-04-10 17:38:36 +0400	[diff] [blame]	1033	if (need_pull_dl_task(rq, prev)) {
Peter Zijlstra	38033c3	2014-01-23 20:32:21 +0100	[diff] [blame]	1034	pull_dl_task(rq);
Kirill Tkhai	a1d9a32	2014-04-10 17:38:36 +0400	[diff] [blame]	1035	/*
				1036	* pull_rt_task() can drop (and re-acquire) rq->lock; this
				1037	* means a stop task can slip in, in which case we need to
				1038	* re-start task selection.
				1039	*/
				1040	if (rq->stop && rq->stop->on_rq)
				1041	return RETRY_TASK;
				1042	}
				1043
Kirill Tkhai	734ff2a	2014-03-04 19:25:46 +0400	[diff] [blame]	1044	/*
				1045	* When prev is DL, we may throttle it in put_prev_task().
				1046	* So, we update time before we check for dl_nr_running.
				1047	*/
				1048	if (prev->sched_class == &dl_sched_class)
				1049	update_curr_dl(rq);
Peter Zijlstra	38033c3	2014-01-23 20:32:21 +0100	[diff] [blame]	1050
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1051	if (unlikely(!dl_rq->dl_nr_running))
				1052	return NULL;
				1053
Peter Zijlstra	3f1d2a3	2014-02-12 10:49:30 +0100	[diff] [blame]	1054	put_prev_task(rq, prev);
Peter Zijlstra	606dba2	2012-02-11 06:05:00 +0100	[diff] [blame]	1055
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1056	dl_se = pick_next_dl_entity(rq, dl_rq);
				1057	BUG_ON(!dl_se);
				1058
				1059	p = dl_task_of(dl_se);
				1060	p->se.exec_start = rq_clock_task(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1061
				1062	/* Running task will never be pushed. */
Juri Lelli	7136265	2014-01-14 12:03:51 +0100	[diff] [blame]	1063	dequeue_pushable_dl_task(rq, p);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1064
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1065	#ifdef CONFIG_SCHED_HRTICK
				1066	if (hrtick_enabled(rq))
				1067	start_hrtick_dl(rq, p);
				1068	#endif
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1069
Peter Zijlstra	dc87734	2014-02-12 15:47:29 +0100	[diff] [blame]	1070	set_post_schedule(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1071
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1072	return p;
				1073	}
				1074
				1075	static void put_prev_task_dl(struct rq rq, struct task_struct p)
				1076	{
				1077	update_curr_dl(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1078
				1079	if (on_dl_rq(&p->dl) && p->nr_cpus_allowed > 1)
				1080	enqueue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1081	}
				1082
				1083	static void task_tick_dl(struct rq rq, struct task_struct p, int queued)
				1084	{
				1085	update_curr_dl(rq);
				1086
				1087	#ifdef CONFIG_SCHED_HRTICK
				1088	if (hrtick_enabled(rq) && queued && p->dl.runtime > 0)
				1089	start_hrtick_dl(rq, p);
				1090	#endif
				1091	}
				1092
				1093	static void task_fork_dl(struct task_struct *p)
				1094	{
				1095	/*
				1096	* SCHED_DEADLINE tasks cannot fork and this is achieved through
				1097	* sched_fork()
				1098	*/
				1099	}
				1100
				1101	static void task_dead_dl(struct task_struct *p)
				1102	{
				1103	struct hrtimer *timer = &p->dl.dl_timer;
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	1104	struct dl_bw *dl_b = dl_bw_of(task_cpu(p));
				1105
				1106	/*
				1107	* Since we are TASK_DEAD we won't slip out of the domain!
				1108	*/
				1109	raw_spin_lock_irq(&dl_b->lock);
				1110	dl_b->total_bw -= p->dl.dl_bw;
				1111	raw_spin_unlock_irq(&dl_b->lock);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1112
Dario Faggioli	2d3d891	2013-11-07 14:43:44 +0100	[diff] [blame]	1113	hrtimer_cancel(timer);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1114	}
				1115
				1116	static void set_curr_task_dl(struct rq *rq)
				1117	{
				1118	struct task_struct *p = rq->curr;
				1119
				1120	p->se.exec_start = rq_clock_task(rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1121
				1122	/* You can't push away the running task */
				1123	dequeue_pushable_dl_task(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1124	}
				1125
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1126	#ifdef CONFIG_SMP
				1127
				1128	/* Only try algorithms three times */
				1129	#define DL_MAX_TRIES 3
				1130
				1131	static int pick_dl_task(struct rq rq, struct task_struct p, int cpu)
				1132	{
				1133	if (!task_running(rq, p) &&
				1134	(cpu < 0 \|\| cpumask_test_cpu(cpu, &p->cpus_allowed)) &&
				1135	(p->nr_cpus_allowed > 1))
				1136	return 1;
				1137
				1138	return 0;
				1139	}
				1140
				1141	/* Returns the second earliest -deadline task, NULL otherwise */
				1142	static struct task_struct pick_next_earliest_dl_task(struct rq rq, int cpu)
				1143	{
				1144	struct rb_node *next_node = rq->dl.rb_leftmost;
				1145	struct sched_dl_entity *dl_se;
				1146	struct task_struct *p = NULL;
				1147
				1148	next_node:
				1149	next_node = rb_next(next_node);
				1150	if (next_node) {
				1151	dl_se = rb_entry(next_node, struct sched_dl_entity, rb_node);
				1152	p = dl_task_of(dl_se);
				1153
				1154	if (pick_dl_task(rq, p, cpu))
				1155	return p;
				1156
				1157	goto next_node;
				1158	}
				1159
				1160	return NULL;
				1161	}
				1162
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1163	static DEFINE_PER_CPU(cpumask_var_t, local_cpu_mask_dl);
				1164
				1165	static int find_later_rq(struct task_struct *task)
				1166	{
				1167	struct sched_domain *sd;
				1168	struct cpumask *later_mask = __get_cpu_var(local_cpu_mask_dl);
				1169	int this_cpu = smp_processor_id();
				1170	int best_cpu, cpu = task_cpu(task);
				1171
				1172	/* Make sure the mask is initialized first */
				1173	if (unlikely(!later_mask))
				1174	return -1;
				1175
				1176	if (task->nr_cpus_allowed == 1)
				1177	return -1;
				1178
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	1179	best_cpu = cpudl_find(&task_rq(task)->rd->cpudl,
				1180	task, later_mask);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1181	if (best_cpu == -1)
				1182	return -1;
				1183
				1184	/*
				1185	* If we are here, some target has been found,
				1186	* the most suitable of which is cached in best_cpu.
				1187	* This is, among the runqueues where the current tasks
				1188	* have later deadlines than the task's one, the rq
				1189	* with the latest possible one.
				1190	*
				1191	* Now we check how well this matches with task's
				1192	* affinity and system topology.
				1193	*
				1194	* The last cpu where the task run is our first
				1195	* guess, since it is most likely cache-hot there.
				1196	*/
				1197	if (cpumask_test_cpu(cpu, later_mask))
				1198	return cpu;
				1199	/*
				1200	* Check if this_cpu is to be skipped (i.e., it is
				1201	* not in the mask) or not.
				1202	*/
				1203	if (!cpumask_test_cpu(this_cpu, later_mask))
				1204	this_cpu = -1;
				1205
				1206	rcu_read_lock();
				1207	for_each_domain(cpu, sd) {
				1208	if (sd->flags & SD_WAKE_AFFINE) {
				1209
				1210	/*
				1211	* If possible, preempting this_cpu is
				1212	* cheaper than migrating.
				1213	*/
				1214	if (this_cpu != -1 &&
				1215	cpumask_test_cpu(this_cpu, sched_domain_span(sd))) {
				1216	rcu_read_unlock();
				1217	return this_cpu;
				1218	}
				1219
				1220	/*
				1221	* Last chance: if best_cpu is valid and is
				1222	* in the mask, that becomes our choice.
				1223	*/
				1224	if (best_cpu < nr_cpu_ids &&
				1225	cpumask_test_cpu(best_cpu, sched_domain_span(sd))) {
				1226	rcu_read_unlock();
				1227	return best_cpu;
				1228	}
				1229	}
				1230	}
				1231	rcu_read_unlock();
				1232
				1233	/*
				1234	* At this point, all our guesses failed, we just return
				1235	* 'something', and let the caller sort the things out.
				1236	*/
				1237	if (this_cpu != -1)
				1238	return this_cpu;
				1239
				1240	cpu = cpumask_any(later_mask);
				1241	if (cpu < nr_cpu_ids)
				1242	return cpu;
				1243
				1244	return -1;
				1245	}
				1246
				1247	/* Locks the rq it finds */
				1248	static struct rq find_lock_later_rq(struct task_struct task, struct rq *rq)
				1249	{
				1250	struct rq *later_rq = NULL;
				1251	int tries;
				1252	int cpu;
				1253
				1254	for (tries = 0; tries < DL_MAX_TRIES; tries++) {
				1255	cpu = find_later_rq(task);
				1256
				1257	if ((cpu == -1) \|\| (cpu == rq->cpu))
				1258	break;
				1259
				1260	later_rq = cpu_rq(cpu);
				1261
				1262	/* Retry if something changed. */
				1263	if (double_lock_balance(rq, later_rq)) {
				1264	if (unlikely(task_rq(task) != rq \|\|
				1265	!cpumask_test_cpu(later_rq->cpu,
				1266	&task->cpus_allowed) \|\|
				1267	task_running(rq, task) \|\| !task->on_rq)) {
				1268	double_unlock_balance(rq, later_rq);
				1269	later_rq = NULL;
				1270	break;
				1271	}
				1272	}
				1273
				1274	/*
				1275	* If the rq we found has no -deadline task, or
				1276	* its earliest one has a later deadline than our
				1277	* task, the rq is a good one.
				1278	*/
				1279	if (!later_rq->dl.dl_nr_running \|\|
				1280	dl_time_before(task->dl.deadline,
				1281	later_rq->dl.earliest_dl.curr))
				1282	break;
				1283
				1284	/* Otherwise we try again. */
				1285	double_unlock_balance(rq, later_rq);
				1286	later_rq = NULL;
				1287	}
				1288
				1289	return later_rq;
				1290	}
				1291
				1292	static struct task_struct pick_next_pushable_dl_task(struct rq rq)
				1293	{
				1294	struct task_struct *p;
				1295
				1296	if (!has_pushable_dl_tasks(rq))
				1297	return NULL;
				1298
				1299	p = rb_entry(rq->dl.pushable_dl_tasks_leftmost,
				1300	struct task_struct, pushable_dl_tasks);
				1301
				1302	BUG_ON(rq->cpu != task_cpu(p));
				1303	BUG_ON(task_current(rq, p));
				1304	BUG_ON(p->nr_cpus_allowed <= 1);
				1305
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	1306	BUG_ON(!p->on_rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1307	BUG_ON(!dl_task(p));
				1308
				1309	return p;
				1310	}
				1311
				1312	/*
				1313	* See if the non running -deadline tasks on this rq
				1314	* can be sent to some other CPU where they can preempt
				1315	* and start executing.
				1316	*/
				1317	static int push_dl_task(struct rq *rq)
				1318	{
				1319	struct task_struct *next_task;
				1320	struct rq *later_rq;
				1321
				1322	if (!rq->dl.overloaded)
				1323	return 0;
				1324
				1325	next_task = pick_next_pushable_dl_task(rq);
				1326	if (!next_task)
				1327	return 0;
				1328
				1329	retry:
				1330	if (unlikely(next_task == rq->curr)) {
				1331	WARN_ON(1);
				1332	return 0;
				1333	}
				1334
				1335	/*
				1336	* If next_task preempts rq->curr, and rq->curr
				1337	* can move away, it makes sense to just reschedule
				1338	* without going further in pushing next_task.
				1339	*/
				1340	if (dl_task(rq->curr) &&
				1341	dl_time_before(next_task->dl.deadline, rq->curr->dl.deadline) &&
				1342	rq->curr->nr_cpus_allowed > 1) {
				1343	resched_task(rq->curr);
				1344	return 0;
				1345	}
				1346
				1347	/* We might release rq lock */
				1348	get_task_struct(next_task);
				1349
				1350	/* Will lock the rq it'll find */
				1351	later_rq = find_lock_later_rq(next_task, rq);
				1352	if (!later_rq) {
				1353	struct task_struct *task;
				1354
				1355	/*
				1356	* We must check all this again, since
				1357	* find_lock_later_rq releases rq->lock and it is
				1358	* then possible that next_task has migrated.
				1359	*/
				1360	task = pick_next_pushable_dl_task(rq);
				1361	if (task_cpu(next_task) == rq->cpu && task == next_task) {
				1362	/*
				1363	* The task is still there. We don't try
				1364	* again, some other cpu will pull it when ready.
				1365	*/
				1366	dequeue_pushable_dl_task(rq, next_task);
				1367	goto out;
				1368	}
				1369
				1370	if (!task)
				1371	/* No more tasks */
				1372	goto out;
				1373
				1374	put_task_struct(next_task);
				1375	next_task = task;
				1376	goto retry;
				1377	}
				1378
				1379	deactivate_task(rq, next_task, 0);
				1380	set_task_cpu(next_task, later_rq->cpu);
				1381	activate_task(later_rq, next_task, 0);
				1382
				1383	resched_task(later_rq->curr);
				1384
				1385	double_unlock_balance(rq, later_rq);
				1386
				1387	out:
				1388	put_task_struct(next_task);
				1389
				1390	return 1;
				1391	}
				1392
				1393	static void push_dl_tasks(struct rq *rq)
				1394	{
				1395	/* Terminates as it moves a -deadline task */
				1396	while (push_dl_task(rq))
				1397	;
				1398	}
				1399
				1400	static int pull_dl_task(struct rq *this_rq)
				1401	{
				1402	int this_cpu = this_rq->cpu, ret = 0, cpu;
				1403	struct task_struct *p;
				1404	struct rq *src_rq;
				1405	u64 dmin = LONG_MAX;
				1406
				1407	if (likely(!dl_overloaded(this_rq)))
				1408	return 0;
				1409
				1410	/*
				1411	* Match the barrier from dl_set_overloaded; this guarantees that if we
				1412	* see overloaded we must also see the dlo_mask bit.
				1413	*/
				1414	smp_rmb();
				1415
				1416	for_each_cpu(cpu, this_rq->rd->dlo_mask) {
				1417	if (this_cpu == cpu)
				1418	continue;
				1419
				1420	src_rq = cpu_rq(cpu);
				1421
				1422	/*
				1423	* It looks racy, abd it is! However, as in sched_rt.c,
				1424	* we are fine with this.
				1425	*/
				1426	if (this_rq->dl.dl_nr_running &&
				1427	dl_time_before(this_rq->dl.earliest_dl.curr,
				1428	src_rq->dl.earliest_dl.next))
				1429	continue;
				1430
				1431	/* Might drop this_rq->lock */
				1432	double_lock_balance(this_rq, src_rq);
				1433
				1434	/*
				1435	* If there are no more pullable tasks on the
				1436	* rq, we're done with it.
				1437	*/
				1438	if (src_rq->dl.dl_nr_running <= 1)
				1439	goto skip;
				1440
				1441	p = pick_next_earliest_dl_task(src_rq, this_cpu);
				1442
				1443	/*
				1444	* We found a task to be pulled if:
				1445	* - it preempts our current (if there's one),
				1446	* - it will preempt the last one we pulled (if any).
				1447	*/
				1448	if (p && dl_time_before(p->dl.deadline, dmin) &&
				1449	(!this_rq->dl.dl_nr_running \|\|
				1450	dl_time_before(p->dl.deadline,
				1451	this_rq->dl.earliest_dl.curr))) {
				1452	WARN_ON(p == src_rq->curr);
Dario Faggioli	332ac17	2013-11-07 14:43:45 +0100	[diff] [blame]	1453	WARN_ON(!p->on_rq);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1454
				1455	/*
				1456	* Then we pull iff p has actually an earlier
				1457	* deadline than the current task of its runqueue.
				1458	*/
				1459	if (dl_time_before(p->dl.deadline,
				1460	src_rq->curr->dl.deadline))
				1461	goto skip;
				1462
				1463	ret = 1;
				1464
				1465	deactivate_task(src_rq, p, 0);
				1466	set_task_cpu(p, this_cpu);
				1467	activate_task(this_rq, p, 0);
				1468	dmin = p->dl.deadline;
				1469
				1470	/* Is there any other task even earlier? */
				1471	}
				1472	skip:
				1473	double_unlock_balance(this_rq, src_rq);
				1474	}
				1475
				1476	return ret;
				1477	}
				1478
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1479	static void post_schedule_dl(struct rq *rq)
				1480	{
				1481	push_dl_tasks(rq);
				1482	}
				1483
				1484	/*
				1485	* Since the task is not running and a reschedule is not going to happen
				1486	* anytime soon on its runqueue, we try pushing it away now.
				1487	*/
				1488	static void task_woken_dl(struct rq rq, struct task_struct p)
				1489	{
				1490	if (!task_running(rq, p) &&
				1491	!test_tsk_need_resched(rq->curr) &&
				1492	has_pushable_dl_tasks(rq) &&
				1493	p->nr_cpus_allowed > 1 &&
				1494	dl_task(rq->curr) &&
				1495	(rq->curr->nr_cpus_allowed < 2 \|\|
				1496	dl_entity_preempt(&rq->curr->dl, &p->dl))) {
				1497	push_dl_tasks(rq);
				1498	}
				1499	}
				1500
				1501	static void set_cpus_allowed_dl(struct task_struct *p,
				1502	const struct cpumask *new_mask)
				1503	{
				1504	struct rq *rq;
				1505	int weight;
				1506
				1507	BUG_ON(!dl_task(p));
				1508
				1509	/*
				1510	* Update only if the task is actually running (i.e.,
				1511	* it is on the rq AND it is not throttled).
				1512	*/
				1513	if (!on_dl_rq(&p->dl))
				1514	return;
				1515
				1516	weight = cpumask_weight(new_mask);
				1517
				1518	/*
				1519	* Only update if the process changes its state from whether it
				1520	* can migrate or not.
				1521	*/
				1522	if ((p->nr_cpus_allowed > 1) == (weight > 1))
				1523	return;
				1524
				1525	rq = task_rq(p);
				1526
				1527	/*
				1528	* The process used to be able to migrate OR it can now migrate
				1529	*/
				1530	if (weight <= 1) {
				1531	if (!task_current(rq, p))
				1532	dequeue_pushable_dl_task(rq, p);
				1533	BUG_ON(!rq->dl.dl_nr_migratory);
				1534	rq->dl.dl_nr_migratory--;
				1535	} else {
				1536	if (!task_current(rq, p))
				1537	enqueue_pushable_dl_task(rq, p);
				1538	rq->dl.dl_nr_migratory++;
				1539	}
				1540
				1541	update_dl_migration(&rq->dl);
				1542	}
				1543
				1544	/* Assumes rq->lock is held */
				1545	static void rq_online_dl(struct rq *rq)
				1546	{
				1547	if (rq->dl.overloaded)
				1548	dl_set_overload(rq);
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	1549
				1550	if (rq->dl.dl_nr_running > 0)
				1551	cpudl_set(&rq->rd->cpudl, rq->cpu, rq->dl.earliest_dl.curr, 1);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1552	}
				1553
				1554	/* Assumes rq->lock is held */
				1555	static void rq_offline_dl(struct rq *rq)
				1556	{
				1557	if (rq->dl.overloaded)
				1558	dl_clear_overload(rq);
Juri Lelli	6bfd6d7	2013-11-07 14:43:47 +0100	[diff] [blame]	1559
				1560	cpudl_set(&rq->rd->cpudl, rq->cpu, 0, 0);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1561	}
				1562
				1563	void init_sched_dl_class(void)
				1564	{
				1565	unsigned int i;
				1566
				1567	for_each_possible_cpu(i)
				1568	zalloc_cpumask_var_node(&per_cpu(local_cpu_mask_dl, i),
				1569	GFP_KERNEL, cpu_to_node(i));
				1570	}
				1571
				1572	#endif /* CONFIG_SMP */
				1573
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1574	static void switched_from_dl(struct rq rq, struct task_struct p)
				1575	{
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1576	if (hrtimer_active(&p->dl.dl_timer) && !dl_policy(p->policy))
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1577	hrtimer_try_to_cancel(&p->dl.dl_timer);
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1578
				1579	#ifdef CONFIG_SMP
				1580	/*
				1581	* Since this might be the only -deadline task on the rq,
				1582	* this is the right place to try to pull some other one
				1583	* from an overloaded cpu, if any.
				1584	*/
				1585	if (!rq->dl.dl_nr_running)
				1586	pull_dl_task(rq);
				1587	#endif
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1588	}
				1589
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1590	/*
				1591	* When switching to -deadline, we may overload the rq, then
				1592	* we try to push someone off, if possible.
				1593	*/
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1594	static void switched_to_dl(struct rq rq, struct task_struct p)
				1595	{
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1596	int check_resched = 1;
				1597
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1598	/*
				1599	* If p is throttled, don't consider the possibility
				1600	* of preempting rq->curr, the check will be done right
				1601	* after its runtime will get replenished.
				1602	*/
				1603	if (unlikely(p->dl.dl_throttled))
				1604	return;
				1605
Kirill Tkhai	390f325	2014-01-28 11:26:14 +0400	[diff] [blame]	1606	if (p->on_rq && rq->curr != p) {
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1607	#ifdef CONFIG_SMP
				1608	if (rq->dl.overloaded && push_dl_task(rq) && rq != task_rq(p))
				1609	/* Only reschedule if pushing failed */
				1610	check_resched = 0;
				1611	#endif /* CONFIG_SMP */
				1612	if (check_resched && task_has_dl_policy(rq->curr))
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1613	check_preempt_curr_dl(rq, p, 0);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1614	}
				1615	}
				1616
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1617	/*
				1618	* If the scheduling parameters of a -deadline task changed,
				1619	* a push or pull operation might be needed.
				1620	*/
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1621	static void prio_changed_dl(struct rq rq, struct task_struct p,
				1622	int oldprio)
				1623	{
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1624	if (p->on_rq \|\| rq->curr == p) {
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1625	#ifdef CONFIG_SMP
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1626	/*
				1627	* This might be too much, but unfortunately
				1628	* we don't have the old deadline value, and
				1629	* we can't argue if the task is increasing
				1630	* or lowering its prio, so...
				1631	*/
				1632	if (!rq->dl.overloaded)
				1633	pull_dl_task(rq);
				1634
				1635	/*
				1636	* If we now have a earlier deadline task than p,
				1637	* then reschedule, provided p is still on this
				1638	* runqueue.
				1639	*/
				1640	if (dl_time_before(rq->dl.earliest_dl.curr, p->dl.deadline) &&
				1641	rq->curr == p)
				1642	resched_task(p);
				1643	#else
				1644	/*
				1645	* Again, we don't know if p has a earlier
				1646	* or later deadline, so let's blindly set a
				1647	* (maybe not needed) rescheduling point.
				1648	*/
				1649	resched_task(p);
				1650	#endif /* CONFIG_SMP */
				1651	} else
				1652	switched_to_dl(rq, p);
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1653	}
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1654
				1655	const struct sched_class dl_sched_class = {
				1656	.next = &rt_sched_class,
				1657	.enqueue_task = enqueue_task_dl,
				1658	.dequeue_task = dequeue_task_dl,
				1659	.yield_task = yield_task_dl,
				1660
				1661	.check_preempt_curr = check_preempt_curr_dl,
				1662
				1663	.pick_next_task = pick_next_task_dl,
				1664	.put_prev_task = put_prev_task_dl,
				1665
				1666	#ifdef CONFIG_SMP
				1667	.select_task_rq = select_task_rq_dl,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1668	.set_cpus_allowed = set_cpus_allowed_dl,
				1669	.rq_online = rq_online_dl,
				1670	.rq_offline = rq_offline_dl,
Juri Lelli	1baca4c	2013-11-07 14:43:38 +0100	[diff] [blame]	1671	.post_schedule = post_schedule_dl,
				1672	.task_woken = task_woken_dl,
Dario Faggioli	aab03e0	2013-11-28 11:14:43 +0100	[diff] [blame]	1673	#endif
				1674
				1675	.set_curr_task = set_curr_task_dl,
				1676	.task_tick = task_tick_dl,
				1677	.task_fork = task_fork_dl,
				1678	.task_dead = task_dead_dl,
				1679
				1680	.prio_changed = prio_changed_dl,
				1681	.switched_from = switched_from_dl,
				1682	.switched_to = switched_to_dl,
				1683	};