These changes are the raw update to linux-4.4.6-rt14. Kernel sources

[kvmfornfv.git] / kernel / kernel / sched / deadline.c
diff --git a/kernel/kernel/sched/deadline.c b/kernel/kernel/sched/deadline.c

index 0c261c5..7a72e69 100644 (file)
--- a/kernel/kernel/sched/deadline.c
+++ b/kernel/kernel/sched/deadline.c
@@ -134,7 +134,7 @@ static void inc_dl_migration(struct sched_dl_entity *dl_se, struct dl_rq *dl_rq)
  {
         struct task_struct *p = dl_task_of(dl_se);
  
-       if (p->nr_cpus_allowed > 1)
+       if (tsk_nr_cpus_allowed(p) > 1)
                 dl_rq->dl_nr_migratory++;
  
         update_dl_migration(dl_rq);
@@ -144,7 +144,7 @@ static void dec_dl_migration(struct sched_dl_entity *dl_se, struct dl_rq *dl_rq)
  {
         struct task_struct *p = dl_task_of(dl_se);
  
-       if (p->nr_cpus_allowed > 1)
+       if (tsk_nr_cpus_allowed(p) > 1)
                 dl_rq->dl_nr_migratory--;
  
         update_dl_migration(dl_rq);
@@ -213,14 +213,28 @@ static inline bool need_pull_dl_task(struct rq *rq, struct task_struct *prev)
         return dl_task(prev);
  }
  
-static inline void set_post_schedule(struct rq *rq)
+static DEFINE_PER_CPU(struct callback_head, dl_push_head);
+static DEFINE_PER_CPU(struct callback_head, dl_pull_head);
+
+static void push_dl_tasks(struct rq *);
+static void pull_dl_task(struct rq *);
+
+static inline void queue_push_tasks(struct rq *rq)
  {
-       rq->post_schedule = has_pushable_dl_tasks(rq);
+       if (!has_pushable_dl_tasks(rq))
+               return;
+
+       queue_balance_callback(rq, &per_cpu(dl_push_head, rq->cpu), push_dl_tasks);
+}
+
+static inline void queue_pull_task(struct rq *rq)
+{
+       queue_balance_callback(rq, &per_cpu(dl_pull_head, rq->cpu), pull_dl_task);
  }
  
  static struct rq *find_lock_later_rq(struct task_struct *task, struct rq *rq);
  
-static void dl_task_offline_migration(struct rq *rq, struct task_struct *p)
+static struct rq *dl_task_offline_migration(struct rq *rq, struct task_struct *p)
  {
         struct rq *later_rq = NULL;
         bool fallback = false;
@@ -254,14 +268,19 @@ static void dl_task_offline_migration(struct rq *rq, struct task_struct *p)
                 double_lock_balance(rq, later_rq);
         }
  
+       /*
+        * By now the task is replenished and enqueued; migrate it.
+        */
         deactivate_task(rq, p, 0);
         set_task_cpu(p, later_rq->cpu);
-       activate_task(later_rq, p, ENQUEUE_REPLENISH);
+       activate_task(later_rq, p, 0);
  
         if (!fallback)
                 resched_curr(later_rq);
  
-       double_unlock_balance(rq, later_rq);
+       double_unlock_balance(later_rq, rq);
+
+       return later_rq;
  }
  
  #else
@@ -291,12 +310,15 @@ static inline bool need_pull_dl_task(struct rq *rq, struct task_struct *prev)
         return false;
  }
  
-static inline int pull_dl_task(struct rq *rq)
+static inline void pull_dl_task(struct rq *rq)
+{
+}
+
+static inline void queue_push_tasks(struct rq *rq)
  {
-       return 0;
  }
  
-static inline void set_post_schedule(struct rq *rq)
+static inline void queue_pull_task(struct rq *rq)
  {
  }
  #endif /* CONFIG_SMP */
@@ -498,24 +520,23 @@ static void update_dl_entity(struct sched_dl_entity *dl_se,
   * actually started or not (i.e., the replenishment instant is in
   * the future or in the past).
   */
-static int start_dl_timer(struct sched_dl_entity *dl_se, bool boosted)
+static int start_dl_timer(struct task_struct *p)
  {
-       struct dl_rq *dl_rq = dl_rq_of_se(dl_se);
-       struct rq *rq = rq_of_dl_rq(dl_rq);
+       struct sched_dl_entity *dl_se = &p->dl;
+       struct hrtimer *timer = &dl_se->dl_timer;
+       struct rq *rq = task_rq(p);
         ktime_t now, act;
-       ktime_t soft, hard;
-       unsigned long range;
         s64 delta;
  
-       if (boosted)
-               return 0;
+       lockdep_assert_held(&rq->lock);
+
         /*
          * We want the timer to fire at the deadline, but considering
          * that it is actually coming from rq->clock and not from
          * hrtimer's time base reading.
          */
         act = ns_to_ktime(dl_se->deadline);
-       now = hrtimer_cb_get_time(&dl_se->dl_timer);
+       now = hrtimer_cb_get_time(timer);
         delta = ktime_to_ns(now) - rq_clock(rq);
         act = ktime_add_ns(act, delta);
  
@@ -527,15 +548,21 @@ static int start_dl_timer(struct sched_dl_entity *dl_se, bool boosted)
         if (ktime_us_delta(act, now) < 0)
                 return 0;
  
-       hrtimer_set_expires(&dl_se->dl_timer, act);
-
-       soft = hrtimer_get_softexpires(&dl_se->dl_timer);
-       hard = hrtimer_get_expires(&dl_se->dl_timer);
-       range = ktime_to_ns(ktime_sub(hard, soft));
-       __hrtimer_start_range_ns(&dl_se->dl_timer, soft,
-                                range, HRTIMER_MODE_ABS, 0);
+       /*
+        * !enqueued will guarantee another callback; even if one is already in
+        * progress. This ensures a balanced {get,put}_task_struct().
+        *
+        * The race against __run_timer() clearing the enqueued state is
+        * harmless because we're holding task_rq()->lock, therefore the timer
+        * expiring after we've done the check will wait on its task_rq_lock()
+        * and observe our state.
+        */
+       if (!hrtimer_is_queued(timer)) {
+               get_task_struct(p);
+               hrtimer_start(timer, act, HRTIMER_MODE_ABS);
+       }
  
-       return hrtimer_active(&dl_se->dl_timer);
+       return 1;
  }
  
  /*
@@ -563,35 +590,40 @@ static enum hrtimer_restart dl_task_timer(struct hrtimer *timer)
         rq = task_rq_lock(p, &flags);
  
         /*
-        * We need to take care of several possible races here:
-        *
-        *   - the task might have changed its scheduling policy
-        *     to something different than SCHED_DEADLINE
-        *   - the task might have changed its reservation parameters
-        *     (through sched_setattr())
-        *   - the task might have been boosted by someone else and
-        *     might be in the boosting/deboosting path
+        * The task might have changed its scheduling policy to something
+        * different than SCHED_DEADLINE (through switched_fromd_dl()).
+        */
+       if (!dl_task(p)) {
+               __dl_clear_params(p);
+               goto unlock;
+       }
+
+       /*
+        * This is possible if switched_from_dl() raced against a running
+        * callback that took the above !dl_task() path and we've since then
+        * switched back into SCHED_DEADLINE.
          *
-        * In all this cases we bail out, as the task is already
-        * in the runqueue or is going to be enqueued back anyway.
+        * There's nothing to do except drop our task reference.
          */
-       if (!dl_task(p) || dl_se->dl_new ||
-           dl_se->dl_boosted || !dl_se->dl_throttled)
+       if (dl_se->dl_new)
                 goto unlock;
  
-       sched_clock_tick();
-       update_rq_clock(rq);
+       /*
+        * The task might have been boosted by someone else and might be in the
+        * boosting/deboosting path, its not throttled.
+        */
+       if (dl_se->dl_boosted)
+               goto unlock;
  
-#ifdef CONFIG_SMP
         /*
-        * If we find that the rq the task was on is no longer
-        * available, we need to select a new rq.
+        * Spurious timer due to start_dl_timer() race; or we already received
+        * a replenishment from rt_mutex_setprio().
          */
-       if (unlikely(!rq->online)) {
-               dl_task_offline_migration(rq, p);
+       if (!dl_se->dl_throttled)
                 goto unlock;
-       }
-#endif
+
+       sched_clock_tick();
+       update_rq_clock(rq);
  
         /*
          * If the throttle happened during sched-out; like:
@@ -617,17 +649,45 @@ static enum hrtimer_restart dl_task_timer(struct hrtimer *timer)
                 check_preempt_curr_dl(rq, p, 0);
         else
                 resched_curr(rq);
+
  #ifdef CONFIG_SMP
         /*
-        * Queueing this task back might have overloaded rq,
-        * check if we need to kick someone away.
+        * Perform balancing operations here; after the replenishments.  We
+        * cannot drop rq->lock before this, otherwise the assertion in
+        * start_dl_timer() about not missing updates is not true.
+        *
+        * If we find that the rq the task was on is no longer available, we
+        * need to select a new rq.
+        *
+        * XXX figure out if select_task_rq_dl() deals with offline cpus.
          */
-       if (has_pushable_dl_tasks(rq))
+       if (unlikely(!rq->online))
+               rq = dl_task_offline_migration(rq, p);
+
+       /*
+        * Queueing this task back might have overloaded rq, check if we need
+        * to kick someone away.
+        */
+       if (has_pushable_dl_tasks(rq)) {
+               /*
+                * Nothing relies on rq->lock after this, so its safe to drop
+                * rq->lock.
+                */
+               lockdep_unpin_lock(&rq->lock);
                 push_dl_task(rq);
+               lockdep_pin_lock(&rq->lock);
+       }
  #endif
+
  unlock:
         task_rq_unlock(rq, p, &flags);
  
+       /*
+        * This can free the task_struct, including this hrtimer, do not touch
+        * anything related to that after this.
+        */
+       put_task_struct(p);
+
         return HRTIMER_NORESTART;
  }
  
@@ -641,7 +701,7 @@ void init_dl_task_timer(struct sched_dl_entity *dl_se)
  }
  
  static
-int dl_runtime_exceeded(struct rq *rq, struct sched_dl_entity *dl_se)
+int dl_runtime_exceeded(struct sched_dl_entity *dl_se)
  {
         return (dl_se->runtime <= 0);
  }
@@ -685,10 +745,10 @@ static void update_curr_dl(struct rq *rq)
         sched_rt_avg_update(rq, delta_exec);
  
         dl_se->runtime -= dl_se->dl_yielded ? 0 : delta_exec;
-       if (dl_runtime_exceeded(rq, dl_se)) {
+       if (dl_runtime_exceeded(dl_se)) {
                 dl_se->dl_throttled = 1;
                 __dequeue_task_dl(rq, curr, 0);
-               if (unlikely(!start_dl_timer(dl_se, curr->dl.dl_boosted)))
+               if (unlikely(dl_se->dl_boosted || !start_dl_timer(curr)))
                         enqueue_task_dl(rq, curr, ENQUEUE_REPLENISH);
  
                 if (!is_leftmost(curr, &rq->dl))
@@ -901,7 +961,7 @@ static void enqueue_task_dl(struct rq *rq, struct task_struct *p, int flags)
  
         /*
          * Use the scheduling parameters of the top pi-waiter
-        * task if we have one and its (relative) deadline is
+        * task if we have one and its (absolute) deadline is
          * smaller than our one... OTW we keep our runtime and
          * deadline.
          */
@@ -930,7 +990,7 @@ static void enqueue_task_dl(struct rq *rq, struct task_struct *p, int flags)
  
         enqueue_dl_entity(&p->dl, pi_se, flags);
  
-       if (!task_current(rq, p) && p->nr_cpus_allowed > 1)
+       if (!task_current(rq, p) && tsk_nr_cpus_allowed(p) > 1)
                 enqueue_pushable_dl_task(rq, p);
  }
  
@@ -996,7 +1056,7 @@ select_task_rq_dl(struct task_struct *p, int cpu, int sd_flag, int flags)
         rq = cpu_rq(cpu);
  
         rcu_read_lock();
-       curr = ACCESS_ONCE(rq->curr); /* unlocked access */
+       curr = READ_ONCE(rq->curr); /* unlocked access */
  
         /*
          * If we are dealing with a -deadline task, we must
@@ -1008,12 +1068,15 @@ select_task_rq_dl(struct task_struct *p, int cpu, int sd_flag, int flags)
          * try to make it stay here, it might be important.
          */
         if (unlikely(dl_task(curr)) &&
-           (curr->nr_cpus_allowed < 2 ||
+           (tsk_nr_cpus_allowed(curr) < 2 ||
              !dl_entity_preempt(&p->dl, &curr->dl)) &&
-           (p->nr_cpus_allowed > 1)) {
+           (tsk_nr_cpus_allowed(p) > 1)) {
                 int target = find_later_rq(p);
  
-               if (target != -1)
+               if (target != -1 &&
+                               (dl_time_before(p->dl.deadline,
+                                       cpu_rq(target)->dl.earliest_dl.curr) ||
+                               (cpu_rq(target)->dl.dl_nr_running == 0)))
                         cpu = target;
         }
         rcu_read_unlock();
@@ -1028,7 +1091,7 @@ static void check_preempt_equal_dl(struct rq *rq, struct task_struct *p)
          * Current can't be migrated, useless to reschedule,
          * let's hope p can move out.
          */
-       if (rq->curr->nr_cpus_allowed == 1 ||
+       if (tsk_nr_cpus_allowed(rq->curr) == 1 ||
             cpudl_find(&rq->rd->cpudl, rq->curr, NULL) == -1)
                 return;
  
@@ -1036,15 +1099,13 @@ static void check_preempt_equal_dl(struct rq *rq, struct task_struct *p)
          * p is migratable, so let's not schedule it and
          * see if it is pushed or pulled somewhere else.
          */
-       if (p->nr_cpus_allowed != 1 &&
+       if (tsk_nr_cpus_allowed(p) != 1 &&
             cpudl_find(&rq->rd->cpudl, p, NULL) != -1)
                 return;
  
         resched_curr(rq);
  }
  
-static int pull_dl_task(struct rq *this_rq);
-
  #endif /* CONFIG_SMP */
  
  /*
@@ -1101,7 +1162,15 @@ struct task_struct *pick_next_task_dl(struct rq *rq, struct task_struct *prev)
         dl_rq = &rq->dl;
  
         if (need_pull_dl_task(rq, prev)) {
+               /*
+                * This is OK, because current is on_cpu, which avoids it being
+                * picked for load-balance and preemption/IRQs are still
+                * disabled avoiding further scheduler activity on it and we're
+                * being very careful to re-start the picking loop.
+                */
+               lockdep_unpin_lock(&rq->lock);
                 pull_dl_task(rq);
+               lockdep_pin_lock(&rq->lock);
                 /*
                  * pull_rt_task() can drop (and re-acquire) rq->lock; this
                  * means a stop task can slip in, in which case we need to
@@ -1135,7 +1204,7 @@ struct task_struct *pick_next_task_dl(struct rq *rq, struct task_struct *prev)
         if (hrtick_enabled(rq))
                 start_hrtick_dl(rq, p);
  
-       set_post_schedule(rq);
+       queue_push_tasks(rq);
  
         return p;
  }
@@ -1144,7 +1213,7 @@ static void put_prev_task_dl(struct rq *rq, struct task_struct *p)
  {
         update_curr_dl(rq);
  
-       if (on_dl_rq(&p->dl) && p->nr_cpus_allowed > 1)
+       if (on_dl_rq(&p->dl) && tsk_nr_cpus_allowed(p) > 1)
                 enqueue_pushable_dl_task(rq, p);
  }
  
@@ -1172,7 +1241,6 @@ static void task_fork_dl(struct task_struct *p)
  
  static void task_dead_dl(struct task_struct *p)
  {
-       struct hrtimer *timer = &p->dl.dl_timer;
         struct dl_bw *dl_b = dl_bw_of(task_cpu(p));
  
         /*
@@ -1182,8 +1250,6 @@ static void task_dead_dl(struct task_struct *p)
         /* XXX we should retain the bw until 0-lag */
         dl_b->total_bw -= p->dl.dl_bw;
         raw_spin_unlock_irq(&dl_b->lock);
-
-       hrtimer_cancel(timer);
  }
  
  static void set_curr_task_dl(struct rq *rq)
@@ -1231,6 +1297,32 @@ next_node:
         return NULL;
  }
  
+/*
+ * Return the earliest pushable rq's task, which is suitable to be executed
+ * on the CPU, NULL otherwise:
+ */
+static struct task_struct *pick_earliest_pushable_dl_task(struct rq *rq, int cpu)
+{
+       struct rb_node *next_node = rq->dl.pushable_dl_tasks_leftmost;
+       struct task_struct *p = NULL;
+
+       if (!has_pushable_dl_tasks(rq))
+               return NULL;
+
+next_node:
+       if (next_node) {
+               p = rb_entry(next_node, struct task_struct, pushable_dl_tasks);
+
+               if (pick_dl_task(rq, p, cpu))
+                       return p;
+
+               next_node = rb_next(next_node);
+               goto next_node;
+       }
+
+       return NULL;
+}
+
  static DEFINE_PER_CPU(cpumask_var_t, local_cpu_mask_dl);
  
  static int find_later_rq(struct task_struct *task)
@@ -1244,7 +1336,7 @@ static int find_later_rq(struct task_struct *task)
         if (unlikely(!later_mask))
                 return -1;
  
-       if (task->nr_cpus_allowed == 1)
+       if (tsk_nr_cpus_allowed(task) == 1)
                 return -1;
  
         /*
@@ -1334,11 +1426,23 @@ static struct rq *find_lock_later_rq(struct task_struct *task, struct rq *rq)
  
                 later_rq = cpu_rq(cpu);
  
+               if (later_rq->dl.dl_nr_running &&
+                   !dl_time_before(task->dl.deadline,
+                                       later_rq->dl.earliest_dl.curr)) {
+                       /*
+                        * Target rq has tasks of equal or earlier deadline,
+                        * retrying does not release any lock and is unlikely
+                        * to yield a different result.
+                        */
+                       later_rq = NULL;
+                       break;
+               }
+
                 /* Retry if something changed. */
                 if (double_lock_balance(rq, later_rq)) {
                         if (unlikely(task_rq(task) != rq ||
                                      !cpumask_test_cpu(later_rq->cpu,
-                                                      &task->cpus_allowed) ||
+                                                      tsk_cpus_allowed(task)) ||
                                      task_running(rq, task) ||
                                      !task_on_rq_queued(task))) {
                                 double_unlock_balance(rq, later_rq);
@@ -1377,7 +1481,7 @@ static struct task_struct *pick_next_pushable_dl_task(struct rq *rq)
  
         BUG_ON(rq->cpu != task_cpu(p));
         BUG_ON(task_current(rq, p));
-       BUG_ON(p->nr_cpus_allowed <= 1);
+       BUG_ON(tsk_nr_cpus_allowed(p) <= 1);
  
         BUG_ON(!task_on_rq_queued(p));
         BUG_ON(!dl_task(p));
@@ -1416,7 +1520,7 @@ retry:
          */
         if (dl_task(rq->curr) &&
             dl_time_before(next_task->dl.deadline, rq->curr->dl.deadline) &&
-           rq->curr->nr_cpus_allowed > 1) {
+           tsk_nr_cpus_allowed(rq->curr) > 1) {
                 resched_curr(rq);
                 return 0;
         }
@@ -1469,20 +1573,21 @@ out:
  
  static void push_dl_tasks(struct rq *rq)
  {
-       /* Terminates as it moves a -deadline task */
+       /* push_dl_task() will return true if it moved a -deadline task */
         while (push_dl_task(rq))
                 ;
  }
  
-static int pull_dl_task(struct rq *this_rq)
+static void pull_dl_task(struct rq *this_rq)
  {
-       int this_cpu = this_rq->cpu, ret = 0, cpu;
+       int this_cpu = this_rq->cpu, cpu;
         struct task_struct *p;
+       bool resched = false;
         struct rq *src_rq;
         u64 dmin = LONG_MAX;
  
         if (likely(!dl_overloaded(this_rq)))
-               return 0;
+               return;
  
         /*
          * Match the barrier from dl_set_overloaded; this guarantees that if we
@@ -1515,7 +1620,7 @@ static int pull_dl_task(struct rq *this_rq)
                 if (src_rq->dl.dl_nr_running <= 1)
                         goto skip;
  
-               p = pick_next_earliest_dl_task(src_rq, this_cpu);
+               p = pick_earliest_pushable_dl_task(src_rq, this_cpu);
  
                 /*
                  * We found a task to be pulled if:
@@ -1537,7 +1642,7 @@ static int pull_dl_task(struct rq *this_rq)
                                            src_rq->curr->dl.deadline))
                                 goto skip;
  
-                       ret = 1;
+                       resched = true;
  
                         deactivate_task(src_rq, p, 0);
                         set_task_cpu(p, this_cpu);
@@ -1550,12 +1655,8 @@ skip:
                 double_unlock_balance(this_rq, src_rq);
         }
  
-       return ret;
-}
-
-static void post_schedule_dl(struct rq *rq)
-{
-       push_dl_tasks(rq);
+       if (resched)
+               resched_curr(this_rq);
  }
  
  /*
@@ -1566,10 +1667,9 @@ static void task_woken_dl(struct rq *rq, struct task_struct *p)
  {
         if (!task_running(rq, p) &&
             !test_tsk_need_resched(rq->curr) &&
-           has_pushable_dl_tasks(rq) &&
-           p->nr_cpus_allowed > 1 &&
+           tsk_nr_cpus_allowed(p) > 1 &&
             dl_task(rq->curr) &&
-           (rq->curr->nr_cpus_allowed < 2 ||
+           (tsk_nr_cpus_allowed(rq->curr) < 2 ||
              !dl_entity_preempt(&p->dl, &rq->curr->dl))) {
                 push_dl_tasks(rq);
         }
@@ -1578,9 +1678,8 @@ static void task_woken_dl(struct rq *rq, struct task_struct *p)
  static void set_cpus_allowed_dl(struct task_struct *p,
                                 const struct cpumask *new_mask)
  {
-       struct rq *rq;
         struct root_domain *src_rd;
-       int weight;
+       struct rq *rq;
  
         BUG_ON(!dl_task(p));
  
@@ -1606,37 +1705,7 @@ static void set_cpus_allowed_dl(struct task_struct *p,
                 raw_spin_unlock(&src_dl_b->lock);
         }
  
-       /*
-        * Update only if the task is actually running (i.e.,
-        * it is on the rq AND it is not throttled).
-        */
-       if (!on_dl_rq(&p->dl))
-               return;
-
-       weight = cpumask_weight(new_mask);
-
-       /*
-        * Only update if the process changes its state from whether it
-        * can migrate or not.
-        */
-       if ((p->nr_cpus_allowed > 1) == (weight > 1))
-               return;
-
-       /*
-        * The process used to be able to migrate OR it can now migrate
-        */
-       if (weight <= 1) {
-               if (!task_current(rq, p))
-                       dequeue_pushable_dl_task(rq, p);
-               BUG_ON(!rq->dl.dl_nr_migratory);
-               rq->dl.dl_nr_migratory--;
-       } else {
-               if (!task_current(rq, p))
-                       enqueue_pushable_dl_task(rq, p);
-               rq->dl.dl_nr_migratory++;
-       }
-
-       update_dl_migration(&rq->dl);
+       set_cpus_allowed_common(p, new_mask);
  }
  
  /* Assumes rq->lock is held */
@@ -1660,7 +1729,7 @@ static void rq_offline_dl(struct rq *rq)
         cpudl_clear_freecpu(&rq->rd->cpudl, rq->cpu);
  }
  
-void init_sched_dl_class(void)
+void __init init_sched_dl_class(void)
  {
         unsigned int i;
  
@@ -1671,37 +1740,16 @@ void init_sched_dl_class(void)
  
  #endif /* CONFIG_SMP */
  
-/*
- *  Ensure p's dl_timer is cancelled. May drop rq->lock for a while.
- */
-static void cancel_dl_timer(struct rq *rq, struct task_struct *p)
-{
-       struct hrtimer *dl_timer = &p->dl.dl_timer;
-
-       /* Nobody will change task's class if pi_lock is held */
-       lockdep_assert_held(&p->pi_lock);
-
-       if (hrtimer_active(dl_timer)) {
-               int ret = hrtimer_try_to_cancel(dl_timer);
-
-               if (unlikely(ret == -1)) {
-                       /*
-                        * Note, p may migrate OR new deadline tasks
-                        * may appear in rq when we are unlocking it.
-                        * A caller of us must be fine with that.
-                        */
-                       raw_spin_unlock(&rq->lock);
-                       hrtimer_cancel(dl_timer);
-                       raw_spin_lock(&rq->lock);
-               }
-       }
-}
-
  static void switched_from_dl(struct rq *rq, struct task_struct *p)
  {
-       /* XXX we should retain the bw until 0-lag */
-       cancel_dl_timer(rq, p);
-       __dl_clear_params(p);
+       /*
+        * Start the deadline timer; if we switch back to dl before this we'll
+        * continue consuming our current CBS slice. If we stay outside of
+        * SCHED_DEADLINE until the deadline passes, the timer will reset the
+        * task.
+        */
+       if (!start_dl_timer(p))
+               __dl_clear_params(p);
  
         /*
          * Since this might be the only -deadline task on the rq,
@@ -1711,8 +1759,7 @@ static void switched_from_dl(struct rq *rq, struct task_struct *p)
         if (!task_on_rq_queued(p) || rq->dl.dl_nr_running)
                 return;
  
-       if (pull_dl_task(rq))
-               resched_curr(rq);
+       queue_pull_task(rq);
  }
  
  /*
@@ -1721,21 +1768,16 @@ static void switched_from_dl(struct rq *rq, struct task_struct *p)
   */
  static void switched_to_dl(struct rq *rq, struct task_struct *p)
  {
-       int check_resched = 1;
-
         if (task_on_rq_queued(p) && rq->curr != p) {
  #ifdef CONFIG_SMP
-               if (p->nr_cpus_allowed > 1 && rq->dl.overloaded &&
-                       push_dl_task(rq) && rq != task_rq(p))
-                       /* Only reschedule if pushing failed */
-                       check_resched = 0;
-#endif /* CONFIG_SMP */
-               if (check_resched) {
-                       if (dl_task(rq->curr))
-                               check_preempt_curr_dl(rq, p, 0);
-                       else
-                               resched_curr(rq);
-               }
+               if (tsk_nr_cpus_allowed(p) > 1 && rq->dl.overloaded)
+                       queue_push_tasks(rq);
+#else
+               if (dl_task(rq->curr))
+                       check_preempt_curr_dl(rq, p, 0);
+               else
+                       resched_curr(rq);
+#endif
         }
  }
  
@@ -1755,15 +1797,14 @@ static void prio_changed_dl(struct rq *rq, struct task_struct *p,
                  * or lowering its prio, so...
                  */
                 if (!rq->dl.overloaded)
-                       pull_dl_task(rq);
+                       queue_pull_task(rq);
  
                 /*
                  * If we now have a earlier deadline task than p,
                  * then reschedule, provided p is still on this
                  * runqueue.
                  */
-               if (dl_time_before(rq->dl.earliest_dl.curr, p->dl.deadline) &&
-                   rq->curr == p)
+               if (dl_time_before(rq->dl.earliest_dl.curr, p->dl.deadline))
                         resched_curr(rq);
  #else
                 /*
@@ -1793,7 +1834,6 @@ const struct sched_class dl_sched_class = {
         .set_cpus_allowed       = set_cpus_allowed_dl,
         .rq_online              = rq_online_dl,
         .rq_offline             = rq_offline_dl,
-       .post_schedule          = post_schedule_dl,
         .task_woken             = task_woken_dl,
  #endif