sched: Fix sleep time double accounting in enqueue entity

[mirror_ubuntu-bionic-kernel.git] / kernel / sched / fair.c
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index 47a30be1fe8335b956763618f4c8dfbbbb93f4ac..9bbc303598ea848453efbb647fffe9ac08ca5029 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -680,6 +680,26 @@ static u64 sched_vslice(struct cfs_rq *cfs_rq, struct sched_entity *se)
         return calc_delta_fair(sched_slice(cfs_rq, se), se);
  }
  
+#ifdef CONFIG_SMP
+static inline void __update_task_entity_contrib(struct sched_entity *se);
+
+/* Give new task start runnable values to heavy its load in infant time */
+void init_task_runnable_average(struct task_struct *p)
+{
+       u32 slice;
+
+       p->se.avg.decay_count = 0;
+       slice = sched_slice(task_cfs_rq(p), &p->se) >> 10;
+       p->se.avg.runnable_avg_sum = slice;
+       p->se.avg.runnable_avg_period = slice;
+       __update_task_entity_contrib(&p->se);
+}
+#else
+void init_task_runnable_average(struct task_struct *p)
+{
+}
+#endif
+
  /*
   * Update the current task's runtime statistics. Skip current tasks that
   * are not in our scheduling class.
@@ -1128,8 +1148,7 @@ static inline void update_cfs_shares(struct cfs_rq *cfs_rq)
  }
  #endif /* CONFIG_FAIR_GROUP_SCHED */
  
-/* Only depends on SMP, FAIR_GROUP_SCHED may be removed when useful in lb */
-#if defined(CONFIG_SMP) && defined(CONFIG_FAIR_GROUP_SCHED)
+#ifdef CONFIG_SMP
  /*
   * We choose a half-life close to 1 scheduling period.
   * Note: The tables below are dependent on this value.
@@ -1528,6 +1547,10 @@ static inline void enqueue_entity_load_avg(struct cfs_rq *cfs_rq,
          * We track migrations using entity decay_count <= 0, on a wake-up
          * migration we use a negative decay count to track the remote decays
          * accumulated while sleeping.
+        *
+        * Newly forked tasks are enqueued with se->avg.decay_count == 0, they
+        * are seen by enqueue_entity_load_avg() as a migration with an already
+        * constructed load_avg_contrib.
          */
         if (unlikely(se->avg.decay_count <= 0)) {
                 se->avg.last_runnable_update = rq_clock_task(rq_of(cfs_rq));
@@ -1548,7 +1571,13 @@ static inline void enqueue_entity_load_avg(struct cfs_rq *cfs_rq,
                 }
                 wakeup = 0;
         } else {
-               __synchronize_entity_decay(se);
+               /*
+                * Task re-woke on same cpu (or else migrate_task_rq_fair()
+                * would have made count negative); we must be careful to avoid
+                * double-accounting blocked time after synchronizing decays.
+                */
+               se->avg.last_runnable_update += __synchronize_entity_decay(se)
+                                                       << 20;
         }
  
         /* migrated tasks did not contribute to our blocked load */
@@ -2618,10 +2647,6 @@ static void check_cfs_rq_runtime(struct cfs_rq *cfs_rq)
         throttle_cfs_rq(cfs_rq);
  }
  
-static inline u64 default_cfs_period(void);
-static int do_sched_cfs_period_timer(struct cfs_bandwidth *cfs_b, int overrun);
-static void do_sched_cfs_slack_timer(struct cfs_bandwidth *cfs_b);
-
  static enum hrtimer_restart sched_cfs_slack_timer(struct hrtimer *timer)
  {
         struct cfs_bandwidth *cfs_b =
@@ -3434,12 +3459,6 @@ unlock:
         return new_cpu;
  }
  
-/*
- * Load-tracking only depends on SMP, FAIR_GROUP_SCHED dependency below may be
- * removed when useful for applications beyond shares distribution (e.g.
- * load-balance).
- */
-#ifdef CONFIG_FAIR_GROUP_SCHED
  /*
   * Called immediately before a task is migrated to a new cpu; task_cpu(p) and
   * cfs_rq_of(p) references at time of call are still valid and identify the
@@ -3463,7 +3482,6 @@ migrate_task_rq_fair(struct task_struct *p, int next_cpu)
                 atomic64_add(se->avg.load_avg_contrib, &cfs_rq->removed_load);
         }
  }
-#endif
  #endif /* CONFIG_SMP */
  
  static unsigned long
@@ -5865,7 +5883,7 @@ static void switched_from_fair(struct rq *rq, struct task_struct *p)
                 se->vruntime -= cfs_rq->min_vruntime;
         }
  
-#if defined(CONFIG_FAIR_GROUP_SCHED) && defined(CONFIG_SMP)
+#ifdef CONFIG_SMP
         /*
         * Remove our load from contribution when we leave sched_fair
         * and ensure we don't carry in an old decay_count if we
@@ -5924,7 +5942,7 @@ void init_cfs_rq(struct cfs_rq *cfs_rq)
  #ifndef CONFIG_64BIT
         cfs_rq->min_vruntime_copy = cfs_rq->min_vruntime;
  #endif
-#if defined(CONFIG_FAIR_GROUP_SCHED) && defined(CONFIG_SMP)
+#ifdef CONFIG_SMP
         atomic64_set(&cfs_rq->decay_counter, 1);
         atomic64_set(&cfs_rq->removed_load, 0);
  #endif
@@ -6166,9 +6184,8 @@ const struct sched_class fair_sched_class = {
  
  #ifdef CONFIG_SMP
         .select_task_rq         = select_task_rq_fair,
-#ifdef CONFIG_FAIR_GROUP_SCHED
         .migrate_task_rq        = migrate_task_rq_fair,
-#endif
+
         .rq_online              = rq_online_fair,
         .rq_offline             = rq_offline_fair,