sched: bias effective_load() error towards failing wake_affine().

author Peter Zijlstra <a.p.zijlstra@chello.nl>

Fri, 27 Jun 2008 11:41:39 +0000 (13:41 +0200)

committer Ingo Molnar <mingo@elte.hu>

Fri, 27 Jun 2008 12:31:47 +0000 (14:31 +0200)
author Peter Zijlstra <a.p.zijlstra@chello.nl>
Fri, 27 Jun 2008 11:41:39 +0000 (13:41 +0200)
committer Ingo Molnar <mingo@elte.hu>
Fri, 27 Jun 2008 12:31:47 +0000 (14:31 +0200)
diff --git a/kernel/sched_fair.c b/kernel/sched_fair.c

index e87f1a52f625ce7304103d3f60e8ee1adc532079..9bcc0030a58bccb9df0555dce052dbb8f21ec8ef 100644 (file)
--- a/kernel/sched_fair.c
+++ b/kernel/sched_fair.c
@@ -1074,6 +1074,27 @@ static inline int wake_idle(int cpu, struct task_struct *p)
  static const struct sched_class fair_sched_class;
  
  #ifdef CONFIG_FAIR_GROUP_SCHED
+/*
+ * effective_load() calculates the load change as seen from the root_task_group
+ *
+ * Adding load to a group doesn't make a group heavier, but can cause movement
+ * of group shares between cpus. Assuming the shares were perfectly aligned one
+ * can calculate the shift in shares.
+ *
+ * The problem is that perfectly aligning the shares is rather expensive, hence
+ * we try to avoid doing that too often - see update_shares(), which ratelimits
+ * this change.
+ *
+ * We compensate this by not only taking the current delta into account, but
+ * also considering the delta between when the shares were last adjusted and
+ * now.
+ *
+ * We still saw a performance dip, some tracing learned us that between
+ * cgroup:/ and cgroup:/foo balancing the number of affine wakeups increased
+ * significantly. Therefore try to bias the error in direction of failing
+ * the affine wakeup.
+ *
+ */
  static long effective_load(struct task_group *tg, int cpu,
                 long wl, long wg)
  {
@@ -1083,6 +1104,13 @@ static long effective_load(struct task_group *tg, int cpu,
         if (!tg->parent)
                 return wl;
  
+       /*
+        * By not taking the decrease of shares on the other cpu into
+        * account our error leans towards reducing the affine wakeups.
+        */
+       if (!wl && sched_feat(ASYM_EFF_LOAD))
+               return wl;
+
         /*
          * Instead of using this increment, also add the difference
          * between when the shares were last updated and now.
diff --git a/kernel/sched_features.h b/kernel/sched_features.h

index 7d616d2a2a3fedc5b93ed2f0bfa7150f08085c32..862b06bd560aa58df2c95b0143b7331b8db113e7 100644 (file)
--- a/kernel/sched_features.h
+++ b/kernel/sched_features.h
@@ -10,3 +10,4 @@ SCHED_FEAT(DOUBLE_TICK, 0)
  SCHED_FEAT(ASYM_GRAN, 1)
  SCHED_FEAT(LB_BIAS, 0)
  SCHED_FEAT(LB_WAKEUP_UPDATE, 1)
+SCHED_FEAT(ASYM_EFF_LOAD, 1)
author	Peter Zijlstra <a.p.zijlstra@chello.nl>
	Fri, 27 Jun 2008 11:41:39 +0000 (13:41 +0200)
committer	Ingo Molnar <mingo@elte.hu>
	Fri, 27 Jun 2008 12:31:47 +0000 (14:31 +0200)
kernel/sched_fair.c		patch \| blob \| history
kernel/sched_features.h		patch \| blob \| history