sched/fair: Consider SD_NUMA when selecting the most idle group to schedule on

author Mel Gorman <mgorman@techsingularity.net>

Tue, 13 Feb 2018 13:37:29 +0000 (13:37 +0000)

committer Ingo Molnar <mingo@kernel.org>

Wed, 21 Feb 2018 07:49:43 +0000 (08:49 +0100)
author Mel Gorman <mgorman@techsingularity.net>
Tue, 13 Feb 2018 13:37:29 +0000 (13:37 +0000)
committer Ingo Molnar <mingo@kernel.org>
Wed, 21 Feb 2018 07:49:43 +0000 (08:49 +0100)
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index 302dda81e19211b53f82a6491efb5a4089eab987..94aea5b91a96a9d231c6992a3f2fb542f16867b0 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -5911,6 +5911,18 @@ skip_spare:
         if (!idlest)
                 return NULL;
  
+       /*
+        * When comparing groups across NUMA domains, it's possible for the
+        * local domain to be very lightly loaded relative to the remote
+        * domains but "imbalance" skews the comparison making remote CPUs
+        * look much more favourable. When considering cross-domain, add
+        * imbalance to the runnable load on the remote node and consider
+        * staying local.
+        */
+       if ((sd->flags & SD_NUMA) &&
+           min_runnable_load + imbalance >= this_runnable_load)
+               return NULL;
+
         if (min_runnable_load > (this_runnable_load + imbalance))
                 return NULL;
author	Mel Gorman <mgorman@techsingularity.net>
	Tue, 13 Feb 2018 13:37:29 +0000 (13:37 +0000)
committer	Ingo Molnar <mingo@kernel.org>
	Wed, 21 Feb 2018 07:49:43 +0000 (08:49 +0100)