sched/numa: Retry migration of tasks to CPU on a preferred node

author Mel Gorman <mgorman@suse.de>

Mon, 7 Oct 2013 10:29:11 +0000 (11:29 +0100)

committer Ingo Molnar <mingo@kernel.org>

Wed, 9 Oct 2013 10:40:40 +0000 (12:40 +0200)
author Mel Gorman <mgorman@suse.de>
Mon, 7 Oct 2013 10:29:11 +0000 (11:29 +0100)
committer Ingo Molnar <mingo@kernel.org>
Wed, 9 Oct 2013 10:40:40 +0000 (12:40 +0200)
diff --git a/include/linux/sched.h b/include/linux/sched.h

index d946195eec105a388fe07e096ed16086e41e39b5..14251a8ff2ea379702648eb1476236c3d114965b 100644 (file)
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -1341,6 +1341,7 @@ struct task_struct {
         int numa_migrate_seq;
         unsigned int numa_scan_period;
         unsigned int numa_scan_period_max;
+       unsigned long numa_migrate_retry;
         u64 node_stamp;                 /* migration stamp  */
         struct callback_head numa_work;
  
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index 51a7600811931ad0a0d9cb58fabf80b41b8a5271..f84ac3fb581bd6d847c7dac34ae7e6d3a7a029e5 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -1011,6 +1011,23 @@ migrate:
         return migrate_task_to(p, env.best_cpu);
  }
  
+/* Attempt to migrate a task to a CPU on the preferred node. */
+static void numa_migrate_preferred(struct task_struct *p)
+{
+       /* Success if task is already running on preferred CPU */
+       p->numa_migrate_retry = 0;
+       if (cpu_to_node(task_cpu(p)) == p->numa_preferred_nid)
+               return;
+
+       /* This task has no NUMA fault statistics yet */
+       if (unlikely(p->numa_preferred_nid == -1))
+               return;
+
+       /* Otherwise, try migrate to a CPU on the preferred node */
+       if (task_numa_migrate(p) != 0)
+               p->numa_migrate_retry = jiffies + HZ*5;
+}
+
  static void task_numa_placement(struct task_struct *p)
  {
         int seq, nid, max_nid = -1;
@@ -1045,17 +1062,12 @@ static void task_numa_placement(struct task_struct *p)
                 }
         }
  
-       /*
-        * Record the preferred node as the node with the most faults,
-        * requeue the task to be running on the idlest CPU on the
-        * preferred node and reset the scanning rate to recheck
-        * the working set placement.
-        */
+       /* Preferred node as the node with the most faults */
         if (max_faults && max_nid != p->numa_preferred_nid) {
                 /* Update the preferred nid and migrate task if possible */
                 p->numa_preferred_nid = max_nid;
                 p->numa_migrate_seq = 1;
-               task_numa_migrate(p);
+               numa_migrate_preferred(p);
         }
  }
  
@@ -1111,6 +1123,10 @@ void task_numa_fault(int last_nidpid, int node, int pages, bool migrated)
  
         task_numa_placement(p);
  
+       /* Retry task to preferred node migration if it previously failed */
+       if (p->numa_migrate_retry && time_after(jiffies, p->numa_migrate_retry))
+               numa_migrate_preferred(p);
+
         p->numa_faults_buffer[task_faults_idx(node, priv)] += pages;
  }
author	Mel Gorman <mgorman@suse.de>
	Mon, 7 Oct 2013 10:29:11 +0000 (11:29 +0100)
committer	Ingo Molnar <mingo@kernel.org>
	Wed, 9 Oct 2013 10:40:40 +0000 (12:40 +0200)
include/linux/sched.h		patch \| blob \| blame \| history
kernel/sched/fair.c		patch \| blob \| blame \| history