Revert "mm: sched: numa: Delay PTE scanning until a task is scheduled on a new node"

author Mel Gorman <mgorman@suse.de>

Mon, 7 Oct 2013 10:28:53 +0000 (11:28 +0100)

committer Ingo Molnar <mingo@kernel.org>

Wed, 9 Oct 2013 10:40:17 +0000 (12:40 +0200)
author Mel Gorman <mgorman@suse.de>
Mon, 7 Oct 2013 10:28:53 +0000 (11:28 +0100)
committer Ingo Molnar <mingo@kernel.org>
Wed, 9 Oct 2013 10:40:17 +0000 (12:40 +0200)
diff --git a/include/linux/mm_types.h b/include/linux/mm_types.h

index d9851ee..b7adf1d 100644 (file)
--- a/include/linux/mm_types.h
+++ b/include/linux/mm_types.h
@@ -428,20 +428,10 @@ struct mm_struct {
  
         /* numa_scan_seq prevents two threads setting pte_numa */
         int numa_scan_seq;
-
-       /*
-        * The first node a task was scheduled on. If a task runs on
-        * a different node than Make PTE Scan Go Now.
-        */
-       int first_nid;
  #endif
         struct uprobes_state uprobes_state;
  };
  
-/* first nid will either be a valid NID or one of these values */
-#define NUMA_PTE_SCAN_INIT     -1
-#define NUMA_PTE_SCAN_ACTIVE   -2
-
  static inline void mm_init_cpumask(struct mm_struct *mm)
  {
  #ifdef CONFIG_CPUMASK_OFFSTACK
diff --git a/kernel/fork.c b/kernel/fork.c

index 086fe73..7192d91 100644 (file)
--- a/kernel/fork.c
+++ b/kernel/fork.c
@@ -816,9 +816,6 @@ struct mm_struct *dup_mm(struct task_struct *tsk)
  
  #ifdef CONFIG_TRANSPARENT_HUGEPAGE
         mm->pmd_huge_pte = NULL;
-#endif
-#ifdef CONFIG_NUMA_BALANCING
-       mm->first_nid = NUMA_PTE_SCAN_INIT;
  #endif
         if (!mm_init(mm, tsk))
                 goto fail_nomem;
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index 464207f..49b11fa 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -900,24 +900,6 @@ void task_numa_work(struct callback_head *work)
         if (p->flags & PF_EXITING)
                 return;
  
-       /*
-        * We do not care about task placement until a task runs on a node
-        * other than the first one used by the address space. This is
-        * largely because migrations are driven by what CPU the task
-        * is running on. If it's never scheduled on another node, it'll
-        * not migrate so why bother trapping the fault.
-        */
-       if (mm->first_nid == NUMA_PTE_SCAN_INIT)
-               mm->first_nid = numa_node_id();
-       if (mm->first_nid != NUMA_PTE_SCAN_ACTIVE) {
-               /* Are we running on a new node yet? */
-               if (numa_node_id() == mm->first_nid &&
-                   !sched_feat_numa(NUMA_FORCE))
-                       return;
-
-               mm->first_nid = NUMA_PTE_SCAN_ACTIVE;
-       }
-
         /*
          * Reset the scan period if enough time has gone by. Objective is that
          * scanning will be reduced if pages are properly placed. As tasks
diff --git a/kernel/sched/features.h b/kernel/sched/features.h

index 99399f8..cba5c61 100644 (file)
--- a/kernel/sched/features.h
+++ b/kernel/sched/features.h
@@ -63,10 +63,8 @@ SCHED_FEAT(LB_MIN, false)
  /*
   * Apply the automatic NUMA scheduling policy. Enabled automatically
   * at runtime if running on a NUMA machine. Can be controlled via
- * numa_balancing=. Allow PTE scanning to be forced on UMA machines
- * for debugging the core machinery.
+ * numa_balancing=
   */
  #ifdef CONFIG_NUMA_BALANCING
  SCHED_FEAT(NUMA,       false)
-SCHED_FEAT(NUMA_FORCE, false)
  #endif
author	Mel Gorman <mgorman@suse.de>
	Mon, 7 Oct 2013 10:28:53 +0000 (11:28 +0100)
committer	Ingo Molnar <mingo@kernel.org>
	Wed, 9 Oct 2013 10:40:17 +0000 (12:40 +0200)
include/linux/mm_types.h		patch \| blob \| history
kernel/fork.c		patch \| blob \| history
kernel/sched/fair.c		patch \| blob \| history
kernel/sched/features.h		patch \| blob \| history