mm: numa: slow PTE scan rate if migration failures occur

author Mel Gorman <mgorman@suse.de>

Wed, 25 Mar 2015 22:55:42 +0000 (15:55 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Wed, 25 Mar 2015 23:20:31 +0000 (16:20 -0700)
author Mel Gorman <mgorman@suse.de>
Wed, 25 Mar 2015 22:55:42 +0000 (15:55 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Wed, 25 Mar 2015 23:20:31 +0000 (16:20 -0700)
diff --git a/include/linux/sched.h b/include/linux/sched.h

index 6d77432e14ff971bffd4ca211dccb917768b2c8c..a419b65770d669c3a51c88a86a145abbcd3db339 100644 (file)
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -1625,11 +1625,11 @@ struct task_struct {
  
         /*
          * numa_faults_locality tracks if faults recorded during the last
-        * scan window were remote/local. The task scan period is adapted
-        * based on the locality of the faults with different weights
-        * depending on whether they were shared or private faults
+        * scan window were remote/local or failed to migrate. The task scan
+        * period is adapted based on the locality of the faults with different
+        * weights depending on whether they were shared or private faults
          */
-       unsigned long numa_faults_locality[2];
+       unsigned long numa_faults_locality[3];
  
         unsigned long numa_pages_migrated;
  #endif /* CONFIG_NUMA_BALANCING */
@@ -1719,6 +1719,7 @@ struct task_struct {
  #define TNF_NO_GROUP   0x02
  #define TNF_SHARED     0x04
  #define TNF_FAULT_LOCAL        0x08
+#define TNF_MIGRATE_FAIL 0x10
  
  #ifdef CONFIG_NUMA_BALANCING
  extern void task_numa_fault(int last_node, int node, int pages, int flags);
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index 7ce18f3c097ac4779eb4cf6ed0ad14ac1beb3eb5..bcfe32088b3768363c2f37502a953b61a361f7ff 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -1609,9 +1609,11 @@ static void update_task_scan_period(struct task_struct *p,
         /*
          * If there were no record hinting faults then either the task is
          * completely idle or all activity is areas that are not of interest
-        * to automatic numa balancing. Scan slower
+        * to automatic numa balancing. Related to that, if there were failed
+        * migration then it implies we are migrating too quickly or the local
+        * node is overloaded. In either case, scan slower
          */
-       if (local + shared == 0) {
+       if (local + shared == 0 || p->numa_faults_locality[2]) {
                 p->numa_scan_period = min(p->numa_scan_period_max,
                         p->numa_scan_period << 1);
  
@@ -2080,6 +2082,8 @@ void task_numa_fault(int last_cpupid, int mem_node, int pages, int flags)
  
         if (migrated)
                 p->numa_pages_migrated += pages;
+       if (flags & TNF_MIGRATE_FAIL)
+               p->numa_faults_locality[2] += pages;
  
         p->numa_faults[task_faults_idx(NUMA_MEMBUF, mem_node, priv)] += pages;
         p->numa_faults[task_faults_idx(NUMA_CPUBUF, cpu_node, priv)] += pages;
diff --git a/mm/huge_memory.c b/mm/huge_memory.c

index 0a42d1521aa43a0d44e564a2bb0554ec43180bcb..51b3e7c64622a6042cf0fb9828639826871b546b 100644 (file)
--- a/mm/huge_memory.c
+++ b/mm/huge_memory.c
@@ -1350,7 +1350,8 @@ int do_huge_pmd_numa_page(struct mm_struct *mm, struct vm_area_struct *vma,
         if (migrated) {
                 flags |= TNF_MIGRATED;
                 page_nid = target_nid;
-       }
+       } else
+               flags |= TNF_MIGRATE_FAIL;
  
         goto out;
  clear_pmdnuma:
diff --git a/mm/memory.c b/mm/memory.c

index d20e12da3a3cb29bf7fc6bffa2de9fbe89f22e4f..97839f5c8c303df324a1cec1dfacadb1b0bfa04c 100644 (file)
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -3103,7 +3103,8 @@ static int do_numa_page(struct mm_struct *mm, struct vm_area_struct *vma,
         if (migrated) {
                 page_nid = target_nid;
                 flags |= TNF_MIGRATED;
-       }
+       } else
+               flags |= TNF_MIGRATE_FAIL;
  
  out:
         if (page_nid != -1)
author	Mel Gorman <mgorman@suse.de>
	Wed, 25 Mar 2015 22:55:42 +0000 (15:55 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Wed, 25 Mar 2015 23:20:31 +0000 (16:20 -0700)
include/linux/sched.h		patch \| blob \| history
kernel/sched/fair.c		patch \| blob \| history
mm/huge_memory.c		patch \| blob \| history
mm/memory.c		patch \| blob \| history