tools headers UAPI: Sync linux/prctl.h with the kernel sources

[linux-2.6-microblaze.git] / mm / swap.c
diff --git a/mm/swap.c b/mm/swap.c

index 31b844d..dfb48cf 100644 (file)
--- a/mm/swap.c
+++ b/mm/swap.c
@@ -36,6 +36,7 @@
  #include <linux/hugetlb.h>
  #include <linux/page_idle.h>
  #include <linux/local_lock.h>
+#include <linux/buffer_head.h>
  
  #include "internal.h"
  
@@ -235,6 +236,18 @@ static void pagevec_move_tail_fn(struct page *page, struct lruvec *lruvec)
         }
  }
  
+/* return true if pagevec needs to drain */
+static bool pagevec_add_and_need_flush(struct pagevec *pvec, struct page *page)
+{
+       bool ret = false;
+
+       if (!pagevec_add(pvec, page) || PageCompound(page) ||
+                       lru_cache_disabled())
+               ret = true;
+
+       return ret;
+}
+
  /*
   * Writeback is about to end against a page which has been marked for immediate
   * reclaim.  If it still appears to be reclaimable, move it to the tail of the
@@ -252,7 +265,7 @@ void rotate_reclaimable_page(struct page *page)
                 get_page(page);
                 local_lock_irqsave(&lru_rotate.lock, flags);
                 pvec = this_cpu_ptr(&lru_rotate.pvec);
-               if (!pagevec_add(pvec, page) || PageCompound(page))
+               if (pagevec_add_and_need_flush(pvec, page))
                         pagevec_lru_move_fn(pvec, pagevec_move_tail_fn);
                 local_unlock_irqrestore(&lru_rotate.lock, flags);
         }
@@ -343,7 +356,7 @@ static void activate_page(struct page *page)
                 local_lock(&lru_pvecs.lock);
                 pvec = this_cpu_ptr(&lru_pvecs.activate_page);
                 get_page(page);
-               if (!pagevec_add(pvec, page) || PageCompound(page))
+               if (pagevec_add_and_need_flush(pvec, page))
                         pagevec_lru_move_fn(pvec, __activate_page);
                 local_unlock(&lru_pvecs.lock);
         }
@@ -458,7 +471,7 @@ void lru_cache_add(struct page *page)
         get_page(page);
         local_lock(&lru_pvecs.lock);
         pvec = this_cpu_ptr(&lru_pvecs.lru_add);
-       if (!pagevec_add(pvec, page) || PageCompound(page))
+       if (pagevec_add_and_need_flush(pvec, page))
                 __pagevec_lru_add(pvec);
         local_unlock(&lru_pvecs.lock);
  }
@@ -483,7 +496,7 @@ void lru_cache_add_inactive_or_unevictable(struct page *page,
         if (unlikely(unevictable) && !TestSetPageMlocked(page)) {
                 int nr_pages = thp_nr_pages(page);
                 /*
-                * We use the irq-unsafe __mod_zone_page_stat because this
+                * We use the irq-unsafe __mod_zone_page_state because this
                  * counter is not modified from interrupt context, and the pte
                  * lock is held(spinlock), which implies preemption disabled.
                  */
@@ -629,6 +642,7 @@ void lru_add_drain_cpu(int cpu)
                 pagevec_lru_move_fn(pvec, lru_lazyfree_fn);
  
         activate_page_drain(cpu);
+       invalidate_bh_lrus_cpu(cpu);
  }
  
  /**
@@ -654,7 +668,7 @@ void deactivate_file_page(struct page *page)
                 local_lock(&lru_pvecs.lock);
                 pvec = this_cpu_ptr(&lru_pvecs.lru_deactivate_file);
  
-               if (!pagevec_add(pvec, page) || PageCompound(page))
+               if (pagevec_add_and_need_flush(pvec, page))
                         pagevec_lru_move_fn(pvec, lru_deactivate_file_fn);
                 local_unlock(&lru_pvecs.lock);
         }
@@ -676,7 +690,7 @@ void deactivate_page(struct page *page)
                 local_lock(&lru_pvecs.lock);
                 pvec = this_cpu_ptr(&lru_pvecs.lru_deactivate);
                 get_page(page);
-               if (!pagevec_add(pvec, page) || PageCompound(page))
+               if (pagevec_add_and_need_flush(pvec, page))
                         pagevec_lru_move_fn(pvec, lru_deactivate_fn);
                 local_unlock(&lru_pvecs.lock);
         }
@@ -698,7 +712,7 @@ void mark_page_lazyfree(struct page *page)
                 local_lock(&lru_pvecs.lock);
                 pvec = this_cpu_ptr(&lru_pvecs.lru_lazyfree);
                 get_page(page);
-               if (!pagevec_add(pvec, page) || PageCompound(page))
+               if (pagevec_add_and_need_flush(pvec, page))
                         pagevec_lru_move_fn(pvec, lru_lazyfree_fn);
                 local_unlock(&lru_pvecs.lock);
         }
@@ -735,7 +749,7 @@ static void lru_add_drain_per_cpu(struct work_struct *dummy)
   * Calling this function with cpu hotplug locks held can actually lead
   * to obscure indirect dependencies via WQ context.
   */
-void lru_add_drain_all(void)
+inline void __lru_add_drain_all(bool force_all_cpus)
  {
         /*
          * lru_drain_gen - Global pages generation number
@@ -780,7 +794,7 @@ void lru_add_drain_all(void)
          * (C) Exit the draining operation if a newer generation, from another
          * lru_add_drain_all(), was already scheduled for draining. Check (A).
          */
-       if (unlikely(this_gen != lru_drain_gen))
+       if (unlikely(this_gen != lru_drain_gen && !force_all_cpus))
                 goto done;
  
         /*
@@ -794,7 +808,7 @@ void lru_add_drain_all(void)
          * below which drains the page vectors.
          *
          * Let x, y, and z represent some system CPU numbers, where x < y < z.
-        * Assume CPU #z is is in the middle of the for_each_online_cpu loop
+        * Assume CPU #z is in the middle of the for_each_online_cpu loop
          * below and has already reached CPU #y's per-cpu data. CPU #x comes
          * along, adds some pages to its per-cpu vectors, then calls
          * lru_add_drain_all().
@@ -810,12 +824,14 @@ void lru_add_drain_all(void)
         for_each_online_cpu(cpu) {
                 struct work_struct *work = &per_cpu(lru_add_drain_work, cpu);
  
-               if (pagevec_count(&per_cpu(lru_pvecs.lru_add, cpu)) ||
+               if (force_all_cpus ||
+                   pagevec_count(&per_cpu(lru_pvecs.lru_add, cpu)) ||
                     data_race(pagevec_count(&per_cpu(lru_rotate.pvec, cpu))) ||
                     pagevec_count(&per_cpu(lru_pvecs.lru_deactivate_file, cpu)) ||
                     pagevec_count(&per_cpu(lru_pvecs.lru_deactivate, cpu)) ||
                     pagevec_count(&per_cpu(lru_pvecs.lru_lazyfree, cpu)) ||
-                   need_activate_page_drain(cpu)) {
+                   need_activate_page_drain(cpu) ||
+                   has_bh_in_lru(cpu, NULL)) {
                         INIT_WORK(work, lru_add_drain_per_cpu);
                         queue_work_on(cpu, mm_percpu_wq, work);
                         __cpumask_set_cpu(cpu, &has_work);
@@ -828,6 +844,11 @@ void lru_add_drain_all(void)
  done:
         mutex_unlock(&lock);
  }
+
+void lru_add_drain_all(void)
+{
+       __lru_add_drain_all(false);
+}
  #else
  void lru_add_drain_all(void)
  {
@@ -835,6 +856,34 @@ void lru_add_drain_all(void)
  }
  #endif /* CONFIG_SMP */
  
+atomic_t lru_disable_count = ATOMIC_INIT(0);
+
+/*
+ * lru_cache_disable() needs to be called before we start compiling
+ * a list of pages to be migrated using isolate_lru_page().
+ * It drains pages on LRU cache and then disable on all cpus until
+ * lru_cache_enable is called.
+ *
+ * Must be paired with a call to lru_cache_enable().
+ */
+void lru_cache_disable(void)
+{
+       atomic_inc(&lru_disable_count);
+#ifdef CONFIG_SMP
+       /*
+        * lru_add_drain_all in the force mode will schedule draining on
+        * all online CPUs so any calls of lru_cache_disabled wrapped by
+        * local_lock or preemption disabled would be ordered by that.
+        * The atomic operation doesn't need to have stronger ordering
+        * requirements because that is enforeced by the scheduling
+        * guarantees.
+        */
+       __lru_add_drain_all(true);
+#else
+       lru_add_drain();
+#endif
+}
+
  /**
   * release_pages - batched put_page()
   * @pages: array of pages to release