swap: cull unevictable pages in fault path

author Lee Schermerhorn <lee.schermerhorn@hp.com>

Sun, 19 Oct 2008 03:26:52 +0000 (20:26 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Mon, 20 Oct 2008 15:52:31 +0000 (08:52 -0700)
author Lee Schermerhorn <lee.schermerhorn@hp.com>
Sun, 19 Oct 2008 03:26:52 +0000 (20:26 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Mon, 20 Oct 2008 15:52:31 +0000 (08:52 -0700)
diff --git a/include/linux/swap.h b/include/linux/swap.h

index 7edb4cbc29f9f51f2aaa2cb93d68b1088fc45bf1..07eda69412fbe56e00583be0dc41d037f29000d8 100644 (file)
--- a/include/linux/swap.h
+++ b/include/linux/swap.h
@@ -173,6 +173,8 @@ extern unsigned int nr_free_pagecache_pages(void);
  /* linux/mm/swap.c */
  extern void __lru_cache_add(struct page *, enum lru_list lru);
  extern void lru_cache_add_lru(struct page *, enum lru_list lru);
+extern void lru_cache_add_active_or_unevictable(struct page *,
+                                       struct vm_area_struct *);
  extern void activate_page(struct page *);
  extern void mark_page_accessed(struct page *);
  extern void lru_add_drain(void);
diff --git a/mm/memory.c b/mm/memory.c

index 9fef7272fb9e81324959efeea12e7b74c6ce6262..450127f4c5820a30e694cbd9763aa353a50774a7 100644 (file)
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -1922,12 +1922,13 @@ gotten:
                  * thread doing COW.
                  */
                 ptep_clear_flush_notify(vma, address, page_table);
-               set_pte_at(mm, address, page_table, entry);
-               update_mmu_cache(vma, address, entry);
                 SetPageSwapBacked(new_page);
-               lru_cache_add_active_anon(new_page);
+               lru_cache_add_active_or_unevictable(new_page, vma);
                 page_add_new_anon_rmap(new_page, vma, address);
  
+//TODO:  is this safe?  do_anonymous_page() does it this way.
+               set_pte_at(mm, address, page_table, entry);
+               update_mmu_cache(vma, address, entry);
                 if (old_page) {
                         /*
                          * Only after switching the pte to the new page may
@@ -2420,7 +2421,7 @@ static int do_anonymous_page(struct mm_struct *mm, struct vm_area_struct *vma,
                 goto release;
         inc_mm_counter(mm, anon_rss);
         SetPageSwapBacked(page);
-       lru_cache_add_active_anon(page);
+       lru_cache_add_active_or_unevictable(page, vma);
         page_add_new_anon_rmap(page, vma, address);
         set_pte_at(mm, address, page_table, entry);
  
@@ -2564,12 +2565,11 @@ static int __do_fault(struct mm_struct *mm, struct vm_area_struct *vma,
                 entry = mk_pte(page, vma->vm_page_prot);
                 if (flags & FAULT_FLAG_WRITE)
                         entry = maybe_mkwrite(pte_mkdirty(entry), vma);
-               set_pte_at(mm, address, page_table, entry);
                 if (anon) {
-                        inc_mm_counter(mm, anon_rss);
+                       inc_mm_counter(mm, anon_rss);
                         SetPageSwapBacked(page);
-                        lru_cache_add_active_anon(page);
-                        page_add_new_anon_rmap(page, vma, address);
+                       lru_cache_add_active_or_unevictable(page, vma);
+                       page_add_new_anon_rmap(page, vma, address);
                 } else {
                         inc_mm_counter(mm, file_rss);
                         page_add_file_rmap(page);
@@ -2578,6 +2578,8 @@ static int __do_fault(struct mm_struct *mm, struct vm_area_struct *vma,
                                 get_page(dirty_page);
                         }
                 }
+//TODO:  is this safe?  do_anonymous_page() does it this way.
+               set_pte_at(mm, address, page_table, entry);
  
                 /* no need to invalidate: a not-present page won't be cached */
                 update_mmu_cache(vma, address, entry);
diff --git a/mm/swap.c b/mm/swap.c

index bc58c1369dd6def1add1d55b0b53a605c6308e27..2152e48a7b8f0726f06a88c516d82a0becf3c19d 100644 (file)
--- a/mm/swap.c
+++ b/mm/swap.c
@@ -31,6 +31,8 @@
  #include <linux/backing-dev.h>
  #include <linux/memcontrol.h>
  
+#include "internal.h"
+
  /* How many pages do we try to swap or page in/out together? */
  int page_cluster;
  
@@ -244,6 +246,25 @@ void add_page_to_unevictable_list(struct page *page)
         spin_unlock_irq(&zone->lru_lock);
  }
  
+/**
+ * lru_cache_add_active_or_unevictable
+ * @page:  the page to be added to LRU
+ * @vma:   vma in which page is mapped for determining reclaimability
+ *
+ * place @page on active or unevictable LRU list, depending on
+ * page_evictable().  Note that if the page is not evictable,
+ * it goes directly back onto it's zone's unevictable list.  It does
+ * NOT use a per cpu pagevec.
+ */
+void lru_cache_add_active_or_unevictable(struct page *page,
+                                       struct vm_area_struct *vma)
+{
+       if (page_evictable(page, vma))
+               lru_cache_add_lru(page, LRU_ACTIVE + page_is_file_cache(page));
+       else
+               add_page_to_unevictable_list(page);
+}
+
  /*
   * Drain pages out of the cpu's pagevecs.
   * Either "cpu" is the current CPU, and preemption has already been
author	Lee Schermerhorn <lee.schermerhorn@hp.com>
	Sun, 19 Oct 2008 03:26:52 +0000 (20:26 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Mon, 20 Oct 2008 15:52:31 +0000 (08:52 -0700)
include/linux/swap.h		patch \| blob \| history
mm/memory.c		patch \| blob \| history
mm/swap.c		patch \| blob \| history