mm: compaction: determine if dirty pages can be migrated without blocking within...

author Mel Gorman <mgorman@suse.de>

Fri, 13 Jan 2012 01:19:34 +0000 (17:19 -0800)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 1 Aug 2012 19:27:17 +0000 (12:27 -0700)
author Mel Gorman <mgorman@suse.de>
Fri, 13 Jan 2012 01:19:34 +0000 (17:19 -0800)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 1 Aug 2012 19:27:17 +0000 (12:27 -0700)
diff --git a/fs/btrfs/disk-io.c b/fs/btrfs/disk-io.c

index 1ac8db5dc0a31b9a742099956b121cd75ba0a1a6..522cb2a6cb10cb9ea635e9167ee9ca4926cd598f 100644 (file)
--- a/fs/btrfs/disk-io.c
+++ b/fs/btrfs/disk-io.c
@@ -801,7 +801,7 @@ static int btree_submit_bio_hook(struct inode *inode, int rw, struct bio *bio,
  
  #ifdef CONFIG_MIGRATION
  static int btree_migratepage(struct address_space *mapping,
-                       struct page *newpage, struct page *page)
+                       struct page *newpage, struct page *page, bool sync)
  {
         /*
          * we can't safely write a btree page from here,
@@ -816,7 +816,7 @@ static int btree_migratepage(struct address_space *mapping,
         if (page_has_private(page) &&
             !try_to_release_page(page, GFP_KERNEL))
                 return -EAGAIN;
-       return migrate_page(mapping, newpage, page);
+       return migrate_page(mapping, newpage, page, sync);
  }
  #endif
  
diff --git a/fs/hugetlbfs/inode.c b/fs/hugetlbfs/inode.c

index 8b0c87530b04e810fa36783564713fa149f9a822..6ca608bbc8b6182ee3779fc621b71c0cb8b3fe34 100644 (file)
--- a/fs/hugetlbfs/inode.c
+++ b/fs/hugetlbfs/inode.c
@@ -568,7 +568,8 @@ static int hugetlbfs_set_page_dirty(struct page *page)
  }
  
  static int hugetlbfs_migrate_page(struct address_space *mapping,
-                               struct page *newpage, struct page *page)
+                               struct page *newpage, struct page *page,
+                               bool sync)
  {
         int rc;
  
diff --git a/fs/nfs/internal.h b/fs/nfs/internal.h

index 2a55347a2daa85f66aa24b44d7bb7c93efe1d409..a74442ae688467a0e0121255c96d59d58192f6ef 100644 (file)
--- a/fs/nfs/internal.h
+++ b/fs/nfs/internal.h
@@ -315,7 +315,7 @@ void nfs_commit_release_pages(struct nfs_write_data *data);
  
  #ifdef CONFIG_MIGRATION
  extern int nfs_migrate_page(struct address_space *,
-               struct page *, struct page *);
+               struct page *, struct page *, bool);
  #else
  #define nfs_migrate_page NULL
  #endif
diff --git a/fs/nfs/write.c b/fs/nfs/write.c

index f2f80c005c023d4911490555a874bb872a7dad55..22a48fdee3cf2cd6da473f2ea48eac3a100705c8 100644 (file)
--- a/fs/nfs/write.c
+++ b/fs/nfs/write.c
@@ -1662,7 +1662,7 @@ out_error:
  
  #ifdef CONFIG_MIGRATION
  int nfs_migrate_page(struct address_space *mapping, struct page *newpage,
-               struct page *page)
+               struct page *page, bool sync)
  {
         /*
          * If PagePrivate is set, then the page is currently associated with
@@ -1677,7 +1677,7 @@ int nfs_migrate_page(struct address_space *mapping, struct page *newpage,
  
         nfs_fscache_release_page(page, GFP_KERNEL);
  
-       return migrate_page(mapping, newpage, page);
+       return migrate_page(mapping, newpage, page, sync);
  }
  #endif
  
diff --git a/include/linux/fs.h b/include/linux/fs.h

index 96b10354c741c01306ba608ee0cdfb4e1d71ee98..09ddec9ee5dd4cc010a40e4bb59b7a65eb5ce224 100644 (file)
--- a/include/linux/fs.h
+++ b/include/linux/fs.h
@@ -607,9 +607,12 @@ struct address_space_operations {
                         loff_t offset, unsigned long nr_segs);
         int (*get_xip_mem)(struct address_space *, pgoff_t, int,
                                                 void **, unsigned long *);
-       /* migrate the contents of a page to the specified target */
+       /*
+        * migrate the contents of a page to the specified target. If sync
+        * is false, it must not block.
+        */
         int (*migratepage) (struct address_space *,
-                       struct page *, struct page *);
+                       struct page *, struct page *, bool);
         int (*launder_page) (struct page *);
         int (*is_partially_uptodate) (struct page *, read_descriptor_t *,
                                         unsigned long);
@@ -2478,7 +2481,7 @@ extern int generic_check_addressable(unsigned, u64);
  
  #ifdef CONFIG_MIGRATION
  extern int buffer_migrate_page(struct address_space *,
-                               struct page *, struct page *);
+                               struct page *, struct page *, bool);
  #else
  #define buffer_migrate_page NULL
  #endif
diff --git a/include/linux/migrate.h b/include/linux/migrate.h

index e39aeecfe9a21666a107bf02be780bacca1ba0f5..14e6d2a884752db4d74843d6b171731e76468af9 100644 (file)
--- a/include/linux/migrate.h
+++ b/include/linux/migrate.h
@@ -11,7 +11,7 @@ typedef struct page *new_page_t(struct page *, unsigned long private, int **);
  
  extern void putback_lru_pages(struct list_head *l);
  extern int migrate_page(struct address_space *,
-                       struct page *, struct page *);
+                       struct page *, struct page *, bool);
  extern int migrate_pages(struct list_head *l, new_page_t x,
                         unsigned long private, bool offlining,
                         bool sync);
diff --git a/mm/migrate.c b/mm/migrate.c

index 33358f8781118ae9153ac4eb3e00530ca2f20e93..d43689ad8a5bcbe7e14bd8b0fe6baeefe49915fe 100644 (file)
--- a/mm/migrate.c
+++ b/mm/migrate.c
@@ -220,6 +220,55 @@ out:
         pte_unmap_unlock(ptep, ptl);
  }
  
+#ifdef CONFIG_BLOCK
+/* Returns true if all buffers are successfully locked */
+static bool buffer_migrate_lock_buffers(struct buffer_head *head, bool sync)
+{
+       struct buffer_head *bh = head;
+
+       /* Simple case, sync compaction */
+       if (sync) {
+               do {
+                       get_bh(bh);
+                       lock_buffer(bh);
+                       bh = bh->b_this_page;
+
+               } while (bh != head);
+
+               return true;
+       }
+
+       /* async case, we cannot block on lock_buffer so use trylock_buffer */
+       do {
+               get_bh(bh);
+               if (!trylock_buffer(bh)) {
+                       /*
+                        * We failed to lock the buffer and cannot stall in
+                        * async migration. Release the taken locks
+                        */
+                       struct buffer_head *failed_bh = bh;
+                       put_bh(failed_bh);
+                       bh = head;
+                       while (bh != failed_bh) {
+                               unlock_buffer(bh);
+                               put_bh(bh);
+                               bh = bh->b_this_page;
+                       }
+                       return false;
+               }
+
+               bh = bh->b_this_page;
+       } while (bh != head);
+       return true;
+}
+#else
+static inline bool buffer_migrate_lock_buffers(struct buffer_head *head,
+                                                               bool sync)
+{
+       return true;
+}
+#endif /* CONFIG_BLOCK */
+
  /*
   * Replace the page in the mapping.
   *
@@ -229,7 +278,8 @@ out:
   * 3 for pages with a mapping and PagePrivate/PagePrivate2 set.
   */
  static int migrate_page_move_mapping(struct address_space *mapping,
-               struct page *newpage, struct page *page)
+               struct page *newpage, struct page *page,
+               struct buffer_head *head, bool sync)
  {
         int expected_count;
         void **pslot;
@@ -258,6 +308,19 @@ static int migrate_page_move_mapping(struct address_space *mapping,
                 return -EAGAIN;
         }
  
+       /*
+        * In the async migration case of moving a page with buffers, lock the
+        * buffers using trylock before the mapping is moved. If the mapping
+        * was moved, we later failed to lock the buffers and could not move
+        * the mapping back due to an elevated page count, we would have to
+        * block waiting on other references to be dropped.
+        */
+       if (!sync && head && !buffer_migrate_lock_buffers(head, sync)) {
+               page_unfreeze_refs(page, expected_count);
+               spin_unlock_irq(&mapping->tree_lock);
+               return -EAGAIN;
+       }
+
         /*
          * Now we know that no one else is looking at the page.
          */
@@ -415,13 +478,13 @@ EXPORT_SYMBOL(fail_migrate_page);
   * Pages are locked upon entry and exit.
   */
  int migrate_page(struct address_space *mapping,
-               struct page *newpage, struct page *page)
+               struct page *newpage, struct page *page, bool sync)
  {
         int rc;
  
         BUG_ON(PageWriteback(page));    /* Writeback must be complete */
  
-       rc = migrate_page_move_mapping(mapping, newpage, page);
+       rc = migrate_page_move_mapping(mapping, newpage, page, NULL, sync);
  
         if (rc)
                 return rc;
@@ -438,28 +501,28 @@ EXPORT_SYMBOL(migrate_page);
   * exist.
   */
  int buffer_migrate_page(struct address_space *mapping,
-               struct page *newpage, struct page *page)
+               struct page *newpage, struct page *page, bool sync)
  {
         struct buffer_head *bh, *head;
         int rc;
  
         if (!page_has_buffers(page))
-               return migrate_page(mapping, newpage, page);
+               return migrate_page(mapping, newpage, page, sync);
  
         head = page_buffers(page);
  
-       rc = migrate_page_move_mapping(mapping, newpage, page);
+       rc = migrate_page_move_mapping(mapping, newpage, page, head, sync);
  
         if (rc)
                 return rc;
  
-       bh = head;
-       do {
-               get_bh(bh);
-               lock_buffer(bh);
-               bh = bh->b_this_page;
-
-       } while (bh != head);
+       /*
+        * In the async case, migrate_page_move_mapping locked the buffers
+        * with an IRQ-safe spinlock held. In the sync case, the buffers
+        * need to be locked now
+        */
+       if (sync)
+               BUG_ON(!buffer_migrate_lock_buffers(head, sync));
  
         ClearPagePrivate(page);
         set_page_private(newpage, page_private(page));
@@ -536,10 +599,13 @@ static int writeout(struct address_space *mapping, struct page *page)
   * Default handling if a filesystem does not provide a migration function.
   */
  static int fallback_migrate_page(struct address_space *mapping,
-       struct page *newpage, struct page *page)
+       struct page *newpage, struct page *page, bool sync)
  {
-       if (PageDirty(page))
+       if (PageDirty(page)) {
+               if (!sync)
+                       return -EBUSY;
                 return writeout(mapping, page);
+       }
  
         /*
          * Buffers may be managed in a filesystem specific way.
@@ -549,7 +615,7 @@ static int fallback_migrate_page(struct address_space *mapping,
             !try_to_release_page(page, GFP_KERNEL))
                 return -EAGAIN;
  
-       return migrate_page(mapping, newpage, page);
+       return migrate_page(mapping, newpage, page, sync);
  }
  
  /*
@@ -585,29 +651,18 @@ static int move_to_new_page(struct page *newpage, struct page *page,
  
         mapping = page_mapping(page);
         if (!mapping)
-               rc = migrate_page(mapping, newpage, page);
-       else {
+               rc = migrate_page(mapping, newpage, page, sync);
+       else if (mapping->a_ops->migratepage)
                 /*
-                * Do not writeback pages if !sync and migratepage is
-                * not pointing to migrate_page() which is nonblocking
-                * (swapcache/tmpfs uses migratepage = migrate_page).
+                * Most pages have a mapping and most filesystems provide a
+                * migratepage callback. Anonymous pages are part of swap
+                * space which also has its own migratepage callback. This
+                * is the most common path for page migration.
                  */
-               if (PageDirty(page) && !sync &&
-                   mapping->a_ops->migratepage != migrate_page)
-                       rc = -EBUSY;
-               else if (mapping->a_ops->migratepage)
-                       /*
-                        * Most pages have a mapping and most filesystems
-                        * should provide a migration function. Anonymous
-                        * pages are part of swap space which also has its
-                        * own migration function. This is the most common
-                        * path for page migration.
-                        */
-                       rc = mapping->a_ops->migratepage(mapping,
-                                                       newpage, page);
-               else
-                       rc = fallback_migrate_page(mapping, newpage, page);
-       }
+               rc = mapping->a_ops->migratepage(mapping,
+                                               newpage, page, sync);
+       else
+               rc = fallback_migrate_page(mapping, newpage, page, sync);
  
         if (rc) {
                 newpage->mapping = NULL;
author	Mel Gorman <mgorman@suse.de>
	Fri, 13 Jan 2012 01:19:34 +0000 (17:19 -0800)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 1 Aug 2012 19:27:17 +0000 (12:27 -0700)
fs/btrfs/disk-io.c		patch \| blob \| history
fs/hugetlbfs/inode.c		patch \| blob \| history
fs/nfs/internal.h		patch \| blob \| history
fs/nfs/write.c		patch \| blob \| history
include/linux/fs.h		patch \| blob \| history
include/linux/migrate.h		patch \| blob \| history
mm/migrate.c		patch \| blob \| history