]> git.baikalelectronics.ru Git - kernel.git/commitdiff
mm/hugetlb: grab head page refcount once for group of subpages
authorJoao Martins <joao.m.martins@oracle.com>
Wed, 24 Feb 2021 20:07:12 +0000 (12:07 -0800)
committerLinus Torvalds <torvalds@linux-foundation.org>
Wed, 24 Feb 2021 21:38:32 +0000 (13:38 -0800)
Patch series "mm/hugetlb: follow_hugetlb_page() improvements", v2.

While looking at ZONE_DEVICE struct page reuse particularly the last
patch[0], I found two possible improvements for follow_hugetlb_page()
which is solely used for get_user_pages()/pin_user_pages().

The first patch batches page refcount updates while the second tidies up
storing the subpages/vmas.  Both together bring the cost of slow variant
of gup() cost from ~87.6k usecs to ~5.8k usecs.

libhugetlbfs tests seem to pass as well gup_test benchmarks with hugetlbfs
vmas.

This patch (of 2):

follow_hugetlb_page() once it locks the pmd/pud, checks all its N subpages
in a huge page and grabs a reference for each one.  Similar to gup-fast,
have follow_hugetlb_page() grab the head page refcount only after counting
all its subpages that are part of the just faulted huge page.

Consequently we reduce the number of atomics necessary to pin said huge
page, which improves non-fast gup() considerably:

  - 16G with 1G huge page size
  gup_test -f /mnt/huge/file -m 16384 -r 10 -L -S -n 512 -w

PIN_LONGTERM_BENCHMARK: ~87.6k us -> ~12.8k us

Link: https://lkml.kernel.org/r/20210128182632.24562-1-joao.m.martins@oracle.com
Link: https://lkml.kernel.org/r/20210128182632.24562-2-joao.m.martins@oracle.com
Signed-off-by: Joao Martins <joao.m.martins@oracle.com>
Reviewed-by: Mike Kravetz <mike.kravetz@oracle.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
include/linux/mm.h
mm/gup.c
mm/hugetlb.c

index 76cab132c2954ee0700594397aaa2f03714ae162..77e64e3eac80bd756021c8d8a158b4faae694dcf 100644 (file)
@@ -1187,6 +1187,9 @@ static inline void get_page(struct page *page)
 }
 
 bool __must_check try_grab_page(struct page *page, unsigned int flags);
+__maybe_unused struct page *try_grab_compound_head(struct page *page, int refs,
+                                                  unsigned int flags);
+
 
 static inline __must_check bool try_get_page(struct page *page)
 {
index e4c224cd9661f9c4d1d8372a37a19684cca3e3d0..e40579624f107811b3755851c3d9d66cc35dcc4d 100644 (file)
--- a/mm/gup.c
+++ b/mm/gup.c
@@ -78,9 +78,8 @@ static inline struct page *try_get_compound_head(struct page *page, int refs)
  * considered failure, and furthermore, a likely bug in the caller, so a warning
  * is also emitted.
  */
-static __maybe_unused struct page *try_grab_compound_head(struct page *page,
-                                                         int refs,
-                                                         unsigned int flags)
+__maybe_unused struct page *try_grab_compound_head(struct page *page,
+                                                  int refs, unsigned int flags)
 {
        if (flags & FOLL_GET)
                return try_get_compound_head(page, refs);
index 6920c71d7e0de6d4d982f20058b367776da42919..d4fc5db6bc3224814db47ff4e39c723b1966f37c 100644 (file)
@@ -4796,7 +4796,7 @@ long follow_hugetlb_page(struct mm_struct *mm, struct vm_area_struct *vma,
        unsigned long vaddr = *position;
        unsigned long remainder = *nr_pages;
        struct hstate *h = hstate_vma(vma);
-       int err = -EFAULT;
+       int err = -EFAULT, refs;
 
        while (vaddr < vma->vm_end && remainder) {
                pte_t *pte;
@@ -4916,26 +4916,11 @@ long follow_hugetlb_page(struct mm_struct *mm, struct vm_area_struct *vma,
                        continue;
                }
 
+               refs = 0;
+
 same_page:
-               if (pages) {
+               if (pages)
                        pages[i] = mem_map_offset(page, pfn_offset);
-                       /*
-                        * try_grab_page() should always succeed here, because:
-                        * a) we hold the ptl lock, and b) we've just checked
-                        * that the huge page is present in the page tables. If
-                        * the huge page is present, then the tail pages must
-                        * also be present. The ptl prevents the head page and
-                        * tail pages from being rearranged in any way. So this
-                        * page must be available at this point, unless the page
-                        * refcount overflowed:
-                        */
-                       if (WARN_ON_ONCE(!try_grab_page(pages[i], flags))) {
-                               spin_unlock(ptl);
-                               remainder = 0;
-                               err = -ENOMEM;
-                               break;
-                       }
-               }
 
                if (vmas)
                        vmas[i] = vma;
@@ -4944,6 +4929,7 @@ same_page:
                ++pfn_offset;
                --remainder;
                ++i;
+               ++refs;
                if (vaddr < vma->vm_end && remainder &&
                                pfn_offset < pages_per_huge_page(h)) {
                        /*
@@ -4951,6 +4937,25 @@ same_page:
                         * of this compound page.
                         */
                        goto same_page;
+               } else if (pages) {
+                       /*
+                        * try_grab_compound_head() should always succeed here,
+                        * because: a) we hold the ptl lock, and b) we've just
+                        * checked that the huge page is present in the page
+                        * tables. If the huge page is present, then the tail
+                        * pages must also be present. The ptl prevents the
+                        * head page and tail pages from being rearranged in
+                        * any way. So this page must be available at this
+                        * point, unless the page refcount overflowed:
+                        */
+                       if (WARN_ON_ONCE(!try_grab_compound_head(pages[i-1],
+                                                                refs,
+                                                                flags))) {
+                               spin_unlock(ptl);
+                               remainder = 0;
+                               err = -ENOMEM;
+                               break;
+                       }
                }
                spin_unlock(ptl);
        }