net: fix sk_page_frag() recursion from memory reclaim

author Tejun Heo <tj@kernel.org>

Thu, 24 Oct 2019 20:50:27 +0000 (13:50 -0700)

committer David S. Miller <davem@davemloft.net>

Mon, 28 Oct 2019 23:17:31 +0000 (16:17 -0700)
author Tejun Heo <tj@kernel.org>
Thu, 24 Oct 2019 20:50:27 +0000 (13:50 -0700)
committer David S. Miller <davem@davemloft.net>
Mon, 28 Oct 2019 23:17:31 +0000 (16:17 -0700)
diff --git a/include/linux/gfp.h b/include/linux/gfp.h

index fb07b503dc453ddfe16c5f0f959d46be01ad55ba..61f2f6ff94673b0a74d2d7705d87373bfba74fe5 100644 (file)
--- a/include/linux/gfp.h
+++ b/include/linux/gfp.h
@@ -325,6 +325,29 @@ static inline bool gfpflags_allow_blocking(const gfp_t gfp_flags)
         return !!(gfp_flags & __GFP_DIRECT_RECLAIM);
  }
  
+/**
+ * gfpflags_normal_context - is gfp_flags a normal sleepable context?
+ * @gfp_flags: gfp_flags to test
+ *
+ * Test whether @gfp_flags indicates that the allocation is from the
+ * %current context and allowed to sleep.
+ *
+ * An allocation being allowed to block doesn't mean it owns the %current
+ * context.  When direct reclaim path tries to allocate memory, the
+ * allocation context is nested inside whatever %current was doing at the
+ * time of the original allocation.  The nested allocation may be allowed
+ * to block but modifying anything %current owns can corrupt the outer
+ * context's expectations.
+ *
+ * %true result from this function indicates that the allocation context
+ * can sleep and use anything that's associated with %current.
+ */
+static inline bool gfpflags_normal_context(const gfp_t gfp_flags)
+{
+       return (gfp_flags & (__GFP_DIRECT_RECLAIM | __GFP_MEMALLOC)) ==
+               __GFP_DIRECT_RECLAIM;
+}
+
  #ifdef CONFIG_HIGHMEM
  #define OPT_ZONE_HIGHMEM ZONE_HIGHMEM
  #else
diff --git a/include/net/sock.h b/include/net/sock.h

index f69b58bff7e5c69537444d99d68db5afc3abfa27..c31a9ed86d5a58be7f1ca9933c48c40f12d0e57f 100644 (file)
--- a/include/net/sock.h
+++ b/include/net/sock.h
@@ -2242,12 +2242,17 @@ struct sk_buff *sk_stream_alloc_skb(struct sock *sk, int size, gfp_t gfp,
   * sk_page_frag - return an appropriate page_frag
   * @sk: socket
   *
- * If socket allocation mode allows current thread to sleep, it means its
- * safe to use the per task page_frag instead of the per socket one.
+ * Use the per task page_frag instead of the per socket one for
+ * optimization when we know that we're in the normal context and owns
+ * everything that's associated with %current.
+ *
+ * gfpflags_allow_blocking() isn't enough here as direct reclaim may nest
+ * inside other socket operations and end up recursing into sk_page_frag()
+ * while it's already in use.
   */
  static inline struct page_frag *sk_page_frag(struct sock *sk)
  {
-       if (gfpflags_allow_blocking(sk->sk_allocation))
+       if (gfpflags_normal_context(sk->sk_allocation))
                 return &current->task_frag;
  
         return &sk->sk_frag;
author	Tejun Heo <tj@kernel.org>
	Thu, 24 Oct 2019 20:50:27 +0000 (13:50 -0700)
committer	David S. Miller <davem@davemloft.net>
	Mon, 28 Oct 2019 23:17:31 +0000 (16:17 -0700)
include/linux/gfp.h		patch \| blob \| history
include/net/sock.h		patch \| blob \| history