KVM: x86/mmu: Zap only the target TDP MMU shadow page in NX recovery

author Sean Christopherson <seanjc@google.com>

Sat, 26 Feb 2022 00:15:31 +0000 (00:15 +0000)

committer Paolo Bonzini <pbonzini@redhat.com>

Tue, 8 Mar 2022 14:31:54 +0000 (09:31 -0500)
author Sean Christopherson <seanjc@google.com>
Sat, 26 Feb 2022 00:15:31 +0000 (00:15 +0000)
committer Paolo Bonzini <pbonzini@redhat.com>
Tue, 8 Mar 2022 14:31:54 +0000 (09:31 -0500)
diff --git a/arch/x86/kvm/mmu/mmu_internal.h b/arch/x86/kvm/mmu/mmu_internal.h

index da6166b5c37704f5c254839f923f52048445766f..be063b6c91b7d517c2b0f7241c6eb59be5db1ffb 100644 (file)
--- a/arch/x86/kvm/mmu/mmu_internal.h
+++ b/arch/x86/kvm/mmu/mmu_internal.h
@@ -30,6 +30,8 @@ extern bool dbg;
  #define INVALID_PAE_ROOT       0
  #define IS_VALID_PAE_ROOT(x)   (!!(x))
  
+typedef u64 __rcu *tdp_ptep_t;
+
  struct kvm_mmu_page {
         /*
          * Note, "link" through "spt" fit in a single 64 byte cache line on
@@ -59,7 +61,10 @@ struct kvm_mmu_page {
                 refcount_t tdp_mmu_root_count;
         };
         unsigned int unsync_children;
-       struct kvm_rmap_head parent_ptes; /* rmap pointers to parent sptes */
+       union {
+               struct kvm_rmap_head parent_ptes; /* rmap pointers to parent sptes */
+               tdp_ptep_t ptep;
+       };
         DECLARE_BITMAP(unsync_child_bitmap, 512);
  
         struct list_head lpage_disallowed_link;
diff --git a/arch/x86/kvm/mmu/tdp_iter.h b/arch/x86/kvm/mmu/tdp_iter.h

index bb9b581f1ee4e6b44500e40f11bfe9e56553ecef..e2a7e267a77dbada903bfbae7f2e7ead1c9cdb1c 100644 (file)
--- a/arch/x86/kvm/mmu/tdp_iter.h
+++ b/arch/x86/kvm/mmu/tdp_iter.h
@@ -7,8 +7,6 @@
  
  #include "mmu.h"
  
-typedef u64 __rcu *tdp_ptep_t;
-
  /*
   * TDP MMU SPTEs are RCU protected to allow paging structures (non-leaf SPTEs)
   * to be zapped while holding mmu_lock for read.  Holding RCU isn't required for
diff --git a/arch/x86/kvm/mmu/tdp_mmu.c b/arch/x86/kvm/mmu/tdp_mmu.c

index 0ffa62abde2d016c14b0b57a60392954d3e131a5..dc9db5057f3bb4db441ac4b9dbff0f241f5ef2ab 100644 (file)
--- a/arch/x86/kvm/mmu/tdp_mmu.c
+++ b/arch/x86/kvm/mmu/tdp_mmu.c
@@ -199,13 +199,14 @@ static struct kvm_mmu_page *tdp_mmu_alloc_sp(struct kvm_vcpu *vcpu)
         return sp;
  }
  
-static void tdp_mmu_init_sp(struct kvm_mmu_page *sp, gfn_t gfn,
-                             union kvm_mmu_page_role role)
+static void tdp_mmu_init_sp(struct kvm_mmu_page *sp, tdp_ptep_t sptep,
+                           gfn_t gfn, union kvm_mmu_page_role role)
  {
         set_page_private(virt_to_page(sp->spt), (unsigned long)sp);
  
         sp->role = role;
         sp->gfn = gfn;
+       sp->ptep = sptep;
         sp->tdp_mmu_page = true;
  
         trace_kvm_mmu_get_page(sp, true);
@@ -222,7 +223,7 @@ static void tdp_mmu_init_child_sp(struct kvm_mmu_page *child_sp,
         role = parent_sp->role;
         role.level--;
  
-       tdp_mmu_init_sp(child_sp, iter->gfn, role);
+       tdp_mmu_init_sp(child_sp, iter->sptep, iter->gfn, role);
  }
  
  hpa_t kvm_tdp_mmu_get_vcpu_root_hpa(struct kvm_vcpu *vcpu)
@@ -244,7 +245,7 @@ hpa_t kvm_tdp_mmu_get_vcpu_root_hpa(struct kvm_vcpu *vcpu)
         }
  
         root = tdp_mmu_alloc_sp(vcpu);
-       tdp_mmu_init_sp(root, 0, role);
+       tdp_mmu_init_sp(root, NULL, 0, role);
  
         refcount_set(&root->tdp_mmu_root_count, 1);
  
@@ -736,6 +737,33 @@ static inline bool __must_check tdp_mmu_iter_cond_resched(struct kvm *kvm,
         return iter->yielded;
  }
  
+bool kvm_tdp_mmu_zap_sp(struct kvm *kvm, struct kvm_mmu_page *sp)
+{
+       u64 old_spte;
+
+       /*
+        * This helper intentionally doesn't allow zapping a root shadow page,
+        * which doesn't have a parent page table and thus no associated entry.
+        */
+       if (WARN_ON_ONCE(!sp->ptep))
+               return false;
+
+       rcu_read_lock();
+
+       old_spte = kvm_tdp_mmu_read_spte(sp->ptep);
+       if (WARN_ON_ONCE(!is_shadow_present_pte(old_spte))) {
+               rcu_read_unlock();
+               return false;
+       }
+
+       __tdp_mmu_set_spte(kvm, kvm_mmu_page_as_id(sp), sp->ptep, old_spte, 0,
+                          sp->gfn, sp->role.level + 1, true, true);
+
+       rcu_read_unlock();
+
+       return true;
+}
+
  /*
   * Tears down the mappings for the range of gfns, [start, end), and frees the
   * non-root pages mapping GFNs strictly within that range. Returns true if
diff --git a/arch/x86/kvm/mmu/tdp_mmu.h b/arch/x86/kvm/mmu/tdp_mmu.h

index 57c73d8f76ceb14337ddec2ca9a06bbcd51539c5..5e5ef2576c811a91492477b0e6dde3785fccbb8b 100644 (file)
--- a/arch/x86/kvm/mmu/tdp_mmu.h
+++ b/arch/x86/kvm/mmu/tdp_mmu.h
@@ -22,24 +22,8 @@ static inline bool kvm_tdp_mmu_zap_gfn_range(struct kvm *kvm, int as_id,
  {
         return __kvm_tdp_mmu_zap_gfn_range(kvm, as_id, start, end, true, flush);
  }
-static inline bool kvm_tdp_mmu_zap_sp(struct kvm *kvm, struct kvm_mmu_page *sp)
-{
-       gfn_t end = sp->gfn + KVM_PAGES_PER_HPAGE(sp->role.level + 1);
-
-       /*
-        * Don't allow yielding, as the caller may have a flush pending.  Note,
-        * if mmu_lock is held for write, zapping will never yield in this case,
-        * but explicitly disallow it for safety.  The TDP MMU does not yield
-        * until it has made forward progress (steps sideways), and when zapping
-        * a single shadow page that it's guaranteed to see (thus the mmu_lock
-        * requirement), its "step sideways" will always step beyond the bounds
-        * of the shadow page's gfn range and stop iterating before yielding.
-        */
-       lockdep_assert_held_write(&kvm->mmu_lock);
-       return __kvm_tdp_mmu_zap_gfn_range(kvm, kvm_mmu_page_as_id(sp),
-                                          sp->gfn, end, false, false);
-}
  
+bool kvm_tdp_mmu_zap_sp(struct kvm *kvm, struct kvm_mmu_page *sp);
  void kvm_tdp_mmu_zap_all(struct kvm *kvm);
  void kvm_tdp_mmu_invalidate_all_roots(struct kvm *kvm);
  void kvm_tdp_mmu_zap_invalidated_roots(struct kvm *kvm);
author	Sean Christopherson <seanjc@google.com>
	Sat, 26 Feb 2022 00:15:31 +0000 (00:15 +0000)
committer	Paolo Bonzini <pbonzini@redhat.com>
	Tue, 8 Mar 2022 14:31:54 +0000 (09:31 -0500)
arch/x86/kvm/mmu/mmu_internal.h		patch \| blob \| history
arch/x86/kvm/mmu/tdp_iter.h		patch \| blob \| history
arch/x86/kvm/mmu/tdp_mmu.c		patch \| blob \| history
arch/x86/kvm/mmu/tdp_mmu.h		patch \| blob \| history