KVM: x86/mmu: Don't leak non-leaf SPTEs when zapping all SPTEs

author Sean Christopherson <seanjc@google.com>

Thu, 12 Aug 2021 18:14:13 +0000 (11:14 -0700)

committer Paolo Bonzini <pbonzini@redhat.com>

Fri, 13 Aug 2021 07:31:46 +0000 (03:31 -0400)
author Sean Christopherson <seanjc@google.com>
Thu, 12 Aug 2021 18:14:13 +0000 (11:14 -0700)
committer Paolo Bonzini <pbonzini@redhat.com>
Fri, 13 Aug 2021 07:31:46 +0000 (03:31 -0400)
diff --git a/arch/x86/kvm/mmu/tdp_mmu.c b/arch/x86/kvm/mmu/tdp_mmu.c

index 0853370..8783b9e 100644 (file)
--- a/arch/x86/kvm/mmu/tdp_mmu.c
+++ b/arch/x86/kvm/mmu/tdp_mmu.c
@@ -43,6 +43,7 @@ void kvm_mmu_uninit_tdp_mmu(struct kvm *kvm)
         if (!kvm->arch.tdp_mmu_enabled)
                 return;
  
+       WARN_ON(!list_empty(&kvm->arch.tdp_mmu_pages));
         WARN_ON(!list_empty(&kvm->arch.tdp_mmu_roots));
  
         /*
@@ -81,8 +82,6 @@ static void tdp_mmu_free_sp_rcu_callback(struct rcu_head *head)
  void kvm_tdp_mmu_put_root(struct kvm *kvm, struct kvm_mmu_page *root,
                           bool shared)
  {
-       gfn_t max_gfn = 1ULL << (shadow_phys_bits - PAGE_SHIFT);
-
         kvm_lockdep_assert_mmu_lock_held(kvm, shared);
  
         if (!refcount_dec_and_test(&root->tdp_mmu_root_count))
@@ -94,7 +93,7 @@ void kvm_tdp_mmu_put_root(struct kvm *kvm, struct kvm_mmu_page *root,
         list_del_rcu(&root->link);
         spin_unlock(&kvm->arch.tdp_mmu_pages_lock);
  
-       zap_gfn_range(kvm, root, 0, max_gfn, false, false, shared);
+       zap_gfn_range(kvm, root, 0, -1ull, false, false, shared);
  
         call_rcu(&root->rcu_head, tdp_mmu_free_sp_rcu_callback);
  }
@@ -724,8 +723,17 @@ static bool zap_gfn_range(struct kvm *kvm, struct kvm_mmu_page *root,
                           gfn_t start, gfn_t end, bool can_yield, bool flush,
                           bool shared)
  {
+       gfn_t max_gfn_host = 1ULL << (shadow_phys_bits - PAGE_SHIFT);
+       bool zap_all = (start == 0 && end >= max_gfn_host);
         struct tdp_iter iter;
  
+       /*
+        * Bound the walk at host.MAXPHYADDR, guest accesses beyond that will
+        * hit a #PF(RSVD) and never get to an EPT Violation/Misconfig / #NPF,
+        * and so KVM will never install a SPTE for such addresses.
+        */
+       end = min(end, max_gfn_host);
+
         kvm_lockdep_assert_mmu_lock_held(kvm, shared);
  
         rcu_read_lock();
@@ -744,9 +752,10 @@ retry:
                 /*
                  * If this is a non-last-level SPTE that covers a larger range
                  * than should be zapped, continue, and zap the mappings at a
-                * lower level.
+                * lower level, except when zapping all SPTEs.
                  */
-               if ((iter.gfn < start ||
+               if (!zap_all &&
+                   (iter.gfn < start ||
                      iter.gfn + KVM_PAGES_PER_HPAGE(iter.level) > end) &&
                     !is_last_spte(iter.old_spte, iter.level))
                         continue;
@@ -794,12 +803,11 @@ bool __kvm_tdp_mmu_zap_gfn_range(struct kvm *kvm, int as_id, gfn_t start,
  
  void kvm_tdp_mmu_zap_all(struct kvm *kvm)
  {
-       gfn_t max_gfn = 1ULL << (shadow_phys_bits - PAGE_SHIFT);
         bool flush = false;
         int i;
  
         for (i = 0; i < KVM_ADDRESS_SPACE_NUM; i++)
-               flush = kvm_tdp_mmu_zap_gfn_range(kvm, i, 0, max_gfn,
+               flush = kvm_tdp_mmu_zap_gfn_range(kvm, i, 0, -1ull,
                                                   flush, false);
  
         if (flush)
@@ -838,7 +846,6 @@ static struct kvm_mmu_page *next_invalidated_root(struct kvm *kvm,
   */
  void kvm_tdp_mmu_zap_invalidated_roots(struct kvm *kvm)
  {
-       gfn_t max_gfn = 1ULL << (shadow_phys_bits - PAGE_SHIFT);
         struct kvm_mmu_page *next_root;
         struct kvm_mmu_page *root;
         bool flush = false;
@@ -854,8 +861,7 @@ void kvm_tdp_mmu_zap_invalidated_roots(struct kvm *kvm)
  
                 rcu_read_unlock();
  
-               flush = zap_gfn_range(kvm, root, 0, max_gfn, true, flush,
-                                     true);
+               flush = zap_gfn_range(kvm, root, 0, -1ull, true, flush, true);
  
                 /*
                  * Put the reference acquired in
author	Sean Christopherson <seanjc@google.com>
	Thu, 12 Aug 2021 18:14:13 +0000 (11:14 -0700)
committer	Paolo Bonzini <pbonzini@redhat.com>
	Fri, 13 Aug 2021 07:31:46 +0000 (03:31 -0400)