KVM: x86/mmu: Tag disallowed NX huge pages even if they're not tracked

author Sean Christopherson <seanjc@google.com>

Wed, 19 Oct 2022 16:56:11 +0000 (16:56 +0000)

committer Paolo Bonzini <pbonzini@redhat.com>

Wed, 9 Nov 2022 17:31:31 +0000 (12:31 -0500)
author Sean Christopherson <seanjc@google.com>
Wed, 19 Oct 2022 16:56:11 +0000 (16:56 +0000)
committer Paolo Bonzini <pbonzini@redhat.com>
Wed, 9 Nov 2022 17:31:31 +0000 (12:31 -0500)
diff --git a/arch/x86/kvm/mmu/mmu.c b/arch/x86/kvm/mmu/mmu.c

index 5d662b43a63efa50901578e6dfb97eaaed744c60..989586e7dd86e01cdc510ae51ae30e346c75ceb1 100644 (file)
--- a/arch/x86/kvm/mmu/mmu.c
+++ b/arch/x86/kvm/mmu/mmu.c
@@ -803,15 +803,25 @@ static void account_shadowed(struct kvm *kvm, struct kvm_mmu_page *sp)
                 kvm_flush_remote_tlbs_with_address(kvm, gfn, 1);
  }
  
-void account_huge_nx_page(struct kvm *kvm, struct kvm_mmu_page *sp)
+void account_huge_nx_page(struct kvm *kvm, struct kvm_mmu_page *sp,
+                         bool nx_huge_page_possible)
  {
-       if (sp->lpage_disallowed)
+       sp->lpage_disallowed = true;
+
+       /*
+        * If it's possible to replace the shadow page with an NX huge page,
+        * i.e. if the shadow page is the only thing currently preventing KVM
+        * from using a huge page, add the shadow page to the list of "to be
+        * zapped for NX recovery" pages.  Note, the shadow page can already be
+        * on the list if KVM is reusing an existing shadow page, i.e. if KVM
+        * links a shadow page at multiple points.
+        */
+       if (!nx_huge_page_possible || !list_empty(&sp->lpage_disallowed_link))
                 return;
  
         ++kvm->stat.nx_lpage_splits;
         list_add_tail(&sp->lpage_disallowed_link,
                       &kvm->arch.lpage_disallowed_mmu_pages);
-       sp->lpage_disallowed = true;
  }
  
  static void unaccount_shadowed(struct kvm *kvm, struct kvm_mmu_page *sp)
@@ -833,9 +843,13 @@ static void unaccount_shadowed(struct kvm *kvm, struct kvm_mmu_page *sp)
  
  void unaccount_huge_nx_page(struct kvm *kvm, struct kvm_mmu_page *sp)
  {
-       --kvm->stat.nx_lpage_splits;
         sp->lpage_disallowed = false;
-       list_del(&sp->lpage_disallowed_link);
+
+       if (list_empty(&sp->lpage_disallowed_link))
+               return;
+
+       --kvm->stat.nx_lpage_splits;
+       list_del_init(&sp->lpage_disallowed_link);
  }
  
  static struct kvm_memory_slot *
@@ -2130,6 +2144,8 @@ static struct kvm_mmu_page *kvm_mmu_alloc_shadow_page(struct kvm *kvm,
  
         set_page_private(virt_to_page(sp->spt), (unsigned long)sp);
  
+       INIT_LIST_HEAD(&sp->lpage_disallowed_link);
+
         /*
          * active_mmu_pages must be a FIFO list, as kvm_zap_obsolete_pages()
          * depends on valid pages being added to the head of the list.  See
@@ -3127,9 +3143,9 @@ static int __direct_map(struct kvm_vcpu *vcpu, struct kvm_page_fault *fault)
                         continue;
  
                 link_shadow_page(vcpu, it.sptep, sp);
-               if (fault->is_tdp && fault->huge_page_disallowed &&
-                   fault->req_level >= it.level)
-                       account_huge_nx_page(vcpu->kvm, sp);
+               if (fault->is_tdp && fault->huge_page_disallowed)
+                       account_huge_nx_page(vcpu->kvm, sp,
+                                            fault->req_level >= it.level);
         }
  
         if (WARN_ON_ONCE(it.level != fault->goal_level))
diff --git a/arch/x86/kvm/mmu/mmu_internal.h b/arch/x86/kvm/mmu/mmu_internal.h

index 582def531d4d9e12d2c281973d63f034a7f0f222..cca1ad75d09611050b62bc18bd1239b7bf38d646 100644 (file)
--- a/arch/x86/kvm/mmu/mmu_internal.h
+++ b/arch/x86/kvm/mmu/mmu_internal.h
@@ -100,6 +100,13 @@ struct kvm_mmu_page {
                 };
         };
  
+       /*
+        * Tracks shadow pages that, if zapped, would allow KVM to create an NX
+        * huge page.  A shadow page will have lpage_disallowed set but not be
+        * on the list if a huge page is disallowed for other reasons, e.g.
+        * because KVM is shadowing a PTE at the same gfn, the memslot isn't
+        * properly aligned, etc...
+        */
         struct list_head lpage_disallowed_link;
  #ifdef CONFIG_X86_32
         /*
@@ -315,7 +322,8 @@ void disallowed_hugepage_adjust(struct kvm_page_fault *fault, u64 spte, int cur_
  
  void *mmu_memory_cache_alloc(struct kvm_mmu_memory_cache *mc);
  
-void account_huge_nx_page(struct kvm *kvm, struct kvm_mmu_page *sp);
+void account_huge_nx_page(struct kvm *kvm, struct kvm_mmu_page *sp,
+                         bool nx_huge_page_possible);
  void unaccount_huge_nx_page(struct kvm *kvm, struct kvm_mmu_page *sp);
  
  #endif /* __KVM_X86_MMU_INTERNAL_H */
diff --git a/arch/x86/kvm/mmu/paging_tmpl.h b/arch/x86/kvm/mmu/paging_tmpl.h

index 5ab5f94dcb6fdb3c95140dbc31bee11595665832..8fd0c4e1e5750197b343f76025bd0f310caa718b 100644 (file)
--- a/arch/x86/kvm/mmu/paging_tmpl.h
+++ b/arch/x86/kvm/mmu/paging_tmpl.h
@@ -713,9 +713,9 @@ static int FNAME(fetch)(struct kvm_vcpu *vcpu, struct kvm_page_fault *fault,
                         continue;
  
                 link_shadow_page(vcpu, it.sptep, sp);
-               if (fault->huge_page_disallowed &&
-                   fault->req_level >= it.level)
-                       account_huge_nx_page(vcpu->kvm, sp);
+               if (fault->huge_page_disallowed)
+                       account_huge_nx_page(vcpu->kvm, sp,
+                                            fault->req_level >= it.level);
         }
  
         if (WARN_ON_ONCE(it.level != fault->goal_level))
diff --git a/arch/x86/kvm/mmu/tdp_mmu.c b/arch/x86/kvm/mmu/tdp_mmu.c

index 672f0432d7777fca9414da2bb6fc6cc13d28220b..80a4a1a09131081f7b0ed4ddd254693ec1adffd1 100644 (file)
--- a/arch/x86/kvm/mmu/tdp_mmu.c
+++ b/arch/x86/kvm/mmu/tdp_mmu.c
@@ -284,6 +284,8 @@ static struct kvm_mmu_page *tdp_mmu_alloc_sp(struct kvm_vcpu *vcpu)
  static void tdp_mmu_init_sp(struct kvm_mmu_page *sp, tdp_ptep_t sptep,
                             gfn_t gfn, union kvm_mmu_page_role role)
  {
+       INIT_LIST_HEAD(&sp->lpage_disallowed_link);
+
         set_page_private(virt_to_page(sp->spt), (unsigned long)sp);
  
         sp->role = role;
@@ -1141,7 +1143,7 @@ static int tdp_mmu_link_sp(struct kvm *kvm, struct tdp_iter *iter,
         spin_lock(&kvm->arch.tdp_mmu_pages_lock);
         list_add(&sp->link, &kvm->arch.tdp_mmu_pages);
         if (account_nx)
-               account_huge_nx_page(kvm, sp);
+               account_huge_nx_page(kvm, sp, true);
         spin_unlock(&kvm->arch.tdp_mmu_pages_lock);
         tdp_account_mmu_page(kvm, sp);
author	Sean Christopherson <seanjc@google.com>
	Wed, 19 Oct 2022 16:56:11 +0000 (16:56 +0000)
committer	Paolo Bonzini <pbonzini@redhat.com>
	Wed, 9 Nov 2022 17:31:31 +0000 (12:31 -0500)
arch/x86/kvm/mmu/mmu.c		patch \| blob \| blame \| history
arch/x86/kvm/mmu/mmu_internal.h		patch \| blob \| blame \| history
arch/x86/kvm/mmu/paging_tmpl.h		patch \| blob \| blame \| history
arch/x86/kvm/mmu/tdp_mmu.c		patch \| blob \| blame \| history