KVM: SEV: Support SEV-SNP AP Creation NAE event

author Tom Lendacky <thomas.lendacky@amd.com>

Wed, 1 May 2024 08:52:02 +0000 (03:52 -0500)

committer Paolo Bonzini <pbonzini@redhat.com>

Sun, 12 May 2024 08:09:32 +0000 (04:09 -0400)
author Tom Lendacky <thomas.lendacky@amd.com>
Wed, 1 May 2024 08:52:02 +0000 (03:52 -0500)
committer Paolo Bonzini <pbonzini@redhat.com>
Sun, 12 May 2024 08:09:32 +0000 (04:09 -0400)
diff --git a/arch/x86/include/asm/kvm_host.h b/arch/x86/include/asm/kvm_host.h

index 80dfcdab87eb882f18debc522a92bdf22cea415b..aabf1648a56a9a6f2df7358e0d6a74f8da4ece45 100644 (file)
--- a/arch/x86/include/asm/kvm_host.h
+++ b/arch/x86/include/asm/kvm_host.h
@@ -121,6 +121,7 @@
         KVM_ARCH_REQ_FLAGS(31, KVM_REQUEST_WAIT | KVM_REQUEST_NO_WAKEUP)
  #define KVM_REQ_HV_TLB_FLUSH \
         KVM_ARCH_REQ_FLAGS(32, KVM_REQUEST_WAIT | KVM_REQUEST_NO_WAKEUP)
+#define KVM_REQ_UPDATE_PROTECTED_GUEST_STATE   KVM_ARCH_REQ(34)
  
  #define CR0_RESERVED_BITS                                               \
         (~(unsigned long)(X86_CR0_PE | X86_CR0_MP | X86_CR0_EM | X86_CR0_TS \
diff --git a/arch/x86/include/asm/svm.h b/arch/x86/include/asm/svm.h

index 544a43c1cf1123e163a550d0371be6a20035300e..f0dea3750ca9f0e59c69f51541ba058686314339 100644 (file)
--- a/arch/x86/include/asm/svm.h
+++ b/arch/x86/include/asm/svm.h
@@ -286,8 +286,14 @@ static_assert((X2AVIC_MAX_PHYSICAL_ID & AVIC_PHYSICAL_MAX_INDEX_MASK) == X2AVIC_
  #define AVIC_HPA_MASK  ~((0xFFFULL << 52) | 0xFFF)
  
  #define SVM_SEV_FEAT_SNP_ACTIVE                                BIT(0)
+#define SVM_SEV_FEAT_RESTRICTED_INJECTION              BIT(3)
+#define SVM_SEV_FEAT_ALTERNATE_INJECTION               BIT(4)
  #define SVM_SEV_FEAT_DEBUG_SWAP                                BIT(5)
  
+#define SVM_SEV_FEAT_INT_INJ_MODES             \
+       (SVM_SEV_FEAT_RESTRICTED_INJECTION |    \
+        SVM_SEV_FEAT_ALTERNATE_INJECTION)
+
  struct vmcb_seg {
         u16 selector;
         u16 attrib;
diff --git a/arch/x86/kvm/svm/sev.c b/arch/x86/kvm/svm/sev.c

index f01cee8278ab2bd764a61eeda622a0a66e219c0c..0c1108ffc4ae72a3dbf1ddd03e707483907a92f1 100644 (file)
--- a/arch/x86/kvm/svm/sev.c
+++ b/arch/x86/kvm/svm/sev.c
@@ -38,7 +38,7 @@
  #define GHCB_VERSION_DEFAULT   2ULL
  #define GHCB_VERSION_MIN       1ULL
  
-#define GHCB_HV_FT_SUPPORTED   GHCB_HV_FT_SNP
+#define GHCB_HV_FT_SUPPORTED   (GHCB_HV_FT_SNP | GHCB_HV_FT_SNP_AP_CREATION)
  
  /* enable/disable SEV support */
  static bool sev_enabled = true;
@@ -3267,6 +3267,13 @@ static int sev_es_validate_vmgexit(struct vcpu_svm *svm)
                 if (!kvm_ghcb_sw_scratch_is_valid(svm))
                         goto vmgexit_err;
                 break;
+       case SVM_VMGEXIT_AP_CREATION:
+               if (!sev_snp_guest(vcpu->kvm))
+                       goto vmgexit_err;
+               if (lower_32_bits(control->exit_info_1) != SVM_VMGEXIT_AP_DESTROY)
+                       if (!kvm_ghcb_rax_is_valid(svm))
+                               goto vmgexit_err;
+               break;
         case SVM_VMGEXIT_NMI_COMPLETE:
         case SVM_VMGEXIT_AP_HLT_LOOP:
         case SVM_VMGEXIT_AP_JUMP_TABLE:
@@ -3701,6 +3708,205 @@ next_range:
         unreachable();
  }
  
+static int __sev_snp_update_protected_guest_state(struct kvm_vcpu *vcpu)
+{
+       struct vcpu_svm *svm = to_svm(vcpu);
+
+       WARN_ON(!mutex_is_locked(&svm->sev_es.snp_vmsa_mutex));
+
+       /* Mark the vCPU as offline and not runnable */
+       vcpu->arch.pv.pv_unhalted = false;
+       vcpu->arch.mp_state = KVM_MP_STATE_HALTED;
+
+       /* Clear use of the VMSA */
+       svm->vmcb->control.vmsa_pa = INVALID_PAGE;
+
+       if (VALID_PAGE(svm->sev_es.snp_vmsa_gpa)) {
+               gfn_t gfn = gpa_to_gfn(svm->sev_es.snp_vmsa_gpa);
+               struct kvm_memory_slot *slot;
+               kvm_pfn_t pfn;
+
+               slot = gfn_to_memslot(vcpu->kvm, gfn);
+               if (!slot)
+                       return -EINVAL;
+
+               /*
+                * The new VMSA will be private memory guest memory, so
+                * retrieve the PFN from the gmem backend.
+                */
+               if (kvm_gmem_get_pfn(vcpu->kvm, slot, gfn, &pfn, NULL))
+                       return -EINVAL;
+
+               /*
+                * From this point forward, the VMSA will always be a
+                * guest-mapped page rather than the initial one allocated
+                * by KVM in svm->sev_es.vmsa. In theory, svm->sev_es.vmsa
+                * could be free'd and cleaned up here, but that involves
+                * cleanups like wbinvd_on_all_cpus() which would ideally
+                * be handled during teardown rather than guest boot.
+                * Deferring that also allows the existing logic for SEV-ES
+                * VMSAs to be re-used with minimal SNP-specific changes.
+                */
+               svm->sev_es.snp_has_guest_vmsa = true;
+
+               /* Use the new VMSA */
+               svm->vmcb->control.vmsa_pa = pfn_to_hpa(pfn);
+
+               /* Mark the vCPU as runnable */
+               vcpu->arch.pv.pv_unhalted = false;
+               vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE;
+
+               svm->sev_es.snp_vmsa_gpa = INVALID_PAGE;
+
+               /*
+                * gmem pages aren't currently migratable, but if this ever
+                * changes then care should be taken to ensure
+                * svm->sev_es.vmsa is pinned through some other means.
+                */
+               kvm_release_pfn_clean(pfn);
+       }
+
+       /*
+        * When replacing the VMSA during SEV-SNP AP creation,
+        * mark the VMCB dirty so that full state is always reloaded.
+        */
+       vmcb_mark_all_dirty(svm->vmcb);
+
+       return 0;
+}
+
+/*
+ * Invoked as part of svm_vcpu_reset() processing of an init event.
+ */
+void sev_snp_init_protected_guest_state(struct kvm_vcpu *vcpu)
+{
+       struct vcpu_svm *svm = to_svm(vcpu);
+       int ret;
+
+       if (!sev_snp_guest(vcpu->kvm))
+               return;
+
+       mutex_lock(&svm->sev_es.snp_vmsa_mutex);
+
+       if (!svm->sev_es.snp_ap_waiting_for_reset)
+               goto unlock;
+
+       svm->sev_es.snp_ap_waiting_for_reset = false;
+
+       ret = __sev_snp_update_protected_guest_state(vcpu);
+       if (ret)
+               vcpu_unimpl(vcpu, "snp: AP state update on init failed\n");
+
+unlock:
+       mutex_unlock(&svm->sev_es.snp_vmsa_mutex);
+}
+
+static int sev_snp_ap_creation(struct vcpu_svm *svm)
+{
+       struct kvm_sev_info *sev = &to_kvm_svm(svm->vcpu.kvm)->sev_info;
+       struct kvm_vcpu *vcpu = &svm->vcpu;
+       struct kvm_vcpu *target_vcpu;
+       struct vcpu_svm *target_svm;
+       unsigned int request;
+       unsigned int apic_id;
+       bool kick;
+       int ret;
+
+       request = lower_32_bits(svm->vmcb->control.exit_info_1);
+       apic_id = upper_32_bits(svm->vmcb->control.exit_info_1);
+
+       /* Validate the APIC ID */
+       target_vcpu = kvm_get_vcpu_by_id(vcpu->kvm, apic_id);
+       if (!target_vcpu) {
+               vcpu_unimpl(vcpu, "vmgexit: invalid AP APIC ID [%#x] from guest\n",
+                           apic_id);
+               return -EINVAL;
+       }
+
+       ret = 0;
+
+       target_svm = to_svm(target_vcpu);
+
+       /*
+        * The target vCPU is valid, so the vCPU will be kicked unless the
+        * request is for CREATE_ON_INIT. For any errors at this stage, the
+        * kick will place the vCPU in an non-runnable state.
+        */
+       kick = true;
+
+       mutex_lock(&target_svm->sev_es.snp_vmsa_mutex);
+
+       target_svm->sev_es.snp_vmsa_gpa = INVALID_PAGE;
+       target_svm->sev_es.snp_ap_waiting_for_reset = true;
+
+       /* Interrupt injection mode shouldn't change for AP creation */
+       if (request < SVM_VMGEXIT_AP_DESTROY) {
+               u64 sev_features;
+
+               sev_features = vcpu->arch.regs[VCPU_REGS_RAX];
+               sev_features ^= sev->vmsa_features;
+
+               if (sev_features & SVM_SEV_FEAT_INT_INJ_MODES) {
+                       vcpu_unimpl(vcpu, "vmgexit: invalid AP injection mode [%#lx] from guest\n",
+                                   vcpu->arch.regs[VCPU_REGS_RAX]);
+                       ret = -EINVAL;
+                       goto out;
+               }
+       }
+
+       switch (request) {
+       case SVM_VMGEXIT_AP_CREATE_ON_INIT:
+               kick = false;
+               fallthrough;
+       case SVM_VMGEXIT_AP_CREATE:
+               if (!page_address_valid(vcpu, svm->vmcb->control.exit_info_2)) {
+                       vcpu_unimpl(vcpu, "vmgexit: invalid AP VMSA address [%#llx] from guest\n",
+                                   svm->vmcb->control.exit_info_2);
+                       ret = -EINVAL;
+                       goto out;
+               }
+
+               /*
+                * Malicious guest can RMPADJUST a large page into VMSA which
+                * will hit the SNP erratum where the CPU will incorrectly signal
+                * an RMP violation #PF if a hugepage collides with the RMP entry
+                * of VMSA page, reject the AP CREATE request if VMSA address from
+                * guest is 2M aligned.
+                */
+               if (IS_ALIGNED(svm->vmcb->control.exit_info_2, PMD_SIZE)) {
+                       vcpu_unimpl(vcpu,
+                                   "vmgexit: AP VMSA address [%llx] from guest is unsafe as it is 2M aligned\n",
+                                   svm->vmcb->control.exit_info_2);
+                       ret = -EINVAL;
+                       goto out;
+               }
+
+               target_svm->sev_es.snp_vmsa_gpa = svm->vmcb->control.exit_info_2;
+               break;
+       case SVM_VMGEXIT_AP_DESTROY:
+               break;
+       default:
+               vcpu_unimpl(vcpu, "vmgexit: invalid AP creation request [%#x] from guest\n",
+                           request);
+               ret = -EINVAL;
+               break;
+       }
+
+out:
+       if (kick) {
+               kvm_make_request(KVM_REQ_UPDATE_PROTECTED_GUEST_STATE, target_vcpu);
+
+               if (target_vcpu->arch.mp_state == KVM_MP_STATE_UNINITIALIZED)
+                       kvm_make_request(KVM_REQ_UNBLOCK, target_vcpu);
+
+               kvm_vcpu_kick(target_vcpu);
+       }
+
+       mutex_unlock(&target_svm->sev_es.snp_vmsa_mutex);
+
+       return ret;
+}
+
  static int sev_handle_vmgexit_msr_protocol(struct vcpu_svm *svm)
  {
         struct vmcb_control_area *control = &svm->vmcb->control;
@@ -3966,6 +4172,15 @@ int sev_handle_vmgexit(struct kvm_vcpu *vcpu)
  
                 ret = snp_begin_psc(svm, svm->sev_es.ghcb_sa);
                 break;
+       case SVM_VMGEXIT_AP_CREATION:
+               ret = sev_snp_ap_creation(svm);
+               if (ret) {
+                       ghcb_set_sw_exit_info_1(svm->sev_es.ghcb, 2);
+                       ghcb_set_sw_exit_info_2(svm->sev_es.ghcb, GHCB_ERR_INVALID_INPUT);
+               }
+
+               ret = 1;
+               break;
         case SVM_VMGEXIT_UNSUPPORTED_EVENT:
                 vcpu_unimpl(vcpu,
                             "vmgexit: unsupported event - exit_info_1=%#llx, exit_info_2=%#llx\n",
@@ -4060,7 +4275,7 @@ static void sev_es_init_vmcb(struct vcpu_svm *svm)
          * the VMSA will be NULL if this vCPU is the destination for intrahost
          * migration, and will be copied later.
          */
-       if (svm->sev_es.vmsa)
+       if (svm->sev_es.vmsa && !svm->sev_es.snp_has_guest_vmsa)
                 svm->vmcb->control.vmsa_pa = __pa(svm->sev_es.vmsa);
  
         /* Can't intercept CR register access, HV can't modify CR registers */
@@ -4136,6 +4351,8 @@ void sev_es_vcpu_reset(struct vcpu_svm *svm)
         set_ghcb_msr(svm, GHCB_MSR_SEV_INFO((__u64)sev->ghcb_version,
                                             GHCB_VERSION_MIN,
                                             sev_enc_bit));
+
+       mutex_init(&svm->sev_es.snp_vmsa_mutex);
  }
  
  void sev_es_prepare_switch_to_guest(struct vcpu_svm *svm, struct sev_es_save_area *hostsa)
@@ -4247,6 +4464,16 @@ struct page *snp_safe_alloc_page(struct kvm_vcpu *vcpu)
         return p;
  }
  
+void sev_vcpu_unblocking(struct kvm_vcpu *vcpu)
+{
+       if (!sev_snp_guest(vcpu->kvm))
+               return;
+
+       if (kvm_test_request(KVM_REQ_UPDATE_PROTECTED_GUEST_STATE, vcpu) &&
+           vcpu->arch.mp_state == KVM_MP_STATE_UNINITIALIZED)
+               vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE;
+}
+
  void sev_handle_rmp_fault(struct kvm_vcpu *vcpu, gpa_t gpa, u64 error_code)
  {
         struct kvm_memory_slot *slot;
diff --git a/arch/x86/kvm/svm/svm.c b/arch/x86/kvm/svm/svm.c

index bdaf3957181767c1f99433861b1e3037a7336e50..546656606b44410c7e5305fc9025ae69274a773e 100644 (file)
--- a/arch/x86/kvm/svm/svm.c
+++ b/arch/x86/kvm/svm/svm.c
@@ -1398,6 +1398,9 @@ static void svm_vcpu_reset(struct kvm_vcpu *vcpu, bool init_event)
         svm->spec_ctrl = 0;
         svm->virt_spec_ctrl = 0;
  
+       if (init_event)
+               sev_snp_init_protected_guest_state(vcpu);
+
         init_vmcb(vcpu);
  
         if (!init_event)
@@ -4940,6 +4943,12 @@ static void *svm_alloc_apic_backing_page(struct kvm_vcpu *vcpu)
         return page_address(page);
  }
  
+static void svm_vcpu_unblocking(struct kvm_vcpu *vcpu)
+{
+       sev_vcpu_unblocking(vcpu);
+       avic_vcpu_unblocking(vcpu);
+}
+
  static struct kvm_x86_ops svm_x86_ops __initdata = {
         .name = KBUILD_MODNAME,
  
@@ -4962,7 +4971,7 @@ static struct kvm_x86_ops svm_x86_ops __initdata = {
         .vcpu_load = svm_vcpu_load,
         .vcpu_put = svm_vcpu_put,
         .vcpu_blocking = avic_vcpu_blocking,
-       .vcpu_unblocking = avic_vcpu_unblocking,
+       .vcpu_unblocking = svm_vcpu_unblocking,
  
         .update_exception_bitmap = svm_update_exception_bitmap,
         .get_msr_feature = svm_get_msr_feature,
diff --git a/arch/x86/kvm/svm/svm.h b/arch/x86/kvm/svm/svm.h

index 36b573427b8506da81473dd916b8631a499f0b7a..926bfce571a6e10822e95bf695b7ba600ad31204 100644 (file)
--- a/arch/x86/kvm/svm/svm.h
+++ b/arch/x86/kvm/svm/svm.h
@@ -216,6 +216,11 @@ struct vcpu_sev_es_state {
         bool psc_2m;
  
         u64 ghcb_registered_gpa;
+
+       struct mutex snp_vmsa_mutex; /* Used to handle concurrent updates of VMSA. */
+       gpa_t snp_vmsa_gpa;
+       bool snp_ap_waiting_for_reset;
+       bool snp_has_guest_vmsa;
  };
  
  struct vcpu_svm {
@@ -729,6 +734,8 @@ int sev_cpu_init(struct svm_cpu_data *sd);
  int sev_dev_get_attr(u32 group, u64 attr, u64 *val);
  extern unsigned int max_sev_asid;
  void sev_handle_rmp_fault(struct kvm_vcpu *vcpu, gpa_t gpa, u64 error_code);
+void sev_vcpu_unblocking(struct kvm_vcpu *vcpu);
+void sev_snp_init_protected_guest_state(struct kvm_vcpu *vcpu);
  #else
  static inline struct page *snp_safe_alloc_page(struct kvm_vcpu *vcpu) {
         return alloc_page(GFP_KERNEL_ACCOUNT | __GFP_ZERO);
@@ -743,6 +750,8 @@ static inline int sev_cpu_init(struct svm_cpu_data *sd) { return 0; }
  static inline int sev_dev_get_attr(u32 group, u64 attr, u64 *val) { return -ENXIO; }
  #define max_sev_asid 0
  static inline void sev_handle_rmp_fault(struct kvm_vcpu *vcpu, gpa_t gpa, u64 error_code) {}
+static inline void sev_vcpu_unblocking(struct kvm_vcpu *vcpu) {}
+static inline void sev_snp_init_protected_guest_state(struct kvm_vcpu *vcpu) {}
  
  #endif
  
diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c

index a143c26a92214769f56ffa9227815f3bd0df6a17..d29477910ffa17d3169979a4a53bf3f43ba111a1 100644 (file)
--- a/arch/x86/kvm/x86.c
+++ b/arch/x86/kvm/x86.c
@@ -10939,6 +10939,14 @@ static int vcpu_enter_guest(struct kvm_vcpu *vcpu)
  
                 if (kvm_check_request(KVM_REQ_UPDATE_CPU_DIRTY_LOGGING, vcpu))
                         static_call(kvm_x86_update_cpu_dirty_logging)(vcpu);
+
+               if (kvm_check_request(KVM_REQ_UPDATE_PROTECTED_GUEST_STATE, vcpu)) {
+                       kvm_vcpu_reset(vcpu, true);
+                       if (vcpu->arch.mp_state != KVM_MP_STATE_RUNNABLE) {
+                               r = 1;
+                               goto out;
+                       }
+               }
         }
  
         if (kvm_check_request(KVM_REQ_EVENT, vcpu) || req_int_win ||
@@ -13146,6 +13154,9 @@ static inline bool kvm_vcpu_has_events(struct kvm_vcpu *vcpu)
         if (kvm_test_request(KVM_REQ_PMI, vcpu))
                 return true;
  
+       if (kvm_test_request(KVM_REQ_UPDATE_PROTECTED_GUEST_STATE, vcpu))
+               return true;
+
         if (kvm_arch_interrupt_allowed(vcpu) &&
             (kvm_cpu_has_interrupt(vcpu) ||
             kvm_guest_apic_has_interrupt(vcpu)))
author	Tom Lendacky <thomas.lendacky@amd.com>
	Wed, 1 May 2024 08:52:02 +0000 (03:52 -0500)
committer	Paolo Bonzini <pbonzini@redhat.com>
	Sun, 12 May 2024 08:09:32 +0000 (04:09 -0400)
arch/x86/include/asm/kvm_host.h		patch \| blob \| history
arch/x86/include/asm/svm.h		patch \| blob \| history
arch/x86/kvm/svm/sev.c		patch \| blob \| history
arch/x86/kvm/svm/svm.c		patch \| blob \| history
arch/x86/kvm/svm/svm.h		patch \| blob \| history
arch/x86/kvm/x86.c		patch \| blob \| history