x86/KVM/VMX: Add L1D flush logic

author Paolo Bonzini <pbonzini@redhat.com>

Mon, 2 Jul 2018 11:07:14 +0000 (13:07 +0200)

committer Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>

Sat, 11 Aug 2018 00:44:39 +0000 (20:44 -0400)
author Paolo Bonzini <pbonzini@redhat.com>
Mon, 2 Jul 2018 11:07:14 +0000 (13:07 +0200)
committer Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Sat, 11 Aug 2018 00:44:39 +0000 (20:44 -0400)
diff --git a/arch/x86/include/asm/kvm_host.h b/arch/x86/include/asm/kvm_host.h

index 10dd34d36ccd3909793f670103ef1887a7fec286..004c70549d48507c6b58812bc4540a7f473f64d7 100644 (file)
--- a/arch/x86/include/asm/kvm_host.h
+++ b/arch/x86/include/asm/kvm_host.h
@@ -542,6 +542,9 @@ struct kvm_vcpu_arch {
         struct {
                 bool pv_unhalted;
         } pv;
+
+       /* Flush the L1 Data cache for L1TF mitigation on VMENTER */
+       bool l1tf_flush_l1d;
  };
  
  struct kvm_lpage_info {
@@ -666,6 +669,7 @@ struct kvm_vcpu_stat {
         u32 signal_exits;
         u32 irq_window_exits;
         u32 nmi_window_exits;
+       u64 l1d_flush;
         u32 halt_exits;
         u32 halt_successful_poll;
         u32 halt_wakeup;
diff --git a/arch/x86/kvm/vmx.c b/arch/x86/kvm/vmx.c

index 4f80c38f37b4d4cb1f5f55eb7be4bd89f9d739f1..6e21980f559e04d8af97a975268341705fff9b36 100644 (file)
--- a/arch/x86/kvm/vmx.c
+++ b/arch/x86/kvm/vmx.c
@@ -5238,6 +5238,7 @@ static int handle_exception(struct kvm_vcpu *vcpu)
  
                 if (kvm_event_needs_reinjection(vcpu))
                         kvm_mmu_unprotect_page_virt(vcpu, cr2);
+               vcpu->arch.l1tf_flush_l1d = true;
                 return kvm_mmu_page_fault(vcpu, cr2, error_code, NULL, 0);
         }
  
@@ -7923,9 +7924,20 @@ static int vmx_handle_exit(struct kvm_vcpu *vcpu)
  #define L1D_CACHE_ORDER 4
  static void *vmx_l1d_flush_pages;
  
-static void __maybe_unused vmx_l1d_flush(void)
+static void vmx_l1d_flush(struct kvm_vcpu *vcpu)
  {
         int size = PAGE_SIZE << L1D_CACHE_ORDER;
+       bool always;
+
+       /*
+        * If the mitigation mode is 'flush always', keep the flush bit
+        * set, otherwise clear it. It gets set again either from
+        * vcpu_run() or from one of the unsafe VMEXIT handlers.
+        */
+       always = vmentry_l1d_flush == VMENTER_L1D_FLUSH_ALWAYS;
+       vcpu->arch.l1tf_flush_l1d = always;
+
+       vcpu->stat.l1d_flush++;
  
         if (static_cpu_has(X86_FEATURE_FLUSH_L1D)) {
                 wrmsrl(MSR_IA32_FLUSH_CMD, L1D_FLUSH);
@@ -8161,6 +8173,7 @@ static void vmx_handle_external_intr(struct kvm_vcpu *vcpu)
                         [ss]"i"(__KERNEL_DS),
                         [cs]"i"(__KERNEL_CS)
                         );
+               vcpu->arch.l1tf_flush_l1d = true;
         } else
                 local_irq_enable();
  }
@@ -8371,6 +8384,11 @@ static void __noclone vmx_vcpu_run(struct kvm_vcpu *vcpu)
  
         x86_spec_ctrl_set_guest(vmx->spec_ctrl, 0);
  
+       if (unlikely(static_key_enabled(&vmx_l1d_should_flush))) {
+               if (vcpu->arch.l1tf_flush_l1d)
+                       vmx_l1d_flush(vcpu);
+       }
+
         asm(
                 /* Store host registers */
                 "push %%" _ASM_DX "; push %%" _ASM_BP ";"
@@ -9821,6 +9839,9 @@ static int nested_vmx_run(struct kvm_vcpu *vcpu, bool launch)
  
         vmcs12->launch_state = 1;
  
+       /* Hide L1D cache contents from the nested guest.  */
+       vmx->vcpu.arch.l1tf_flush_l1d = true;
+
         if (vmcs12->guest_activity_state == GUEST_ACTIVITY_HLT)
                 return kvm_vcpu_halt(vcpu);
  
diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c

index d128875fd642db962396d921981ca99dbe9a382c..b05535b2871c0e998c4eea0b47e3832141d12b27 100644 (file)
--- a/arch/x86/kvm/x86.c
+++ b/arch/x86/kvm/x86.c
@@ -157,6 +157,7 @@ struct kvm_stats_debugfs_item debugfs_entries[] = {
         { "insn_emulation_fail", VCPU_STAT(insn_emulation_fail) },
         { "irq_injections", VCPU_STAT(irq_injections) },
         { "nmi_injections", VCPU_STAT(nmi_injections) },
+       { "l1d_flush", VCPU_STAT(l1d_flush) },
         { "mmu_shadow_zapped", VM_STAT(mmu_shadow_zapped) },
         { "mmu_pte_write", VM_STAT(mmu_pte_write) },
         { "mmu_pte_updated", VM_STAT(mmu_pte_updated) },
@@ -4355,6 +4356,9 @@ int kvm_write_guest_virt_system(struct x86_emulate_ctxt *ctxt,
         void *data = val;
         int r = X86EMUL_CONTINUE;
  
+       /* kvm_write_guest_virt_system can pull in tons of pages. */
+       vcpu->arch.l1tf_flush_l1d = true;
+
         while (bytes) {
                 gpa_t gpa =  vcpu->arch.walk_mmu->gva_to_gpa(vcpu, addr,
                                                              PFERR_WRITE_MASK,
@@ -4378,6 +4382,7 @@ int kvm_write_guest_virt_system(struct x86_emulate_ctxt *ctxt,
  out:
         return r;
  }
+
  EXPORT_SYMBOL_GPL(kvm_write_guest_virt_system);
  
  static int vcpu_mmio_gva_to_gpa(struct kvm_vcpu *vcpu, unsigned long gva,
@@ -5395,6 +5400,8 @@ int x86_emulate_instruction(struct kvm_vcpu *vcpu,
         bool writeback = true;
         bool write_fault_to_spt = vcpu->arch.write_fault_to_shadow_pgtable;
  
+       vcpu->arch.l1tf_flush_l1d = true;
+
         /*
          * Clear write_fault_to_shadow_pgtable here to ensure it is
          * never reused.
@@ -6494,6 +6501,7 @@ static int vcpu_run(struct kvm_vcpu *vcpu)
         struct kvm *kvm = vcpu->kvm;
  
         vcpu->srcu_idx = srcu_read_lock(&kvm->srcu);
+       vcpu->arch.l1tf_flush_l1d = true;
  
         for (;;) {
                 if (vcpu->arch.mp_state == KVM_MP_STATE_RUNNABLE &&
@@ -7427,6 +7435,7 @@ void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu)
  
  void kvm_arch_sched_in(struct kvm_vcpu *vcpu, int cpu)
  {
+       vcpu->arch.l1tf_flush_l1d = true;
         kvm_x86_ops->sched_in(vcpu, cpu);
  }
author	Paolo Bonzini <pbonzini@redhat.com>
	Mon, 2 Jul 2018 11:07:14 +0000 (13:07 +0200)
committer	Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
	Sat, 11 Aug 2018 00:44:39 +0000 (20:44 -0400)
arch/x86/include/asm/kvm_host.h		patch \| blob \| history
arch/x86/kvm/vmx.c		patch \| blob \| history
arch/x86/kvm/x86.c		patch \| blob \| history