x86: perf: prevent spurious PMU NMIs on Haswell systems

author Dan Duval <dan.duval@oracle.com>

Fri, 24 Oct 2014 19:14:14 +0000 (15:14 -0400)

committer Santosh Shilimkar <santosh.shilimkar@oracle.com>

Mon, 29 Jun 2015 15:36:56 +0000 (08:36 -0700)
author Dan Duval <dan.duval@oracle.com>
Fri, 24 Oct 2014 19:14:14 +0000 (15:14 -0400)
committer Santosh Shilimkar <santosh.shilimkar@oracle.com>
Mon, 29 Jun 2015 15:36:56 +0000 (08:36 -0700)
diff --git a/arch/x86/kernel/cpu/perf_event_intel.c b/arch/x86/kernel/cpu/perf_event_intel.c

index a1e35c9f06b9522af32b79cd4837f3a93a083f6b..2e06274924612cf12b79b87fe957565243f191fa 100644 (file)
--- a/arch/x86/kernel/cpu/perf_event_intel.c
+++ b/arch/x86/kernel/cpu/perf_event_intel.c
@@ -1576,6 +1576,7 @@ static int intel_pmu_handle_irq(struct pt_regs *regs)
         int bit, loops;
         u64 status;
         int handled;
+       u32 lvtpc;
  
         cpuc = this_cpu_ptr(&cpu_hw_events);
  
@@ -1586,6 +1587,7 @@ static int intel_pmu_handle_irq(struct pt_regs *regs)
         if (!x86_pmu.late_ack)
                 apic_write(APIC_LVTPC, APIC_DM_NMI);
         __intel_pmu_disable_all();
+
         handled = intel_pmu_drain_bts_buffer();
         handled += intel_bts_interrupt();
         status = intel_pmu_get_status();
@@ -1670,6 +1672,25 @@ again:
                 goto again;
  
  done:
+       lvtpc = apic_read(APIC_LVTPC);
+
+       /*
+        * Haswell processors sometimes generate PMIs that are not handled
+        * by other code in this handler.  The following ensures that any
+        * NMI that is generated by the PMU is at least "claimed" by this
+        * handler, rather than showing up as an unknown NMI and possibly
+        * causing a crash.
+        */
+       if(handled == 0 && (lvtpc & APIC_LVT_MASKED))
+               handled = 1;
+
+       /*
+        * Only unmask the NMI after the overflow counters
+        * have been reset. This avoids spurious NMIs on
+        * Haswell CPUs.
+        */
+       apic_write(APIC_LVTPC, APIC_DM_NMI);
+
         __intel_pmu_enable_all(0, true);
         /*
          * Only unmask the NMI after the overflow counters
author	Dan Duval <dan.duval@oracle.com>
	Fri, 24 Oct 2014 19:14:14 +0000 (15:14 -0400)
committer	Santosh Shilimkar <santosh.shilimkar@oracle.com>
	Mon, 29 Jun 2015 15:36:56 +0000 (08:36 -0700)