x86/microcode: Synchronize late microcode loading

author Borislav Petkov <bp@suse.de>

Wed, 8 May 2019 15:10:41 +0000 (11:10 -0400)

committer Boris Ostrovsky <boris.ostrovsky@oracle.com>

Wed, 8 May 2019 21:33:34 +0000 (17:33 -0400)
author Borislav Petkov <bp@suse.de>
Wed, 8 May 2019 15:10:41 +0000 (11:10 -0400)
committer Boris Ostrovsky <boris.ostrovsky@oracle.com>
Wed, 8 May 2019 21:33:34 +0000 (17:33 -0400)
diff --git a/arch/x86/kernel/cpu/microcode/core.c b/arch/x86/kernel/cpu/microcode/core.c

index 7ffbd73d3e4d1896133478d9498bb913f72673ce..08d23b12b6e44ff253810358c7b0807433ad39d4 100644 (file)
--- a/arch/x86/kernel/cpu/microcode/core.c
+++ b/arch/x86/kernel/cpu/microcode/core.c
@@ -74,12 +74,15 @@
  #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  
  #include <linux/platform_device.h>
+#include <linux/stop_machine.h>
  #include <linux/miscdevice.h>
  #include <linux/capability.h>
  #include <linux/kernel.h>
+#include <linux/delay.h>
  #include <linux/module.h>
  #include <linux/mutex.h>
  #include <linux/cpu.h>
+#include <linux/nmi.h>
  #include <linux/fs.h>
  #include <linux/mm.h>
  #include <linux/syscore_ops.h>
@@ -116,6 +119,11 @@ module_param(dis_ucode_ldr, bool, 0);
   */
  static DEFINE_MUTEX(microcode_mutex);
  
+/*
+ * Serialize late loading so that CPUs get updated one-by-one.
+ */
+static DEFINE_SPINLOCK(update_lock);
+
  struct ucode_cpu_info          ucode_cpu_info[NR_CPUS];
  EXPORT_SYMBOL_GPL(ucode_cpu_info);
  
@@ -326,6 +334,19 @@ MODULE_ALIAS("devname:cpu/microcode");
  /* fake device for request_firmware */
  static struct platform_device  *microcode_pdev;
  
+/*
+ * Late loading dance. Why the heavy-handed stomp_machine effort?
+ *
+ * - HT siblings must be idle and not execute other code while the other sibling
+ *   is loading microcode in order to avoid any negative interactions caused by
+ *   the loading.
+ *
+ * - In addition, microcode update on the cores must be serialized until this
+ *   requirement can be relaxed in the future. Right now, this is conservative
+ *   and good.
+ */
+#define SPINUNIT 100 /* 100 nsec */
+
  static int check_online_cpus(void)
  {
         unsigned int cpu;
@@ -344,31 +365,81 @@ static int check_online_cpus(void)
         return 0;
  }
  
-static int reload_for_cpu(int cpu)
+static atomic_t late_cpus;
+
+/*
+ * Returns:
+ * < 0 - on error
+ *   0 - no update done
+ *   1 - microcode was updated
+ */
+static int __reload_late(void *info)
  {
-       struct ucode_cpu_info *uci = ucode_cpu_info + cpu;
-       enum ucode_state ustate;
-       int err = 0;
+       unsigned int timeout = NSEC_PER_SEC;
+       int all_cpus = num_online_cpus();
+       int cpu = smp_processor_id();
+       enum ucode_state err;
+       int ret = 0;
  
-       if (!uci->valid)
-               return err;
+       /*
+        * Wait for all CPUs to arrive. A load will not be attempted unless all
+        * CPUs show up.
+        * */
+       while (atomic_read(&late_cpus)) {
+               if (timeout < SPINUNIT) {
+                       pr_err("Timeout while waiting for CPUs rendezvous, remaining: %d\n",
+                               atomic_read(&late_cpus));
+                       return -1;
+               }
  
-       ustate = microcode_ops->request_microcode_fw(cpu, &microcode_pdev->dev, true);
-       if (ustate == UCODE_OK)
-               apply_microcode_on_target(cpu);
-       else
-               if (ustate == UCODE_ERROR)
-                       err = -EINVAL;
-       return err;
+               ndelay(SPINUNIT);
+               timeout -= SPINUNIT;
+
+               touch_nmi_watchdog();
+       }
+
+       spin_lock(&update_lock);
+       apply_microcode_local(&err);
+       spin_unlock(&update_lock);
+
+       if (err < 0) {
+               pr_warn("Error reloading microcode on CPU %d\n", cpu);
+               ret = -1;
+       } else {
+               ret = 1;
+       }
+
+       atomic_inc(&late_cpus);
+
+       while (atomic_read(&late_cpus) != all_cpus)
+               cpu_relax();
+
+       return ret;
  }
  
+/*
+ * Reload microcode late on all CPUs. Wait for a sec until they
+ * all gather together.
+ */
+static int microcode_reload_late(void)
+{
+       int ret;
+
+       atomic_set(&late_cpus, num_online_cpus());
+
+       ret = stop_machine(__reload_late, NULL, cpu_online_mask);
+
+       return ret;
+}
+
+
  static ssize_t reload_store(struct device *dev,
                             struct device_attribute *attr,
                             const char *buf, size_t size)
  {
         unsigned long val;
+       ssize_t ret;
         int cpu;
-       ssize_t ret = 0, tmp_ret;
  
         ret = kstrtoul(buf, 0, &val);
         if (ret)
@@ -384,27 +455,30 @@ static ssize_t reload_store(struct device *dev,
                 goto put;
  
         mutex_lock(&microcode_mutex);
-       for_each_online_cpu(cpu) {
-               tmp_ret = reload_for_cpu(cpu);
-               if (tmp_ret != 0)
-                       pr_warn("Error reloading microcode on CPU %d\n", cpu);
  
-               /* save retval of the first encountered reload error */
-               if (!ret)
-                       ret = tmp_ret;
+       for_each_online_cpu(cpu) {
+               ret = microcode_ops->request_microcode_fw(cpu, &microcode_pdev->dev, true);
+               if (ret != UCODE_OK) {
+                       ret = -EINVAL;
+                       goto out;
+               }
         }
-       if (!ret) {
+
+       ret = microcode_reload_late();
+
+       if (ret >= 0) {
                 perf_check_microcode();
                 microcode_late_eval_cpuid_all();
                 microcode_late_select_mitigation();
         }
  
+out:
         mutex_unlock(&microcode_mutex);
  
  put:
         put_online_cpus();
  
-       if (!ret)
+       if (ret >= 0)
                 ret = size;
  
         return ret;
author	Borislav Petkov <bp@suse.de>
	Wed, 8 May 2019 15:10:41 +0000 (11:10 -0400)
committer	Boris Ostrovsky <boris.ostrovsky@oracle.com>
	Wed, 8 May 2019 21:33:34 +0000 (17:33 -0400)