lib: optimize cpumask_local_spread()

author Yuqi Jin <jinyuqi@huawei.com>

Thu, 31 Dec 2020 22:04:43 +0000 (22:04 +0000)

committer Johannes Weiner <hannes@cmpxchg.org>

Thu, 31 Dec 2020 22:04:43 +0000 (22:04 +0000)
author Yuqi Jin <jinyuqi@huawei.com>
Thu, 31 Dec 2020 22:04:43 +0000 (22:04 +0000)
committer Johannes Weiner <hannes@cmpxchg.org>
Thu, 31 Dec 2020 22:04:43 +0000 (22:04 +0000)
diff --git a/lib/cpumask.c b/lib/cpumask.c

index 35924025097b963b513da7cd75f06073a8d71c31..fb4b704c7265a5b41569b4d20cd338633383f138 100644 (file)
--- a/lib/cpumask.c
+++ b/lib/cpumask.c
@@ -193,20 +193,47 @@ void __init free_bootmem_cpumask_var(cpumask_var_t mask)
  }
  #endif
  
+static int find_nearest_node(int node, bool *used)
+{
+       int i, min_dist, node_id = -1;
+
+       /* Choose the first unused node to compare */
+       for (i = 0; i < nr_node_ids; i++) {
+               if (used[i] == false) {
+                       min_dist = node_distance(node, i);
+                       node_id = i;
+                       break;
+               }
+       }
+
+       /* Compare and return the nearest node */
+       for (i = 0; i < nr_node_ids; i++) {
+               if (node_distance(node, i) < min_dist && used[i] == false) {
+                       min_dist = node_distance(node, i);
+                       node_id = i;
+               }
+       }
+
+       return node_id;
+}
+
  /**
   * cpumask_local_spread - select the i'th cpu with local numa cpu's first
   * @i: index number
   * @node: local numa_node
   *
   * This function selects an online CPU according to a numa aware policy;
- * local cpus are returned first, followed by non-local ones, then it
- * wraps around.
+ * local cpus are returned first, followed by the next one which is the
+ * nearest unused NUMA node based on NUMA distance, then it wraps around.
   *
   * It's not very efficient, but useful for setup.
   */
  unsigned int cpumask_local_spread(unsigned int i, int node)
  {
-       int cpu, hk_flags;
+       static DEFINE_SPINLOCK(spread_lock);
+       static bool used[MAX_NUMNODES];
+       unsigned long flags;
+       int cpu, hk_flags, j, id;
         const struct cpumask *mask;
  
         hk_flags = HK_FLAG_DOMAIN | HK_FLAG_MANAGED_IRQ;
@@ -220,20 +247,27 @@ unsigned int cpumask_local_spread(unsigned int i, int node)
                                 return cpu;
                 }
         } else {
-               /* NUMA first. */
-               for_each_cpu_and(cpu, cpumask_of_node(node), mask) {
-                       if (i-- == 0)
-                               return cpu;
+               spin_lock_irqsave(&spread_lock, flags);
+               memset(used, 0, nr_node_ids * sizeof(bool));
+               /* select node according to the distance from local node */
+               for (j = 0; j < nr_node_ids; j++) {
+                       id = find_nearest_node(node, used);
+                       if (id < 0)
+                               break;
+
+                       for_each_cpu_and(cpu, cpumask_of_node(id), mask)
+                               if (i-- == 0) {
+                                       spin_unlock_irqrestore(&spread_lock,
+                                                              flags);
+                                       return cpu;
+                               }
+                       used[id] = true;
                 }
+               spin_unlock_irqrestore(&spread_lock, flags);
  
-               for_each_cpu(cpu, mask) {
-                       /* Skip NUMA nodes, done above. */
-                       if (cpumask_test_cpu(cpu, cpumask_of_node(node)))
-                               continue;
-
+               for_each_cpu(cpu, mask)
                         if (i-- == 0)
                                 return cpu;
-               }
         }
         BUG();
  }
author	Yuqi Jin <jinyuqi@huawei.com>
	Thu, 31 Dec 2020 22:04:43 +0000 (22:04 +0000)
committer	Johannes Weiner <hannes@cmpxchg.org>
	Thu, 31 Dec 2020 22:04:43 +0000 (22:04 +0000)