mm, slub: sheaf prefilling for guaranteed allocations

author Vlastimil Babka <vbabka@suse.cz>

Tue, 5 Nov 2024 16:00:08 +0000 (17:00 +0100)

committer Vlastimil Babka <vbabka@suse.cz>

Fri, 17 Jan 2025 18:33:39 +0000 (19:33 +0100)
author Vlastimil Babka <vbabka@suse.cz>
Tue, 5 Nov 2024 16:00:08 +0000 (17:00 +0100)
committer Vlastimil Babka <vbabka@suse.cz>
Fri, 17 Jan 2025 18:33:39 +0000 (19:33 +0100)
diff --git a/include/linux/slab.h b/include/linux/slab.h

index 55e0e4f16ede1394bda1f9efe9eb7e512fef5af5..7e7efb5da3edbcb5a75b561d1d3b9752a367862d 100644 (file)
--- a/include/linux/slab.h
+++ b/include/linux/slab.h
@@ -843,6 +843,22 @@ void *kmem_cache_alloc_node_noprof(struct kmem_cache *s, gfp_t flags,
                                    int node) __assume_slab_alignment __malloc;
  #define kmem_cache_alloc_node(...)     alloc_hooks(kmem_cache_alloc_node_noprof(__VA_ARGS__))
  
+struct slab_sheaf *
+kmem_cache_prefill_sheaf(struct kmem_cache *s, gfp_t gfp, unsigned int count);
+
+int kmem_cache_refill_sheaf(struct kmem_cache *s, gfp_t gfp,
+               struct slab_sheaf *sheaf);
+
+void kmem_cache_return_sheaf(struct kmem_cache *s, gfp_t gfp,
+                                      struct slab_sheaf *sheaf);
+
+void *kmem_cache_alloc_from_sheaf_noprof(struct kmem_cache *cachep, gfp_t gfp,
+                       struct slab_sheaf *sheaf) __assume_slab_alignment __malloc;
+#define kmem_cache_alloc_from_sheaf(...)       \
+                       alloc_hooks(kmem_cache_alloc_from_sheaf_noprof(__VA_ARGS__))
+
+unsigned int kmem_cache_sheaf_count(struct slab_sheaf *sheaf);
+
  /*
   * These macros allow declaring a kmem_buckets * parameter alongside size, which
   * can be compiled out with CONFIG_SLAB_BUCKETS=n so that a large number of call
diff --git a/mm/slub.c b/mm/slub.c

index b71e560e818e8a423111d6ded004fcf07d52ed86..a03cf92718d1625c61e85032142f6e86fb19e209 100644 (file)
--- a/mm/slub.c
+++ b/mm/slub.c
@@ -442,6 +442,7 @@ struct slab_sheaf {
         union {
                 struct rcu_head rcu_head;
                 struct list_head barn_list;
+               bool oversize;
         };
         struct kmem_cache *cache;
         unsigned int size;
@@ -2830,6 +2831,30 @@ static int barn_put_full_sheaf(struct node_barn *barn, struct slab_sheaf *sheaf,
         return ret;
  }
  
+static struct slab_sheaf *barn_get_full_or_empty_sheaf(struct node_barn *barn)
+{
+       struct slab_sheaf *sheaf = NULL;
+       unsigned long flags;
+
+       spin_lock_irqsave(&barn->lock, flags);
+
+       if (barn->nr_full) {
+               sheaf = list_first_entry(&barn->sheaves_full, struct slab_sheaf,
+                                       barn_list);
+               list_del(&sheaf->barn_list);
+               barn->nr_full--;
+       } else if (barn->nr_empty) {
+               sheaf = list_first_entry(&barn->sheaves_empty,
+                                        struct slab_sheaf, barn_list);
+               list_del(&sheaf->barn_list);
+               barn->nr_empty--;
+       }
+
+       spin_unlock_irqrestore(&barn->lock, flags);
+
+       return sheaf;
+}
+
  /*
   * If a full sheaf is available, return it and put the supplied empty one to
   * barn. We ignore the limit on empty sheaves as the number of sheaves doesn't
@@ -4927,6 +4952,145 @@ void *kmem_cache_alloc_node_noprof(struct kmem_cache *s, gfp_t gfpflags, int nod
  }
  EXPORT_SYMBOL(kmem_cache_alloc_node_noprof);
  
+
+/*
+ * returns a sheaf that has least the given count of objects
+ * when prefilling is needed, do so with given gfp flags
+ *
+ * return NULL if prefilling failed, or when the requested count is
+ * above cache's sheaf_capacity (TODO: lift this limitation)
+ */
+struct slab_sheaf *
+kmem_cache_prefill_sheaf(struct kmem_cache *s, gfp_t gfp, unsigned int count)
+{
+       struct slub_percpu_sheaves *pcs;
+       struct slab_sheaf *sheaf = NULL;
+
+       //TODO: handle via oversize sheaf
+       if (count > s->sheaf_capacity)
+               return NULL;
+
+       pcs = cpu_sheaves_lock(s->cpu_sheaves);
+
+       if (pcs->spare) {
+               sheaf = pcs->spare;
+               pcs->spare = NULL;
+       }
+
+       if (!sheaf)
+               sheaf = barn_get_full_or_empty_sheaf(pcs->barn);
+
+       cpu_sheaves_unlock(s->cpu_sheaves);
+
+       if (!sheaf) {
+               sheaf = alloc_empty_sheaf(s, gfp);
+       }
+
+       if (sheaf && sheaf->size < count) {
+               if (refill_sheaf(s, sheaf, gfp)) {
+                       sheaf_flush(s, sheaf);
+                       free_empty_sheaf(s, sheaf);
+                       sheaf = NULL;
+               }
+       }
+
+       return sheaf;
+}
+
+int kmem_cache_refill_sheaf(struct kmem_cache *s, gfp_t gfp,
+                struct slab_sheaf *sheaf)
+{
+       if (!sheaf)
+               return -EINVAL;
+
+       //TODO: handle via oversize sheaf
+       //TODO: handle failures
+       refill_sheaf(s, sheaf, gfp);
+       return 0;
+}
+
+/*
+ * Use this to return a sheaf obtained by kmem_cache_prefill_sheaf()
+ * It tries to refill the sheaf back to the cache's sheaf_capacity
+ * to avoid handling partially full sheaves.
+ *
+ * If the refill fails because gfp is e.g. GFP_NOWAIT, the sheaf is
+ * instead dissolved
+ */
+void kmem_cache_return_sheaf(struct kmem_cache *s, gfp_t gfp,
+                            struct slab_sheaf *sheaf)
+{
+       struct slub_percpu_sheaves *pcs;
+       bool refill = false;
+       struct node_barn *barn;
+
+       //TODO: handle oversize sheaf
+
+       pcs = cpu_sheaves_lock(s->cpu_sheaves);
+
+       if (!pcs->spare) {
+               pcs->spare = sheaf;
+               sheaf = NULL;
+       } else if (pcs->barn->nr_full >= MAX_FULL_SHEAVES) {
+               /* racy check */
+               barn = pcs->barn;
+               refill = true;
+       }
+
+       cpu_sheaves_unlock(s->cpu_sheaves);
+
+       if (!sheaf)
+               return;
+
+       /*
+        * if the barn is full of full sheaves or we fail to refill the sheaf,
+        * simply flush and free it
+        */
+       if (!refill || refill_sheaf(s, sheaf, gfp)) {
+               sheaf_flush(s, sheaf);
+               free_empty_sheaf(s, sheaf);
+               return;
+       }
+
+       /* we racily determined the sheaf would fit, so now force it */
+       barn_put_full_sheaf(barn, sheaf, true);
+}
+
+/*
+ * Allocate from a sheaf obtained by kmem_cache_prefill_sheaf()
+ *
+ * Guaranteed not to fail as many allocations as was the requested count.
+ * After the sheaf is emptied, it fails - no fallback to the slab cache itself.
+ *
+ * The gfp parameter is meant only to specify __GFP_ZERO or __GFP_ACCOUNT
+ * memcg charging is forced over limit if necessary, to avoid failure.
+ */
+void *
+kmem_cache_alloc_from_sheaf_noprof(struct kmem_cache *s, gfp_t gfp,
+                                  struct slab_sheaf *sheaf)
+{
+       void *ret = NULL;
+       bool init;
+
+       if (sheaf->size == 0)
+               goto out;
+
+       ret = sheaf->objects[--sheaf->size];
+
+       init = slab_want_init_on_alloc(gfp, s);
+
+       /* add __GFP_NOFAIL to force successful memcg charging */
+       slab_post_alloc_hook(s, NULL, gfp | __GFP_NOFAIL, 1, &ret, init, s->object_size);
+out:
+       trace_kmem_cache_alloc(_RET_IP_, ret, s, gfp, NUMA_NO_NODE);
+
+       return ret;
+}
+
+unsigned int kmem_cache_sheaf_count(struct slab_sheaf *sheaf)
+{
+       return sheaf->size;
+}
  /*
   * To avoid unnecessary overhead, we pass through large allocation requests
   * directly to the page allocator. We use __GFP_COMP, because we will need to
author	Vlastimil Babka <vbabka@suse.cz>
	Tue, 5 Nov 2024 16:00:08 +0000 (17:00 +0100)
committer	Vlastimil Babka <vbabka@suse.cz>
	Fri, 17 Jan 2025 18:33:39 +0000 (19:33 +0100)
include/linux/slab.h		patch \| blob \| history
mm/slub.c		patch \| blob \| history