percpu: implement [__]alloc_percpu_gfp()

author Tejun Heo <tj@kernel.org>

Tue, 2 Sep 2014 18:46:04 +0000 (14:46 -0400)

committer Tejun Heo <tj@kernel.org>

Tue, 2 Sep 2014 18:46:04 +0000 (14:46 -0400)
author Tejun Heo <tj@kernel.org>
Tue, 2 Sep 2014 18:46:04 +0000 (14:46 -0400)
committer Tejun Heo <tj@kernel.org>
Tue, 2 Sep 2014 18:46:04 +0000 (14:46 -0400)
diff --git a/include/linux/percpu.h b/include/linux/percpu.h

index 6f61b61b7996a8f248af9eb64139a5f9bfc52c7c..d1b416da25ed40029fdbcc85a81375a96ab01d81 100644 (file)
--- a/include/linux/percpu.h
+++ b/include/linux/percpu.h
@@ -122,11 +122,16 @@ extern void __init setup_per_cpu_areas(void);
  #endif
  extern void __init percpu_init_late(void);
  
+extern void __percpu *__alloc_percpu_gfp(size_t size, size_t align, gfp_t gfp);
  extern void __percpu *__alloc_percpu(size_t size, size_t align);
  extern void free_percpu(void __percpu *__pdata);
  extern phys_addr_t per_cpu_ptr_to_phys(void *addr);
  
-#define alloc_percpu(type)     \
-       (typeof(type) __percpu *)__alloc_percpu(sizeof(type), __alignof__(type))
+#define alloc_percpu_gfp(type, gfp)                                    \
+       (typeof(type) __percpu *)__alloc_percpu_gfp(sizeof(type),       \
+                                               __alignof__(type), gfp)
+#define alloc_percpu(type)                                             \
+       (typeof(type) __percpu *)__alloc_percpu(sizeof(type),           \
+                                               __alignof__(type))
  
  #endif /* __LINUX_PERCPU_H */
diff --git a/mm/percpu.c b/mm/percpu.c

index 577d84fb30023b33972b1a01b593a7c541038a4e..c52b93117dc20a0a28d545c633e90dc538a57f4c 100644 (file)
--- a/mm/percpu.c
+++ b/mm/percpu.c
@@ -151,11 +151,6 @@ static struct pcpu_chunk *pcpu_first_chunk;
  static struct pcpu_chunk *pcpu_reserved_chunk;
  static int pcpu_reserved_chunk_limit;
  
-/*
- * Free path accesses and alters only the index data structures and can be
- * safely called from atomic context.  When memory needs to be returned to
- * the system, free path schedules reclaim_work.
- */
  static DEFINE_SPINLOCK(pcpu_lock);     /* all internal data structures */
  static DEFINE_MUTEX(pcpu_alloc_mutex); /* chunk create/destroy, [de]pop */
  
@@ -727,20 +722,21 @@ static struct pcpu_chunk *pcpu_chunk_addr_search(void *addr)
   * @size: size of area to allocate in bytes
   * @align: alignment of area (max PAGE_SIZE)
   * @reserved: allocate from the reserved chunk if available
+ * @gfp: allocation flags
   *
- * Allocate percpu area of @size bytes aligned at @align.
- *
- * CONTEXT:
- * Does GFP_KERNEL allocation.
+ * Allocate percpu area of @size bytes aligned at @align.  If @gfp doesn't
+ * contain %GFP_KERNEL, the allocation is atomic.
   *
   * RETURNS:
   * Percpu pointer to the allocated area on success, NULL on failure.
   */
-static void __percpu *pcpu_alloc(size_t size, size_t align, bool reserved)
+static void __percpu *pcpu_alloc(size_t size, size_t align, bool reserved,
+                                gfp_t gfp)
  {
         static int warn_limit = 10;
         struct pcpu_chunk *chunk;
         const char *err;
+       bool is_atomic = !(gfp & GFP_KERNEL);
         int slot, off, new_alloc, cpu, ret;
         unsigned long flags;
         void __percpu *ptr;
@@ -773,14 +769,15 @@ static void __percpu *pcpu_alloc(size_t size, size_t align, bool reserved)
  
                 while ((new_alloc = pcpu_need_to_extend(chunk))) {
                         spin_unlock_irqrestore(&pcpu_lock, flags);
-                       if (pcpu_extend_area_map(chunk, new_alloc) < 0) {
+                       if (is_atomic ||
+                           pcpu_extend_area_map(chunk, new_alloc) < 0) {
                                 err = "failed to extend area map of reserved chunk";
                                 goto fail;
                         }
                         spin_lock_irqsave(&pcpu_lock, flags);
                 }
  
-               off = pcpu_alloc_area(chunk, size, align, false);
+               off = pcpu_alloc_area(chunk, size, align, is_atomic);
                 if (off >= 0)
                         goto area_found;
  
@@ -797,6 +794,8 @@ restart:
  
                         new_alloc = pcpu_need_to_extend(chunk);
                         if (new_alloc) {
+                               if (is_atomic)
+                                       continue;
                                 spin_unlock_irqrestore(&pcpu_lock, flags);
                                 if (pcpu_extend_area_map(chunk,
                                                          new_alloc) < 0) {
@@ -811,7 +810,7 @@ restart:
                                 goto restart;
                         }
  
-                       off = pcpu_alloc_area(chunk, size, align, false);
+                       off = pcpu_alloc_area(chunk, size, align, is_atomic);
                         if (off >= 0)
                                 goto area_found;
                 }
@@ -824,6 +823,9 @@ restart:
          * tasks to create chunks simultaneously.  Serialize and create iff
          * there's still no empty chunk after grabbing the mutex.
          */
+       if (is_atomic)
+               goto fail;
+
         mutex_lock(&pcpu_alloc_mutex);
  
         if (list_empty(&pcpu_slot[pcpu_nr_slots - 1])) {
@@ -846,7 +848,7 @@ area_found:
         spin_unlock_irqrestore(&pcpu_lock, flags);
  
         /* populate if not all pages are already there */
-       if (true) {
+       if (!is_atomic) {
                 int page_start, page_end, rs, re;
  
                 mutex_lock(&pcpu_alloc_mutex);
@@ -884,9 +886,9 @@ area_found:
  fail_unlock:
         spin_unlock_irqrestore(&pcpu_lock, flags);
  fail:
-       if (warn_limit) {
-               pr_warning("PERCPU: allocation failed, size=%zu align=%zu, "
-                          "%s\n", size, align, err);
+       if (!is_atomic && warn_limit) {
+               pr_warning("PERCPU: allocation failed, size=%zu align=%zu atomic=%d, %s\n",
+                          size, align, is_atomic, err);
                 dump_stack();
                 if (!--warn_limit)
                         pr_info("PERCPU: limit reached, disable warning\n");
@@ -895,22 +897,34 @@ fail:
  }
  
  /**
- * __alloc_percpu - allocate dynamic percpu area
+ * __alloc_percpu_gfp - allocate dynamic percpu area
   * @size: size of area to allocate in bytes
   * @align: alignment of area (max PAGE_SIZE)
+ * @gfp: allocation flags
   *
- * Allocate zero-filled percpu area of @size bytes aligned at @align.
- * Might sleep.  Might trigger writeouts.
- *
- * CONTEXT:
- * Does GFP_KERNEL allocation.
+ * Allocate zero-filled percpu area of @size bytes aligned at @align.  If
+ * @gfp doesn't contain %GFP_KERNEL, the allocation doesn't block and can
+ * be called from any context but is a lot more likely to fail.
   *
   * RETURNS:
   * Percpu pointer to the allocated area on success, NULL on failure.
   */
+void __percpu *__alloc_percpu_gfp(size_t size, size_t align, gfp_t gfp)
+{
+       return pcpu_alloc(size, align, false, gfp);
+}
+EXPORT_SYMBOL_GPL(__alloc_percpu_gfp);
+
+/**
+ * __alloc_percpu - allocate dynamic percpu area
+ * @size: size of area to allocate in bytes
+ * @align: alignment of area (max PAGE_SIZE)
+ *
+ * Equivalent to __alloc_percpu_gfp(size, align, %GFP_KERNEL).
+ */
  void __percpu *__alloc_percpu(size_t size, size_t align)
  {
-       return pcpu_alloc(size, align, false);
+       return pcpu_alloc(size, align, false, GFP_KERNEL);
  }
  EXPORT_SYMBOL_GPL(__alloc_percpu);
  
@@ -932,7 +946,7 @@ EXPORT_SYMBOL_GPL(__alloc_percpu);
   */
  void __percpu *__alloc_reserved_percpu(size_t size, size_t align)
  {
-       return pcpu_alloc(size, align, true);
+       return pcpu_alloc(size, align, true, GFP_KERNEL);
  }
  
  /**
author	Tejun Heo <tj@kernel.org>
	Tue, 2 Sep 2014 18:46:04 +0000 (14:46 -0400)
committer	Tejun Heo <tj@kernel.org>
	Tue, 2 Sep 2014 18:46:04 +0000 (14:46 -0400)
include/linux/percpu.h		patch \| blob \| history
mm/percpu.c		patch \| blob \| history