mm, swap: do not perform synchronous discard during allocation

author Kairui Song <kasong@tencent.com>

Mon, 6 Oct 2025 20:02:33 +0000 (04:02 +0800)

committer Andrew Morton <akpm@linux-foundation.org>

Wed, 15 Oct 2025 04:28:31 +0000 (21:28 -0700)
author Kairui Song <kasong@tencent.com>
Mon, 6 Oct 2025 20:02:33 +0000 (04:02 +0800)
committer Andrew Morton <akpm@linux-foundation.org>
Wed, 15 Oct 2025 04:28:31 +0000 (21:28 -0700)
diff --git a/mm/swapfile.c b/mm/swapfile.c

index cb2392ed8e0ebe83808a54510f434e3801716407..0d1924f6f49584268416cddd01a5430739e5d62c 100644 (file)
--- a/mm/swapfile.c
+++ b/mm/swapfile.c
@@ -1101,13 +1101,6 @@ new_cluster:
                         goto done;
         }
  
-       /*
-        * We don't have free cluster but have some clusters in discarding,
-        * do discard now and reclaim them.
-        */
-       if ((si->flags & SWP_PAGE_DISCARD) && swap_do_scheduled_discard(si))
-               goto new_cluster;
-
         if (order)
                 goto done;
  
@@ -1394,6 +1387,33 @@ start_over:
         return false;
  }
  
+/*
+ * Discard pending clusters in a synchronized way when under high pressure.
+ * Return: true if any cluster is discarded.
+ */
+static bool swap_sync_discard(void)
+{
+       bool ret = false;
+       int nid = numa_node_id();
+       struct swap_info_struct *si, *next;
+
+       spin_lock(&swap_avail_lock);
+       plist_for_each_entry_safe(si, next, &swap_avail_heads[nid], avail_lists[nid]) {
+               spin_unlock(&swap_avail_lock);
+               if (get_swap_device_info(si)) {
+                       if (si->flags & SWP_PAGE_DISCARD)
+                               ret = swap_do_scheduled_discard(si);
+                       put_swap_device(si);
+               }
+               if (ret)
+                       break;
+               spin_lock(&swap_avail_lock);
+       }
+       spin_unlock(&swap_avail_lock);
+
+       return ret;
+}
+
  /**
   * folio_alloc_swap - allocate swap space for a folio
   * @folio: folio we want to move to swap
@@ -1432,11 +1452,17 @@ int folio_alloc_swap(struct folio *folio, gfp_t gfp)
                 }
         }
  
+again:
         local_lock(&percpu_swap_cluster.lock);
         if (!swap_alloc_fast(&entry, order))
                 swap_alloc_slow(&entry, order);
         local_unlock(&percpu_swap_cluster.lock);
  
+       if (unlikely(!order && !entry.val)) {
+               if (swap_sync_discard())
+                       goto again;
+       }
+
         /* Need to call this even if allocation failed, for MEMCG_SWAP_FAIL. */
         if (mem_cgroup_try_charge_swap(folio, entry))
                 goto out_free;
author	Kairui Song <kasong@tencent.com>
	Mon, 6 Oct 2025 20:02:33 +0000 (04:02 +0800)
committer	Andrew Morton <akpm@linux-foundation.org>
	Wed, 15 Oct 2025 04:28:31 +0000 (21:28 -0700)