mm, swap: prefer nonfull over free clusters

author Kairui Song <kasong@tencent.com>

Wed, 6 Aug 2025 16:17:48 +0000 (00:17 +0800)

committer Andrew Morton <akpm@linux-foundation.org>

Fri, 12 Sep 2025 00:24:38 +0000 (17:24 -0700)
author Kairui Song <kasong@tencent.com>
Wed, 6 Aug 2025 16:17:48 +0000 (00:17 +0800)
committer Andrew Morton <akpm@linux-foundation.org>
Fri, 12 Sep 2025 00:24:38 +0000 (17:24 -0700)
diff --git a/mm/swapfile.c b/mm/swapfile.c

index 5fdb3cb2b8b7ab020dbe0a309ff6334146d0b749..4a0cf4fb348df386928be3a9d57be66a85a76267 100644 (file)
--- a/mm/swapfile.c
+++ b/mm/swapfile.c
@@ -908,18 +908,20 @@ static unsigned long cluster_alloc_swap_entry(struct swap_info_struct *si, int o
         }
  
  new_cluster:
-       ci = isolate_lock_cluster(si, &si->free_clusters);
-       if (ci) {
-               found = alloc_swap_scan_cluster(si, ci, cluster_offset(si, ci),
-                                               order, usage);
-               if (found)
-                       goto done;
+       /*
+        * If the device need discard, prefer new cluster over nonfull
+        * to spread out the writes.
+        */
+       if (si->flags & SWP_PAGE_DISCARD) {
+               ci = isolate_lock_cluster(si, &si->free_clusters);
+               if (ci) {
+                       found = alloc_swap_scan_cluster(si, ci, cluster_offset(si, ci),
+                                                       order, usage);
+                       if (found)
+                               goto done;
+               }
         }
  
-       /* Try reclaim from full clusters if free clusters list is drained */
-       if (vm_swap_full())
-               swap_reclaim_full_clusters(si, false);
-
         if (order < PMD_ORDER) {
                 while ((ci = isolate_lock_cluster(si, &si->nonfull_clusters[order]))) {
                         found = alloc_swap_scan_cluster(si, ci, cluster_offset(si, ci),
@@ -927,7 +929,23 @@ new_cluster:
                         if (found)
                                 goto done;
                 }
+       }
  
+       if (!(si->flags & SWP_PAGE_DISCARD)) {
+               ci = isolate_lock_cluster(si, &si->free_clusters);
+               if (ci) {
+                       found = alloc_swap_scan_cluster(si, ci, cluster_offset(si, ci),
+                                                       order, usage);
+                       if (found)
+                               goto done;
+               }
+       }
+
+       /* Try reclaim full clusters if free and nonfull lists are drained */
+       if (vm_swap_full())
+               swap_reclaim_full_clusters(si, false);
+
+       if (order < PMD_ORDER) {
                 /*
                  * Scan only one fragment cluster is good enough. Order 0
                  * allocation will surely success, and large allocation
author	Kairui Song <kasong@tencent.com>
	Wed, 6 Aug 2025 16:17:48 +0000 (00:17 +0800)
committer	Andrew Morton <akpm@linux-foundation.org>
	Fri, 12 Sep 2025 00:24:38 +0000 (17:24 -0700)