mm: handle swap page faults under per-VMA lock

author Suren Baghdasaryan <surenb@google.com>

Fri, 30 Jun 2023 21:19:56 +0000 (14:19 -0700)

committer Andrew Morton <akpm@linux-foundation.org>

Thu, 24 Aug 2023 23:20:17 +0000 (16:20 -0700)
author Suren Baghdasaryan <surenb@google.com>
Fri, 30 Jun 2023 21:19:56 +0000 (14:19 -0700)
committer Andrew Morton <akpm@linux-foundation.org>
Thu, 24 Aug 2023 23:20:17 +0000 (16:20 -0700)
diff --git a/include/linux/mm.h b/include/linux/mm.h

index 939386e0aedab9f018d8fae4fe8ead037d08f7ec..0d16208178c7b6d18f7cfb14fe23c27a449f5a1e 100644 (file)
--- a/include/linux/mm.h
+++ b/include/linux/mm.h
@@ -729,6 +729,14 @@ static inline void vma_mark_detached(struct vm_area_struct *vma, bool detached)
         vma->detached = detached;
  }
  
+static inline void release_fault_lock(struct vm_fault *vmf)
+{
+       if (vmf->flags & FAULT_FLAG_VMA_LOCK)
+               vma_end_read(vmf->vma);
+       else
+               mmap_read_unlock(vmf->vma->vm_mm);
+}
+
  struct vm_area_struct *lock_vma_under_rcu(struct mm_struct *mm,
                                           unsigned long address);
  
@@ -749,6 +757,11 @@ static inline struct vm_area_struct *lock_vma_under_rcu(struct mm_struct *mm,
         return NULL;
  }
  
+static inline void release_fault_lock(struct vm_fault *vmf)
+{
+       mmap_read_unlock(vmf->vma->vm_mm);
+}
+
  #endif /* CONFIG_PER_VMA_LOCK */
  
  extern const struct vm_operations_struct vma_dummy_vm_ops;
diff --git a/mm/filemap.c b/mm/filemap.c

index 40514493014a15c972708d2ab17fb016d519ade7..8040545954bc4175b26e1efd7331828a774333cd 100644 (file)
--- a/mm/filemap.c
+++ b/mm/filemap.c
@@ -1671,27 +1671,26 @@ static int __folio_lock_async(struct folio *folio, struct wait_page_queue *wait)
   * Return values:
   * 0 - folio is locked.
   * non-zero - folio is not locked.
- *     mmap_lock has been released (mmap_read_unlock(), unless flags had both
- *     FAULT_FLAG_ALLOW_RETRY and FAULT_FLAG_RETRY_NOWAIT set, in
- *     which case mmap_lock is still held.
+ *     mmap_lock or per-VMA lock has been released (mmap_read_unlock() or
+ *     vma_end_read()), unless flags had both FAULT_FLAG_ALLOW_RETRY and
+ *     FAULT_FLAG_RETRY_NOWAIT set, in which case the lock is still held.
   *
   * If neither ALLOW_RETRY nor KILLABLE are set, will always return 0
- * with the folio locked and the mmap_lock unperturbed.
+ * with the folio locked and the mmap_lock/per-VMA lock is left unperturbed.
   */
  vm_fault_t __folio_lock_or_retry(struct folio *folio, struct vm_fault *vmf)
  {
-       struct mm_struct *mm = vmf->vma->vm_mm;
         unsigned int flags = vmf->flags;
  
         if (fault_flag_allow_retry_first(flags)) {
                 /*
-                * CAUTION! In this case, mmap_lock is not released
-                * even though return VM_FAULT_RETRY.
+                * CAUTION! In this case, mmap_lock/per-VMA lock is not
+                * released even though returning VM_FAULT_RETRY.
                  */
                 if (flags & FAULT_FLAG_RETRY_NOWAIT)
                         return VM_FAULT_RETRY;
  
-               mmap_read_unlock(mm);
+               release_fault_lock(vmf);
                 if (flags & FAULT_FLAG_KILLABLE)
                         folio_wait_locked_killable(folio);
                 else
@@ -1703,7 +1702,7 @@ vm_fault_t __folio_lock_or_retry(struct folio *folio, struct vm_fault *vmf)
  
                 ret = __folio_lock_killable(folio);
                 if (ret) {
-                       mmap_read_unlock(mm);
+                       release_fault_lock(vmf);
                         return VM_FAULT_RETRY;
                 }
         } else {
diff --git a/mm/memory.c b/mm/memory.c

index 080e1d59d752e853aeb16894638a8a13035cec52..5748a41c164c5b553f839e3b176c3e26231e3e39 100644 (file)
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -3746,12 +3746,6 @@ vm_fault_t do_swap_page(struct vm_fault *vmf)
         if (!pte_unmap_same(vmf))
                 goto out;
  
-       if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
-               ret = VM_FAULT_RETRY;
-               vma_end_read(vma);
-               goto out;
-       }
-
         entry = pte_to_swp_entry(vmf->orig_pte);
         if (unlikely(non_swap_entry(entry))) {
                 if (is_migration_entry(entry)) {
@@ -3761,6 +3755,16 @@ vm_fault_t do_swap_page(struct vm_fault *vmf)
                         vmf->page = pfn_swap_entry_to_page(entry);
                         ret = remove_device_exclusive_entry(vmf);
                 } else if (is_device_private_entry(entry)) {
+                       if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
+                               /*
+                                * migrate_to_ram is not yet ready to operate
+                                * under VMA lock.
+                                */
+                               vma_end_read(vma);
+                               ret = VM_FAULT_RETRY;
+                               goto out;
+                       }
+
                         vmf->page = pfn_swap_entry_to_page(entry);
                         vmf->pte = pte_offset_map_lock(vma->vm_mm, vmf->pmd,
                                         vmf->address, &vmf->ptl);
author	Suren Baghdasaryan <surenb@google.com>
	Fri, 30 Jun 2023 21:19:56 +0000 (14:19 -0700)
committer	Andrew Morton <akpm@linux-foundation.org>
	Thu, 24 Aug 2023 23:20:17 +0000 (16:20 -0700)
include/linux/mm.h		patch \| blob \| history
mm/filemap.c		patch \| blob \| history
mm/memory.c		patch \| blob \| history