]> www.infradead.org Git - users/jedix/linux-maple.git/commitdiff
mm: check against orig_pte for finish_fault()
authorPeter Xu <peterx@redhat.com>
Thu, 14 Apr 2022 19:16:48 +0000 (12:16 -0700)
committerLiam R. Howlett <Liam.Howlett@oracle.com>
Thu, 14 Apr 2022 21:49:51 +0000 (17:49 -0400)
We used to check against none pte in finish_fault(), with the assumption
that the orig_pte is always none pte.

This change prepares us to be able to call do_fault() on !none ptes.  For
example, we should allow that to happen for pte marker so that we can
restore information out of the pte markers.

Let's change the "pte_none" check into detecting changes since we fetched
orig_pte.  One trivial thing to take care of here is, when pmd==NULL for
the pgtable we may not initialize orig_pte at all in handle_pte_fault().

By default orig_pte will be all zeros however the problem is not all
architectures are using all-zeros for a none pte.  pte_clear() will be the
right thing to use here so that we'll always have a valid orig_pte value
for the whole handle_pte_fault() call.

Link: https://lkml.kernel.org/r/20220405014836.14077-1-peterx@redhat.com
Signed-off-by: Peter Xu <peterx@redhat.com>
Reviewed-by: Alistair Popple <apopple@nvidia.com>
Cc: Andrea Arcangeli <aarcange@redhat.com>
Cc: Axel Rasmussen <axelrasmussen@google.com>
Cc: David Hildenbrand <david@redhat.com>
Cc: Hugh Dickins <hughd@google.com>
Cc: Jerome Glisse <jglisse@redhat.com>
Cc: "Kirill A . Shutemov" <kirill@shutemov.name>
Cc: Matthew Wilcox <willy@infradead.org>
Cc: Mike Kravetz <mike.kravetz@oracle.com>
Cc: Mike Rapoport <rppt@linux.vnet.ibm.com>
Cc: Nadav Amit <nadav.amit@gmail.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
mm/memory.c

index ec79e7849b047d8918e6f406c9800d189cdbc7fb..3ca1fbf29e4fd976f210f7fbf604ad663f36b8b0 100644 (file)
@@ -4252,7 +4252,7 @@ vm_fault_t finish_fault(struct vm_fault *vmf)
                                      vmf->address, &vmf->ptl);
        ret = 0;
        /* Re-check under ptl */
-       if (likely(pte_none(*vmf->pte)))
+       if (likely(pte_same(*vmf->pte, vmf->orig_pte)))
                do_set_pte(vmf, page, vmf->address);
        else
                ret = VM_FAULT_NOPAGE;
@@ -4720,6 +4720,13 @@ static vm_fault_t handle_pte_fault(struct vm_fault *vmf)
                 * concurrent faults and from rmap lookups.
                 */
                vmf->pte = NULL;
+               /*
+                * Always initialize orig_pte.  This matches with below
+                * code to have orig_pte to be the none pte if pte==NULL.
+                * This makes the rest code to be always safe to reference
+                * it, e.g. in finish_fault() we'll detect pte changes.
+                */
+               pte_clear(vmf->vma->vm_mm, vmf->address, &vmf->orig_pte);
        } else {
                /*
                 * If a huge pmd materialized under us just retry later.  Use