x86/speculation/l1tf: Disallow non privileged high MMIO PROT_NONE mappings

author Andi Klein <ak@linux.intel.com>

Wed, 13 Jun 2018 22:48:27 +0000 (15:48 -0700)

committer Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>

Fri, 10 Aug 2018 22:56:32 +0000 (18:56 -0400)
author Andi Klein <ak@linux.intel.com>
Wed, 13 Jun 2018 22:48:27 +0000 (15:48 -0700)
committer Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
Fri, 10 Aug 2018 22:56:32 +0000 (18:56 -0400)
diff --git a/arch/x86/include/asm/pgtable.h b/arch/x86/include/asm/pgtable.h

index f14cf1d69cd0c933b3d007a5e80901e277a3b40b..f08973965079aa4ec58e99169f0c07c6d3b396f9 100644 (file)
--- a/arch/x86/include/asm/pgtable.h
+++ b/arch/x86/include/asm/pgtable.h
@@ -915,6 +915,14 @@ static inline pte_t pte_swp_clear_soft_dirty(pte_t pte)
  }
  #endif
  
+#define __HAVE_ARCH_PFN_MODIFY_ALLOWED 1
+extern bool pfn_modify_allowed(unsigned long pfn, pgprot_t prot);
+
+static inline bool arch_has_pfn_modify_check(void)
+{
+       return boot_cpu_has_bug(X86_BUG_L1TF);
+}
+
  #include <asm-generic/pgtable.h>
  #endif /* __ASSEMBLY__ */
  
diff --git a/arch/x86/mm/mmap.c b/arch/x86/mm/mmap.c

index cb87336f44e1dbd2bbcef7cd9acd99f847eb8482..5b726ecb83ddf1bf62069f6303dec08f34772353 100644 (file)
--- a/arch/x86/mm/mmap.c
+++ b/arch/x86/mm/mmap.c
@@ -183,3 +183,24 @@ int valid_mmap_phys_addr_range(unsigned long pfn, size_t count)
  
         return phys_addr_valid(addr + count - 1);
  }
+
+/*
+ * Only allow root to set high MMIO mappings to PROT_NONE.
+ * This prevents an unpriv. user to set them to PROT_NONE and invert
+ * them, then pointing to valid memory for L1TF speculation.
+ *
+ * Note: for locked down kernels may want to disable the root override.
+ */
+bool pfn_modify_allowed(unsigned long pfn, pgprot_t prot)
+{
+       if (!boot_cpu_has_bug(X86_BUG_L1TF))
+               return true;
+       if (!__pte_needs_invert(pgprot_val(prot)))
+               return true;
+       /* If it's real memory always allow */
+       if (pfn_valid(pfn))
+               return true;
+       if (pfn > l1tf_pfn_limit() && !capable(CAP_SYS_ADMIN))
+               return false;
+       return true;
+}
diff --git a/include/asm-generic/pgtable.h b/include/asm-generic/pgtable.h

index d041167a9b2909542ef39f51c001fd155661945a..42344e002c30d43b7096f5cf83303ed65d2c4f3a 100644 (file)
--- a/include/asm-generic/pgtable.h
+++ b/include/asm-generic/pgtable.h
@@ -801,4 +801,16 @@ static inline int pmd_clear_huge(pmd_t *pmd)
  #define io_remap_pfn_range remap_pfn_range
  #endif
  
+#ifndef __HAVE_ARCH_PFN_MODIFY_ALLOWED
+static inline bool pfn_modify_allowed(unsigned long pfn, pgprot_t prot)
+{
+       return true;
+}
+
+static inline bool arch_has_pfn_modify_check(void)
+{
+       return false;
+}
+#endif
+
  #endif /* _ASM_GENERIC_PGTABLE_H */
diff --git a/mm/memory.c b/mm/memory.c

index 60549daa68dfc197d1676a4bdf08d00aa164b313..825f39347ab141fd7584eee0e6e7a0b8d3d5831d 100644 (file)
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -1660,6 +1660,8 @@ int vm_insert_pfn(struct vm_area_struct *vma, unsigned long addr,
  
         if (addr < vma->vm_start || addr >= vma->vm_end)
                 return -EFAULT;
+       if (!pfn_modify_allowed(pfn, pgprot))
+               return -EACCES;
         if (track_pfn_insert(vma, &pgprot, pfn))
                 return -EINVAL;
  
@@ -1674,9 +1676,14 @@ int vm_insert_mixed(struct vm_area_struct *vma, unsigned long addr,
  {
         BUG_ON(!(vma->vm_flags & VM_MIXEDMAP));
  
+       pgprot_t pgprot = vma->vm_page_prot;
+
         if (addr < vma->vm_start || addr >= vma->vm_end)
                 return -EFAULT;
  
+       if (!pfn_modify_allowed(pfn, pgprot))
+               return -EACCES;
+
         /*
          * If we don't have pte special, then we have to use the pfn_valid()
          * based VM_MIXEDMAP scheme (see vm_normal_page), and thus we *must*
@@ -1705,6 +1712,7 @@ static int remap_pte_range(struct mm_struct *mm, pmd_t *pmd,
  {
         pte_t *pte;
         spinlock_t *ptl;
+       int err = 0;
  
         pte = pte_alloc_map_lock(mm, pmd, addr, &ptl);
         if (!pte)
@@ -1712,12 +1720,16 @@ static int remap_pte_range(struct mm_struct *mm, pmd_t *pmd,
         arch_enter_lazy_mmu_mode();
         do {
                 BUG_ON(!pte_none(*pte));
+               if (!pfn_modify_allowed(pfn, prot)) {
+                       err = -EACCES;
+                       break;
+               }
                 set_pte_at(mm, addr, pte, pte_mkspecial(pfn_pte(pfn, prot)));
                 pfn++;
         } while (pte++, addr += PAGE_SIZE, addr != end);
         arch_leave_lazy_mmu_mode();
         pte_unmap_unlock(pte - 1, ptl);
-       return 0;
+       return err;
  }
  
  static inline int remap_pmd_range(struct mm_struct *mm, pud_t *pud,
@@ -1726,6 +1738,7 @@ static inline int remap_pmd_range(struct mm_struct *mm, pud_t *pud,
  {
         pmd_t *pmd;
         unsigned long next;
+       int err;
  
         pfn -= addr >> PAGE_SHIFT;
         pmd = pmd_alloc(mm, pud, addr);
@@ -1734,9 +1747,10 @@ static inline int remap_pmd_range(struct mm_struct *mm, pud_t *pud,
         VM_BUG_ON(pmd_trans_huge(*pmd));
         do {
                 next = pmd_addr_end(addr, end);
-               if (remap_pte_range(mm, pmd, addr, next,
-                               pfn + (addr >> PAGE_SHIFT), prot))
-                       return -ENOMEM;
+               err = remap_pte_range(mm, pmd, addr, next,
+                               pfn + (addr >> PAGE_SHIFT), prot);
+               if (err)
+                       return err;
         } while (pmd++, addr = next, addr != end);
         return 0;
  }
@@ -1747,6 +1761,7 @@ static inline int remap_pud_range(struct mm_struct *mm, p4d_t *p4d,
  {
         pud_t *pud;
         unsigned long next;
+       int err;
  
         pfn -= addr >> PAGE_SHIFT;
         pud = pud_alloc(mm, p4d, addr);
@@ -1754,9 +1769,10 @@ static inline int remap_pud_range(struct mm_struct *mm, p4d_t *p4d,
                 return -ENOMEM;
         do {
                 next = pud_addr_end(addr, end);
-               if (remap_pmd_range(mm, pud, addr, next,
-                               pfn + (addr >> PAGE_SHIFT), prot))
-                       return -ENOMEM;
+               err = remap_pmd_range(mm, pud, addr, next,
+                               pfn + (addr >> PAGE_SHIFT), prot);
+               if (err)
+                       return err;
         } while (pud++, addr = next, addr != end);
         return 0;
  }
@@ -1767,6 +1783,7 @@ static inline int remap_p4d_range(struct mm_struct *mm, pgd_t *pgd,
  {
         p4d_t *p4d;
         unsigned long next;
+       int err;
  
         pfn -= addr >> PAGE_SHIFT;
         p4d = p4d_alloc(mm, pgd, addr);
@@ -1774,9 +1791,10 @@ static inline int remap_p4d_range(struct mm_struct *mm, pgd_t *pgd,
                 return -ENOMEM;
         do {
                 next = p4d_addr_end(addr, end);
-               if (remap_pud_range(mm, p4d, addr, next,
-                               pfn + (addr >> PAGE_SHIFT), prot))
-                       return -ENOMEM;
+               err = remap_pud_range(mm, p4d, addr, next,
+                               pfn + (addr >> PAGE_SHIFT), prot);
+               if (err)
+                       return err;
         } while (p4d++, addr = next, addr != end);
         return 0;
  }
diff --git a/mm/mprotect.c b/mm/mprotect.c

index fbdeb814f270f1d39b7f6d1d661a4220531a63b0..85644e33ab548b69d3fada930c31efebf893ee5b 100644 (file)
--- a/mm/mprotect.c
+++ b/mm/mprotect.c
@@ -272,6 +272,42 @@ unsigned long change_protection(struct vm_area_struct *vma, unsigned long start,
         return pages;
  }
  
+static int prot_none_pte_entry(pte_t *pte, unsigned long addr,
+                              unsigned long next, struct mm_walk *walk)
+{
+       return pfn_modify_allowed(pte_pfn(*pte), *(pgprot_t *)(walk->private)) ?
+               0 : -EACCES;
+}
+
+static int prot_none_hugetlb_entry(pte_t *pte, unsigned long hmask,
+                                  unsigned long addr, unsigned long next,
+                                  struct mm_walk *walk)
+{
+       return pfn_modify_allowed(pte_pfn(*pte), *(pgprot_t *)(walk->private)) ?
+               0 : -EACCES;
+}
+
+static int prot_none_test(unsigned long addr, unsigned long next,
+                         struct mm_walk *walk)
+{
+       return 0;
+}
+
+static int prot_none_walk(struct vm_area_struct *vma, unsigned long start,
+                          unsigned long end, unsigned long newflags)
+{
+       pgprot_t new_pgprot = vm_get_page_prot(newflags);
+       struct mm_walk prot_none_walk = {
+               .pte_entry = prot_none_pte_entry,
+               .hugetlb_entry = prot_none_hugetlb_entry,
+               .test_walk = prot_none_test,
+               .mm = current->mm,
+               .private = &new_pgprot,
+       };
+
+       return walk_page_range(start, end, &prot_none_walk);
+}
+
  int
  mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev,
         unsigned long start, unsigned long end, unsigned long newflags)
@@ -289,6 +325,19 @@ mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev,
                 return 0;
         }
  
+       /*
+        * Do PROT_NONE PFN permission checks here when we can still
+        * bail out without undoing a lot of state. This is a rather
+        * uncommon case, so doesn't need to be very optimized.
+        */
+       if (arch_has_pfn_modify_check() &&
+           (vma->vm_flags & (VM_PFNMAP|VM_MIXEDMAP)) &&
+           (newflags & (VM_READ|VM_WRITE|VM_EXEC)) == 0) {
+               error = prot_none_walk(vma, start, end, newflags);
+               if (error)
+                       return error;
+       }
+
         /*
          * If we make a private mapping writable we increase our commit;
          * but (without finer accounting) cannot reduce our commit if we
author	Andi Klein <ak@linux.intel.com>
	Wed, 13 Jun 2018 22:48:27 +0000 (15:48 -0700)
committer	Konrad Rzeszutek Wilk <konrad.wilk@oracle.com>
	Fri, 10 Aug 2018 22:56:32 +0000 (18:56 -0400)
arch/x86/include/asm/pgtable.h		patch \| blob \| history
arch/x86/mm/mmap.c		patch \| blob \| history
include/asm-generic/pgtable.h		patch \| blob \| history
mm/memory.c		patch \| blob \| history
mm/mprotect.c		patch \| blob \| history