mm/gup, x86/mm/pkeys: Check VMAs and PTEs for protection keys

author Dave Hansen <dave.hansen@linux.intel.com>

Fri, 12 Feb 2016 21:02:19 +0000 (13:02 -0800)

committer Ingo Molnar <mingo@kernel.org>

Thu, 18 Feb 2016 08:32:44 +0000 (09:32 +0100)
author Dave Hansen <dave.hansen@linux.intel.com>
Fri, 12 Feb 2016 21:02:19 +0000 (13:02 -0800)
committer Ingo Molnar <mingo@kernel.org>
Thu, 18 Feb 2016 08:32:44 +0000 (09:32 +0100)
diff --git a/arch/powerpc/include/asm/mmu_context.h b/arch/powerpc/include/asm/mmu_context.h

index 878c27771717260cb1bc5590ad4c6138b2b096f7..a0f1838c8e78e409f9b5ae04d7bc93b254ef44d6 100644 (file)
--- a/arch/powerpc/include/asm/mmu_context.h
+++ b/arch/powerpc/include/asm/mmu_context.h
@@ -148,5 +148,16 @@ static inline void arch_bprm_mm_init(struct mm_struct *mm,
  {
  }
  
+static inline bool arch_vma_access_permitted(struct vm_area_struct *vma, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
+
+static inline bool arch_pte_access_permitted(pte_t pte, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
  #endif /* __KERNEL__ */
  #endif /* __ASM_POWERPC_MMU_CONTEXT_H */
diff --git a/arch/s390/include/asm/mmu_context.h b/arch/s390/include/asm/mmu_context.h

index fb1b93ea3e3fead0efde9f30e819c55eecb88da9..2627b338382cd448755c107d8d34d1c6dff28ce3 100644 (file)
--- a/arch/s390/include/asm/mmu_context.h
+++ b/arch/s390/include/asm/mmu_context.h
@@ -130,4 +130,15 @@ static inline void arch_bprm_mm_init(struct mm_struct *mm,
  {
  }
  
+static inline bool arch_vma_access_permitted(struct vm_area_struct *vma, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
+
+static inline bool arch_pte_access_permitted(pte_t pte, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
  #endif /* __S390_MMU_CONTEXT_H */
diff --git a/arch/unicore32/include/asm/mmu_context.h b/arch/unicore32/include/asm/mmu_context.h

index 1cb5220afaf9dbdb13c2ad2f250566d2881a1c1e..3133f947ade27338abda2246910fe3458d43bb44 100644 (file)
--- a/arch/unicore32/include/asm/mmu_context.h
+++ b/arch/unicore32/include/asm/mmu_context.h
@@ -97,4 +97,15 @@ static inline void arch_bprm_mm_init(struct mm_struct *mm,
  {
  }
  
+static inline bool arch_vma_access_permitted(struct vm_area_struct *vma, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
+
+static inline bool arch_pte_access_permitted(pte_t pte, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
  #endif
diff --git a/arch/x86/include/asm/mmu_context.h b/arch/x86/include/asm/mmu_context.h

index 94c4c8b5cb8fd1d485164f47f7f1a4a2bd9055b4..19036cdbed8ffbda1141c53d31ef18a47014af8b 100644 (file)
--- a/arch/x86/include/asm/mmu_context.h
+++ b/arch/x86/include/asm/mmu_context.h
@@ -286,4 +286,53 @@ static inline int vma_pkey(struct vm_area_struct *vma)
         return pkey;
  }
  
+static inline bool __pkru_allows_pkey(u16 pkey, bool write)
+{
+       u32 pkru = read_pkru();
+
+       if (!__pkru_allows_read(pkru, pkey))
+               return false;
+       if (write && !__pkru_allows_write(pkru, pkey))
+               return false;
+
+       return true;
+}
+
+/*
+ * We only want to enforce protection keys on the current process
+ * because we effectively have no access to PKRU for other
+ * processes or any way to tell *which * PKRU in a threaded
+ * process we could use.
+ *
+ * So do not enforce things if the VMA is not from the current
+ * mm, or if we are in a kernel thread.
+ */
+static inline bool vma_is_foreign(struct vm_area_struct *vma)
+{
+       if (!current->mm)
+               return true;
+       /*
+        * Should PKRU be enforced on the access to this VMA?  If
+        * the VMA is from another process, then PKRU has no
+        * relevance and should not be enforced.
+        */
+       if (current->mm != vma->vm_mm)
+               return true;
+
+       return false;
+}
+
+static inline bool arch_vma_access_permitted(struct vm_area_struct *vma, bool write)
+{
+       /* allow access if the VMA is not one from this process */
+       if (vma_is_foreign(vma))
+               return true;
+       return __pkru_allows_pkey(vma_pkey(vma), write);
+}
+
+static inline bool arch_pte_access_permitted(pte_t pte, bool write)
+{
+       return __pkru_allows_pkey(pte_flags_pkey(pte_flags(pte)), write);
+}
+
  #endif /* _ASM_X86_MMU_CONTEXT_H */
diff --git a/arch/x86/include/asm/pgtable.h b/arch/x86/include/asm/pgtable.h

index e997dcc6ee2bec19d7918deec02542db68335a4b..3cbfae80abb2ef88ba73b8d92e1b625f2624f04b 100644 (file)
--- a/arch/x86/include/asm/pgtable.h
+++ b/arch/x86/include/asm/pgtable.h
@@ -919,6 +919,35 @@ static inline pte_t pte_swp_clear_soft_dirty(pte_t pte)
  }
  #endif
  
+#define PKRU_AD_BIT 0x1
+#define PKRU_WD_BIT 0x2
+
+static inline bool __pkru_allows_read(u32 pkru, u16 pkey)
+{
+       int pkru_pkey_bits = pkey * 2;
+       return !(pkru & (PKRU_AD_BIT << pkru_pkey_bits));
+}
+
+static inline bool __pkru_allows_write(u32 pkru, u16 pkey)
+{
+       int pkru_pkey_bits = pkey * 2;
+       /*
+        * Access-disable disables writes too so we need to check
+        * both bits here.
+        */
+       return !(pkru & ((PKRU_AD_BIT|PKRU_WD_BIT) << pkru_pkey_bits));
+}
+
+static inline u16 pte_flags_pkey(unsigned long pte_flags)
+{
+#ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS
+       /* ifdef to avoid doing 59-bit shift on 32-bit values */
+       return (pte_flags & _PAGE_PKEY_MASK) >> _PAGE_BIT_PKEY_BIT0;
+#else
+       return 0;
+#endif
+}
+
  #include <asm-generic/pgtable.h>
  #endif /* __ASSEMBLY__ */
  
diff --git a/arch/x86/mm/fault.c b/arch/x86/mm/fault.c

index 6e71dcf699ab59f55288ba0923a155e64982df64..319331afae24ca9fac9d10347a04c3450668d6e8 100644 (file)
--- a/arch/x86/mm/fault.c
+++ b/arch/x86/mm/fault.c
@@ -897,6 +897,16 @@ bad_area(struct pt_regs *regs, unsigned long error_code, unsigned long address)
         __bad_area(regs, error_code, address, NULL, SEGV_MAPERR);
  }
  
+static inline bool bad_area_access_from_pkeys(unsigned long error_code,
+               struct vm_area_struct *vma)
+{
+       if (!boot_cpu_has(X86_FEATURE_OSPKE))
+               return false;
+       if (error_code & PF_PK)
+               return true;
+       return false;
+}
+
  static noinline void
  bad_area_access_error(struct pt_regs *regs, unsigned long error_code,
                       unsigned long address, struct vm_area_struct *vma)
@@ -906,7 +916,7 @@ bad_area_access_error(struct pt_regs *regs, unsigned long error_code,
          * But, doing it this way allows compiler optimizations
          * if pkeys are compiled out.
          */
-       if (boot_cpu_has(X86_FEATURE_OSPKE) && (error_code & PF_PK))
+       if (bad_area_access_from_pkeys(error_code, vma))
                 __bad_area(regs, error_code, address, vma, SEGV_PKUERR);
         else
                 __bad_area(regs, error_code, address, vma, SEGV_ACCERR);
@@ -1081,6 +1091,15 @@ int show_unhandled_signals = 1;
  static inline int
  access_error(unsigned long error_code, struct vm_area_struct *vma)
  {
+       /*
+        * Access or read was blocked by protection keys. We do
+        * this check before any others because we do not want
+        * to, for instance, confuse a protection-key-denied
+        * write with one for which we should do a COW.
+        */
+       if (error_code & PF_PK)
+               return 1;
+
         if (error_code & PF_WRITE) {
                 /* write, present and write, not present: */
                 if (unlikely(!(vma->vm_flags & VM_WRITE)))
diff --git a/arch/x86/mm/gup.c b/arch/x86/mm/gup.c

index 2f0a32945cda32a4c21ce0c13c9c597bfd9ce035..bab259e75984441a5857da5c3029d06d705ad551 100644 (file)
--- a/arch/x86/mm/gup.c
+++ b/arch/x86/mm/gup.c
@@ -11,6 +11,7 @@
  #include <linux/swap.h>
  #include <linux/memremap.h>
  
+#include <asm/mmu_context.h>
  #include <asm/pgtable.h>
  
  static inline pte_t gup_get_pte(pte_t *ptep)
@@ -89,6 +90,10 @@ static inline int pte_allows_gup(unsigned long pteval, int write)
         if ((pteval & need_pte_bits) != need_pte_bits)
                 return 0;
  
+       /* Check memory protection keys permissions. */
+       if (!__pkru_allows_pkey(pte_flags_pkey(pteval), write))
+               return 0;
+
         return 1;
  }
  
diff --git a/include/asm-generic/mm_hooks.h b/include/asm-generic/mm_hooks.h

index 866aa461efa54b92693640038e43097880afaa46..c1fc5af3c3843f24982c7d9913ccdf9da0ba92bb 100644 (file)
--- a/include/asm-generic/mm_hooks.h
+++ b/include/asm-generic/mm_hooks.h
@@ -26,4 +26,15 @@ static inline void arch_bprm_mm_init(struct mm_struct *mm,
  {
  }
  
+static inline bool arch_vma_access_permitted(struct vm_area_struct *vma, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
+
+static inline bool arch_pte_access_permitted(pte_t pte, bool write)
+{
+       /* by default, allow everything */
+       return true;
+}
  #endif /* _ASM_GENERIC_MM_HOOKS_H */
diff --git a/mm/gup.c b/mm/gup.c

index b935c2c71ec93530b4466599bf600e112ab4cfc6..e0f5f3574d16a9749efff3fc53d502e5f1614453 100644 (file)
--- a/mm/gup.c
+++ b/mm/gup.c
@@ -15,6 +15,7 @@
  #include <linux/rwsem.h>
  #include <linux/hugetlb.h>
  
+#include <asm/mmu_context.h>
  #include <asm/pgtable.h>
  #include <asm/tlbflush.h>
  
@@ -444,6 +445,8 @@ static int check_vma_flags(struct vm_area_struct *vma, unsigned long gup_flags)
                 if (!(vm_flags & VM_MAYREAD))
                         return -EFAULT;
         }
+       if (!arch_vma_access_permitted(vma, (gup_flags & FOLL_WRITE)))
+               return -EFAULT;
         return 0;
  }
  
@@ -612,13 +615,19 @@ EXPORT_SYMBOL(__get_user_pages);
  
  bool vma_permits_fault(struct vm_area_struct *vma, unsigned int fault_flags)
  {
-       vm_flags_t vm_flags;
-
-       vm_flags = (fault_flags & FAULT_FLAG_WRITE) ? VM_WRITE : VM_READ;
+       bool write = !!(fault_flags & FAULT_FLAG_WRITE);
+       vm_flags_t vm_flags = write ? VM_WRITE : VM_READ;
  
         if (!(vm_flags & vma->vm_flags))
                 return false;
  
+       /*
+        * The architecture might have a hardware protection
+        * mechanism other than read/write that can deny access
+        */
+       if (!arch_vma_access_permitted(vma, write))
+               return false;
+
         return true;
  }
  
@@ -1172,6 +1181,9 @@ static int gup_pte_range(pmd_t pmd, unsigned long addr, unsigned long end,
                         pte_protnone(pte) || (write && !pte_write(pte)))
                         goto pte_unmap;
  
+               if (!arch_pte_access_permitted(pte, write))
+                       goto pte_unmap;
+
                 VM_BUG_ON(!pfn_valid(pte_pfn(pte)));
                 page = pte_page(pte);
                 head = compound_head(page);
diff --git a/mm/memory.c b/mm/memory.c

index 8bfbad0cca8ceb77fa206308b709affc4a4c6e25..d7e84fe6504dd622cc87babd30ba27cc3ec712da 100644 (file)
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -65,6 +65,7 @@
  #include <linux/userfaultfd_k.h>
  
  #include <asm/io.h>
+#include <asm/mmu_context.h>
  #include <asm/pgalloc.h>
  #include <asm/uaccess.h>
  #include <asm/tlb.h>
@@ -3378,6 +3379,9 @@ static int __handle_mm_fault(struct mm_struct *mm, struct vm_area_struct *vma,
         pmd_t *pmd;
         pte_t *pte;
  
+       if (!arch_vma_access_permitted(vma, flags & FAULT_FLAG_WRITE))
+               return VM_FAULT_SIGSEGV;
+
         if (unlikely(is_vm_hugetlb_page(vma)))
                 return hugetlb_fault(mm, vma, address, flags);
author	Dave Hansen <dave.hansen@linux.intel.com>
	Fri, 12 Feb 2016 21:02:19 +0000 (13:02 -0800)
committer	Ingo Molnar <mingo@kernel.org>
	Thu, 18 Feb 2016 08:32:44 +0000 (09:32 +0100)
arch/powerpc/include/asm/mmu_context.h		patch \| blob \| history
arch/s390/include/asm/mmu_context.h		patch \| blob \| history
arch/unicore32/include/asm/mmu_context.h		patch \| blob \| history
arch/x86/include/asm/mmu_context.h		patch \| blob \| history
arch/x86/include/asm/pgtable.h		patch \| blob \| history
arch/x86/mm/fault.c		patch \| blob \| history
arch/x86/mm/gup.c		patch \| blob \| history
include/asm-generic/mm_hooks.h		patch \| blob \| history
mm/gup.c		patch \| blob \| history
mm/memory.c		patch \| blob \| history