[RFC 06/12] mm: Add the encrypt_mprotect() system call
Jarkko Sakkinen
jarkko.sakkinen at linux.intel.com
Mon Sep 10 18:02:43 UTC 2018
On Fri, 2018-09-07 at 15:36 -0700, Alison Schofield wrote:
> Implement memory encryption with a new system call that is an
> extension of the legacy mprotect() system call.
>
> In encrypt_mprotect the caller must pass a handle to a previously
> allocated and programmed encryption key. Validate the key and store
> the keyid bits in the vm_page_prot for each VMA in the protection
> range.
>
> Signed-off-by: Alison Schofield <alison.schofield at intel.com>
> ---
> fs/exec.c | 4 ++--
> include/linux/key.h | 2 ++
> include/linux/mm.h | 3 ++-
> mm/mprotect.c | 67 ++++++++++++++++++++++++++++++++++++++++++++++++--
> ---
> 4 files changed, 67 insertions(+), 9 deletions(-)
>
> diff --git a/fs/exec.c b/fs/exec.c
> index a1a246062561..b681a413db9c 100644
> --- a/fs/exec.c
> +++ b/fs/exec.c
> @@ -754,8 +754,8 @@ int setup_arg_pages(struct linux_binprm *bprm,
> vm_flags |= mm->def_flags;
> vm_flags |= VM_STACK_INCOMPLETE_SETUP;
>
> - ret = mprotect_fixup(vma, &prev, vma->vm_start, vma->vm_end,
> - vm_flags);
> + ret = mprotect_fixup(vma, &prev, vma->vm_start, vma->vm_end,
> vm_flags,
> + -1);
Why you pass a magic number here when you went the trouble having
a named constant?
> if (ret)
> goto out_unlock;
> BUG_ON(prev != vma);
> diff --git a/include/linux/key.h b/include/linux/key.h
> index e58ee10f6e58..fb8a7d5f6149 100644
> --- a/include/linux/key.h
> +++ b/include/linux/key.h
> @@ -346,6 +346,8 @@ static inline key_serial_t key_serial(const struct key
> *key)
>
> extern void key_set_timeout(struct key *, unsigned);
>
> +extern key_ref_t lookup_user_key(key_serial_t id, unsigned long lflags,
> + key_perm_t perm);
> /*
> * The permissions required on a key that we're looking up.
> */
> diff --git a/include/linux/mm.h b/include/linux/mm.h
> index ac85c0805761..0f9422c7841e 100644
> --- a/include/linux/mm.h
> +++ b/include/linux/mm.h
> @@ -1579,7 +1579,8 @@ extern unsigned long change_protection(struct
> vm_area_struct *vma, unsigned long
> int dirty_accountable, int prot_numa);
> extern int mprotect_fixup(struct vm_area_struct *vma,
> struct vm_area_struct **pprev, unsigned long start,
> - unsigned long end, unsigned long newflags);
> + unsigned long end, unsigned long newflags,
> + int newkeyid);
>
> /*
> * doesn't attempt to fault and will return short.
> diff --git a/mm/mprotect.c b/mm/mprotect.c
> index 56e64ef7931e..6c2e1106525c 100644
> --- a/mm/mprotect.c
> +++ b/mm/mprotect.c
> @@ -28,14 +28,17 @@
> #include <linux/ksm.h>
> #include <linux/uaccess.h>
> #include <linux/mm_inline.h>
> +#include <linux/key.h>
> #include <asm/pgtable.h>
> #include <asm/cacheflush.h>
> #include <asm/mmu_context.h>
> #include <asm/tlbflush.h>
> +#include <asm/mktme.h>
>
> #include "internal.h"
>
> #define NO_PKEY -1
> +#define NO_KEYID -1
Should have only single named constant IMHO. This ambiguity
is worse than some reasonable constant name for both cases.
Maybe NO_KEYID would be adequate?
>
> static unsigned long change_pte_range(struct vm_area_struct *vma, pmd_t *pmd,
> unsigned long addr, unsigned long end, pgprot_t newprot,
> @@ -310,7 +313,8 @@ unsigned long change_protection(struct vm_area_struct
> *vma, unsigned long start,
>
> int
> mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev,
> - unsigned long start, unsigned long end, unsigned long newflags)
> + unsigned long start, unsigned long end, unsigned long
> newflags,
> + int newkeyid)
> {
> struct mm_struct *mm = vma->vm_mm;
> unsigned long oldflags = vma->vm_flags;
> @@ -320,10 +324,24 @@ mprotect_fixup(struct vm_area_struct *vma, struct
> vm_area_struct **pprev,
> int error;
> int dirty_accountable = 0;
>
> + /*
> + * Flags match and Keyids match or we have NO_KEYID.
> + * This _fixup is usually called from do_mprotect_ext() except
> + * for one special case: caller fs/exec.c/setup_arg_pages()
> + * In that case, newkeyid is passed as -1 (NO_KEYID).
> + */
> + if (newflags == oldflags &&
> + (newkeyid == vma_keyid(vma) || newkeyid == NO_KEYID)) {
> + *pprev = vma;
> + return 0;
> + }
> + /* Flags match and Keyid changes */
> if (newflags == oldflags) {
> + mprotect_set_encrypt(vma, newkeyid);
> *pprev = vma;
> return 0;
> }
> + /* Flags and Keyids both change, continue. */
>
> /*
> * If we make a private mapping writable we increase our commit;
> @@ -373,6 +391,8 @@ mprotect_fixup(struct vm_area_struct *vma, struct
> vm_area_struct **pprev,
> }
>
> success:
> + if (newkeyid != NO_KEYID)
> + mprotect_set_encrypt(vma, newkeyid);
> /*
> * vm_flags and vm_page_prot are protected by the mmap_sem
> * held in write mode.
> @@ -404,10 +424,15 @@ mprotect_fixup(struct vm_area_struct *vma, struct
> vm_area_struct **pprev,
> }
>
> /*
> - * When pkey==NO_PKEY we get legacy mprotect behavior here.
> + * do_mprotect_ext() supports the legacy mprotect behavior plus extensions
> + * for protection keys and memory encryption keys. These extensions are
> + * mutually exclusive and the behavior is:
> + * (pkey==NO_PKEY && keyid==NO_KEYID) ==> legacy mprotect
> + * (pkey is valid) ==> legacy mprotect plus protection key extensions
> + * (keyid is valid) ==> legacy mprotect plus encryption key extensions
> */
The header does not follow
https://www.kernel.org/doc/Documentation/kernel-doc-nano-HOWTO.txt
> static int do_mprotect_ext(unsigned long start, size_t len,
> - unsigned long prot, int pkey)
> + unsigned long prot, int pkey, int keyid)
> {
> unsigned long nstart, end, tmp, reqprot;
> struct vm_area_struct *vma, *prev;
> @@ -505,7 +530,8 @@ static int do_mprotect_ext(unsigned long start, size_t
> len,
> tmp = vma->vm_end;
> if (tmp > end)
> tmp = end;
> - error = mprotect_fixup(vma, &prev, nstart, tmp, newflags);
> + error = mprotect_fixup(vma, &prev, nstart, tmp, newflags,
> + keyid);
> if (error)
> goto out;
> nstart = tmp;
> @@ -530,7 +556,7 @@ static int do_mprotect_ext(unsigned long start, size_t
> len,
> SYSCALL_DEFINE3(mprotect, unsigned long, start, size_t, len,
> unsigned long, prot)
> {
> - return do_mprotect_ext(start, len, prot, NO_PKEY);
> + return do_mprotect_ext(start, len, prot, NO_PKEY, NO_KEYID);
> }
>
> #ifdef CONFIG_ARCH_HAS_PKEYS
> @@ -538,7 +564,7 @@ SYSCALL_DEFINE3(mprotect, unsigned long, start, size_t,
> len,
> SYSCALL_DEFINE4(pkey_mprotect, unsigned long, start, size_t, len,
> unsigned long, prot, int, pkey)
> {
> - return do_mprotect_ext(start, len, prot, pkey);
> + return do_mprotect_ext(start, len, prot, pkey, NO_KEYID);
> }
>
> SYSCALL_DEFINE2(pkey_alloc, unsigned long, flags, unsigned long, init_val)
> @@ -587,3 +613,32 @@ SYSCALL_DEFINE1(pkey_free, int, pkey)
> }
>
> #endif /* CONFIG_ARCH_HAS_PKEYS */
> +
> +#ifdef CONFIG_X86_INTEL_MKTME
> +
> +SYSCALL_DEFINE4(encrypt_mprotect, unsigned long, start, size_t, len,
> + unsigned long, prot, key_serial_t, serial)
> +{
> + key_ref_t key_ref;
> + int ret, keyid;
> +
> + /* TODO MKTME key service must be initialized */
> +
> + key_ref = lookup_user_key(serial, 0, KEY_NEED_VIEW);
> + if (IS_ERR(key_ref))
> + return PTR_ERR(key_ref);
> +
> + mktme_map_lock();
> + keyid = mktme_map_keyid_from_serial(serial);
> + if (!keyid) {
> + mktme_map_unlock();
> + key_ref_put(key_ref);
> + return -EINVAL;
> + }
> + ret = do_mprotect_ext(start, len, prot, NO_PKEY, keyid);
> + mktme_map_unlock();
> + key_ref_put(key_ref);
> + return ret;
> +}
> +
> +#endif /* CONFIG_X86_INTEL_MKTME */
/Jarkko
More information about the Linux-security-module-archive
mailing list