On Wed, Nov 22, 2017 at 04:35:21PM -0800, Dave Hansen wrote: > > From: Dave Hansen <dave.hansen@xxxxxxxxxxxxxxx> > > With KAISER Kernel PGDs that map userspace are "poisoned" with > the NX bit. This ensures that if a kernel->user CR3 switch is > missed, userspace crashes instead of running in an unhardened > state. > > This code will be needed in a moment when KAISER is turned > on and off at runtime. > > Note that an __ASSEMBLY__ #ifdef is now required since kaiser.h > is indirectly included into assembly. > > Signed-off-by: Dave Hansen <dave.hansen@xxxxxxxxxxxxxxx> > Cc: Moritz Lipp <moritz.lipp@xxxxxxxxxxxxxx> > Cc: Daniel Gruss <daniel.gruss@xxxxxxxxxxxxxx> > Cc: Michael Schwarz <michael.schwarz@xxxxxxxxxxxxxx> > Cc: Richard Fellner <richard.fellner@xxxxxxxxxxxxxxxxx> > Cc: Andy Lutomirski <luto@xxxxxxxxxx> > Cc: Linus Torvalds <torvalds@xxxxxxxxxxxxxxxxxxxx> > Cc: Kees Cook <keescook@xxxxxxxxxx> > Cc: Hugh Dickins <hughd@xxxxxxxxxx> > Cc: x86@xxxxxxxxxx > --- > > b/arch/x86/include/asm/pgtable_64.h | 16 ++++++++++++++- > b/arch/x86/mm/kaiser.c | 38 ++++++++++++++++++++++++++++++++++++ > b/include/linux/kaiser.h | 3 +- > 3 files changed, 55 insertions(+), 2 deletions(-) > > diff -puN arch/x86/include/asm/pgtable_64.h~kaiser-dynamic-unpoison-pgd arch/x86/include/asm/pgtable_64.h > --- a/arch/x86/include/asm/pgtable_64.h~kaiser-dynamic-unpoison-pgd 2017-11-22 15:45:55.818619722 -0800 > +++ b/arch/x86/include/asm/pgtable_64.h 2017-11-22 15:45:55.824619722 -0800 > @@ -3,6 +3,7 @@ > #define _ASM_X86_PGTABLE_64_H > > #include <linux/const.h> > +#include <linux/kaiser.h> > #include <asm/pgtable_64_types.h> > > #ifndef __ASSEMBLY__ > @@ -199,6 +200,18 @@ static inline bool pgd_userspace_access( > return pgd.pgd & _PAGE_USER; > } > > +static inline void kaiser_poison_pgd(pgd_t *pgd) > +{ > + if (pgd->pgd & _PAGE_PRESENT) > + pgd->pgd |= _PAGE_NX; > +} > + > +static inline void kaiser_unpoison_pgd(pgd_t *pgd) > +{ > + if (pgd->pgd & _PAGE_PRESENT) > + pgd->pgd &= ~_PAGE_NX; > +} > + > /* > * Take a PGD location (pgdp) and a pgd value that needs > * to be set there. Populates the shadow and returns > @@ -222,7 +235,8 @@ static inline pgd_t kaiser_set_shadow_pg > * wrong CR3 value, userspace will crash > * instead of running. > */ > - pgd.pgd |= _PAGE_NX; > + if (kaiser_active()) > + kaiser_poison_pgd(&pgd); > } > } else if (pgd_userspace_access(*pgdp)) { > /* > diff -puN arch/x86/mm/kaiser.c~kaiser-dynamic-unpoison-pgd arch/x86/mm/kaiser.c > --- a/arch/x86/mm/kaiser.c~kaiser-dynamic-unpoison-pgd 2017-11-22 15:45:55.819619722 -0800 > +++ b/arch/x86/mm/kaiser.c 2017-11-22 15:45:55.825619722 -0800 > @@ -501,6 +501,9 @@ static ssize_t kaiser_enabled_write_file > if (enable > 1) > return -EINVAL; > > + if (kaiser_enabled == enable) > + return count; > + > WRITE_ONCE(kaiser_enabled, enable); > return count; > } Shouldn't the above hunk be part of the patch that adds the debugfs entry? > @@ -518,3 +521,38 @@ static int __init create_kaiser_enabled( > return 0; > } > late_initcall(create_kaiser_enabled); > + > +enum poison { > + KAISER_POISON, > + KAISER_UNPOISON > +}; > +void kaiser_poison_pgd_page(pgd_t *pgd_page, enum poison do_poison) > +{ > + int i = 0; > + > + for (i = 0; i < PTRS_PER_PGD; i++) { > + pgd_t *pgd = &pgd_page[i]; > + > + /* Stop once we hit kernel addresses: */ > + if (!pgdp_maps_userspace(pgd)) > + break; > + > + if (do_poison == KAISER_POISON) > + kaiser_poison_pgd(pgd); > + else > + kaiser_unpoison_pgd(pgd); > + } > + > +} > + > +void kaiser_poison_pgds(enum poison do_poison) > +{ > + struct page *page; > + > + spin_lock(&pgd_lock); > + list_for_each_entry(page, &pgd_list, lru) { > + pgd_t *pgd = (pgd_t *)page_address(page); > + kaiser_poison_pgd_page(pgd, do_poison); > + } > + spin_unlock(&pgd_lock); > +} > diff -puN include/linux/kaiser.h~kaiser-dynamic-unpoison-pgd include/linux/kaiser.h > --- a/include/linux/kaiser.h~kaiser-dynamic-unpoison-pgd 2017-11-22 15:45:55.821619722 -0800 > +++ b/include/linux/kaiser.h 2017-11-22 15:45:55.826619722 -0800 > @@ -4,7 +4,7 @@ > #ifdef CONFIG_KAISER > #include <asm/kaiser.h> > #else > - > +#ifndef __ASSEMBLY__ > /* > * These stubs are used whenever CONFIG_KAISER is off, which > * includes architectures that support KAISER, but have it > @@ -33,5 +33,6 @@ static inline bool kaiser_active(void) > { > return 0; > } > +#endif /* __ASSEMBLY__ */ > #endif /* !CONFIG_KAISER */ > #endif /* _INCLUDE_KAISER_H */ > _ > -- All the best, Eduardo Valentin -- To unsubscribe, send a message with 'unsubscribe linux-mm' in the body to majordomo@xxxxxxxxx. For more info on Linux MM, see: http://www.linux-mm.org/ . Don't email: <a href=mailto:"dont@xxxxxxxxx"> email@xxxxxxxxx </a>