On Thu, Jan 17, 2019 at 01:55:29PM +0000, Zhuangyanying wrote: > From: Xiao Guangrong <xiaoguangrong@xxxxxxxxxxx> > > It is used to track possible writable sptes on the shadow page on > which the bit is set to 1 for the sptes that are already writable > or can be locklessly updated to writable on the fast_page_fault > path, also a counter for the number of possible writable sptes is > introduced to speed up bitmap walking > > Later patch will benefit good performance by using this bitmap and > counter to fast figure out writable sptes and write protect them > > Signed-off-by: Xiao Guangrong <xiaoguangrong@xxxxxxxxxxx> > --- > arch/x86/include/asm/kvm_host.h | 6 ++++- > arch/x86/kvm/mmu.c | 53 ++++++++++++++++++++++++++++++++++++++++- > 2 files changed, 57 insertions(+), 2 deletions(-) > > diff --git a/arch/x86/include/asm/kvm_host.h b/arch/x86/include/asm/kvm_host.h > index 4660ce9..5c30aa0 100644 > --- a/arch/x86/include/asm/kvm_host.h > +++ b/arch/x86/include/asm/kvm_host.h > @@ -128,6 +128,7 @@ static inline gfn_t gfn_to_index(gfn_t gfn, gfn_t base_gfn, int level) > #define KVM_MIN_ALLOC_MMU_PAGES 64 > #define KVM_MMU_HASH_SHIFT 12 > #define KVM_NUM_MMU_PAGES (1 << KVM_MMU_HASH_SHIFT) > +#define KVM_MMU_SP_ENTRY_NR 512 > #define KVM_MIN_FREE_MMU_PAGES 5 > #define KVM_REFILL_PAGES 25 > #define KVM_MAX_CPUID_ENTRIES 80 > @@ -331,12 +332,15 @@ struct kvm_mmu_page { > gfn_t *gfns; > int root_count; /* Currently serving as active root */ > unsigned int unsync_children; > + unsigned int possiable_writable_sptes; s/possiable/possible > struct kvm_rmap_head parent_ptes; /* rmap pointers to parent sptes */ > > /* The page is obsolete if mmu_valid_gen != kvm->arch.mmu_valid_gen. */ > unsigned long mmu_valid_gen; > > - DECLARE_BITMAP(unsync_child_bitmap, 512); > + DECLARE_BITMAP(unsync_child_bitmap, KVM_MMU_SP_ENTRY_NR); > + > + DECLARE_BITMAP(possible_writable_spte_bitmap, KVM_MMU_SP_ENTRY_NR); > > #ifdef CONFIG_X86_32 > /* > diff --git a/arch/x86/kvm/mmu.c b/arch/x86/kvm/mmu.c > index eeb3bac..9daab00 100644 > --- a/arch/x86/kvm/mmu.c > +++ b/arch/x86/kvm/mmu.c > @@ -718,6 +718,49 @@ static bool is_dirty_spte(u64 spte) > return dirty_mask ? spte & dirty_mask : spte & PT_WRITABLE_MASK; > } > > +static bool is_possible_writable_spte(u64 spte) > +{ > + if (!is_shadow_present_pte(spte)) > + return false; > + > + if (is_writable_pte(spte)) > + return true; > + > + if (spte_can_locklessly_be_made_writable(spte)) > + return true; > + > + /* > + * although is_access_track_spte() sptes can be updated out of > + * mmu-lock, we need not take them into account as access_track > + * drops writable bit for them > + */ > + return false; > +} > + > +static void > +mmu_log_possible_writable_spte(u64 *sptep, u64 old_spte, u64 new_spte) > +{ > + struct kvm_mmu_page *sp = page_header(__pa(sptep)); > + bool old_state, new_state; > + > + old_state = is_possible_writable_spte(old_spte); > + new_state = is_possible_writable_spte(new_spte); > + > + if (old_state == new_state) > + return; > + > + /* a possible writable spte is dropped */ > + if (old_state) { > + sp->possiable_writable_sptes--; > + __clear_bit(sptep - sp->spt, sp->possible_writable_spte_bitmap); > + return; > + } > + > + /* a new possible writable spte is set */ > + sp->possiable_writable_sptes++; > + __set_bit(sptep - sp->spt, sp->possible_writable_spte_bitmap); > +} > + > /* Rules for using mmu_spte_set: > * Set the sptep from nonpresent to present. > * Note: the sptep being assigned *must* be either not present > @@ -728,6 +771,7 @@ static void mmu_spte_set(u64 *sptep, u64 new_spte) > { > WARN_ON(is_shadow_present_pte(*sptep)); > __set_spte(sptep, new_spte); > + mmu_log_possible_writable_spte(sptep, 0ull, new_spte); > } > > /* > @@ -746,6 +790,7 @@ static void mmu_spte_update_no_track(u64 *sptep, u64 new_spte) > } > > __update_clear_spte_fast(sptep, new_spte); > + mmu_log_possible_writable_spte(sptep, old_spte, new_spte); Hmm, maybe it's just me, but I find the "track vs. no_track" terminology quite confusing, e.g. the "no_track" functions are now logging sptes. Track and log aren't exact synonyms, but they're pretty closed. > } > > /* > @@ -771,6 +816,7 @@ static u64 mmu_spte_update_track(u64 *sptep, u64 new_spte) > > WARN_ON(spte_to_pfn(old_spte) != spte_to_pfn(new_spte)); > > + mmu_log_possible_writable_spte(sptep, old_spte, new_spte); > return old_spte; > } > > @@ -836,6 +882,8 @@ static int mmu_spte_clear_track_bits(u64 *sptep) > else > old_spte = __update_clear_spte_slow(sptep, 0ull); > > + mmu_log_possible_writable_spte(sptep, old_spte, 0ull); > + > if (!is_shadow_present_pte(old_spte)) > return 0; > > @@ -864,7 +912,10 @@ static int mmu_spte_clear_track_bits(u64 *sptep) > */ > static void mmu_spte_clear_no_track(u64 *sptep) > { > + u64 old_spte = *sptep; > + > __update_clear_spte_fast(sptep, 0ull); > + mmu_log_possible_writable_spte(sptep, old_spte, 0ull); > } > > static u64 mmu_spte_get_lockless(u64 *sptep) > @@ -2159,7 +2210,7 @@ static int __mmu_unsync_walk(struct kvm_mmu_page *sp, > { > int i, ret, nr_unsync_leaf = 0; > > - for_each_set_bit(i, sp->unsync_child_bitmap, 512) { > + for_each_set_bit(i, sp->unsync_child_bitmap, KVM_MMU_SP_ENTRY_NR) { > struct kvm_mmu_page *child; > u64 ent = sp->spt[i]; > > -- > 1.8.3.1 > >