Re: [PATCH v6 07/13] KVM: selftests: Change ____vm_create() to take struct kvm_vm_mem_params

Ricardo Koller <ricarkol@xxxxxxxxxx> · Mon, 19 Sep 2022 12:21:19 -0700

On Mon, Sep 19, 2022 at 04:28:26PM +0000, Sean Christopherson wrote:
> On Tue, Sep 06, 2022, Ricardo Koller wrote:
> > @@ -637,19 +658,45 @@ vm_paddr_t vm_phy_pages_alloc(struct kvm_vm *vm, size_t num,
> >  			      vm_paddr_t paddr_min, uint32_t memslot);
> >  vm_paddr_t vm_alloc_page_table(struct kvm_vm *vm);
> >  
> > +struct kvm_vm_mem_params {
> > +	enum vm_guest_mode mode;
> > +
> > +	struct {
> > +		enum vm_mem_backing_src_type src_type;
> > +		uint64_t guest_paddr;
> > +		/*
> > +		 * KVM region slot (same meaning as in struct
> > +		 * kvm_userspace_memory_region).
> > +		 */
> > +		uint32_t slot;
> > +		uint64_t npages;
> > +		uint32_t flags;
> > +		bool enabled;
> 
> "enabled" is unnecessary, just have ____vm_create() skip over regions with npages=0.
> Likely ends up being a moot point though.
> 
> > +	} region[NR_MEM_REGIONS];
> > +
> > +	/* Each region type points to a region in the above array. */
> > +	uint16_t region_idx[NR_MEM_REGIONS];
> 
> Eww.  This is going to be super confusing and it's one more thing for tests to
> screw up.  And open coding the indices for region[] is beyond gross.
> 
> > +};
> > +
> > +extern struct kvm_vm_mem_params kvm_vm_mem_default;
> > +
> >  /*
> >   * ____vm_create() does KVM_CREATE_VM and little else.  __vm_create() also
> >   * loads the test binary into guest memory and creates an IRQ chip (x86 only).
> >   * __vm_create() does NOT create vCPUs, @nr_runnable_vcpus is used purely to
> >   * calculate the amount of memory needed for per-vCPU data, e.g. stacks.
> >   */
> > -struct kvm_vm *____vm_create(enum vm_guest_mode mode, uint64_t nr_pages);
> > +struct kvm_vm *____vm_create(struct kvm_vm_mem_params *mem_params);
> >  struct kvm_vm *__vm_create(enum vm_guest_mode mode, uint32_t nr_runnable_vcpus,
> >  			   uint64_t nr_extra_pages);
> >  
> >  static inline struct kvm_vm *vm_create_barebones(void)
> >  {
> > -	return ____vm_create(VM_MODE_DEFAULT, 0);
> > +	struct kvm_vm_mem_params params_wo_memslots = {
> > +		.mode = kvm_vm_mem_default.mode,
> > +	};
> > +
> > +	return ____vm_create(&params_wo_memslots);
> 
> Very related to the above complaints, this is rather ugly.  I liked the idea of
> passing a struct to __vm_create(), but passing it to ____vm_create() feels extremely
> forced.
> 
> In an ideal world, my preference would still be to modify __vm_create() to take the
> struct so that a test that wants to utilize different memslots doesn't need to
> manually duplicate all the other stuff in __vm_create(), but that might end up
> being too forced as well.  For now, I'm ok punting on that so the page_fault_test
> can get merged.
> 
> Looking at this with fresh eyes, there's simply no reason ____vm_create() should be
> creating memslots.  If this series first moves the memslot creation into __vm_create()
> where it belongs (patch below), then there's no need to force ____vm_create() to take
> a struct.  And if we punt on refactoring __vm_create(), then there's no need to
> add kvm_vm_mem_default and no real need to add struct kvm_vm_mem_params either.

I think I prefer option A below. And I will take the offer of punting on
refactoring __vm_create() for after page_fault_test.

Having a struct would be nice, as that will allow tests to do things
like: run with all these combinations of (backing_src, regions, ...).

Thanks for the review,
Ricardo

> 
> If/when there's a second test that wants fine-grained control over memslots then
> we can figure out a proper API to share between page_fault_test and whatever the
> new test is, but for now if page_fault_test is going to call ____vm_create()
> directly, then I think it's easier to forego the common API and just have page_fault_test
> and __vm_create() open code setting vm->memslots.
> 
> Alternatively, if we really want a common API right away, then we can add a helper
> to populate the memory region + vm->memslots.
> 
> Option A (open code):
> 
> struct kvm_vm *__vm_create(enum vm_guest_mode mode, uint32_t nr_runnable_vcpus,
> 			   uint64_t nr_extra_pages)
> {
> 	uint64_t nr_pages = vm_nr_pages_required(mode, nr_runnable_vcpus,
> 						 nr_extra_pages);
> 	struct kvm_vm *vm;
> 	int i;
> 
> 	vm = ____vm_create(mode);
> 
> 	vm_userspace_mem_region_add(vm, VM_MEM_SRC_ANONYMOUS, 0, 0, nr_pages, 0);
> 
> 	for (i = 0; i < NR_MEM_REGIONS; i++)
> 		vm->memslots[i] = 0;
> 
> 	kvm_vm_elf_load(vm, program_invocation_name);
> 
> #ifdef __x86_64__
> 	vm_create_irqchip(vm);
> #endif
> 	return vm;
> }
> 
> ...
> 
> enum pf_test_memslots {
> 	CODE_MEMSLOT,
> 	PAGE_TABLE_MEMSLOT,
> 	DATA_MEMSLOT,
> }
> 
> /* Create a code memslot at pfn=0, and data and PT ones at max_gfn. */
> static void setup_memslots(struct kvm_vm *vm, struct test_params *p)
> {
> 	uint64_t backing_src_pagesz = get_backing_src_pagesz(p->src_type);
> 	uint64_t guest_page_size = vm_guest_mode_params[mode].page_size;
> 	uint64_t max_gfn = get_max_gfn(mode);
> 	/* Enough for 2M of code when using 4K guest pages. */
> 	uint64_t code_npages = 512;
> 	uint64_t pt_size, data_size, data_gpa;
> 
> 	/*
> 	 * This test requires 1 pgd, 2 pud, 4 pmd, and 6 pte pages when using
> 	 * VM_MODE_P48V48_4K. Note that the .text takes ~1.6MBs.  That's 13
> 	 * pages. VM_MODE_P48V48_4K is the mode with most PT pages; let's use
> 	 * twice that just in case.
> 	 */
> 	pt_size = 26 * guest_page_size;
> 
> 	/* memslot sizes and gpa's must be aligned to the backing page size */
> 	pt_size = align_up(pt_size, backing_src_pagesz);
> 	data_size = align_up(guest_page_size, backing_src_pagesz);
> 	data_gpa = (max_gfn * guest_page_size) - data_size;
> 	data_gpa = align_down(data_gpa, backing_src_pagesz);
> 
> 	vm_userspace_mem_region_add(vm, VM_MEM_SRC_ANONYMOUS, 0, CODE_MEMSLOT,
> 				    code_npages, 0);
> 	vm->memslots[MEM_REGION_CODE] = CODE_MEMSLOT;
> 
> 	vm_userspace_mem_region_add(vm, p->src_type, data_gpa - pt_size,
> 				    PAGE_TABLE_MEMSLOT, pt_size / guest_page_size,
> 				    p->test_desc->pt_memslot_flags);
> 	vm->memslots[MEM_REGION_PT] = PAGE_TABLE_MEMSLOT;
> 
> 	vm_userspace_mem_region_add(vm, p->src_type, data_gpa, DATA_MEMSLOT,
> 				    data_size / guest_page_size,
> 				    p->test_desc->data_memslot_flags);
> 	vm->memslots[MEM_REGION_PT] = DATA_MEMSLOT;
> }
> 
> 
> static void run_test(enum vm_guest_mode mode, void *arg)
> {
> 	struct test_params *p = (struct test_params *)arg;
> 	struct test_desc *test = p->test_desc;
> 	struct kvm_vm *vm;
> 	struct kvm_vcpu *vcpu;
> 	struct uffd_desc *pt_uffd, *data_uffd;
> 
> 	print_test_banner(mode, p);
> 
> 	vm = ____vm_create(mode);
> 	setup_memslots(vm, p);
> 	kvm_vm_elf_load(vm, program_invocation_name);
> 	vcpu = vm_vcpu_add(vm, 0, guest_code);
> 
> 	...
> }
> 
> Option B (helper):
> 
> enum kvm_mem_region_mask {
> 	MEM_REGION_CODE_MASK	= BIT(MEM_REGION_CODE),
> 	MEM_REGION_PT_MASK	= BIT(MEM_REGION_PT),
> 	MEM_REGION_DATA_MASK	= BIT(MEM_REGION_DATA),
> 
> 	MEM_REGION_ALL_MASK	= MEM_REGION_CODE_MASK |
> 				  MEM_REGION_PT_MASK |
> 				  MEM_REGION_DATA_MASK,
> };
> 
> void kvm_vm_add_mem_region(struct kvm_vm *vm, enum kvm_mem_region_mask type_mask,
> 			   enum vm_mem_backing_src_type src_type, uint32_t slot,
> 			   uint64_t guest_paddr, uint64_t nr_pages, uint32_t flags)
> {
> 	int i;
> 
> 	vm_userspace_mem_region_add(vm, src_type, guest_paddr, slot, nr_pages, 0);
> 
> 	for (i = 0; i < NR_MEM_REGIONS; i++) {
> 		if (BIT(i) & type_mask)
> 			vm->memslots[i] = slot;
> 	}
> }
> 
> struct kvm_vm *__vm_create(enum vm_guest_mode mode, uint32_t nr_runnable_vcpus,
> 			   uint64_t nr_extra_pages)
> {
> 	uint64_t nr_pages = vm_nr_pages_required(mode, nr_runnable_vcpus,
> 						 nr_extra_pages);
> 	struct kvm_vm *vm;
> 	int i;
> 
> 	vm = ____vm_create(mode);
> 
> 	kvm_vm_add_mem_region(vm, MEM_REGION_ALL_MASK, VM_MEM_SRC_ANONYMOUS, 0,
> 			      0, nr_pages, 0);
> 
> 	kvm_vm_elf_load(vm, program_invocation_name);
> 
> #ifdef __x86_64__
> 	vm_create_irqchip(vm);
> #endif
> 	return vm;
> }
> 
> static void setup_memslots(struct kvm_vm *vm, struct test_params *p)
> {
> 	...
> 
> 	kvm_vm_add_mem_region(vm, MEM_REGION_CODE_MASK, VM_MEM_SRC_ANONYMOUS,
> 			      CODE_MEMSLOT, 0, code_npages, 0);
> 
> 	kvm_vm_add_mem_region(vm, MEM_REGION_PT_MASK p->src_type,
> 			      PAGE_TABLE_MEMSLOT, data_gpa - pt_size,
> 			      pt_size / guest_page_size,
> 			      p->test_desc->pt_memslot_flags);
> 
> 	kvm_vm_add_mem_region(vm, MEM_REGION_DATA_MASK, p->src_type,
> 			      DATA_MEMSLOT, data_gpa,
> 			      data_size / guest_page_size,
> 			      p->test_desc->data_memslot_flags);
> }
> 
> ---
>  .../testing/selftests/kvm/include/kvm_util_base.h |  4 ++--
>  tools/testing/selftests/kvm/lib/kvm_util.c        | 15 +++++++--------
>  2 files changed, 9 insertions(+), 10 deletions(-)
> 
> diff --git a/tools/testing/selftests/kvm/include/kvm_util_base.h b/tools/testing/selftests/kvm/include/kvm_util_base.h
> index 24fde97f6121..107cb87908f8 100644
> --- a/tools/testing/selftests/kvm/include/kvm_util_base.h
> +++ b/tools/testing/selftests/kvm/include/kvm_util_base.h
> @@ -642,13 +642,13 @@ vm_paddr_t vm_alloc_page_table(struct kvm_vm *vm);
>   * __vm_create() does NOT create vCPUs, @nr_runnable_vcpus is used purely to
>   * calculate the amount of memory needed for per-vCPU data, e.g. stacks.
>   */
> -struct kvm_vm *____vm_create(enum vm_guest_mode mode, uint64_t nr_pages);
> +struct kvm_vm *____vm_create(enum vm_guest_mode mode);
>  struct kvm_vm *__vm_create(enum vm_guest_mode mode, uint32_t nr_runnable_vcpus,
>  			   uint64_t nr_extra_pages);
>  
>  static inline struct kvm_vm *vm_create_barebones(void)
>  {
> -	return ____vm_create(VM_MODE_DEFAULT, 0);
> +	return ____vm_create(VM_MODE_DEFAULT);
>  }
>  
>  static inline struct kvm_vm *vm_create(uint32_t nr_runnable_vcpus)
> diff --git a/tools/testing/selftests/kvm/lib/kvm_util.c b/tools/testing/selftests/kvm/lib/kvm_util.c
> index 9889fe0d8919..c761422faa17 100644
> --- a/tools/testing/selftests/kvm/lib/kvm_util.c
> +++ b/tools/testing/selftests/kvm/lib/kvm_util.c
> @@ -143,13 +143,10 @@ const struct vm_guest_mode_params vm_guest_mode_params[] = {
>  _Static_assert(sizeof(vm_guest_mode_params)/sizeof(struct vm_guest_mode_params) == NUM_VM_MODES,
>  	       "Missing new mode params?");
>  
> -struct kvm_vm *____vm_create(enum vm_guest_mode mode, uint64_t nr_pages)
> +struct kvm_vm *____vm_create(enum vm_guest_mode mode)
>  {
>  	struct kvm_vm *vm;
>  
> -	pr_debug("%s: mode='%s' pages='%ld'\n", __func__,
> -		 vm_guest_mode_string(mode), nr_pages);
> -
>  	vm = calloc(1, sizeof(*vm));
>  	TEST_ASSERT(vm != NULL, "Insufficient Memory");
>  
> @@ -245,9 +242,6 @@ struct kvm_vm *____vm_create(enum vm_guest_mode mode, uint64_t nr_pages)
>  
>  	/* Allocate and setup memory for guest. */
>  	vm->vpages_mapped = sparsebit_alloc();
> -	if (nr_pages != 0)
> -		vm_userspace_mem_region_add(vm, VM_MEM_SRC_ANONYMOUS,
> -					    0, 0, nr_pages, 0);
>  
>  	return vm;
>  }
> @@ -294,7 +288,12 @@ struct kvm_vm *__vm_create(enum vm_guest_mode mode, uint32_t nr_runnable_vcpus,
>  						 nr_extra_pages);
>  	struct kvm_vm *vm;
>  
> -	vm = ____vm_create(mode, nr_pages);
> +	pr_debug("%s: mode='%s' pages='%ld'\n", __func__,
> +		 vm_guest_mode_string(mode), nr_pages);
> +
> +	vm = ____vm_create(mode);
> +
> +	vm_userspace_mem_region_add(vm, VM_MEM_SRC_ANONYMOUS, 0, 0, nr_pages, 0);
>  
>  	kvm_vm_elf_load(vm, program_invocation_name);
>  
> 
> base-commit: 372d07084593dc7a399bf9bee815711b1fb1bcf2
> -- 
> 
_______________________________________________
kvmarm mailing list
kvmarm@xxxxxxxxxxxxxxxxxxxxx
https://lists.cs.columbia.edu/mailman/listinfo/kvmarm