On 12/4/20 1:18 AM, David Woodhouse wrote: > @@ -3742,6 +3716,9 @@ int kvm_vm_ioctl_check_extension(struct kvm *kvm, long ext) > case KVM_CAP_ENFORCE_PV_FEATURE_CPUID: > r = 1; > break; > + case KVM_CAP_XEN_HVM: > + r = 1 | KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL; > + break; Maybe: r = KVM_XEN_HVM_CONFIG_HYPERCALL_MSR | KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL; > case KVM_CAP_SYNC_REGS: > r = KVM_SYNC_X86_VALID_FIELDS; > break; > @@ -5603,7 +5580,15 @@ long kvm_arch_vm_ioctl(struct file *filp, > if (copy_from_user(&xhc, argp, sizeof(xhc))) > goto out; > r = -EINVAL; > - if (xhc.flags) > + if (xhc.flags & ~KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL) > + goto out; > + /* > + * With hypercall interception the kernel generates its own > + * hypercall page so it must not be provided. > + */ > + if ((xhc.flags & KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL) && > + (xhc.blob_addr_32 || xhc.blob_addr_64 || > + xhc.blob_size_32 || xhc.blob_size_64)) > goto out; I suppose it makes sense restricting to INTERCEPT_HCALL to make sure that the kernel only forwards the hcall if it is control off what it put there in the hypercall page (i.e. vmmcall/vmcall). hcall userspace exiting without INTERCEPT_HCALL would break ABI over how this ioctl was used before the new flag... In case kvm_xen_hypercall_enabled() would return true with KVM_XEN_HVM_CONFIG_HYPERCALL_MSR, as now it needs to handle a new userspace exit. If we're are being pedantic, the Xen hypercall MSR is a utility more than a necessity as the OS can always do without the hcall msr IIUC. But it is defacto used by enlightened Xen guests included FreeBSD. If we were to lift the restriction in the conditional above to forward hcall without INTERCEPT_HCALL flag then kvm_xen_hypercall_enabled() would return true with CONFIG_HYPERCALL_MSR and CONFIG_INTERCEPT_HCALL. And on wrmsr time, we would only look at whether we had a blob_size* passed in when handling the msr and initializing the hcall page. The only added gain is that guests which do vmcalls without an hypercall page would still be handled. But I am not sure it's worth the trouble. I feel its good the way this is now, given that this is new behaviour of forward vmmcall/vmcall to userspace. > +#endif /* __ARCH_X86_KVM_XEN_H__ */> diff --git a/include/uapi/linux/kvm.h b/include/uapi/linux/kvm.h > index ca41220b40b8..00221fe56994 100644 > --- a/include/uapi/linux/kvm.h > +++ b/include/uapi/linux/kvm.h > @@ -216,6 +216,20 @@ struct kvm_hyperv_exit { > } u; > }; > > +struct kvm_xen_exit { > +#define KVM_EXIT_XEN_HCALL 1 > + __u32 type; > + union { > + struct { > + __u32 longmode; > + __u32 cpl; > + __u64 input; > + __u64 result; > + __u64 params[6]; > + } hcall; > + } u; > +}; > + > #define KVM_S390_GET_SKEYS_NONE 1 > #define KVM_S390_SKEYS_MAX 1048576 > > @@ -250,6 +264,7 @@ struct kvm_hyperv_exit { > #define KVM_EXIT_ARM_NISV 28 > #define KVM_EXIT_X86_RDMSR 29 > #define KVM_EXIT_X86_WRMSR 30 > +#define KVM_EXIT_XEN 31 > > /* For KVM_EXIT_INTERNAL_ERROR */ > /* Emulate instruction failed. */ > @@ -426,6 +441,8 @@ struct kvm_run { > __u32 index; /* kernel -> user */ > __u64 data; /* kernel <-> user */ > } msr; > + /* KVM_EXIT_XEN */ > + struct kvm_xen_exit xen; > /* Fix the size of the union. */ > char padding[256]; > }; > @@ -1126,6 +1143,8 @@ struct kvm_x86_mce { > #endif > > #ifdef KVM_CAP_XEN_HVM > +#define KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL (1 << 1) > + And adding: #define KVM_XEN_HVM_CONFIG_HYPERCALL_MSR (1 << 0) Of course, this is a nit for readability only, but it aligns with what you write in the docs update you do in the last patch.