Re: [RFC PATCH 3/3] KVM: s390: Hook up ioeventfds.

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Thu, Feb 21, 2013 at 04:21:43PM +0100, Cornelia Huck wrote:
> On Thu, 21 Feb 2013 16:39:05 +0200
> "Michael S. Tsirkin" <mst@xxxxxxxxxx> wrote:
> 
> > On Thu, Feb 21, 2013 at 02:13:00PM +0100, Cornelia Huck wrote:
> > > As s390 doesn't use memory writes for virtio notifcations, create
> > > a special kind of ioeventfd instead that hooks up into diagnose
> > > 0x500 (kvm hypercall) with function code 3 (virtio-ccw notification).
> > > 
> > > Signed-off-by: Cornelia Huck <cornelia.huck@xxxxxxxxxx>
> > 
> > Do we really have to put virtio specific stuff into kvm?
> > How about we add generic functionality to match GPRs
> > on a hypercall and signal an eventfd?
> 
> Worth a try implementing that.
> 
> > 
> > Also, it's a bit unfortunate that this doesn't use
> > the io bus datastructure, long term the linked list handling
> > might become a bottleneck, using shared code this could maybe
> > benefit from performance optimizations there.
> 
> The linked list stuff was more like an initial implementation that
> could be improved later.
> 
> > io bus data structure currently has the ability to match on
> > two 64 bit fields (addr/datamatch) and a signed 32 bit one (length).
> > Isn't this sufficient for your purposes?
> > How about sticking subchannel id in address, vq in data match
> > and using io bus?
> 
> I can give that a try. (I must admit that I didn't look at the iobus
> stuff in detail.)
> 
> > 
> > BTW maybe we could do this for the user interface too,
> > while I'm not 100% sure it's the cleanest thing to do
> > (or will work), it would certainly minimize the patchset.
> 
> You mean integrating with the generic interface and dropping the new
> ARCH flag?

Not sure about the flag but we could use the general structure
without an arch-specific format, if that's a good fit.

> > 
> > > ---
> > >  arch/s390/include/asm/kvm_host.h |  23 ++++++
> > >  arch/s390/kvm/Kconfig            |   1 +
> > >  arch/s390/kvm/Makefile           |   2 +-
> > >  arch/s390/kvm/diag.c             |  23 ++++++
> > >  arch/s390/kvm/kvm-s390.c         | 165 +++++++++++++++++++++++++++++++++++++++
> > >  arch/s390/kvm/kvm-s390.h         |   3 +
> > >  6 files changed, 216 insertions(+), 1 deletion(-)
> > > 
> > > diff --git a/arch/s390/include/asm/kvm_host.h b/arch/s390/include/asm/kvm_host.h
> > > index 16bd5d1..8dad9dc 100644
> > > --- a/arch/s390/include/asm/kvm_host.h
> > > +++ b/arch/s390/include/asm/kvm_host.h
> > > @@ -18,6 +18,7 @@
> > >  #include <linux/kvm_host.h>
> > >  #include <asm/debug.h>
> > >  #include <asm/cpu.h>
> > > +#include <asm/schid.h>
> > >  
> > >  #define KVM_MAX_VCPUS 64
> > >  #define KVM_USER_MEM_SLOTS 32
> > > @@ -262,8 +263,30 @@ struct kvm_arch{
> > >  	debug_info_t *dbf;
> > >  	struct kvm_s390_float_interrupt float_int;
> > >  	struct gmap *gmap;
> > > +	struct list_head sch_fds;
> > > +	struct rw_semaphore sch_fds_sem;
> > 
> > Why sch_? Related to subchannel somehow?
> 
> Yes.
> 
> > Also you mean _ioeventfds really?
> 
> Probably, I don't have the irqfd stuff figured out yet.
> 
> > Might be a good idea to document locking here.
> 
> OK.
> 
> > 
> > >  	int css_support;
> > >  };
> > >  
> > >  extern int sie64a(struct kvm_s390_sie_block *, u64 *);
> > > +#define __KVM_HAVE_ARCH_IOEVENTFD
> > > +
> > > +#define KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY 1
> > > +
> > > +struct kvm_s390_ioeventfd_data {
> > > +	__u8 type;
> > > +	union {
> > > +		/* VIRTIO_CCW_NOTIFY */
> > > +		struct {
> > > +			__u64 vq;
> > > +			struct subchannel_id schid;
> > > +		} virtio_ccw_vq;
> > > +		char padding[35];
> > > +	};
> > > +} __packed;
> > > +
> > 
> > Do you expect userspace to use this structure?
> > If yes this is the wrong header. If not why is it packed?
> 
> Indeed, userspace is supposed to use this.
> 
> > 
> > > +struct kvm_arch_ioeventfd {
> > > +	struct list_head entry;
> > > +	struct kvm_s390_ioeventfd_data data;
> > 
> > Let's not waste memory keeping padding in kernel datastructures.
> > 
> > > +};
> > >  #endif
> > > diff --git a/arch/s390/kvm/Kconfig b/arch/s390/kvm/Kconfig
> > > index b58dd86..3c43e30 100644
> > > --- a/arch/s390/kvm/Kconfig
> > > +++ b/arch/s390/kvm/Kconfig
> > > @@ -22,6 +22,7 @@ config KVM
> > >  	select PREEMPT_NOTIFIERS
> > >  	select ANON_INODES
> > >  	select HAVE_KVM_CPU_RELAX_INTERCEPT
> > > +	select HAVE_KVM_EVENTFD
> > >  	---help---
> > >  	  Support hosting paravirtualized guest machines using the SIE
> > >  	  virtualization capability on the mainframe. This should work
> > > diff --git a/arch/s390/kvm/Makefile b/arch/s390/kvm/Makefile
> > > index 2441ffd..dbd8cc9 100644
> > > --- a/arch/s390/kvm/Makefile
> > > +++ b/arch/s390/kvm/Makefile
> > > @@ -6,7 +6,7 @@
> > >  # it under the terms of the GNU General Public License (version 2 only)
> > >  # as published by the Free Software Foundation.
> > >  
> > > -common-objs = $(addprefix ../../../virt/kvm/, kvm_main.o)
> > > +common-objs = $(addprefix ../../../virt/kvm/, kvm_main.o eventfd.o)
> > >  
> > >  ccflags-y := -Ivirt/kvm -Iarch/s390/kvm
> > >  
> > > diff --git a/arch/s390/kvm/diag.c b/arch/s390/kvm/diag.c
> > > index a390687..51ea66f 100644
> > > --- a/arch/s390/kvm/diag.c
> > > +++ b/arch/s390/kvm/diag.c
> > > @@ -104,6 +104,27 @@ static int __diag_ipl_functions(struct kvm_vcpu *vcpu)
> > >  	return -EREMOTE;
> > >  }
> > >  
> > > +static int __diag_virtio_hypercall(struct kvm_vcpu *vcpu)
> > > +{
> > > +	struct kvm_s390_ioeventfd_data data;
> > > +	u32 tmp;
> > > +
> > > +	/* No channel I/O? Get out quickly. */
> > > +	if (!vcpu->kvm->arch.css_support ||
> > > +	    (vcpu->run->s.regs.gprs[1] != 3))
> > > +		return -EOPNOTSUPP;
> > > +
> > > +	/* subchannel id is in gpr 2, queue in gpr 3 */
> > > +	tmp = vcpu->run->s.regs.gprs[2] & 0xffffffff;
> > > +	memcpy(&data.virtio_ccw_vq.schid, &tmp,
> > > +	       sizeof(data.virtio_ccw_vq.schid));
> > > +	data.virtio_ccw_vq.vq = vcpu->run->s.regs.gprs[3];
> > > +	data.type = KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY;
> > > +
> > > +	/* If signalling via eventfd fails, we want to drop to userspace. */
> > > +	return kvm_s390_ioeventfd_signal(vcpu->kvm, &data) ? -EOPNOTSUPP : 0;
> > > +}
> > > +
> > >  int kvm_s390_handle_diag(struct kvm_vcpu *vcpu)
> > >  {
> > >  	int code = (vcpu->arch.sie_block->ipb & 0xfff0000) >> 16;
> > > @@ -118,6 +139,8 @@ int kvm_s390_handle_diag(struct kvm_vcpu *vcpu)
> > >  		return __diag_time_slice_end_directed(vcpu);
> > >  	case 0x308:
> > >  		return __diag_ipl_functions(vcpu);
> > > +	case 0x500:
> > > +		return __diag_virtio_hypercall(vcpu);
> > >  	default:
> > >  		return -EOPNOTSUPP;
> > >  	}
> > > diff --git a/arch/s390/kvm/kvm-s390.c b/arch/s390/kvm/kvm-s390.c
> > > index 58a5f03..cd9eb0e 100644
> > > --- a/arch/s390/kvm/kvm-s390.c
> > > +++ b/arch/s390/kvm/kvm-s390.c
> > > @@ -15,6 +15,7 @@
> > >  
> > >  #include <linux/compiler.h>
> > >  #include <linux/err.h>
> > > +#include <linux/eventfd.h>
> > >  #include <linux/fs.h>
> > >  #include <linux/hrtimer.h>
> > >  #include <linux/init.h>
> > > @@ -143,6 +144,7 @@ int kvm_dev_ioctl_check_extension(long ext)
> > >  	case KVM_CAP_ONE_REG:
> > >  	case KVM_CAP_ENABLE_CAP:
> > >  	case KVM_CAP_S390_CSS_SUPPORT:
> > > +	case KVM_CAP_IOEVENTFD:
> > >  		r = 1;
> > >  		break;
> > >  	case KVM_CAP_NR_VCPUS:
> > > @@ -237,6 +239,8 @@ int kvm_arch_init_vm(struct kvm *kvm, unsigned long type)
> > >  		if (!kvm->arch.gmap)
> > >  			goto out_nogmap;
> > >  	}
> > > +	INIT_LIST_HEAD(&kvm->arch.sch_fds);
> > > +	init_rwsem(&kvm->arch.sch_fds_sem);
> > >  
> > >  	kvm->arch.css_support = 0;
> > >  
> > > @@ -1028,3 +1032,164 @@ void kvm_arch_flush_shadow_memslot(struct kvm *kvm,
> > >  				   struct kvm_memory_slot *slot)
> > >  {
> > >  }
> > > +static void kvm_s390_ioeventfd_add(struct kvm *kvm,
> > > +				   struct kvm_arch_ioeventfd *arch)
> > > +{
> > > +	switch (arch->data.type) {
> > > +	case KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY:
> > > +		down_write(&kvm->arch.sch_fds_sem);
> > > +		list_add_tail(&arch->entry, &kvm->arch.sch_fds);
> > > +		up_write(&kvm->arch.sch_fds_sem);
> > > +		break;
> > > +	default:
> > > +		pr_warn("Trying to add ioeventfd type %x\n", arch->data.type);
> > > +	}
> > > +}
> > > +
> > > +static void kvm_s390_ioeventfd_remove(struct kvm *kvm,
> > > +				      struct kvm_arch_ioeventfd *arch)
> > > +{
> > > +	switch (arch->data.type) {
> > > +	case KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY:
> > > +		down_write(&kvm->arch.sch_fds_sem);
> > > +		list_del(&arch->entry);
> > > +		up_write(&kvm->arch.sch_fds_sem);
> > > +		break;
> > > +	default:
> > > +		pr_warn("Trying to remove ioeventfd type %x\n",
> > > +			arch->data.type);
> > > +	}
> > > +}
> > > +
> > > +int kvm_s390_ioeventfd_signal(struct kvm *kvm,
> > > +			      struct kvm_s390_ioeventfd_data *data)
> > > +{
> > > +	struct kvm_arch_ioeventfd *arch, match;
> > > +	int ret;
> > > +
> > > +	if (data->type != KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY)
> > > +		return -ENOENT;
> > > +	down_read(&kvm->arch.sch_fds_sem);
> > > +	if (list_empty(&kvm->arch.sch_fds)) {
> > > +		ret = -ENOENT;
> > > +		goto out_unlock;
> > > +	}
> > > +	memcpy(&match.data, data, sizeof(match.data));
> > > +	list_for_each_entry(arch, &kvm->arch.sch_fds, entry) {
> > > +		if (!kvm_arch_ioeventfd_match(arch, &match))
> > > +			continue;
> > > +		ret = eventfd_signal(kvm_ioeventfd_get_eventfd(arch), 1);
> > > +		goto out_unlock;
> > > +	}
> > > +	ret = -ENOENT;
> > > +out_unlock:
> > > +	if (ret > 0)
> > > +		ret = 0;
> > > +	up_read(&kvm->arch.sch_fds_sem);
> > > +	return ret;
> > > +}
> > > +
> > > +int kvm_arch_ioeventfd_check(struct kvm_ioeventfd *args)
> > > +{
> > > +	struct kvm_s390_ioeventfd_data *data;
> > > +
> > > +	if (!(args->flags & KVM_IOEVENTFD_FLAG_ARCH))
> > > +		return -EINVAL;
> > > +	if (args->flags & (KVM_IOEVENTFD_FLAG_DATAMATCH |
> > > +			   KVM_IOEVENTFD_FLAG_PIO))
> > > +		return -EINVAL;
> > > +
> > > +	data = (struct kvm_s390_ioeventfd_data *) args->data;
> > > +	if (data->type != KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY)
> > > +		return -EINVAL;
> > > +	if (((data->virtio_ccw_vq.schid.m == 1) &&
> > > +	     (data->virtio_ccw_vq.schid.cssid != 0xfe)) ||
> > > +	    ((data->virtio_ccw_vq.schid.m == 0) &&
> > > +	     (data->virtio_ccw_vq.schid.cssid != 0)))
> > > +		return -EINVAL;
> > > +	if (data->virtio_ccw_vq.schid.one != 1)
> > > +		return -EINVAL;
> > > +	if (data->virtio_ccw_vq.vq > 128)
> > 
> > Why 128?
> > Generally maybe add a comment documenting the
> > constants used.
> 
> OK.
> 
> > 
> > > +		return -EINVAL;
> > > +	return 0;
> > > +}
> > > +EXPORT_SYMBOL_GPL(kvm_arch_ioeventfd_check);
> > > +
> > > +void kvm_arch_ioeventfd_init(struct kvm_arch_ioeventfd *arch,
> > > +			     struct kvm_ioeventfd *args)
> > > +{
> > > +	INIT_LIST_HEAD(&arch->entry);
> > > +	memcpy(&arch->data, &args->data, sizeof(arch->data));
> > > +}
> > > +EXPORT_SYMBOL_GPL(kvm_arch_ioeventfd_init);
> > > +
> > > +int kvm_arch_ioeventfd_activate(struct kvm *kvm,
> > > +				struct kvm_arch_ioeventfd *arch,
> > > +				struct kvm_ioeventfd *args)
> > > +{
> > > +	int ret;
> > > +
> > > +	switch (arch->data.type) {
> > > +	case KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY:
> > > +		/* Fail if channel subsystem support is not active. */
> > > +		if (!kvm->arch.css_support)
> > > +			ret = -EINVAL;
> > > +		else {
> > > +			kvm_s390_ioeventfd_add(kvm, arch);
> > > +			ret = 0;
> > > +		}
> > > +		break;
> > > +	default:
> > > +		ret = -EINVAL;
> > > +	}
> > > +	return ret;
> > > +}
> > > +EXPORT_SYMBOL_GPL(kvm_arch_ioeventfd_activate);
> > > +
> > > +bool kvm_arch_ioeventfd_match(struct kvm_arch_ioeventfd *arch,
> > > +			      struct kvm_arch_ioeventfd *to_match)
> > > +{
> > > +	if (arch->data.type != to_match->data.type)
> > > +		return false;
> > > +
> > > +	switch (arch->data.type) {
> > > +	case KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY:
> > > +		if (memcmp(&arch->data.virtio_ccw_vq.schid,
> > > +			   &to_match->data.virtio_ccw_vq.schid,
> > > +			   sizeof(arch->data.virtio_ccw_vq.schid)))
> > > +			return false;
> > > +		if (arch->data.virtio_ccw_vq.vq !=
> > > +		    to_match->data.virtio_ccw_vq.vq)
> > > +			return false;
> > > +		return true;
> > > +	default:
> > > +		return false;
> > > +	}
> > > +}
> > > +EXPORT_SYMBOL_GPL(kvm_arch_ioeventfd_match);
> > > +
> > > +bool kvm_arch_ioeventfd_match_and_release(struct kvm *kvm,
> > > +					  struct kvm_arch_ioeventfd *arch,
> > > +					  struct kvm_ioeventfd *args)
> > > +{
> > > +	struct kvm_s390_ioeventfd_data *data;
> > > +
> > > +	data = (struct kvm_s390_ioeventfd_data *)args->data;
> > > +	if (arch->data.type != data->type)
> > > +		return false;
> > > +
> > > +	switch (arch->data.type) {
> > > +	case KVM_S390_IOEVENTFD_VIRTIO_CCW_NOTIFY:
> > > +		if (memcmp(&arch->data.virtio_ccw_vq.schid,
> > > +			   &data->virtio_ccw_vq.schid,
> > > +			   sizeof(arch->data.virtio_ccw_vq.schid)))
> > > +			return false;
> > > +		if (arch->data.virtio_ccw_vq.vq != data->virtio_ccw_vq.vq)
> > > +			return false;
> > > +		kvm_s390_ioeventfd_remove(kvm, arch);
> > > +		return true;
> > > +	default:
> > > +		return false;
> > > +	}
> > > +}
> > > +EXPORT_SYMBOL_GPL(kvm_arch_ioeventfd_match_and_release);
> > > diff --git a/arch/s390/kvm/kvm-s390.h b/arch/s390/kvm/kvm-s390.h
> > > index 4d89d64..9794906 100644
> > > --- a/arch/s390/kvm/kvm-s390.h
> > > +++ b/arch/s390/kvm/kvm-s390.h
> > > @@ -136,4 +136,7 @@ int kvm_s390_vcpu_store_status(struct kvm_vcpu *vcpu,
> > >  /* implemented in diag.c */
> > >  int kvm_s390_handle_diag(struct kvm_vcpu *vcpu);
> > >  
> > > +int kvm_s390_ioeventfd_signal(struct kvm *kvm,
> > > +			      struct kvm_s390_ioeventfd_data *data);
> > > +
> > >  #endif
> > > -- 
> > > 1.7.12.4
> > > 
> > 
--
To unsubscribe from this list: send the line "unsubscribe kvm" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html


[Index of Archives]     [KVM ARM]     [KVM ia64]     [KVM ppc]     [Virtualization Tools]     [Spice Development]     [Libvirt]     [Libvirt Users]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite Questions]     [Linux Kernel]     [Linux SCSI]     [XFree86]
  Powered by Linux