Re: [PATCH] vfio: fix config virtualization, esp command byte

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Tue, 2010-11-09 at 17:09 -0800, Tom Lyon wrote:
> Cleans up config space virtualization, especialy handling of bytes
> which have some virtual and some real bits, like PCI_COMMAND.
> 
> Alex, I hope you can test this with your setups.

Sorry for the delay.  FWIW, I'm not having much luck with this, I'll try
to debug the problem.  Thanks,

Alex

> Signed-off-by: Tom Lyon <pugs@xxxxxxxxx>
> ---
>  drivers/vfio/vfio_pci_config.c |  166 +++++++++++++---------------------------
>  1 files changed, 53 insertions(+), 113 deletions(-)
> 
> diff --git a/drivers/vfio/vfio_pci_config.c b/drivers/vfio/vfio_pci_config.c
> index 8304316..7132ac4 100644
> --- a/drivers/vfio/vfio_pci_config.c
> +++ b/drivers/vfio/vfio_pci_config.c
> @@ -745,6 +745,8 @@ static int vfio_virt_init(struct vfio_dev *vdev)
>   */
>  static void vfio_bar_restore(struct vfio_dev *vdev)
>  {
> +	if (vdev->pdev->is_virtfn)
> +		return;
>  	printk(KERN_WARNING "%s: reset recovery - restoring bars\n", __func__);
>  
>  #define do_bar(off, which) \
> @@ -815,26 +817,15 @@ static inline int vfio_read_config_byte(struct vfio_dev *vdev,
>  static inline int vfio_write_config_byte(struct vfio_dev *vdev,
>  					int pos, u8 val)
>  {
> -	vdev->vconfig[pos] = val;
>  	return pci_user_write_config_byte(vdev->pdev, pos, val);
>  }
>  
>  /* handle virtualized fields in the basic config space */
> -static u8 vfio_virt_basic(struct vfio_dev *vdev, int write,
> -				u16 pos, u16 off, u8 val, u8 newval)
> +static void vfio_virt_basic(struct vfio_dev *vdev, int write, u16 pos, u8 *rbp)
>  {
> -	switch (off) {
> -	/*
> -	 * vendor and device are virt because they don't
> -	 * show up otherwise for sr-iov vfs
> -	 */
> -	case PCI_VENDOR_ID:
> -	case PCI_VENDOR_ID + 1:
> -	case PCI_DEVICE_ID:
> -	case PCI_DEVICE_ID + 1:
> -		/* read only */
> -		val = vdev->vconfig[pos];
> -		break;
> +	u8 val;
> +
> +	switch (pos) {
>  	case PCI_COMMAND:
>  		/*
>  		 * If the real mem or IO enable bits are zero
> @@ -842,100 +833,58 @@ static u8 vfio_virt_basic(struct vfio_dev *vdev, int write,
>  		 * Restore the real BARs before allowing those
>  		 * bits to re-enable
>  		 */
> +		val = vdev->vconfig[pos];
>  		if (vdev->pdev->is_virtfn)
>  			val |= PCI_COMMAND_MEMORY;
>  		if (write) {
> -			int upd = 0;
> -
> -			upd = (newval & PCI_COMMAND_MEMORY) >
> -			      (val & PCI_COMMAND_MEMORY);
> -			upd += (newval & PCI_COMMAND_IO) >
> -			       (val & PCI_COMMAND_IO);
> -			if (upd)
> -				vfio_bar_restore(vdev);
> -			vfio_write_config_byte(vdev, pos, newval);
> -		}
> -		break;
> -	case PCI_BASE_ADDRESS_0:
> -	case PCI_BASE_ADDRESS_0+1:
> -	case PCI_BASE_ADDRESS_0+2:
> -	case PCI_BASE_ADDRESS_0+3:
> -	case PCI_BASE_ADDRESS_1:
> -	case PCI_BASE_ADDRESS_1+1:
> -	case PCI_BASE_ADDRESS_1+2:
> -	case PCI_BASE_ADDRESS_1+3:
> -	case PCI_BASE_ADDRESS_2:
> -	case PCI_BASE_ADDRESS_2+1:
> -	case PCI_BASE_ADDRESS_2+2:
> -	case PCI_BASE_ADDRESS_2+3:
> -	case PCI_BASE_ADDRESS_3:
> -	case PCI_BASE_ADDRESS_3+1:
> -	case PCI_BASE_ADDRESS_3+2:
> -	case PCI_BASE_ADDRESS_3+3:
> -	case PCI_BASE_ADDRESS_4:
> -	case PCI_BASE_ADDRESS_4+1:
> -	case PCI_BASE_ADDRESS_4+2:
> -	case PCI_BASE_ADDRESS_4+3:
> -	case PCI_BASE_ADDRESS_5:
> -	case PCI_BASE_ADDRESS_5+1:
> -	case PCI_BASE_ADDRESS_5+2:
> -	case PCI_BASE_ADDRESS_5+3:
> -	case PCI_ROM_ADDRESS:
> -	case PCI_ROM_ADDRESS+1:
> -	case PCI_ROM_ADDRESS+2:
> -	case PCI_ROM_ADDRESS+3:
> -		if (write) {
> -			vdev->vconfig[pos] = newval;
> -			vdev->bardirty = 1;
> -		} else {
> -			if (vdev->bardirty)
> -				vfio_bar_fixup(vdev);
> -			val = vdev->vconfig[pos];
> +
> +			if (((val & PCI_COMMAND_MEMORY) >
> +				(*rbp & PCI_COMMAND_MEMORY)) ||
> +			    ((val & PCI_COMMAND_IO) >
> +				(*rbp & PCI_COMMAND_IO)))
> +					vfio_bar_restore(vdev);
> +			*rbp &= ~(PCI_COMMAND_MEMORY + PCI_COMMAND_IO);
> +			*rbp |= val & (PCI_COMMAND_MEMORY + PCI_COMMAND_IO);
>  		}
> +		vdev->vconfig[pos] = val;
>  		break;
> -	default:
> +	case PCI_BASE_ADDRESS_0 ... PCI_BASE_ADDRESS_5 + 3:
> +	case PCI_ROM_ADDRESS ... PCI_ROM_ADDRESS + 3:
>  		if (write)
> -			vdev->vconfig[pos] = newval;
> -		else
> -			val = vdev->vconfig[pos];
> +			vdev->bardirty = 1;
> +		else if (vdev->bardirty)
> +			vfio_bar_fixup(vdev);
>  		break;
>  	}
> -	return val;
>  }
>  
>  /*
>   * handle virtualized fields in msi capability
>   * easy, except for multiple-msi fields in flags byte
>   */
> -static u8 vfio_virt_msi(struct vfio_dev *vdev, int write,
> -				u16 pos, u16 off, u8 val, u8 newval)
> +static void vfio_virt_msi(struct vfio_dev *vdev, int write,
> +				u16 pos, u16 off, u8 *rbp)
>  {
> -	if (off == PCI_MSI_FLAGS) {
> -		u8 num;
> +	u8 val;
> +	u8 num;
>  
> +	val = vdev->vconfig[pos];
> +	if (off == PCI_MSI_FLAGS) {
>  		if (write) {
>  			if (!vdev->ev_msi)
> -				newval &= ~PCI_MSI_FLAGS_ENABLE;
> -			num = (newval & PCI_MSI_FLAGS_QSIZE) >> 4;
> +				val &= ~PCI_MSI_FLAGS_ENABLE;
> +			num = (val & PCI_MSI_FLAGS_QSIZE) >> 4;
>  			if (num > vdev->msi_qmax)
>  				num = vdev->msi_qmax;
> -			newval &= ~PCI_MSI_FLAGS_QSIZE;
> -			newval |= num << 4;
> -			vfio_write_config_byte(vdev, pos, newval);
> +			val &= ~PCI_MSI_FLAGS_QSIZE;
> +			val |= num << 4;
> +			*rbp = val;
>  		} else {
> -			if (vfio_read_config_byte(vdev, pos, &val) < 0)
> -				return 0;
>  			val &= ~PCI_MSI_FLAGS_QMASK;
>  			val |= vdev->msi_qmax << 1;
>  		}
> -		return val;
>  	}
> -
> -	if (write)
> -		vdev->vconfig[pos] = newval;
> -	else
> -		val = vdev->vconfig[pos];
> -	return val;
> +	vdev->vconfig[pos] = val;
>  }
>  
>  static int vfio_config_rwbyte(int write,
> @@ -950,6 +899,7 @@ static int vfio_config_rwbyte(int write,
>  	struct perm_bits *perm;
>  	u8 wr, virt;
>  	int ret;
> +	u8 realbits = 0;
>  
>  	cap = map[pos];
>  	if (cap == 0xFF) {	/* unknown region */
> @@ -989,7 +939,7 @@ static int vfio_config_rwbyte(int write,
>  	}
>  	if (write && !wr)		/* no writeable bits */
>  		return 0;
> -	if (!virt) {
> +	if (!virt) {			/* no virtual bits */
>  		if (write) {
>  			if (copy_from_user(&val, buf, 1))
>  				return -EFAULT;
> @@ -1018,54 +968,44 @@ static int vfio_config_rwbyte(int write,
>  		if (copy_from_user(&newval, buf, 1))
>  			return -EFAULT;
>  	}
> -	/*
> -	 * We get here if there are some virt bits
> -	 * handle remaining real bits, if any
> -	 */
> -	if (~virt) {
> -		u8 rbits = (~virt) & wr;
>  
> -		ret = vfio_read_config_byte(vdev, pos, &val);
> +	if (~virt) {	/* mix of real and virt bits */
> +		/* update vconfig with latest hw bits */
> +		ret = vfio_read_config_byte(vdev, pos, &realbits);
>  		if (ret < 0)
>  			return ret;
> -		if (write && rbits) {
> -			val &= ~rbits;
> -			val |= (newval & rbits);
> -			vfio_write_config_byte(vdev, pos, val);
> -		}
> +		vdev->vconfig[pos] =
> +			(vdev->vconfig[pos] & virt) | (realbits & ~virt);
>  	}
> +
> +	/* update vconfig with writeable bits */
> +	vdev->vconfig[pos] =
> +		(vdev->vconfig[pos] & ~wr) | (newval & wr);
> +
>  	/*
> -	 * Now handle entirely virtual fields
> +	 * Now massage virtual fields
>  	 */
>  	if (pos < PCI_CFG_SPACE_SIZE) {
>  		switch (cap) {
>  		case PCI_CAP_ID_BASIC:	/* virtualize BARs */
> -			val = vfio_virt_basic(vdev, write,
> -						pos, off, val, newval);
> +			vfio_virt_basic(vdev, write, pos, &realbits);
>  			break;
>  		case PCI_CAP_ID_MSI:	/* virtualize (parts of) MSI */
> -			val = vfio_virt_msi(vdev, write,
> -						pos, off, val, newval);
> -			break;
> -		default:
> -			if (write)
> -				vdev->vconfig[pos] = newval;
> -			else
> -				val = vdev->vconfig[pos];
> +			vfio_virt_msi(vdev, write, pos, off, &realbits);
>  			break;
>  		}
>  	} else {
>  		/* no virt fields yet in ecaps */
>  		switch (cap) {	/* extended capabilities */
>  		default:
> -			if (write)
> -				vdev->vconfig[pos] = newval;
> -			else
> -				val = vdev->vconfig[pos];
>  			break;
>  		}
>  	}
> -	if (!write && copy_to_user(buf, &val, 1))
> +	if (write && ~virt) {
> +		realbits = (realbits & virt) | (vdev->vconfig[pos] & ~virt);
> +		vfio_write_config_byte(vdev, pos, realbits);
> +	}
> +	if (!write && copy_to_user(buf, &vdev->vconfig[pos], 1))
>  		return -EFAULT;
>  	return 0;
>  }



--
To unsubscribe from this list: send the line "unsubscribe kvm" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html


[Index of Archives]     [KVM ARM]     [KVM ia64]     [KVM ppc]     [Virtualization Tools]     [Spice Development]     [Libvirt]     [Libvirt Users]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite Questions]     [Linux Kernel]     [Linux SCSI]     [XFree86]
  Powered by Linux