Re: [PATCH 2/2] kvm tools: Submit multiple virtio-blk requests in parallel

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On 12/15/2011 08:15 PM, Sasha Levin wrote:
> When using AIO, submit all requests which exists in the vring in a single
> io_submit instead of one io_submit for each descriptor.
> 
> Benchmarks:
> 
> Short version: 15%+ increase in IOPS, small increase in BW.
> 
> Read IOPS:
> Before:
>   vda: ios=291792/0, merge=0/0, ticks=35229/0, in_queue=31025, util=61.30%

I guess you are reading the wrong IOPS number, the 'ios' is the number
of ios performed by all groups, not the IOPS result. Find the 'iops' ;-)

So, Here is the number without/with this patch.

(seq-read, seq-write, rand-read, rand-write)

Before:
  read : io=98304KB, bw=63015KB/s, iops=15753, runt=  1560msec
  write: io=98304KB, bw=56823KB/s, iops=14205, runt=  1730msec
  read : io=98304KB, bw=62139KB/s, iops=15534, runt=  1582msec
  write: io=98304KB, bw=53836KB/s, iops=13458, runt=  1826msec

After:
  read : io=98304KB, bw=63096KB/s, iops=15774, runt=  1558msec
  write: io=98304KB, bw=55823KB/s, iops=13955, runt=  1761msec
  read : io=98304KB, bw=59148KB/s, iops=14787, runt=  1662msec
  write: io=98304KB, bw=55072KB/s, iops=13768, runt=  1785msec

Submit more io requests in one time is not supposed to increase the iops
or bw so dramatically.

I even tried to submit all read/write ops in one io_submit which still
ends up with very little iops or bw improvement.

> 
> After:
>   vda: ios=333114/0, merge=0/0, ticks=47983/0, in_queue=46630, util=62.22%
> 
> Write IOPS:
> Before:
>   vda: ios=0/271716, merge=0/0, ticks=0/33367, in_queue=26531, util=59.96%
> 
> After:
>   vda: ios=0/327485, merge=0/0, ticks=0/23789, in_queue=22475, util=55.74%
> 
> Read BW:
> Before:
>    READ: io=7526.0MB, aggrb=1246.3MB/s, minb=1275.1MB/s, maxb=1275.1MB/s, mint=6040msec, maxt=6040msec
> After:
>    READ: io=7526.0MB, aggrb=1315.5MB/s, minb=1346.7MB/s, maxb=1346.7MB/s, mint=5723msec, maxt=5723msec
> 
> Write BW:
> Before:
>   WRITE: io=7526.0MB, aggrb=1110.2MB/s, minb=1136.9MB/s, maxb=1136.9MB/s, mint=6779msec, maxt=6779msec
> 
> After:
>   WRITE: io=7526.0MB, aggrb=1113.5MB/s, minb=1140.3MB/s, maxb=1140.3MB/s, mint=6759msec, maxt=6759msec
> 
> Signed-off-by: Sasha Levin <levinsasha928@xxxxxxxxx>
> ---
>  tools/kvm/disk/core.c              |    2 -
>  tools/kvm/disk/raw.c               |   38 +++++++++++++++++++++++++++++------
>  tools/kvm/include/kvm/disk-image.h |    8 +++++-
>  tools/kvm/util/read-write.c        |    8 +-----
>  tools/kvm/virtio/blk.c             |    3 ++
>  5 files changed, 42 insertions(+), 17 deletions(-)
> 
> diff --git a/tools/kvm/disk/core.c b/tools/kvm/disk/core.c
> index 4915efd..b18014e 100644
> --- a/tools/kvm/disk/core.c
> +++ b/tools/kvm/disk/core.c
> @@ -5,8 +5,6 @@
>  #include <sys/eventfd.h>
>  #include <sys/poll.h>
>  
> -#define AIO_MAX 32
> -
>  int debug_iodelay;
>  
>  #ifdef CONFIG_HAS_AIO
> diff --git a/tools/kvm/disk/raw.c b/tools/kvm/disk/raw.c
> index caa023c..1162fb7 100644
> --- a/tools/kvm/disk/raw.c
> +++ b/tools/kvm/disk/raw.c
> @@ -10,9 +10,9 @@ ssize_t raw_image__read_sector(struct disk_image *disk, u64 sector, const struct
>  	u64 offset = sector << SECTOR_SHIFT;
>  
>  #ifdef CONFIG_HAS_AIO
> -	struct iocb iocb;
> +	struct iocb *iocb = &disk->iocb[disk->count++];
>  
> -	return aio_preadv(disk->ctx, &iocb, disk->fd, iov, iovcount, offset,
> +	return aio_preadv(disk->ctx, iocb, disk->fd, iov, iovcount, offset,
>  				disk->evt, param);
>  #else
>  	return preadv_in_full(disk->fd, iov, iovcount, offset);
> @@ -25,9 +25,9 @@ ssize_t raw_image__write_sector(struct disk_image *disk, u64 sector, const struc
>  	u64 offset = sector << SECTOR_SHIFT;
>  
>  #ifdef CONFIG_HAS_AIO
> -	struct iocb iocb;
> +	struct iocb *iocb = &disk->iocb[disk->count++];
>  
> -	return aio_pwritev(disk->ctx, &iocb, disk->fd, iov, iovcount, offset,
> +	return aio_pwritev(disk->ctx, iocb, disk->fd, iov, iovcount, offset,
>  				disk->evt, param);
>  #else
>  	return pwritev_in_full(disk->fd, iov, iovcount, offset);
> @@ -79,19 +79,33 @@ int raw_image__close(struct disk_image *disk)
>  
>  	close(disk->evt);
>  
> -#ifdef CONFIG_HAS_VIRTIO
> +#ifdef CONFIG_HAS_AIO
>  	io_destroy(disk->ctx);
>  #endif
>  
>  	return ret;
>  }
>  
> +static int raw_image__aio_submit(struct disk_image *disk)
> +{
> +	int ret;
> +
> +	ret = io_submit(disk->ctx, disk->count, disk->iocb_ptrs);
> +	if (ret > 0)
> +		disk->count = 0;
> +
> +	return ret;
> +}
> +
>  /*
>   * multiple buffer based disk image operations
>   */
>  static struct disk_image_operations raw_image_regular_ops = {
>  	.read_sector	= raw_image__read_sector,
>  	.write_sector	= raw_image__write_sector,
> +#ifdef CONFIG_HAS_AIO
> +	.submit		= raw_image__aio_submit,
> +#endif
>  };
>  
>  struct disk_image_operations ro_ops = {
> @@ -120,8 +134,13 @@ struct disk_image *raw_image__probe(int fd, struct stat *st, bool readonly)
>  
>  			disk = disk_image__new(fd, st->st_size, &ro_ops_nowrite, DISK_IMAGE_REGULAR);
>  #ifdef CONFIG_HAS_AIO
> -			if (disk)
> +			if (disk) {
> +				int i;
> +
>  				disk->async = 1;
> +				for (i = 0; i < AIO_MAX; i++)
> +					disk->iocb_ptrs[i] = &disk->iocb[i];
> +			}
>  #endif
>  		}
>  
> @@ -132,8 +151,13 @@ struct disk_image *raw_image__probe(int fd, struct stat *st, bool readonly)
>  		 */
>  		disk = disk_image__new(fd, st->st_size, &raw_image_regular_ops, DISK_IMAGE_REGULAR);
>  #ifdef CONFIG_HAS_AIO
> -		if (disk)
> +		if (disk) {
> +			int i;
> +
>  			disk->async = 1;
> +			for (i = 0; i < AIO_MAX; i++)
> +				disk->iocb_ptrs[i] = &disk->iocb[i];
> +		}
>  #endif
>  		return disk;
>  	}
> diff --git a/tools/kvm/include/kvm/disk-image.h b/tools/kvm/include/kvm/disk-image.h
> index 56c08da..6eba950 100644
> --- a/tools/kvm/include/kvm/disk-image.h
> +++ b/tools/kvm/include/kvm/disk-image.h
> @@ -20,14 +20,14 @@
>  
>  #define SECTOR_SHIFT		9
>  #define SECTOR_SIZE		(1UL << SECTOR_SHIFT)
> +#define AIO_MAX			256
> +#define MAX_DISK_IMAGES         4
>  
>  enum {
>  	DISK_IMAGE_REGULAR,
>  	DISK_IMAGE_MMAP,
>  };
>  
> -#define MAX_DISK_IMAGES         4
> -
>  struct disk_image;
>  
>  struct disk_image_operations {
> @@ -37,6 +37,7 @@ struct disk_image_operations {
>  				int iovcount, void *param);
>  	int (*flush)(struct disk_image *disk);
>  	int (*close)(struct disk_image *disk);
> +	int (*submit)(struct disk_image *disk);
>  };
>  
>  struct disk_image {
> @@ -50,6 +51,9 @@ struct disk_image {
>  	int				evt;
>  #ifdef CONFIG_HAS_AIO
>  	io_context_t			ctx;
> +	struct iocb			iocb[AIO_MAX];
> +	struct iocb			*iocb_ptrs[AIO_MAX];
> +	u32				count;
>  #endif
>  };
>  
> diff --git a/tools/kvm/util/read-write.c b/tools/kvm/util/read-write.c
> index 55473ba..4ccd554 100644
> --- a/tools/kvm/util/read-write.c
> +++ b/tools/kvm/util/read-write.c
> @@ -321,24 +321,20 @@ ssize_t pwritev_in_full(int fd, const struct iovec *iov, int iovcnt, off_t offse
>  int aio_pwritev(io_context_t ctx, struct iocb *iocb, int fd, const struct iovec *iov, int iovcnt,
>  		off_t offset, int ev, void *param)
>  {
> -	struct iocb *ios[1] = { iocb };
> -
>  	io_prep_pwritev(iocb, fd, iov, iovcnt, offset);
>  	io_set_eventfd(iocb, ev);
>  	iocb->data = param;
>  
> -	return io_submit(ctx, 1, ios);
> +	return 0;
>  }
>  
>  int aio_preadv(io_context_t ctx, struct iocb *iocb, int fd, const struct iovec *iov, int iovcnt,
>  		off_t offset, int ev, void *param)
>  {
> -	struct iocb *ios[1] = { iocb };
> -
>  	io_prep_preadv(iocb, fd, iov, iovcnt, offset);
>  	io_set_eventfd(iocb, ev);
>  	iocb->data = param;
>  
> -	return io_submit(ctx, 1, ios);
> +	return 0;
>  }
>  #endif
> \ No newline at end of file
> diff --git a/tools/kvm/virtio/blk.c b/tools/kvm/virtio/blk.c
> index d1a0197..153b11b 100644
> --- a/tools/kvm/virtio/blk.c
> +++ b/tools/kvm/virtio/blk.c
> @@ -128,6 +128,9 @@ static void virtio_blk_do_io(struct kvm *kvm, struct virt_queue *vq, struct blk_
>  
>  		virtio_blk_do_io_request(kvm, req);
>  	}
> +
> +	if (bdev->disk->ops->submit)
> +		bdev->disk->ops->submit(bdev->disk);
>  }
>  
>  static void set_config(struct kvm *kvm, void *dev, u8 data, u32 offset)


-- 
Asias He
--
To unsubscribe from this list: send the line "unsubscribe kvm" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html


[Index of Archives]     [KVM ARM]     [KVM ia64]     [KVM ppc]     [Virtualization Tools]     [Spice Development]     [Libvirt]     [Libvirt Users]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite Questions]     [Linux Kernel]     [Linux SCSI]     [XFree86]
  Powered by Linux