RE: [PATCH v2] storvsc: get rid of bounce buffer

From: KY Srinivasan
Date: Wed Sep 23 2015 - 10:39:15 EST




> -----Original Message-----
> From: Vitaly Kuznetsov [mailto:vkuznets@xxxxxxxxxx]
> Sent: Wednesday, September 23, 2015 5:59 AM
> To: linux-scsi@xxxxxxxxxxxxxxx
> Cc: linux-kernel@xxxxxxxxxxxxxxx; devel@xxxxxxxxxxxxxxxxxxxxxx; KY
> Srinivasan <kys@xxxxxxxxxxxxx>; Haiyang Zhang
> <haiyangz@xxxxxxxxxxxxx>; James E.J. Bottomley <JBottomley@xxxxxxxx>;
> Radim KrÄmÃÅ <rkrcmar@xxxxxxxxxx>; Christoph Hellwig
> <hch@xxxxxxxxxxxxx>
> Subject: [PATCH v2] storvsc: get rid of bounce buffer
>
> Storvsc driver needs to ensure there are no 'holes' in the presented
> sg list (all segments in the middle of the list need to be of PAGE_SIZE).
> When a hole is detected storvsc driver creates a 'bounce sgl' without
> holes and copies data over with copy_{to,from}_bounce_buffer() functions.
> Setting virt_boundary_mask to PAGE_SIZE - 1 guarantees we'll never see
> such holes so we can significantly simplify the driver. This is also
> supposed to bring us some performance improvement for certain workloads
> as we eliminate copying.
>
> Reported-by: Radim KrÄmÃÅ <rkrcmar@xxxxxxxxxx>
> Signed-off-by: Vitaly Kuznetsov <vkuznets@xxxxxxxxxx>
> ---
> Changes since v1:
> - This patch is a successor of 'storvsc: get rid of homegrown
> copy_{to,from}_bounce_buffer()'. Use virt_boundary instead to
> eliminate the need for bounce buffer completely [Christoph Hellwig].
> ---
> drivers/scsi/storvsc_drv.c | 286 +--------------------------------------------
> 1 file changed, 5 insertions(+), 281 deletions(-)
>
> diff --git a/drivers/scsi/storvsc_drv.c b/drivers/scsi/storvsc_drv.c
> index 40c43ae..eeade40 100644
> --- a/drivers/scsi/storvsc_drv.c
> +++ b/drivers/scsi/storvsc_drv.c
> @@ -393,9 +393,6 @@ static void storvsc_on_channel_callback(void
> *context);
> struct storvsc_cmd_request {
> struct scsi_cmnd *cmd;
>
> - unsigned int bounce_sgl_count;
> - struct scatterlist *bounce_sgl;
> -
> struct hv_device *device;
>
> /* Synchronize the request/response if needed */
> @@ -586,241 +583,6 @@ get_in_err:
>
> }
>
> -static void destroy_bounce_buffer(struct scatterlist *sgl,
> - unsigned int sg_count)
> -{
> - int i;
> - struct page *page_buf;
> -
> - for (i = 0; i < sg_count; i++) {
> - page_buf = sg_page((&sgl[i]));
> - if (page_buf != NULL)
> - __free_page(page_buf);
> - }
> -
> - kfree(sgl);
> -}
> -
> -static int do_bounce_buffer(struct scatterlist *sgl, unsigned int sg_count)
> -{
> - int i;
> -
> - /* No need to check */
> - if (sg_count < 2)
> - return -1;
> -
> - /* We have at least 2 sg entries */
> - for (i = 0; i < sg_count; i++) {
> - if (i == 0) {
> - /* make sure 1st one does not have hole */
> - if (sgl[i].offset + sgl[i].length != PAGE_SIZE)
> - return i;
> - } else if (i == sg_count - 1) {
> - /* make sure last one does not have hole */
> - if (sgl[i].offset != 0)
> - return i;
> - } else {
> - /* make sure no hole in the middle */
> - if (sgl[i].length != PAGE_SIZE || sgl[i].offset != 0)
> - return i;
> - }
> - }
> - return -1;
> -}
> -
> -static struct scatterlist *create_bounce_buffer(struct scatterlist *sgl,
> - unsigned int sg_count,
> - unsigned int len,
> - int write)
> -{
> - int i;
> - int num_pages;
> - struct scatterlist *bounce_sgl;
> - struct page *page_buf;
> - unsigned int buf_len = ((write == WRITE_TYPE) ? 0 : PAGE_SIZE);
> -
> - num_pages = ALIGN(len, PAGE_SIZE) >> PAGE_SHIFT;
> -
> - bounce_sgl = kcalloc(num_pages, sizeof(struct scatterlist),
> GFP_ATOMIC);
> - if (!bounce_sgl)
> - return NULL;
> -
> - sg_init_table(bounce_sgl, num_pages);
> - for (i = 0; i < num_pages; i++) {
> - page_buf = alloc_page(GFP_ATOMIC);
> - if (!page_buf)
> - goto cleanup;
> - sg_set_page(&bounce_sgl[i], page_buf, buf_len, 0);
> - }
> -
> - return bounce_sgl;
> -
> -cleanup:
> - destroy_bounce_buffer(bounce_sgl, num_pages);
> - return NULL;
> -}
> -
> -/* Assume the original sgl has enough room */
> -static unsigned int copy_from_bounce_buffer(struct scatterlist *orig_sgl,
> - struct scatterlist *bounce_sgl,
> - unsigned int orig_sgl_count,
> - unsigned int bounce_sgl_count)
> -{
> - int i;
> - int j = 0;
> - unsigned long src, dest;
> - unsigned int srclen, destlen, copylen;
> - unsigned int total_copied = 0;
> - unsigned long bounce_addr = 0;
> - unsigned long dest_addr = 0;
> - unsigned long flags;
> - struct scatterlist *cur_dest_sgl;
> - struct scatterlist *cur_src_sgl;
> -
> - local_irq_save(flags);
> - cur_dest_sgl = orig_sgl;
> - cur_src_sgl = bounce_sgl;
> - for (i = 0; i < orig_sgl_count; i++) {
> - dest_addr = (unsigned long)
> - kmap_atomic(sg_page(cur_dest_sgl)) +
> - cur_dest_sgl->offset;
> - dest = dest_addr;
> - destlen = cur_dest_sgl->length;
> -
> - if (bounce_addr == 0)
> - bounce_addr = (unsigned long)kmap_atomic(
> -
> sg_page(cur_src_sgl));
> -
> - while (destlen) {
> - src = bounce_addr + cur_src_sgl->offset;
> - srclen = cur_src_sgl->length - cur_src_sgl->offset;
> -
> - copylen = min(srclen, destlen);
> - memcpy((void *)dest, (void *)src, copylen);
> -
> - total_copied += copylen;
> - cur_src_sgl->offset += copylen;
> - destlen -= copylen;
> - dest += copylen;
> -
> - if (cur_src_sgl->offset == cur_src_sgl->length) {
> - /* full */
> - kunmap_atomic((void *)bounce_addr);
> - j++;
> -
> - /*
> - * It is possible that the number of elements
> - * in the bounce buffer may not be equal to
> - * the number of elements in the original
> - * scatter list. Handle this correctly.
> - */
> -
> - if (j == bounce_sgl_count) {
> - /*
> - * We are done; cleanup and return.
> - */
> - kunmap_atomic((void *)(dest_addr -
> - cur_dest_sgl->offset));
> - local_irq_restore(flags);
> - return total_copied;
> - }
> -
> - /* if we need to use another bounce buffer
> */
> - if (destlen || i != orig_sgl_count - 1) {
> - cur_src_sgl = sg_next(cur_src_sgl);
> - bounce_addr = (unsigned long)
> - kmap_atomic(
> -
> sg_page(cur_src_sgl));
> - }
> - } else if (destlen == 0 && i == orig_sgl_count - 1) {
> - /* unmap the last bounce that is < PAGE_SIZE
> */
> - kunmap_atomic((void *)bounce_addr);
> - }
> - }
> -
> - kunmap_atomic((void *)(dest_addr - cur_dest_sgl->offset));
> - cur_dest_sgl = sg_next(cur_dest_sgl);
> - }
> -
> - local_irq_restore(flags);
> -
> - return total_copied;
> -}
> -
> -/* Assume the bounce_sgl has enough room ie using the
> create_bounce_buffer() */
> -static unsigned int copy_to_bounce_buffer(struct scatterlist *orig_sgl,
> - struct scatterlist *bounce_sgl,
> - unsigned int orig_sgl_count)
> -{
> - int i;
> - int j = 0;
> - unsigned long src, dest;
> - unsigned int srclen, destlen, copylen;
> - unsigned int total_copied = 0;
> - unsigned long bounce_addr = 0;
> - unsigned long src_addr = 0;
> - unsigned long flags;
> - struct scatterlist *cur_src_sgl;
> - struct scatterlist *cur_dest_sgl;
> -
> - local_irq_save(flags);
> -
> - cur_src_sgl = orig_sgl;
> - cur_dest_sgl = bounce_sgl;
> -
> - for (i = 0; i < orig_sgl_count; i++) {
> - src_addr = (unsigned long)
> - kmap_atomic(sg_page(cur_src_sgl)) +
> - cur_src_sgl->offset;
> - src = src_addr;
> - srclen = cur_src_sgl->length;
> -
> - if (bounce_addr == 0)
> - bounce_addr = (unsigned long)
> -
> kmap_atomic(sg_page(cur_dest_sgl));
> -
> - while (srclen) {
> - /* assume bounce offset always == 0 */
> - dest = bounce_addr + cur_dest_sgl->length;
> - destlen = PAGE_SIZE - cur_dest_sgl->length;
> -
> - copylen = min(srclen, destlen);
> - memcpy((void *)dest, (void *)src, copylen);
> -
> - total_copied += copylen;
> - cur_dest_sgl->length += copylen;
> - srclen -= copylen;
> - src += copylen;
> -
> - if (cur_dest_sgl->length == PAGE_SIZE) {
> - /* full..move to next entry */
> - kunmap_atomic((void *)bounce_addr);
> - bounce_addr = 0;
> - j++;
> - }
> -
> - /* if we need to use another bounce buffer */
> - if (srclen && bounce_addr == 0) {
> - cur_dest_sgl = sg_next(cur_dest_sgl);
> - bounce_addr = (unsigned long)
> - kmap_atomic(
> - sg_page(cur_dest_sgl));
> - }
> -
> - }
> -
> - kunmap_atomic((void *)(src_addr - cur_src_sgl->offset));
> - cur_src_sgl = sg_next(cur_src_sgl);
> - }
> -
> - if (bounce_addr)
> - kunmap_atomic((void *)bounce_addr);
> -
> - local_irq_restore(flags);
> -
> - return total_copied;
> -}
> -
> static void handle_sc_creation(struct vmbus_channel *new_sc)
> {
> struct hv_device *device = new_sc->primary_channel->device_obj;
> @@ -1171,15 +933,6 @@ static void storvsc_command_completion(struct
> storvsc_cmd_request *cmd_request)
> host = stor_dev->host;
>
> vm_srb = &cmd_request->vstor_packet.vm_srb;
> - if (cmd_request->bounce_sgl_count) {
> - if (vm_srb->data_in == READ_TYPE)
> - copy_from_bounce_buffer(scsi_sglist(scmnd),
> - cmd_request->bounce_sgl,
> - scsi_sg_count(scmnd),
> - cmd_request->bounce_sgl_count);
> - destroy_bounce_buffer(cmd_request->bounce_sgl,
> - cmd_request->bounce_sgl_count);
> - }
>
> scmnd->result = vm_srb->scsi_status;
>
> @@ -1474,6 +1227,9 @@ static int storvsc_device_configure(struct
> scsi_device *sdevice)
>
> blk_queue_rq_timeout(sdevice->request_queue, (storvsc_timeout
> * HZ));
>
> + /* Ensure there are no gaps in presented sgls */
> + blk_queue_virt_boundary(sdevice->request_queue, PAGE_SIZE - 1);
> +
> sdevice->no_write_same = 1;
>
> /*
> @@ -1692,40 +1448,13 @@ static int storvsc_queuecommand(struct
> Scsi_Host *host, struct scsi_cmnd *scmnd)
> payload_sz = sizeof(cmd_request->mpb);
>
> if (sg_count) {
> - /* check if we need to bounce the sgl */
> - if (do_bounce_buffer(sgl, scsi_sg_count(scmnd)) != -1) {
> - cmd_request->bounce_sgl =
> - create_bounce_buffer(sgl, sg_count,
> - length,
> - vm_srb->data_in);
> - if (!cmd_request->bounce_sgl)
> - return SCSI_MLQUEUE_HOST_BUSY;
> -
> - cmd_request->bounce_sgl_count =
> - ALIGN(length, PAGE_SIZE) >> PAGE_SHIFT;
> -
> - if (vm_srb->data_in == WRITE_TYPE)
> - copy_to_bounce_buffer(sgl,
> - cmd_request->bounce_sgl,
> sg_count);
> -
> - sgl = cmd_request->bounce_sgl;
> - sg_count = cmd_request->bounce_sgl_count;
> - }
> -
> -
> if (sg_count > MAX_PAGE_BUFFER_COUNT) {
>
> payload_sz = (sg_count * sizeof(void *) +
> sizeof(struct vmbus_packet_mpb_array));
> payload = kmalloc(payload_sz, GFP_ATOMIC);
> - if (!payload) {
> - if (cmd_request->bounce_sgl_count)
> - destroy_bounce_buffer(
> - cmd_request->bounce_sgl,
> - cmd_request->bounce_sgl_count);
> -
> - return
> SCSI_MLQUEUE_DEVICE_BUSY;
> - }
> + if (!payload)
> + return SCSI_MLQUEUE_DEVICE_BUSY;
> }
>
> payload->range.len = length;
> @@ -1754,11 +1483,6 @@ static int storvsc_queuecommand(struct Scsi_Host
> *host, struct scsi_cmnd *scmnd)
>
> if (ret == -EAGAIN) {
> /* no more space */
> -
> - if (cmd_request->bounce_sgl_count)
> - destroy_bounce_buffer(cmd_request->bounce_sgl,
> - cmd_request->bounce_sgl_count);
> -
> return SCSI_MLQUEUE_DEVICE_BUSY;
> }
>
> --
> 2.4.3
Thanks Vitaly and Christoph. We will run this patch through our testing.

Regards,

K. Y