From: Ming Lei <ming.lei@redhat.com>
To: Damien Le Moal <damien.lemoal@wdc.com>
Cc: linux-scsi@vger.kernel.org,
"Martin K . Petersen" <martin.petersen@oracle.com>,
linux-block@vger.kernel.org, Jens Axboe <axboe@kernel.dk>,
Christoph Hellwig <hch@lst.de>,
Bart Van Assche <bvanassche@acm.org>
Subject: Re: [PATCH V4 1/3] block: Allow mapping of vmalloc-ed buffers
Date: Thu, 27 Jun 2019 15:47:21 +0800 [thread overview]
Message-ID: <20190627074720.GB24671@ming.t460p> (raw)
In-Reply-To: <20190627024910.23987-2-damien.lemoal@wdc.com>
On Thu, Jun 27, 2019 at 11:49:08AM +0900, Damien Le Moal wrote:
> To allow the SCSI subsystem scsi_execute_req() function to issue
> requests using large buffers that are better allocated with vmalloc()
> rather than kmalloc(), modify bio_map_kern() and bio_copy_kern() to
> allow passing a buffer allocated with vmalloc(). To do so, detect
> vmalloc-ed buffers using is_vmalloc_addr(). For vmalloc-ed buffers,
> flush the buffer using flush_kernel_vmap_range(), use vmalloc_to_page()
> instead of virt_to_page() to obtain the pages of the buffer, and
> invalidate the buffer addresses with invalidate_kernel_vmap_range() on
> completion of read BIOs. This last point is executed using the function
> bio_invalidate_vmalloc_pages() which is defined only if the
> architecture defines ARCH_HAS_FLUSH_KERNEL_DCACHE_PAGE, that is, if the
> architecture actually needs the invalidation done.
>
> Fixes: 515ce6061312 ("scsi: sd_zbc: Fix sd_zbc_report_zones() buffer allocation")
> Fixes: e76239a3748c ("block: add a report_zones method")
> Cc: stable@vger.kernel.org
> Signed-off-by: Damien Le Moal <damien.lemoal@wdc.com>
> ---
> block/bio.c | 43 ++++++++++++++++++++++++++++++++++++++++++-
> 1 file changed, 42 insertions(+), 1 deletion(-)
>
> diff --git a/block/bio.c b/block/bio.c
> index ce797d73bb43..1c21d1e7f1b8 100644
> --- a/block/bio.c
> +++ b/block/bio.c
> @@ -16,6 +16,7 @@
> #include <linux/workqueue.h>
> #include <linux/cgroup.h>
> #include <linux/blk-cgroup.h>
> +#include <linux/highmem.h>
>
> #include <trace/events/block.h>
> #include "blk.h"
> @@ -1479,8 +1480,26 @@ void bio_unmap_user(struct bio *bio)
> bio_put(bio);
> }
>
> +#ifdef ARCH_HAS_FLUSH_KERNEL_DCACHE_PAGE
> +static void bio_invalidate_vmalloc_pages(struct bio *bio)
> +{
> + if (bio->bi_private) {
> + struct bvec_iter_all iter_all;
> + struct bio_vec *bvec;
> + unsigned long len = 0;
> +
> + bio_for_each_segment_all(bvec, bio, iter_all)
> + len += bvec->bv_len;
> + invalidate_kernel_vmap_range(bio->bi_private, len);
> + }
> +}
> +#else
> +static void bio_invalidate_vmalloc_pages(struct bio *bio) {}
> +#endif
> +
> static void bio_map_kern_endio(struct bio *bio)
> {
> + bio_invalidate_vmalloc_pages(bio);
> bio_put(bio);
> }
>
> @@ -1501,6 +1520,8 @@ struct bio *bio_map_kern(struct request_queue *q, void *data, unsigned int len,
> unsigned long end = (kaddr + len + PAGE_SIZE - 1) >> PAGE_SHIFT;
> unsigned long start = kaddr >> PAGE_SHIFT;
> const int nr_pages = end - start;
> + bool is_vmalloc = is_vmalloc_addr(data);
> + struct page *page;
> int offset, i;
> struct bio *bio;
>
> @@ -1508,6 +1529,12 @@ struct bio *bio_map_kern(struct request_queue *q, void *data, unsigned int len,
> if (!bio)
> return ERR_PTR(-ENOMEM);
>
> + if (is_vmalloc) {
> + flush_kernel_vmap_range(data, len);
> + if ((!op_is_write(bio_op(bio))))
> + bio->bi_private = data;
> + }
> +
> offset = offset_in_page(kaddr);
> for (i = 0; i < nr_pages; i++) {
> unsigned int bytes = PAGE_SIZE - offset;
> @@ -1518,7 +1545,11 @@ struct bio *bio_map_kern(struct request_queue *q, void *data, unsigned int len,
> if (bytes > len)
> bytes = len;
>
> - if (bio_add_pc_page(q, bio, virt_to_page(data), bytes,
> + if (!is_vmalloc)
> + page = virt_to_page(data);
> + else
> + page = vmalloc_to_page(data);
> + if (bio_add_pc_page(q, bio, page, bytes,
> offset) < bytes) {
> /* we don't support partial mappings */
> bio_put(bio);
> @@ -1531,6 +1562,7 @@ struct bio *bio_map_kern(struct request_queue *q, void *data, unsigned int len,
> }
>
> bio->bi_end_io = bio_map_kern_endio;
> +
> return bio;
> }
> EXPORT_SYMBOL(bio_map_kern);
> @@ -1543,6 +1575,7 @@ static void bio_copy_kern_endio(struct bio *bio)
>
> static void bio_copy_kern_endio_read(struct bio *bio)
> {
> + unsigned long len = 0;
> char *p = bio->bi_private;
> struct bio_vec *bvec;
> struct bvec_iter_all iter_all;
> @@ -1550,8 +1583,12 @@ static void bio_copy_kern_endio_read(struct bio *bio)
> bio_for_each_segment_all(bvec, bio, iter_all) {
> memcpy(p, page_address(bvec->bv_page), bvec->bv_len);
> p += bvec->bv_len;
> + len += bvec->bv_len;
> }
>
> + if (is_vmalloc_addr(bio->bi_private))
> + invalidate_kernel_vmap_range(bio->bi_private, len);
> +
> bio_copy_kern_endio(bio);
> }
>
> @@ -1572,6 +1609,7 @@ struct bio *bio_copy_kern(struct request_queue *q, void *data, unsigned int len,
> unsigned long kaddr = (unsigned long)data;
> unsigned long end = (kaddr + len + PAGE_SIZE - 1) >> PAGE_SHIFT;
> unsigned long start = kaddr >> PAGE_SHIFT;
> + bool is_vmalloc = is_vmalloc_addr(data);
> struct bio *bio;
> void *p = data;
> int nr_pages = 0;
> @@ -1587,6 +1625,9 @@ struct bio *bio_copy_kern(struct request_queue *q, void *data, unsigned int len,
> if (!bio)
> return ERR_PTR(-ENOMEM);
>
> + if (is_vmalloc)
> + flush_kernel_vmap_range(data, len);
> +
Are your sure that invalidate[|flush]_kernel_vmap_range is needed for
bio_copy_kernel? The vmalloc buffer isn't involved in IO, and only
accessed by CPU.
Thanks,
Ming
next prev parent reply other threads:[~2019-06-27 7:47 UTC|newest]
Thread overview: 12+ messages / expand[flat|nested] mbox.gz Atom feed top
2019-06-27 2:49 [PATCH V4 0/3] Fix zone revalidation memory allocation failures Damien Le Moal
2019-06-27 2:49 ` [PATCH V4 1/3] block: Allow mapping of vmalloc-ed buffers Damien Le Moal
2019-06-27 7:28 ` Christoph Hellwig
2019-06-27 8:14 ` Damien Le Moal
2019-06-27 8:25 ` Christoph Hellwig
2019-06-27 8:37 ` Damien Le Moal
2019-06-27 7:47 ` Ming Lei [this message]
2019-06-27 8:17 ` Damien Le Moal
2019-06-27 8:25 ` Christoph Hellwig
2019-06-27 8:36 ` Damien Le Moal
2019-06-27 2:49 ` [PATCH V4 2/3] sd_zbc: Fix report zones buffer allocation Damien Le Moal
2019-06-27 2:49 ` [PATCH V4 3/3] block: Limit zone array allocation size Damien Le Moal
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20190627074720.GB24671@ming.t460p \
--to=ming.lei@redhat.com \
--cc=axboe@kernel.dk \
--cc=bvanassche@acm.org \
--cc=damien.lemoal@wdc.com \
--cc=hch@lst.de \
--cc=linux-block@vger.kernel.org \
--cc=linux-scsi@vger.kernel.org \
--cc=martin.petersen@oracle.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox