From: Jason Wang <jasowang@redhat.com>
To: Hawkins Jiawei <yin31149@gmail.com>
Cc: eperezma@redhat.com, 18801353760@163.com, qemu-devel@nongnu.org
Subject: Re: [PATCH v2 2/2] vdpa: send CVQ state load commands in parallel
Date: Wed, 17 May 2023 13:22:06 +0800 [thread overview]
Message-ID: <CACGkMEuj=HY0YWHoXcw+qBLm4ctfTgj3P5cfWbueVFrOP1B2uQ@mail.gmail.com> (raw)
In-Reply-To: <7d800315d04359d0bb91f61ec348eda1bdb972be.1683371965.git.yin31149@gmail.com>
On Sat, May 6, 2023 at 10:07 PM Hawkins Jiawei <yin31149@gmail.com> wrote:
>
> This patch introduces the vhost_vdpa_net_cvq_add() and
> refactors the vhost_vdpa_net_load*(), so that QEMU can
> send CVQ state load commands in parallel.
>
> To be more specific, this patch introduces vhost_vdpa_net_cvq_add()
> to add SVQ control commands to SVQ and kick the device,
> but does not poll the device used buffers. QEMU will not
> poll and check the device used buffers in vhost_vdpa_net_load()
> until all CVQ state load commands have been sent to the device.
>
> What's more, in order to avoid buffer overwriting caused by
> using `svq->cvq_cmd_out_buffer` and `svq->status` as the
> buffer for all CVQ state load commands when sending
> CVQ state load commands in parallel, this patch introduces
> `out_cursor` and `in_cursor` in vhost_vdpa_net_load(),
> pointing to the available buffer for in descriptor and
> out descriptor, so that different CVQ state load commands can
> use their unique buffer.
>
> Resolves: https://gitlab.com/qemu-project/qemu/-/issues/1578
> Signed-off-by: Hawkins Jiawei <yin31149@gmail.com>
> ---
> net/vhost-vdpa.c | 152 +++++++++++++++++++++++++++++++++++++----------
> 1 file changed, 120 insertions(+), 32 deletions(-)
>
> diff --git a/net/vhost-vdpa.c b/net/vhost-vdpa.c
> index 10804c7200..14e31ca5c5 100644
> --- a/net/vhost-vdpa.c
> +++ b/net/vhost-vdpa.c
> @@ -590,6 +590,44 @@ static void vhost_vdpa_net_cvq_stop(NetClientState *nc)
> vhost_vdpa_net_client_stop(nc);
> }
>
> +/**
> + * vhost_vdpa_net_cvq_add() adds SVQ control commands to SVQ,
> + * kicks the device but does not poll the device used buffers.
> + *
> + * Return the number of elements added to SVQ if success.
> + */
> +static int vhost_vdpa_net_cvq_add(VhostVDPAState *s,
> + void **out_cursor, size_t out_len,
Can we track things like cursors in e.g VhostVDPAState ?
> + virtio_net_ctrl_ack **in_cursor, size_t in_len)
> +{
> + /* Buffers for the device */
> + const struct iovec out = {
> + .iov_base = *out_cursor,
> + .iov_len = out_len,
> + };
> + const struct iovec in = {
> + .iov_base = *in_cursor,
> + .iov_len = sizeof(virtio_net_ctrl_ack),
> + };
> + VhostShadowVirtqueue *svq = g_ptr_array_index(s->vhost_vdpa.shadow_vqs, 0);
> + int r;
> +
> + r = vhost_svq_add(svq, &out, 1, &in, 1, NULL);
> + if (unlikely(r != 0)) {
> + if (unlikely(r == -ENOSPC)) {
> + qemu_log_mask(LOG_GUEST_ERROR, "%s: No space on device queue\n",
> + __func__);
> + }
> + return r;
> + }
> +
> + /* Update the cursor */
> + *out_cursor += out_len;
> + *in_cursor += 1;
> +
> + return 1;
> +}
> +
> /**
> * vhost_vdpa_net_cvq_add_and_wait() adds SVQ control commands to SVQ,
> * kicks the device and polls the device used buffers.
> @@ -628,69 +666,82 @@ static ssize_t vhost_vdpa_net_cvq_add_and_wait(VhostVDPAState *s,
> return vhost_svq_poll(svq);
> }
>
> -static ssize_t vhost_vdpa_net_load_cmd(VhostVDPAState *s, uint8_t class,
> - uint8_t cmd, const void *data,
> - size_t data_size)
> +
> +/**
> + * vhost_vdpa_net_load_cmd() restores the NIC state through SVQ.
> + *
> + * Return the number of elements added to SVQ if success.
> + */
> +static int vhost_vdpa_net_load_cmd(VhostVDPAState *s,
> + void **out_cursor, uint8_t class, uint8_t cmd,
> + const void *data, size_t data_size,
> + virtio_net_ctrl_ack **in_cursor)
> {
> const struct virtio_net_ctrl_hdr ctrl = {
> .class = class,
> .cmd = cmd,
> };
>
> - assert(data_size < vhost_vdpa_net_cvq_cmd_page_len() - sizeof(ctrl));
> + assert(sizeof(ctrl) < vhost_vdpa_net_cvq_cmd_page_len() -
> + (*out_cursor - s->cvq_cmd_out_buffer));
> + assert(data_size < vhost_vdpa_net_cvq_cmd_page_len() - sizeof(ctrl) -
> + (*out_cursor - s->cvq_cmd_out_buffer));
>
> - memcpy(s->cvq_cmd_out_buffer, &ctrl, sizeof(ctrl));
> - memcpy(s->cvq_cmd_out_buffer + sizeof(ctrl), data, data_size);
> + memcpy(*out_cursor, &ctrl, sizeof(ctrl));
> + memcpy(*out_cursor + sizeof(ctrl), data, data_size);
>
> - return vhost_vdpa_net_cvq_add_and_wait(s, sizeof(ctrl) + data_size,
> - sizeof(virtio_net_ctrl_ack));
> + return vhost_vdpa_net_cvq_add(s, out_cursor, sizeof(ctrl) + data_size,
> + in_cursor, sizeof(virtio_net_ctrl_ack));
> }
>
> -static int vhost_vdpa_net_load_mac(VhostVDPAState *s, const VirtIONet *n)
> +/**
> + * vhost_vdpa_net_load_mac() restores the NIC mac through SVQ.
> + *
> + * Return the number of elements added to SVQ if success.
> + */
> +static int vhost_vdpa_net_load_mac(VhostVDPAState *s, const VirtIONet *n,
> + void **out_cursor, virtio_net_ctrl_ack **in_cursor)
> {
> uint64_t features = n->parent_obj.guest_features;
> if (features & BIT_ULL(VIRTIO_NET_F_CTRL_MAC_ADDR)) {
> - ssize_t dev_written = vhost_vdpa_net_load_cmd(s, VIRTIO_NET_CTRL_MAC,
> - VIRTIO_NET_CTRL_MAC_ADDR_SET,
> - n->mac, sizeof(n->mac));
> - if (unlikely(dev_written < 0)) {
> - return dev_written;
> - }
> -
> - return *s->status != VIRTIO_NET_OK;
> + return vhost_vdpa_net_load_cmd(s, out_cursor, VIRTIO_NET_CTRL_MAC,
> + VIRTIO_NET_CTRL_MAC_ADDR_SET,
> + n->mac, sizeof(n->mac), in_cursor);
> }
>
> return 0;
> }
>
> -static int vhost_vdpa_net_load_mq(VhostVDPAState *s,
> - const VirtIONet *n)
> +/**
> + * vhost_vdpa_net_load_mac() restores the NIC mq state through SVQ.
> + *
> + * Return the number of elements added to SVQ if success.
> + */
> +static int vhost_vdpa_net_load_mq(VhostVDPAState *s, const VirtIONet *n,
> + void **out_cursor, virtio_net_ctrl_ack **in_cursor)
> {
> struct virtio_net_ctrl_mq mq;
> uint64_t features = n->parent_obj.guest_features;
> - ssize_t dev_written;
>
> if (!(features & BIT_ULL(VIRTIO_NET_F_MQ))) {
> return 0;
> }
>
> mq.virtqueue_pairs = cpu_to_le16(n->curr_queue_pairs);
> - dev_written = vhost_vdpa_net_load_cmd(s, VIRTIO_NET_CTRL_MQ,
> - VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET, &mq,
> - sizeof(mq));
> - if (unlikely(dev_written < 0)) {
> - return dev_written;
> - }
> -
> - return *s->status != VIRTIO_NET_OK;
> + return vhost_vdpa_net_load_cmd(s, out_cursor, VIRTIO_NET_CTRL_MQ,
> + VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET,
> + &mq, sizeof(mq), in_cursor);
> }
>
> static int vhost_vdpa_net_load(NetClientState *nc)
> {
> VhostVDPAState *s = DO_UPCAST(VhostVDPAState, nc, nc);
> + VhostShadowVirtqueue *svq;
> + void *out_cursor;
> + virtio_net_ctrl_ack *in_cursor;
> struct vhost_vdpa *v = &s->vhost_vdpa;
> const VirtIONet *n;
> - int r;
> + ssize_t cmds_in_flight = 0, dev_written, r;
>
> assert(nc->info->type == NET_CLIENT_DRIVER_VHOST_VDPA);
>
> @@ -699,14 +750,51 @@ static int vhost_vdpa_net_load(NetClientState *nc)
> }
>
> n = VIRTIO_NET(v->dev->vdev);
> - r = vhost_vdpa_net_load_mac(s, n);
> + out_cursor = s->cvq_cmd_out_buffer;
> + in_cursor = s->status;
> +
> + r = vhost_vdpa_net_load_mac(s, n, &out_cursor, &in_cursor);
> if (unlikely(r < 0))
> return r;
> }
> - r = vhost_vdpa_net_load_mq(s, n);
> - if (unlikely(r)) {
> + cmds_in_flight += r;
> +
> + r = vhost_vdpa_net_load_mq(s, n, &out_cursor, &in_cursor);
> + if (unlikely(r < 0)) {
> return r;
> }
> + cmds_in_flight += r;
> +
> + /* Poll for all used buffer from device */
> + svq = g_ptr_array_index(s->vhost_vdpa.shadow_vqs, 0);
> + while (cmds_in_flight > 0) {
> + /*
> + * We can poll here since we've had BQL from the time we sent the
> + * descriptor. Also, we need to take the answer before SVQ pulls
> + * by itself, when BQL is released
> + */
> + dev_written = vhost_svq_poll(svq);
I'd tweak vhost_svq_poll to accept cmds_in_flight.
Thanks
> +
> + if (unlikely(!dev_written)) {
> + /*
> + * vhost_svq_poll() return 0 when something wrong, such as
> + * QEMU waits for too long time or no available used buffer
> + * from device, and there is no need to continue polling
> + * in this case.
> + */
> + return -EINVAL;
> + }
> +
> + --cmds_in_flight;
> + }
> +
> + /* Check the buffers written by device */
> + for (virtio_net_ctrl_ack *status = s->status; status < in_cursor;
> + ++status) {
> + if (*status != VIRTIO_NET_OK) {
> + return -EINVAL;
> + }
> + }
>
> return 0;
> }
> --
> 2.25.1
>
next prev parent reply other threads:[~2023-05-17 5:23 UTC|newest]
Thread overview: 12+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-05-06 14:06 [PATCH v2 0/2] Send all the SVQ control commands in parallel Hawkins Jiawei
2023-05-06 14:06 ` [PATCH v2 1/2] vdpa: rename vhost_vdpa_net_cvq_add() Hawkins Jiawei
2023-05-17 4:12 ` Jason Wang
2023-05-17 15:11 ` Hawkins Jiawei
2023-05-06 14:06 ` [PATCH v2 2/2] vdpa: send CVQ state load commands in parallel Hawkins Jiawei
2023-05-17 5:22 ` Jason Wang [this message]
2023-05-17 8:21 ` Eugenio Perez Martin
2023-05-17 15:01 ` Hawkins Jiawei
2023-05-18 5:46 ` Jason Wang
2023-05-18 6:00 ` Eugenio Perez Martin
2023-05-18 6:12 ` Jason Wang
2023-05-18 6:54 ` Hawkins Jiawei
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to='CACGkMEuj=HY0YWHoXcw+qBLm4ctfTgj3P5cfWbueVFrOP1B2uQ@mail.gmail.com' \
--to=jasowang@redhat.com \
--cc=18801353760@163.com \
--cc=eperezma@redhat.com \
--cc=qemu-devel@nongnu.org \
--cc=yin31149@gmail.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).