From: Anthony Liguori <aliguori@us.ibm.com>
To: Alexey Kardashevskiy <aik@ozlabs.ru>, qemu-devel@nongnu.org
Cc: Alexander Graf <agraf@suse.de>,
qemu-ppc@nongnu.org, Paolo Bonzini <pbonzini@redhat.com>,
Paul Mackerras <paulus@samba.org>,
David Gibson <david@gibson.dropbear.id.au>
Subject: Re: [Qemu-devel] [PATCH 09/17] pseries: rework PAPR virtual SCSI
Date: Mon, 08 Jul 2013 13:42:36 -0500 [thread overview]
Message-ID: <87ppuszyeb.fsf@codemonkey.ws> (raw)
In-Reply-To: <1372315560-5478-10-git-send-email-aik@ozlabs.ru>
Alexey Kardashevskiy <aik@ozlabs.ru> writes:
> The patch reimplements handling of indirect requests in order to
> simplify upcoming live migration support.
> - all pointers (except SCSIRequest*) were replaces with integer
> indexes and offsets;
> - DMA'ed srp_direct_buf kept untouched (ie. BE format);
> - vscsi_fetch_desc() is added, now it is the only place where
> descriptors are fetched and byteswapped;
> - vscsi_req struct fields converted to migration-friendly types;
> - many dprintf()'s fixed.
>
> This also removed an unused field 'lun' from the spapr_vscsi device
> which is assigned, but never used. So, remove it.
>
> [David Gibson: removed unused 'lun']
> Signed-off-by: Alexey Kardashevskiy <aik@ozlabs.ru>
> Cc: David Gibson <david@gibson.dropbear.id.au>
> ---
> hw/scsi/spapr_vscsi.c | 224 +++++++++++++++++++++++++++++--------------------
> 1 file changed, 131 insertions(+), 93 deletions(-)
>
> diff --git a/hw/scsi/spapr_vscsi.c b/hw/scsi/spapr_vscsi.c
> index e8978bf..1e93102 100644
> --- a/hw/scsi/spapr_vscsi.c
> +++ b/hw/scsi/spapr_vscsi.c
> @@ -75,20 +75,19 @@ typedef struct vscsi_req {
> /* SCSI request tracking */
> SCSIRequest *sreq;
> uint32_t qtag; /* qemu tag != srp tag */
> - int lun;
> - int active;
> - long data_len;
> - int writing;
> - int senselen;
> + bool active;
> + uint32_t data_len;
> + bool writing;
> + uint32_t senselen;
> uint8_t sense[SCSI_SENSE_BUF_SIZE];
>
> /* RDMA related bits */
> uint8_t dma_fmt;
> - struct srp_direct_buf ext_desc;
> - struct srp_direct_buf *cur_desc;
> - struct srp_indirect_buf *ind_desc;
> - int local_desc;
> - int total_desc;
> + uint16_t local_desc;
> + uint16_t total_desc;
> + uint16_t cdb_offset;
> + uint16_t cur_desc_num;
> + uint16_t cur_desc_offset;
> } vscsi_req;
>
> #define TYPE_VIO_SPAPR_VSCSI_DEVICE "spapr-vscsi"
> @@ -264,93 +263,139 @@ static int vscsi_send_rsp(VSCSIState *s, vscsi_req *req,
> return 0;
> }
>
> -static inline void vscsi_swap_desc(struct srp_direct_buf *desc)
> +static inline struct srp_direct_buf vscsi_swap_desc(struct srp_direct_buf desc)
> {
> - desc->va = be64_to_cpu(desc->va);
> - desc->len = be32_to_cpu(desc->len);
> + desc.va = be64_to_cpu(desc.va);
> + desc.len = be32_to_cpu(desc.len);
> + return desc;
> +}
> +
> +static int vscsi_fetch_desc(VSCSIState *s, struct vscsi_req *req,
> + unsigned n, unsigned buf_offset,
> + struct srp_direct_buf *ret)
> +{
> + struct srp_cmd *cmd = &req->iu.srp.cmd;
> +
> + switch (req->dma_fmt) {
> + case SRP_NO_DATA_DESC: {
> + dprintf("VSCSI: no data descriptor\n");
> + return 0;
> + }
> + case SRP_DATA_DESC_DIRECT: {
> + *ret = *(struct srp_direct_buf *)(cmd->add_data +
> req->cdb_offset);
If you're reworking this code, you should remove these casts. It's not
safe to assume that cdb_offset is aligned properly. memcpy()'ing would
be much safer.
Regards,
Anthony Liguori
> + assert(req->cur_desc_num == 0);
> + dprintf("VSCSI: direct segment");
> + break;
> + }
> + case SRP_DATA_DESC_INDIRECT: {
> + struct srp_indirect_buf *tmp = (struct srp_indirect_buf *)
> + (cmd->add_data + req->cdb_offset);
> + if (n < req->local_desc) {
> + *ret = tmp->desc_list[n];
> + dprintf("VSCSI: indirect segment local tag=0x%x desc#%d/%d",
> + req->qtag, n, req->local_desc);
> +
> + } else if (n < req->total_desc) {
> + int rc;
> + struct srp_direct_buf tbl_desc = vscsi_swap_desc(tmp->table_desc);
> + unsigned desc_offset = (n - req->local_desc) *
> + sizeof(struct srp_direct_buf);
> +
> + if (desc_offset > tbl_desc.len) {
> + dprintf("VSCSI: #%d is ouf of range (%d bytes)\n",
> + n, desc_offset);
> + return -1;
> + }
> + rc = spapr_vio_dma_read(&s->vdev, tbl_desc.va + desc_offset,
> + ret, sizeof(struct srp_direct_buf));
> + if (rc) {
> + dprintf("VSCSI: spapr_vio_dma_read -> %d reading ext_desc\n",
> + rc);
> + return rc;
> + }
> + dprintf("VSCSI: indirect segment ext. tag=0x%x desc#%d/%d { va=%"PRIx64" len=%x }",
> + req->qtag, n, req->total_desc, tbl_desc.va, tbl_desc.len);
> + } else {
> + dprintf("VSCSI: Out of descriptors !\n");
> + return 0;
> + }
> + break;
> + }
> + default:
> + fprintf(stderr, "VSCSI: Unknown format %x\n", req->dma_fmt);
> + return -1;
> + }
> +
> + *ret = vscsi_swap_desc(*ret);
> + if (buf_offset > ret->len) {
> + dprintf(" offset=%x is out of a descriptor #%d boundary=%x\n",
> + buf_offset, req->cur_desc_num, ret->len);
> + return -1;
> + }
> + ret->va += buf_offset;
> + ret->len -= buf_offset;
> +
> + dprintf(" cur=%d offs=%x ret { va=%"PRIx64" len=%x }\n",
> + req->cur_desc_num, req->cur_desc_offset, ret->va, ret->len);
> +
> + return ret->len ? 1 : 0;
> }
>
> static int vscsi_srp_direct_data(VSCSIState *s, vscsi_req *req,
> uint8_t *buf, uint32_t len)
> {
> - struct srp_direct_buf *md = req->cur_desc;
> + struct srp_direct_buf md;
> uint32_t llen;
> int rc = 0;
>
> - dprintf("VSCSI: direct segment 0x%x bytes, va=0x%llx desc len=0x%x\n",
> - len, (unsigned long long)md->va, md->len);
> + rc = vscsi_fetch_desc(s, req, req->cur_desc_num, req->cur_desc_offset, &md);
> + if (rc < 0) {
> + return -1;
> + } else if (rc == 0) {
> + return 0;
> + }
>
> - llen = MIN(len, md->len);
> + llen = MIN(len, md.len);
> if (llen) {
> if (req->writing) { /* writing = to device = reading from memory */
> - rc = spapr_vio_dma_read(&s->vdev, md->va, buf, llen);
> + rc = spapr_vio_dma_read(&s->vdev, md.va, buf, llen);
> } else {
> - rc = spapr_vio_dma_write(&s->vdev, md->va, buf, llen);
> + rc = spapr_vio_dma_write(&s->vdev, md.va, buf, llen);
> }
> }
> - md->len -= llen;
> - md->va += llen;
>
> if (rc) {
> return -1;
> }
> + req->cur_desc_offset += llen;
> +
> return llen;
> }
>
> static int vscsi_srp_indirect_data(VSCSIState *s, vscsi_req *req,
> uint8_t *buf, uint32_t len)
> {
> - struct srp_direct_buf *td = &req->ind_desc->table_desc;
> - struct srp_direct_buf *md = req->cur_desc;
> + struct srp_direct_buf md;
> int rc = 0;
> uint32_t llen, total = 0;
>
> - dprintf("VSCSI: indirect segment 0x%x bytes, td va=0x%llx len=0x%x\n",
> - len, (unsigned long long)td->va, td->len);
> + dprintf("VSCSI: indirect segment 0x%x bytes\n", len);
>
> /* While we have data ... */
> while (len) {
> - /* If we have a descriptor but it's empty, go fetch a new one */
> - if (md && md->len == 0) {
> - /* More local available, use one */
> - if (req->local_desc) {
> - md = ++req->cur_desc;
> - --req->local_desc;
> - --req->total_desc;
> - td->va += sizeof(struct srp_direct_buf);
> - } else {
> - md = req->cur_desc = NULL;
> - }
> - }
> - /* No descriptor at hand, fetch one */
> - if (!md) {
> - if (!req->total_desc) {
> - dprintf("VSCSI: Out of descriptors !\n");
> - break;
> - }
> - md = req->cur_desc = &req->ext_desc;
> - dprintf("VSCSI: Reading desc from 0x%llx\n",
> - (unsigned long long)td->va);
> - rc = spapr_vio_dma_read(&s->vdev, td->va, md,
> - sizeof(struct srp_direct_buf));
> - if (rc) {
> - dprintf("VSCSI: spapr_vio_dma_read -> %d reading ext_desc\n",
> - rc);
> - break;
> - }
> - vscsi_swap_desc(md);
> - td->va += sizeof(struct srp_direct_buf);
> - --req->total_desc;
> + rc = vscsi_fetch_desc(s, req, req->cur_desc_num, req->cur_desc_offset, &md);
> + if (rc < 0) {
> + return -1;
> + } else if (rc == 0) {
> + break;
> }
> - dprintf("VSCSI: [desc va=0x%llx,len=0x%x] remaining=0x%x\n",
> - (unsigned long long)md->va, md->len, len);
>
> /* Perform transfer */
> - llen = MIN(len, md->len);
> + llen = MIN(len, md.len);
> if (req->writing) { /* writing = to device = reading from memory */
> - rc = spapr_vio_dma_read(&s->vdev, md->va, buf, llen);
> + rc = spapr_vio_dma_read(&s->vdev, md.va, buf, llen);
> } else {
> - rc = spapr_vio_dma_write(&s->vdev, md->va, buf, llen);
> + rc = spapr_vio_dma_write(&s->vdev, md.va, buf, llen);
> }
> if (rc) {
> dprintf("VSCSI: spapr_vio_dma_r/w(%d) -> %d\n", req->writing, rc);
> @@ -361,10 +406,18 @@ static int vscsi_srp_indirect_data(VSCSIState *s, vscsi_req *req,
>
> len -= llen;
> buf += llen;
> +
> total += llen;
> - md->va += llen;
> - md->len -= llen;
> +
> + /* Update current position in the current descriptor */
> + req->cur_desc_offset += llen;
> + if (md.len == llen) {
> + /* Go to the next descriptor if the current one finished */
> + ++req->cur_desc_num;
> + req->cur_desc_offset = 0;
> + }
> }
> +
> return rc ? -1 : total;
> }
>
> @@ -412,14 +465,13 @@ static int data_out_desc_size(struct srp_cmd *cmd)
> static int vscsi_preprocess_desc(vscsi_req *req)
> {
> struct srp_cmd *cmd = &req->iu.srp.cmd;
> - int offset, i;
>
> - offset = cmd->add_cdb_len & ~3;
> + req->cdb_offset = cmd->add_cdb_len & ~3;
>
> if (req->writing) {
> req->dma_fmt = cmd->buf_fmt >> 4;
> } else {
> - offset += data_out_desc_size(cmd);
> + req->cdb_offset += data_out_desc_size(cmd);
> req->dma_fmt = cmd->buf_fmt & ((1U << 4) - 1);
> }
>
> @@ -427,31 +479,18 @@ static int vscsi_preprocess_desc(vscsi_req *req)
> case SRP_NO_DATA_DESC:
> break;
> case SRP_DATA_DESC_DIRECT:
> - req->cur_desc = (struct srp_direct_buf *)(cmd->add_data + offset);
> req->total_desc = req->local_desc = 1;
> - vscsi_swap_desc(req->cur_desc);
> - dprintf("VSCSI: using direct RDMA %s, 0x%x bytes MD: 0x%llx\n",
> - req->writing ? "write" : "read",
> - req->cur_desc->len, (unsigned long long)req->cur_desc->va);
> break;
> - case SRP_DATA_DESC_INDIRECT:
> - req->ind_desc = (struct srp_indirect_buf *)(cmd->add_data + offset);
> - vscsi_swap_desc(&req->ind_desc->table_desc);
> - req->total_desc = req->ind_desc->table_desc.len /
> - sizeof(struct srp_direct_buf);
> + case SRP_DATA_DESC_INDIRECT: {
> + struct srp_indirect_buf *ind_tmp = (struct srp_indirect_buf *)
> + (cmd->add_data + req->cdb_offset);
> +
> + req->total_desc = be32_to_cpu(ind_tmp->table_desc.len) /
> + sizeof(struct srp_direct_buf);
> req->local_desc = req->writing ? cmd->data_out_desc_cnt :
> - cmd->data_in_desc_cnt;
> - for (i = 0; i < req->local_desc; i++) {
> - vscsi_swap_desc(&req->ind_desc->desc_list[i]);
> - }
> - req->cur_desc = req->local_desc ? &req->ind_desc->desc_list[0] : NULL;
> - dprintf("VSCSI: using indirect RDMA %s, 0x%x bytes %d descs "
> - "(%d local) VA: 0x%llx\n",
> - req->writing ? "read" : "write",
> - be32_to_cpu(req->ind_desc->len),
> - req->total_desc, req->local_desc,
> - (unsigned long long)req->ind_desc->table_desc.va);
> + cmd->data_in_desc_cnt;
> break;
> + }
> default:
> fprintf(stderr,
> "vscsi_preprocess_desc: Unknown format %x\n", req->dma_fmt);
> @@ -499,8 +538,8 @@ static void vscsi_command_complete(SCSIRequest *sreq, uint32_t status, size_t re
> vscsi_req *req = sreq->hba_private;
> int32_t res_in = 0, res_out = 0;
>
> - dprintf("VSCSI: SCSI cmd complete, r=0x%x tag=0x%x status=0x%x, req=%p\n",
> - reason, sreq->tag, status, req);
> + dprintf("VSCSI: SCSI cmd complete, tag=0x%x status=0x%x, req=%p\n",
> + sreq->tag, status, req);
> if (req == NULL) {
> fprintf(stderr, "VSCSI: Can't find request for tag 0x%x\n", sreq->tag);
> return;
> @@ -509,7 +548,7 @@ static void vscsi_command_complete(SCSIRequest *sreq, uint32_t status, size_t re
> if (status == CHECK_CONDITION) {
> req->senselen = scsi_req_get_sense(req->sreq, req->sense,
> sizeof(req->sense));
> - dprintf("VSCSI: Sense data, %d bytes:\n", len);
> + dprintf("VSCSI: Sense data, %d bytes:\n", req->senselen);
> dprintf(" %02x %02x %02x %02x %02x %02x %02x %02x\n",
> req->sense[0], req->sense[1], req->sense[2], req->sense[3],
> req->sense[4], req->sense[5], req->sense[6], req->sense[7]);
> @@ -621,12 +660,11 @@ static int vscsi_queue_cmd(VSCSIState *s, vscsi_req *req)
> } return 1;
> }
>
> - req->lun = lun;
> req->sreq = scsi_req_new(sdev, req->qtag, lun, srp->cmd.cdb, req);
> n = scsi_req_enqueue(req->sreq);
>
> - dprintf("VSCSI: Queued command tag 0x%x CMD 0x%x ID %d LUN %d ret: %d\n",
> - req->qtag, srp->cmd.cdb[0], id, lun, n);
> + dprintf("VSCSI: Queued command tag 0x%x CMD 0x%x LUN %d ret: %d\n",
> + req->qtag, srp->cmd.cdb[0], lun, n);
>
> if (n) {
> /* Transfer direction must be set before preprocessing the
> --
> 1.7.10.4
next prev parent reply other threads:[~2013-07-08 18:56 UTC|newest]
Thread overview: 92+ messages / expand[flat|nested] mbox.gz Atom feed top
2013-06-27 6:45 [Qemu-devel] [PATCH 00/17 v3] spapr: migration, pci, msi, power8 Alexey Kardashevskiy
2013-06-27 6:45 ` [Qemu-devel] [PATCH 01/17] pseries: move interrupt controllers to hw/intc/ Alexey Kardashevskiy
2013-07-02 20:54 ` Andreas Färber
2013-07-08 18:15 ` Anthony Liguori
2013-07-08 18:34 ` Alexander Graf
2013-06-27 6:45 ` [Qemu-devel] [PATCH 02/17] pseries: rework XICS Alexey Kardashevskiy
2013-06-27 11:47 ` David Gibson
2013-06-27 12:17 ` Alexey Kardashevskiy
2013-07-02 0:06 ` David Gibson
2013-07-02 0:21 ` Alexander Graf
2013-07-02 2:08 ` Alexey Kardashevskiy
2013-07-08 18:24 ` Anthony Liguori
2013-07-08 18:22 ` Anthony Liguori
2013-07-09 3:40 ` Alexey Kardashevskiy
2013-07-09 4:48 ` Benjamin Herrenschmidt
2013-07-09 13:58 ` Anthony Liguori
2013-07-10 3:06 ` Alexey Kardashevskiy
2013-07-10 3:26 ` Benjamin Herrenschmidt
2013-07-10 12:09 ` Anthony Liguori
2013-06-27 6:45 ` [Qemu-devel] [PATCH 03/17] savevm: Implement VMS_DIVIDE flag Alexey Kardashevskiy
2013-07-08 18:27 ` Anthony Liguori
2013-07-08 23:57 ` David Gibson
2013-07-09 14:06 ` Anthony Liguori
2013-07-09 14:38 ` David Gibson
2013-06-27 6:45 ` [Qemu-devel] [PATCH 04/17] target-ppc: Convert ppc cpu savevm to VMStateDescription Alexey Kardashevskiy
2013-07-08 18:29 ` Anthony Liguori
2013-07-09 5:14 ` Alexey Kardashevskiy
2013-07-09 14:08 ` Anthony Liguori
2013-07-09 15:11 ` David Gibson
2013-07-10 3:31 ` Benjamin Herrenschmidt
2013-07-10 7:49 ` David Gibson
2013-07-15 13:24 ` Paolo Bonzini
2013-06-27 6:45 ` [Qemu-devel] [PATCH 05/17] pseries: savevm support for XICS interrupt controller Alexey Kardashevskiy
2013-07-08 18:31 ` Anthony Liguori
2013-07-09 0:06 ` Alexey Kardashevskiy
2013-07-09 0:49 ` Anthony Liguori
2013-07-09 0:59 ` Alexey Kardashevskiy
2013-07-09 1:25 ` Anthony Liguori
2013-07-09 3:37 ` Alexey Kardashevskiy
2013-07-15 13:05 ` Paolo Bonzini
2013-07-15 13:13 ` Alexey Kardashevskiy
2013-07-15 13:17 ` Paolo Bonzini
2013-07-09 7:17 ` David Gibson
2013-07-15 13:10 ` Paolo Bonzini
2013-06-27 6:45 ` [Qemu-devel] [PATCH 06/17] pseries: savevm support for VIO devices Alexey Kardashevskiy
2013-07-08 18:35 ` Anthony Liguori
2013-06-27 6:45 ` [Qemu-devel] [PATCH 07/17] pseries: savevm support for PAPR VIO logical lan Alexey Kardashevskiy
2013-07-08 18:36 ` Anthony Liguori
2013-06-27 6:45 ` [Qemu-devel] [PATCH 08/17] pseries: savevm support for PAPR TCE tables Alexey Kardashevskiy
2013-07-08 18:39 ` Anthony Liguori
2013-07-08 21:45 ` Benjamin Herrenschmidt
2013-07-08 22:15 ` Anthony Liguori
2013-07-08 22:41 ` Benjamin Herrenschmidt
2013-07-09 7:20 ` David Gibson
2013-07-09 15:22 ` Anthony Liguori
2013-07-10 7:42 ` David Gibson
2013-07-09 16:26 ` Anthony Liguori
2013-07-15 13:26 ` Paolo Bonzini
2013-07-15 15:06 ` Anthony Liguori
2013-06-27 6:45 ` [Qemu-devel] [PATCH 09/17] pseries: rework PAPR virtual SCSI Alexey Kardashevskiy
2013-07-08 18:42 ` Anthony Liguori [this message]
2013-07-15 13:11 ` Paolo Bonzini
2013-06-27 6:45 ` [Qemu-devel] [PATCH 10/17] pseries: savevm support for " Alexey Kardashevskiy
2013-06-27 6:45 ` [Qemu-devel] [PATCH 11/17] pseries: savevm support for pseries machine Alexey Kardashevskiy
2013-07-08 18:45 ` Anthony Liguori
2013-07-08 18:50 ` Alexander Graf
2013-07-08 19:01 ` Anthony Liguori
2013-07-08 21:48 ` Benjamin Herrenschmidt
2013-07-08 22:23 ` Anthony Liguori
2013-06-27 6:45 ` [Qemu-devel] [PATCH 12/17] pseries: savevm support for PCI host bridge Alexey Kardashevskiy
2013-07-08 18:45 ` Anthony Liguori
2013-06-27 6:45 ` [Qemu-devel] [PATCH 13/17] target-ppc: Add helper for KVM_PPC_RTAS_DEFINE_TOKEN Alexey Kardashevskiy
2013-06-27 6:45 ` [Qemu-devel] [PATCH 14/17] pseries: Support for in-kernel XICS interrupt controller Alexey Kardashevskiy
2013-07-08 18:50 ` Anthony Liguori
2013-07-09 3:21 ` Alexey Kardashevskiy
2013-07-09 7:21 ` David Gibson
2013-07-10 3:24 ` Benjamin Herrenschmidt
2013-07-10 7:48 ` David Gibson
2013-06-27 6:45 ` [Qemu-devel] [PATCH 15/17] pseries: savevm support with KVM Alexey Kardashevskiy
2013-06-27 6:45 ` [Qemu-devel] [PATCH 16/17] ppc64: Enable QEMU to run on POWER 8 DD1 chip Alexey Kardashevskiy
2013-07-04 5:54 ` Andreas Färber
2013-07-04 6:26 ` [Qemu-devel] [Qemu-ppc] " Benjamin Herrenschmidt
2013-07-04 6:42 ` [Qemu-devel] " Prerna Saxena
2013-07-10 11:19 ` Alexander Graf
2013-06-27 6:46 ` [Qemu-devel] [PATCH 17/17] spapr-pci: rework MSI/MSIX Alexey Kardashevskiy
2013-07-04 2:31 ` [Qemu-devel] [PATCH 00/17 v3] spapr: migration, pci, msi, power8 Alexey Kardashevskiy
2013-07-04 2:40 ` Anthony Liguori
2013-07-04 2:48 ` Alexey Kardashevskiy
2013-07-08 18:01 ` Anthony Liguori
2013-07-09 6:37 ` Alexey Kardashevskiy
2013-07-09 15:26 ` Anthony Liguori
2013-07-09 14:04 ` Anthony Liguori
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=87ppuszyeb.fsf@codemonkey.ws \
--to=aliguori@us.ibm.com \
--cc=agraf@suse.de \
--cc=aik@ozlabs.ru \
--cc=david@gibson.dropbear.id.au \
--cc=paulus@samba.org \
--cc=pbonzini@redhat.com \
--cc=qemu-devel@nongnu.org \
--cc=qemu-ppc@nongnu.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).