From: Stefan Hajnoczi <stefanha@redhat.com>
To: qemu-devel@nongnu.org
Cc: Kevin Wolf <kwolf@redhat.com>,
Peter Maydell <peter.maydell@linaro.org>,
qemu-block@nongnu.org, Peter Lieven <pl@kamp.de>,
Julia Suvorova <jusual@redhat.com>,
Markus Armbruster <armbru@redhat.com>,
Max Reitz <mreitz@redhat.com>,
Stefan Hajnoczi <stefanha@redhat.com>,
Paolo Bonzini <pbonzini@redhat.com>, Fam Zheng <fam@euphon.net>,
Aarushi Mehta <mehta.aaru20@gmail.com>
Subject: [PULL 03/18] block/io: take bs->reqs_lock in bdrv_mark_request_serialising
Date: Thu, 30 Jan 2020 21:30:59 +0000 [thread overview]
Message-ID: <20200130213114.325157-4-stefanha@redhat.com> (raw)
In-Reply-To: <20200130213114.325157-1-stefanha@redhat.com>
From: Paolo Bonzini <pbonzini@redhat.com>
bdrv_mark_request_serialising is writing the overlap_offset and
overlap_bytes fields of BdrvTrackedRequest. Take bs->reqs_lock
for the whole duration of it, and not just when waiting for
serialising requests, so that tracked_request_overlaps does not
look at a half-updated request.
The new code does not unlock/relock around retries. This is unnecessary
because a retry is always preceded by a CoQueue wait, which already
releases and reacquires bs->reqs_lock.
Reported-by: Peter Lieven <pl@kamp.de>
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
Message-id: 1578495356-46219-4-git-send-email-pbonzini@redhat.com
Message-Id: <1578495356-46219-4-git-send-email-pbonzini@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
---
block/io.c | 112 ++++++++++++++++++++++++++++++-----------------------
1 file changed, 63 insertions(+), 49 deletions(-)
diff --git a/block/io.c b/block/io.c
index c466df8ed5..1eb2b2bddc 100644
--- a/block/io.c
+++ b/block/io.c
@@ -41,7 +41,6 @@
#define MAX_BOUNCE_BUFFER (32768 << BDRV_SECTOR_BITS)
static void bdrv_parent_cb_resize(BlockDriverState *bs);
-static bool coroutine_fn bdrv_wait_serialising_requests(BdrvTrackedRequest *self);
static int coroutine_fn bdrv_co_do_pwrite_zeroes(BlockDriverState *bs,
int64_t offset, int bytes, BdrvRequestFlags flags);
@@ -716,12 +715,69 @@ static void tracked_request_begin(BdrvTrackedRequest *req,
qemu_co_mutex_unlock(&bs->reqs_lock);
}
+static bool tracked_request_overlaps(BdrvTrackedRequest *req,
+ int64_t offset, uint64_t bytes)
+{
+ /* aaaa bbbb */
+ if (offset >= req->overlap_offset + req->overlap_bytes) {
+ return false;
+ }
+ /* bbbb aaaa */
+ if (req->overlap_offset >= offset + bytes) {
+ return false;
+ }
+ return true;
+}
+
+static bool coroutine_fn
+bdrv_wait_serialising_requests_locked(BlockDriverState *bs,
+ BdrvTrackedRequest *self)
+{
+ BdrvTrackedRequest *req;
+ bool retry;
+ bool waited = false;
+
+ do {
+ retry = false;
+ QLIST_FOREACH(req, &bs->tracked_requests, list) {
+ if (req == self || (!req->serialising && !self->serialising)) {
+ continue;
+ }
+ if (tracked_request_overlaps(req, self->overlap_offset,
+ self->overlap_bytes))
+ {
+ /* Hitting this means there was a reentrant request, for
+ * example, a block driver issuing nested requests. This must
+ * never happen since it means deadlock.
+ */
+ assert(qemu_coroutine_self() != req->co);
+
+ /* If the request is already (indirectly) waiting for us, or
+ * will wait for us as soon as it wakes up, then just go on
+ * (instead of producing a deadlock in the former case). */
+ if (!req->waiting_for) {
+ self->waiting_for = req;
+ qemu_co_queue_wait(&req->wait_queue, &bs->reqs_lock);
+ self->waiting_for = NULL;
+ retry = true;
+ waited = true;
+ break;
+ }
+ }
+ }
+ } while (retry);
+ return waited;
+}
+
bool bdrv_mark_request_serialising(BdrvTrackedRequest *req, uint64_t align)
{
+ BlockDriverState *bs = req->bs;
int64_t overlap_offset = req->offset & ~(align - 1);
uint64_t overlap_bytes = ROUND_UP(req->offset + req->bytes, align)
- overlap_offset;
+ bool waited;
+ qemu_co_mutex_lock(&bs->reqs_lock);
if (!req->serialising) {
atomic_inc(&req->bs->serialising_in_flight);
req->serialising = true;
@@ -729,7 +785,9 @@ bool bdrv_mark_request_serialising(BdrvTrackedRequest *req, uint64_t align)
req->overlap_offset = MIN(req->overlap_offset, overlap_offset);
req->overlap_bytes = MAX(req->overlap_bytes, overlap_bytes);
- return bdrv_wait_serialising_requests(req);
+ waited = bdrv_wait_serialising_requests_locked(bs, req);
+ qemu_co_mutex_unlock(&bs->reqs_lock);
+ return waited;
}
/**
@@ -783,20 +841,6 @@ static int bdrv_get_cluster_size(BlockDriverState *bs)
}
}
-static bool tracked_request_overlaps(BdrvTrackedRequest *req,
- int64_t offset, uint64_t bytes)
-{
- /* aaaa bbbb */
- if (offset >= req->overlap_offset + req->overlap_bytes) {
- return false;
- }
- /* bbbb aaaa */
- if (req->overlap_offset >= offset + bytes) {
- return false;
- }
- return true;
-}
-
void bdrv_inc_in_flight(BlockDriverState *bs)
{
atomic_inc(&bs->in_flight);
@@ -816,45 +860,15 @@ void bdrv_dec_in_flight(BlockDriverState *bs)
static bool coroutine_fn bdrv_wait_serialising_requests(BdrvTrackedRequest *self)
{
BlockDriverState *bs = self->bs;
- BdrvTrackedRequest *req;
- bool retry;
bool waited = false;
if (!atomic_read(&bs->serialising_in_flight)) {
return false;
}
- do {
- retry = false;
- qemu_co_mutex_lock(&bs->reqs_lock);
- QLIST_FOREACH(req, &bs->tracked_requests, list) {
- if (req == self || (!req->serialising && !self->serialising)) {
- continue;
- }
- if (tracked_request_overlaps(req, self->overlap_offset,
- self->overlap_bytes))
- {
- /* Hitting this means there was a reentrant request, for
- * example, a block driver issuing nested requests. This must
- * never happen since it means deadlock.
- */
- assert(qemu_coroutine_self() != req->co);
-
- /* If the request is already (indirectly) waiting for us, or
- * will wait for us as soon as it wakes up, then just go on
- * (instead of producing a deadlock in the former case). */
- if (!req->waiting_for) {
- self->waiting_for = req;
- qemu_co_queue_wait(&req->wait_queue, &bs->reqs_lock);
- self->waiting_for = NULL;
- retry = true;
- waited = true;
- break;
- }
- }
- }
- qemu_co_mutex_unlock(&bs->reqs_lock);
- } while (retry);
+ qemu_co_mutex_lock(&bs->reqs_lock);
+ waited = bdrv_wait_serialising_requests_locked(bs, self);
+ qemu_co_mutex_unlock(&bs->reqs_lock);
return waited;
}
--
2.24.1
next prev parent reply other threads:[~2020-01-30 21:33 UTC|newest]
Thread overview: 22+ messages / expand[flat|nested] mbox.gz Atom feed top
2020-01-30 21:30 [PULL 00/18] Block patches Stefan Hajnoczi
2020-01-30 21:30 ` [PULL 01/18] block: eliminate BDRV_REQ_NO_SERIALISING Stefan Hajnoczi
2020-01-30 21:30 ` [PULL 02/18] block/io: wait for serialising requests when a request becomes serialising Stefan Hajnoczi
2020-01-30 21:30 ` Stefan Hajnoczi [this message]
2020-01-30 21:31 ` [PULL 04/18] configure: permit use of io_uring Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 05/18] qapi/block-core: add option for io_uring Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 06/18] block/block: add BDRV flag " Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 07/18] block/io_uring: implements interfaces " Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 08/18] stubs: add stubs for io_uring interface Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 09/18] util/async: add aio interfaces for io_uring Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 10/18] blockdev: adds bdrv_parse_aio to use io_uring Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 11/18] block/file-posix.c: extend " Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 12/18] block: add trace events for io_uring Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 13/18] block/io_uring: adds userspace completion polling Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 14/18] qemu-io: adds option to use aio engine Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 15/18] qemu-img: adds option to use aio engine for benchmarking Stefan Hajnoczi
2020-02-03 10:55 ` Peter Maydell
2020-02-05 15:55 ` Julia Suvorova
2020-01-30 21:31 ` [PULL 16/18] qemu-nbd: adds option for aio engines Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 17/18] tests/qemu-iotests: enable testing with aio options Stefan Hajnoczi
2020-01-30 21:31 ` [PULL 18/18] tests/qemu-iotests: use AIOMODE with various tests Stefan Hajnoczi
2020-01-31 11:39 ` [PULL 00/18] Block patches Peter Maydell
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20200130213114.325157-4-stefanha@redhat.com \
--to=stefanha@redhat.com \
--cc=armbru@redhat.com \
--cc=fam@euphon.net \
--cc=jusual@redhat.com \
--cc=kwolf@redhat.com \
--cc=mehta.aaru20@gmail.com \
--cc=mreitz@redhat.com \
--cc=pbonzini@redhat.com \
--cc=peter.maydell@linaro.org \
--cc=pl@kamp.de \
--cc=qemu-block@nongnu.org \
--cc=qemu-devel@nongnu.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).