block: Don't manually poll in bdrv_drain_all()

All involved nodes are already idle, we called bdrv_do_drain_begin() on them. The comment in the code suggested that this was not correct because the completion of a request on one node could spawn a new request on a different node (which might have been drained before, so we wouldn't drain the new request). In reality, new requests to different nodes aren't spawned out of nothing, but only in the context of a parent request, and they aren't submitted to random nodes, but only to child nodes. As long as we still poll for the completion of the parent request (which we do), draining each root node separately is good enough. Remove the additional polling code from bdrv_drain_all_begin() and replace it with an assertion that all nodes are already idle after we drained them separately. Signed-off-by: Kevin Wolf <kwolf@redhat.com> Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
author: Kevin Wolf <kwolf@redhat.com> 2017-12-14 11:25:16 +0100
committer: Kevin Wolf <kwolf@redhat.com> 2018-06-18 15:03:25 +0200
commit: c13ad59f012cbbccb866a10477458e69bc868dbb (patch)
tree: 8e1e5c96e0f1f98c19e5419fda528d2c26c2e4e4
parent: 7d40d9ef9dfb4948a857bfc6ec8408eed1d1d9e7 (diff)
download: qemu-c13ad59f012cbbccb866a10477458e69bc868dbb.zip
qemu-c13ad59f012cbbccb866a10477458e69bc868dbb.tar.gz
qemu-c13ad59f012cbbccb866a10477458e69bc868dbb.tar.bz2
1 files changed, 12 insertions, 29 deletions
diff --git a/block/io.c b/block/io.c
index b75d688..983307c 100644
--- a/block/io.c
+++ b/block/io.c
@@ -377,6 +377,16 @@ void bdrv_drain(BlockDriverState *bs)
     bdrv_drained_end(bs);
 }
 
+static void bdrv_drain_assert_idle(BlockDriverState *bs)
+{
+    BdrvChild *child, *next;
+
+    assert(atomic_read(&bs->in_flight) == 0);
+    QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
+        bdrv_drain_assert_idle(child->bs);
+    }
+}
+
 /*
  * Wait for pending requests to complete across all BlockDriverStates
  *
@@ -391,11 +401,8 @@ void bdrv_drain(BlockDriverState *bs)
  */
 void bdrv_drain_all_begin(void)
 {
-    /* Always run first iteration so any pending completion BHs run */
-    bool waited = true;
     BlockDriverState *bs;
     BdrvNextIterator it;
-    GSList *aio_ctxs = NULL, *ctx;
 
     /* BDRV_POLL_WHILE() for a node can only be called from its own I/O thread
      * or the main loop AioContext. We potentially use BDRV_POLL_WHILE() on
@@ -409,35 +416,11 @@ void bdrv_drain_all_begin(void)
         aio_context_acquire(aio_context);
         bdrv_do_drained_begin(bs, true, NULL);
         aio_context_release(aio_context);
-
-        if (!g_slist_find(aio_ctxs, aio_context)) {
-            aio_ctxs = g_slist_prepend(aio_ctxs, aio_context);
-        }
     }
 
-    /* Note that completion of an asynchronous I/O operation can trigger any
-     * number of other I/O operations on other devices---for example a
-     * coroutine can submit an I/O request to another device in response to
-     * request completion.  Therefore we must keep looping until there was no
-     * more activity rather than simply draining each device independently.
-     */
-    while (waited) {
-        waited = false;
-
-        for (ctx = aio_ctxs; ctx != NULL; ctx = ctx->next) {
-            AioContext *aio_context = ctx->data;
-
-            aio_context_acquire(aio_context);
-            for (bs = bdrv_first(&it); bs; bs = bdrv_next(&it)) {
-                if (aio_context == bdrv_get_aio_context(bs)) {
-                    waited |= bdrv_drain_recurse(bs);
-                }
-            }
-            aio_context_release(aio_context);
-        }
+    for (bs = bdrv_first(&it); bs; bs = bdrv_next(&it)) {
+        bdrv_drain_assert_idle(bs);
     }
-
-    g_slist_free(aio_ctxs);
 }
 
 void bdrv_drain_all_end(void)
author	Kevin Wolf <kwolf@redhat.com>	2017-12-14 11:25:16 +0100
committer	Kevin Wolf <kwolf@redhat.com>	2018-06-18 15:03:25 +0200
commit	c13ad59f012cbbccb866a10477458e69bc868dbb (patch)
tree	8e1e5c96e0f1f98c19e5419fda528d2c26c2e4e4
parent	7d40d9ef9dfb4948a857bfc6ec8408eed1d1d9e7 (diff)
download	qemu-c13ad59f012cbbccb866a10477458e69bc868dbb.zip qemu-c13ad59f012cbbccb866a10477458e69bc868dbb.tar.gz qemu-c13ad59f012cbbccb866a10477458e69bc868dbb.tar.bz2