Blame SOURCES/kvm-test-bdrv-drain-bdrv_drain-works-with-cross-AioConte.patch

1bdc94
From 6ad2df3cb4ec0fbabc5d3e1beab138a071415bba Mon Sep 17 00:00:00 2001
1bdc94
From: Kevin Wolf <kwolf@redhat.com>
1bdc94
Date: Fri, 14 Sep 2018 10:54:59 +0200
1bdc94
Subject: [PATCH 08/49] test-bdrv-drain: bdrv_drain() works with
1bdc94
 cross-AioContext events
1bdc94
1bdc94
RH-Author: Kevin Wolf <kwolf@redhat.com>
1bdc94
Message-id: <20180914105540.18077-2-kwolf@redhat.com>
1bdc94
Patchwork-id: 82152
1bdc94
O-Subject: [RHV-7.6 qemu-kvm-rhev PATCH 01/42] test-bdrv-drain: bdrv_drain() works with cross-AioContext events
1bdc94
Bugzilla: 1601212
1bdc94
RH-Acked-by: John Snow <jsnow@redhat.com>
1bdc94
RH-Acked-by: Max Reitz <mreitz@redhat.com>
1bdc94
RH-Acked-by: Fam Zheng <famz@redhat.com>
1bdc94
1bdc94
As long as nobody keeps the other I/O thread from working, there is no
1bdc94
reason why bdrv_drain() wouldn't work with cross-AioContext events. The
1bdc94
key is that the root request we're waiting for is in the AioContext
1bdc94
we're polling (which it always is for bdrv_drain()) so that aio_poll()
1bdc94
is woken up in the end.
1bdc94
1bdc94
Add a test case that shows that it works. Remove the comment in
1bdc94
bdrv_drain() that claims otherwise.
1bdc94
1bdc94
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
1bdc94
(cherry picked from commit bb6756895459f181e2f25e877d3d7a10c297b5c8)
1bdc94
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
1bdc94
Signed-off-by: Miroslav Rezanina <mrezanin@redhat.com>
1bdc94
---
1bdc94
 block/io.c              |   4 --
1bdc94
 tests/test-bdrv-drain.c | 187 +++++++++++++++++++++++++++++++++++++++++++++++-
1bdc94
 2 files changed, 186 insertions(+), 5 deletions(-)
1bdc94
1bdc94
diff --git a/block/io.c b/block/io.c
1bdc94
index bb617de..7e0a169 100644
1bdc94
--- a/block/io.c
1bdc94
+++ b/block/io.c
1bdc94
@@ -369,10 +369,6 @@ void bdrv_unapply_subtree_drain(BdrvChild *child, BlockDriverState *old_parent)
1bdc94
  *
1bdc94
  * Note that unlike bdrv_drain_all(), the caller must hold the BlockDriverState
1bdc94
  * AioContext.
1bdc94
- *
1bdc94
- * Only this BlockDriverState's AioContext is run, so in-flight requests must
1bdc94
- * not depend on events in other AioContexts.  In that case, use
1bdc94
- * bdrv_drain_all() instead.
1bdc94
  */
1bdc94
 void coroutine_fn bdrv_co_drain(BlockDriverState *bs)
1bdc94
 {
1bdc94
diff --git a/tests/test-bdrv-drain.c b/tests/test-bdrv-drain.c
1bdc94
index 403446e..dee0a10 100644
1bdc94
--- a/tests/test-bdrv-drain.c
1bdc94
+++ b/tests/test-bdrv-drain.c
1bdc94
@@ -27,9 +27,13 @@
1bdc94
 #include "block/blockjob_int.h"
1bdc94
 #include "sysemu/block-backend.h"
1bdc94
 #include "qapi/error.h"
1bdc94
+#include "iothread.h"
1bdc94
+
1bdc94
+static QemuEvent done_event;
1bdc94
 
1bdc94
 typedef struct BDRVTestState {
1bdc94
     int drain_count;
1bdc94
+    AioContext *bh_indirection_ctx;
1bdc94
 } BDRVTestState;
1bdc94
 
1bdc94
 static void coroutine_fn bdrv_test_co_drain_begin(BlockDriverState *bs)
1bdc94
@@ -50,16 +54,29 @@ static void bdrv_test_close(BlockDriverState *bs)
1bdc94
     g_assert_cmpint(s->drain_count, >, 0);
1bdc94
 }
1bdc94
 
1bdc94
+static void co_reenter_bh(void *opaque)
1bdc94
+{
1bdc94
+    aio_co_wake(opaque);
1bdc94
+}
1bdc94
+
1bdc94
 static int coroutine_fn bdrv_test_co_preadv(BlockDriverState *bs,
1bdc94
                                             uint64_t offset, uint64_t bytes,
1bdc94
                                             QEMUIOVector *qiov, int flags)
1bdc94
 {
1bdc94
+    BDRVTestState *s = bs->opaque;
1bdc94
+
1bdc94
     /* We want this request to stay until the polling loop in drain waits for
1bdc94
      * it to complete. We need to sleep a while as bdrv_drain_invoke() comes
1bdc94
      * first and polls its result, too, but it shouldn't accidentally complete
1bdc94
      * this request yet. */
1bdc94
     qemu_co_sleep_ns(QEMU_CLOCK_REALTIME, 100000);
1bdc94
 
1bdc94
+    if (s->bh_indirection_ctx) {
1bdc94
+        aio_bh_schedule_oneshot(s->bh_indirection_ctx, co_reenter_bh,
1bdc94
+                                qemu_coroutine_self());
1bdc94
+        qemu_coroutine_yield();
1bdc94
+    }
1bdc94
+
1bdc94
     return 0;
1bdc94
 }
1bdc94
 
1bdc94
@@ -490,6 +507,164 @@ static void test_graph_change(void)
1bdc94
     blk_unref(blk_b);
1bdc94
 }
1bdc94
 
1bdc94
+struct test_iothread_data {
1bdc94
+    BlockDriverState *bs;
1bdc94
+    enum drain_type drain_type;
1bdc94
+    int *aio_ret;
1bdc94
+};
1bdc94
+
1bdc94
+static void test_iothread_drain_entry(void *opaque)
1bdc94
+{
1bdc94
+    struct test_iothread_data *data = opaque;
1bdc94
+
1bdc94
+    aio_context_acquire(bdrv_get_aio_context(data->bs));
1bdc94
+    do_drain_begin(data->drain_type, data->bs);
1bdc94
+    g_assert_cmpint(*data->aio_ret, ==, 0);
1bdc94
+    do_drain_end(data->drain_type, data->bs);
1bdc94
+    aio_context_release(bdrv_get_aio_context(data->bs));
1bdc94
+
1bdc94
+    qemu_event_set(&done_event);
1bdc94
+}
1bdc94
+
1bdc94
+static void test_iothread_aio_cb(void *opaque, int ret)
1bdc94
+{
1bdc94
+    int *aio_ret = opaque;
1bdc94
+    *aio_ret = ret;
1bdc94
+    qemu_event_set(&done_event);
1bdc94
+}
1bdc94
+
1bdc94
+/*
1bdc94
+ * Starts an AIO request on a BDS that runs in the AioContext of iothread 1.
1bdc94
+ * The request involves a BH on iothread 2 before it can complete.
1bdc94
+ *
1bdc94
+ * @drain_thread = 0 means that do_drain_begin/end are called from the main
1bdc94
+ * thread, @drain_thread = 1 means that they are called from iothread 1. Drain
1bdc94
+ * for this BDS cannot be called from iothread 2 because only the main thread
1bdc94
+ * may do cross-AioContext polling.
1bdc94
+ */
1bdc94
+static void test_iothread_common(enum drain_type drain_type, int drain_thread)
1bdc94
+{
1bdc94
+    BlockBackend *blk;
1bdc94
+    BlockDriverState *bs;
1bdc94
+    BDRVTestState *s;
1bdc94
+    BlockAIOCB *acb;
1bdc94
+    int aio_ret;
1bdc94
+    struct test_iothread_data data;
1bdc94
+
1bdc94
+    IOThread *a = iothread_new();
1bdc94
+    IOThread *b = iothread_new();
1bdc94
+    AioContext *ctx_a = iothread_get_aio_context(a);
1bdc94
+    AioContext *ctx_b = iothread_get_aio_context(b);
1bdc94
+
1bdc94
+    QEMUIOVector qiov;
1bdc94
+    struct iovec iov = {
1bdc94
+        .iov_base = NULL,
1bdc94
+        .iov_len = 0,
1bdc94
+    };
1bdc94
+    qemu_iovec_init_external(&qiov, &iov, 1);
1bdc94
+
1bdc94
+    /* bdrv_drain_all() may only be called from the main loop thread */
1bdc94
+    if (drain_type == BDRV_DRAIN_ALL && drain_thread != 0) {
1bdc94
+        goto out;
1bdc94
+    }
1bdc94
+
1bdc94
+    blk = blk_new(BLK_PERM_ALL, BLK_PERM_ALL);
1bdc94
+    bs = bdrv_new_open_driver(&bdrv_test, "test-node", BDRV_O_RDWR,
1bdc94
+                              &error_abort);
1bdc94
+    s = bs->opaque;
1bdc94
+    blk_insert_bs(blk, bs, &error_abort);
1bdc94
+
1bdc94
+    blk_set_aio_context(blk, ctx_a);
1bdc94
+    aio_context_acquire(ctx_a);
1bdc94
+
1bdc94
+    s->bh_indirection_ctx = ctx_b;
1bdc94
+
1bdc94
+    aio_ret = -EINPROGRESS;
1bdc94
+    if (drain_thread == 0) {
1bdc94
+        acb = blk_aio_preadv(blk, 0, &qiov, 0, test_iothread_aio_cb, &aio_ret);
1bdc94
+    } else {
1bdc94
+        acb = blk_aio_preadv(blk, 0, &qiov, 0, aio_ret_cb, &aio_ret);
1bdc94
+    }
1bdc94
+    g_assert(acb != NULL);
1bdc94
+    g_assert_cmpint(aio_ret, ==, -EINPROGRESS);
1bdc94
+
1bdc94
+    aio_context_release(ctx_a);
1bdc94
+
1bdc94
+    data = (struct test_iothread_data) {
1bdc94
+        .bs         = bs,
1bdc94
+        .drain_type = drain_type,
1bdc94
+        .aio_ret    = &aio_ret,
1bdc94
+    };
1bdc94
+
1bdc94
+    switch (drain_thread) {
1bdc94
+    case 0:
1bdc94
+        if (drain_type != BDRV_DRAIN_ALL) {
1bdc94
+            aio_context_acquire(ctx_a);
1bdc94
+        }
1bdc94
+
1bdc94
+        /* The request is running on the IOThread a. Draining its block device
1bdc94
+         * will make sure that it has completed as far as the BDS is concerned,
1bdc94
+         * but the drain in this thread can continue immediately after
1bdc94
+         * bdrv_dec_in_flight() and aio_ret might be assigned only slightly
1bdc94
+         * later. */
1bdc94
+        qemu_event_reset(&done_event);
1bdc94
+        do_drain_begin(drain_type, bs);
1bdc94
+        g_assert_cmpint(bs->in_flight, ==, 0);
1bdc94
+
1bdc94
+        if (drain_type != BDRV_DRAIN_ALL) {
1bdc94
+            aio_context_release(ctx_a);
1bdc94
+        }
1bdc94
+        qemu_event_wait(&done_event);
1bdc94
+        if (drain_type != BDRV_DRAIN_ALL) {
1bdc94
+            aio_context_acquire(ctx_a);
1bdc94
+        }
1bdc94
+
1bdc94
+        g_assert_cmpint(aio_ret, ==, 0);
1bdc94
+        do_drain_end(drain_type, bs);
1bdc94
+
1bdc94
+        if (drain_type != BDRV_DRAIN_ALL) {
1bdc94
+            aio_context_release(ctx_a);
1bdc94
+        }
1bdc94
+        break;
1bdc94
+    case 1:
1bdc94
+        qemu_event_reset(&done_event);
1bdc94
+        aio_bh_schedule_oneshot(ctx_a, test_iothread_drain_entry, &data);
1bdc94
+        qemu_event_wait(&done_event);
1bdc94
+        break;
1bdc94
+    default:
1bdc94
+        g_assert_not_reached();
1bdc94
+    }
1bdc94
+
1bdc94
+    aio_context_acquire(ctx_a);
1bdc94
+    blk_set_aio_context(blk, qemu_get_aio_context());
1bdc94
+    aio_context_release(ctx_a);
1bdc94
+
1bdc94
+    bdrv_unref(bs);
1bdc94
+    blk_unref(blk);
1bdc94
+
1bdc94
+out:
1bdc94
+    iothread_join(a);
1bdc94
+    iothread_join(b);
1bdc94
+}
1bdc94
+
1bdc94
+static void test_iothread_drain_all(void)
1bdc94
+{
1bdc94
+    test_iothread_common(BDRV_DRAIN_ALL, 0);
1bdc94
+    test_iothread_common(BDRV_DRAIN_ALL, 1);
1bdc94
+}
1bdc94
+
1bdc94
+static void test_iothread_drain(void)
1bdc94
+{
1bdc94
+    test_iothread_common(BDRV_DRAIN, 0);
1bdc94
+    test_iothread_common(BDRV_DRAIN, 1);
1bdc94
+}
1bdc94
+
1bdc94
+static void test_iothread_drain_subtree(void)
1bdc94
+{
1bdc94
+    test_iothread_common(BDRV_SUBTREE_DRAIN, 0);
1bdc94
+    test_iothread_common(BDRV_SUBTREE_DRAIN, 1);
1bdc94
+}
1bdc94
+
1bdc94
 
1bdc94
 typedef struct TestBlockJob {
1bdc94
     BlockJob common;
1bdc94
@@ -613,10 +788,13 @@ static void test_blockjob_drain_subtree(void)
1bdc94
 
1bdc94
 int main(int argc, char **argv)
1bdc94
 {
1bdc94
+    int ret;
1bdc94
+
1bdc94
     bdrv_init();
1bdc94
     qemu_init_main_loop(&error_abort);
1bdc94
 
1bdc94
     g_test_init(&argc, &argv, NULL);
1bdc94
+    qemu_event_init(&done_event, false);
1bdc94
 
1bdc94
     g_test_add_func("/bdrv-drain/driver-cb/drain_all", test_drv_cb_drain_all);
1bdc94
     g_test_add_func("/bdrv-drain/driver-cb/drain", test_drv_cb_drain);
1bdc94
@@ -643,10 +821,17 @@ int main(int argc, char **argv)
1bdc94
     g_test_add_func("/bdrv-drain/multiparent", test_multiparent);
1bdc94
     g_test_add_func("/bdrv-drain/graph-change", test_graph_change);
1bdc94
 
1bdc94
+    g_test_add_func("/bdrv-drain/iothread/drain_all", test_iothread_drain_all);
1bdc94
+    g_test_add_func("/bdrv-drain/iothread/drain", test_iothread_drain);
1bdc94
+    g_test_add_func("/bdrv-drain/iothread/drain_subtree",
1bdc94
+                    test_iothread_drain_subtree);
1bdc94
+
1bdc94
     g_test_add_func("/bdrv-drain/blockjob/drain_all", test_blockjob_drain_all);
1bdc94
     g_test_add_func("/bdrv-drain/blockjob/drain", test_blockjob_drain);
1bdc94
     g_test_add_func("/bdrv-drain/blockjob/drain_subtree",
1bdc94
                     test_blockjob_drain_subtree);
1bdc94
 
1bdc94
-    return g_test_run();
1bdc94
+    ret = g_test_run();
1bdc94
+    qemu_event_destroy(&done_event);
1bdc94
+    return ret;
1bdc94
 }
1bdc94
-- 
1bdc94
1.8.3.1
1bdc94