xref: /qemu/tests/unit/test-bdrv-drain.c (revision 487b91870face8973e78d82cd312a77d8f9f5363)
1881cfd17SKevin Wolf /*
2881cfd17SKevin Wolf  * Block node draining tests
3881cfd17SKevin Wolf  *
4881cfd17SKevin Wolf  * Copyright (c) 2017 Kevin Wolf <kwolf@redhat.com>
5881cfd17SKevin Wolf  *
6881cfd17SKevin Wolf  * Permission is hereby granted, free of charge, to any person obtaining a copy
7881cfd17SKevin Wolf  * of this software and associated documentation files (the "Software"), to deal
8881cfd17SKevin Wolf  * in the Software without restriction, including without limitation the rights
9881cfd17SKevin Wolf  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10881cfd17SKevin Wolf  * copies of the Software, and to permit persons to whom the Software is
11881cfd17SKevin Wolf  * furnished to do so, subject to the following conditions:
12881cfd17SKevin Wolf  *
13881cfd17SKevin Wolf  * The above copyright notice and this permission notice shall be included in
14881cfd17SKevin Wolf  * all copies or substantial portions of the Software.
15881cfd17SKevin Wolf  *
16881cfd17SKevin Wolf  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17881cfd17SKevin Wolf  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18881cfd17SKevin Wolf  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19881cfd17SKevin Wolf  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20881cfd17SKevin Wolf  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21881cfd17SKevin Wolf  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22881cfd17SKevin Wolf  * THE SOFTWARE.
23881cfd17SKevin Wolf  */
24881cfd17SKevin Wolf 
25881cfd17SKevin Wolf #include "qemu/osdep.h"
26e2c1c34fSMarkus Armbruster #include "block/block_int.h"
277253220dSKevin Wolf #include "block/blockjob_int.h"
28881cfd17SKevin Wolf #include "sysemu/block-backend.h"
29881cfd17SKevin Wolf #include "qapi/error.h"
30db725815SMarkus Armbruster #include "qemu/main-loop.h"
31bb675689SKevin Wolf #include "iothread.h"
32bb675689SKevin Wolf 
33bb675689SKevin Wolf static QemuEvent done_event;
34881cfd17SKevin Wolf 
35881cfd17SKevin Wolf typedef struct BDRVTestState {
36881cfd17SKevin Wolf     int drain_count;
37bb675689SKevin Wolf     AioContext *bh_indirection_ctx;
3857320ca9SKevin Wolf     bool sleep_in_drain_begin;
39881cfd17SKevin Wolf } BDRVTestState;
40881cfd17SKevin Wolf 
417bce1c29SKevin Wolf static void coroutine_fn sleep_in_drain_begin(void *opaque)
427bce1c29SKevin Wolf {
437bce1c29SKevin Wolf     BlockDriverState *bs = opaque;
447bce1c29SKevin Wolf 
457bce1c29SKevin Wolf     qemu_co_sleep_ns(QEMU_CLOCK_REALTIME, 100000);
467bce1c29SKevin Wolf     bdrv_dec_in_flight(bs);
477bce1c29SKevin Wolf }
487bce1c29SKevin Wolf 
495e8ac217SKevin Wolf static void bdrv_test_drain_begin(BlockDriverState *bs)
50881cfd17SKevin Wolf {
51881cfd17SKevin Wolf     BDRVTestState *s = bs->opaque;
52881cfd17SKevin Wolf     s->drain_count++;
5357320ca9SKevin Wolf     if (s->sleep_in_drain_begin) {
547bce1c29SKevin Wolf         Coroutine *co = qemu_coroutine_create(sleep_in_drain_begin, bs);
557bce1c29SKevin Wolf         bdrv_inc_in_flight(bs);
567bce1c29SKevin Wolf         aio_co_enter(bdrv_get_aio_context(bs), co);
5757320ca9SKevin Wolf     }
58881cfd17SKevin Wolf }
59881cfd17SKevin Wolf 
605e8ac217SKevin Wolf static void bdrv_test_drain_end(BlockDriverState *bs)
61881cfd17SKevin Wolf {
62881cfd17SKevin Wolf     BDRVTestState *s = bs->opaque;
63881cfd17SKevin Wolf     s->drain_count--;
64881cfd17SKevin Wolf }
65881cfd17SKevin Wolf 
66881cfd17SKevin Wolf static void bdrv_test_close(BlockDriverState *bs)
67881cfd17SKevin Wolf {
68881cfd17SKevin Wolf     BDRVTestState *s = bs->opaque;
69881cfd17SKevin Wolf     g_assert_cmpint(s->drain_count, >, 0);
70881cfd17SKevin Wolf }
71881cfd17SKevin Wolf 
72bb675689SKevin Wolf static void co_reenter_bh(void *opaque)
73bb675689SKevin Wolf {
74bb675689SKevin Wolf     aio_co_wake(opaque);
75bb675689SKevin Wolf }
76bb675689SKevin Wolf 
77881cfd17SKevin Wolf static int coroutine_fn bdrv_test_co_preadv(BlockDriverState *bs,
78f7ef38ddSVladimir Sementsov-Ogievskiy                                             int64_t offset, int64_t bytes,
79f7ef38ddSVladimir Sementsov-Ogievskiy                                             QEMUIOVector *qiov,
80f7ef38ddSVladimir Sementsov-Ogievskiy                                             BdrvRequestFlags flags)
81881cfd17SKevin Wolf {
82bb675689SKevin Wolf     BDRVTestState *s = bs->opaque;
83bb675689SKevin Wolf 
84881cfd17SKevin Wolf     /* We want this request to stay until the polling loop in drain waits for
85881cfd17SKevin Wolf      * it to complete. We need to sleep a while as bdrv_drain_invoke() comes
86881cfd17SKevin Wolf      * first and polls its result, too, but it shouldn't accidentally complete
87881cfd17SKevin Wolf      * this request yet. */
88881cfd17SKevin Wolf     qemu_co_sleep_ns(QEMU_CLOCK_REALTIME, 100000);
89881cfd17SKevin Wolf 
90bb675689SKevin Wolf     if (s->bh_indirection_ctx) {
91bb675689SKevin Wolf         aio_bh_schedule_oneshot(s->bh_indirection_ctx, co_reenter_bh,
92bb675689SKevin Wolf                                 qemu_coroutine_self());
93bb675689SKevin Wolf         qemu_coroutine_yield();
94bb675689SKevin Wolf     }
95bb675689SKevin Wolf 
96881cfd17SKevin Wolf     return 0;
97881cfd17SKevin Wolf }
98881cfd17SKevin Wolf 
999746b35cSMax Reitz static int bdrv_test_change_backing_file(BlockDriverState *bs,
1009746b35cSMax Reitz                                          const char *backing_file,
1019746b35cSMax Reitz                                          const char *backing_fmt)
1029746b35cSMax Reitz {
1039746b35cSMax Reitz     return 0;
1049746b35cSMax Reitz }
1059746b35cSMax Reitz 
106881cfd17SKevin Wolf static BlockDriver bdrv_test = {
107881cfd17SKevin Wolf     .format_name            = "test",
108881cfd17SKevin Wolf     .instance_size          = sizeof(BDRVTestState),
10925f78d9eSVladimir Sementsov-Ogievskiy     .supports_backing       = true,
110881cfd17SKevin Wolf 
111881cfd17SKevin Wolf     .bdrv_close             = bdrv_test_close,
112881cfd17SKevin Wolf     .bdrv_co_preadv         = bdrv_test_co_preadv,
113881cfd17SKevin Wolf 
1145e8ac217SKevin Wolf     .bdrv_drain_begin       = bdrv_test_drain_begin,
1155e8ac217SKevin Wolf     .bdrv_drain_end         = bdrv_test_drain_end,
11686e1c840SKevin Wolf 
117e5d8a406SMax Reitz     .bdrv_child_perm        = bdrv_default_perms,
1189746b35cSMax Reitz 
1199746b35cSMax Reitz     .bdrv_change_backing_file = bdrv_test_change_backing_file,
120881cfd17SKevin Wolf };
121881cfd17SKevin Wolf 
122881cfd17SKevin Wolf static void aio_ret_cb(void *opaque, int ret)
123881cfd17SKevin Wolf {
124881cfd17SKevin Wolf     int *aio_ret = opaque;
125881cfd17SKevin Wolf     *aio_ret = ret;
126881cfd17SKevin Wolf }
127881cfd17SKevin Wolf 
1280582eb10SKevin Wolf typedef struct CallInCoroutineData {
1290582eb10SKevin Wolf     void (*entry)(void);
1300582eb10SKevin Wolf     bool done;
1310582eb10SKevin Wolf } CallInCoroutineData;
1320582eb10SKevin Wolf 
1330582eb10SKevin Wolf static coroutine_fn void call_in_coroutine_entry(void *opaque)
1340582eb10SKevin Wolf {
1350582eb10SKevin Wolf     CallInCoroutineData *data = opaque;
1360582eb10SKevin Wolf 
1370582eb10SKevin Wolf     data->entry();
1380582eb10SKevin Wolf     data->done = true;
1390582eb10SKevin Wolf }
1400582eb10SKevin Wolf 
1410582eb10SKevin Wolf static void call_in_coroutine(void (*entry)(void))
1420582eb10SKevin Wolf {
1430582eb10SKevin Wolf     Coroutine *co;
1440582eb10SKevin Wolf     CallInCoroutineData data = {
1450582eb10SKevin Wolf         .entry  = entry,
1460582eb10SKevin Wolf         .done   = false,
1470582eb10SKevin Wolf     };
1480582eb10SKevin Wolf 
1490582eb10SKevin Wolf     co = qemu_coroutine_create(call_in_coroutine_entry, &data);
1500582eb10SKevin Wolf     qemu_coroutine_enter(co);
1510582eb10SKevin Wolf     while (!data.done) {
1520582eb10SKevin Wolf         aio_poll(qemu_get_aio_context(), true);
1530582eb10SKevin Wolf     }
1540582eb10SKevin Wolf }
1550582eb10SKevin Wolf 
15686e1c840SKevin Wolf enum drain_type {
15786e1c840SKevin Wolf     BDRV_DRAIN_ALL,
15886e1c840SKevin Wolf     BDRV_DRAIN,
1596c429a6aSKevin Wolf     DRAIN_TYPE_MAX,
16086e1c840SKevin Wolf };
16186e1c840SKevin Wolf 
16286e1c840SKevin Wolf static void do_drain_begin(enum drain_type drain_type, BlockDriverState *bs)
16386e1c840SKevin Wolf {
16486e1c840SKevin Wolf     switch (drain_type) {
16586e1c840SKevin Wolf     case BDRV_DRAIN_ALL:        bdrv_drain_all_begin(); break;
16686e1c840SKevin Wolf     case BDRV_DRAIN:            bdrv_drained_begin(bs); break;
16786e1c840SKevin Wolf     default:                    g_assert_not_reached();
16886e1c840SKevin Wolf     }
16986e1c840SKevin Wolf }
17086e1c840SKevin Wolf 
17186e1c840SKevin Wolf static void do_drain_end(enum drain_type drain_type, BlockDriverState *bs)
17286e1c840SKevin Wolf {
17386e1c840SKevin Wolf     switch (drain_type) {
17486e1c840SKevin Wolf     case BDRV_DRAIN_ALL:        bdrv_drain_all_end(); break;
17586e1c840SKevin Wolf     case BDRV_DRAIN:            bdrv_drained_end(bs); break;
17686e1c840SKevin Wolf     default:                    g_assert_not_reached();
17786e1c840SKevin Wolf     }
17886e1c840SKevin Wolf }
17986e1c840SKevin Wolf 
180f62c1729SKevin Wolf static void do_drain_begin_unlocked(enum drain_type drain_type, BlockDriverState *bs)
181f62c1729SKevin Wolf {
182f62c1729SKevin Wolf     if (drain_type != BDRV_DRAIN_ALL) {
183f62c1729SKevin Wolf         aio_context_acquire(bdrv_get_aio_context(bs));
184f62c1729SKevin Wolf     }
185f62c1729SKevin Wolf     do_drain_begin(drain_type, bs);
186f62c1729SKevin Wolf     if (drain_type != BDRV_DRAIN_ALL) {
187f62c1729SKevin Wolf         aio_context_release(bdrv_get_aio_context(bs));
188f62c1729SKevin Wolf     }
189f62c1729SKevin Wolf }
190f62c1729SKevin Wolf 
19157f3d07bSKevin Wolf static BlockBackend * no_coroutine_fn test_setup(void)
19257f3d07bSKevin Wolf {
19357f3d07bSKevin Wolf     BlockBackend *blk;
19457f3d07bSKevin Wolf     BlockDriverState *bs, *backing;
19557f3d07bSKevin Wolf 
19657f3d07bSKevin Wolf     blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
19757f3d07bSKevin Wolf     bs = bdrv_new_open_driver(&bdrv_test, "test-node", BDRV_O_RDWR,
19857f3d07bSKevin Wolf                               &error_abort);
19957f3d07bSKevin Wolf     blk_insert_bs(blk, bs, &error_abort);
20057f3d07bSKevin Wolf 
20157f3d07bSKevin Wolf     backing = bdrv_new_open_driver(&bdrv_test, "backing", 0, &error_abort);
20257f3d07bSKevin Wolf     bdrv_set_backing_hd(bs, backing, &error_abort);
20357f3d07bSKevin Wolf 
20457f3d07bSKevin Wolf     bdrv_unref(backing);
20557f3d07bSKevin Wolf     bdrv_unref(bs);
20657f3d07bSKevin Wolf 
20757f3d07bSKevin Wolf     return blk;
20857f3d07bSKevin Wolf }
20957f3d07bSKevin Wolf 
210f62c1729SKevin Wolf static void do_drain_end_unlocked(enum drain_type drain_type, BlockDriverState *bs)
211f62c1729SKevin Wolf {
212f62c1729SKevin Wolf     if (drain_type != BDRV_DRAIN_ALL) {
213f62c1729SKevin Wolf         aio_context_acquire(bdrv_get_aio_context(bs));
214f62c1729SKevin Wolf     }
215f62c1729SKevin Wolf     do_drain_end(drain_type, bs);
216f62c1729SKevin Wolf     if (drain_type != BDRV_DRAIN_ALL) {
217f62c1729SKevin Wolf         aio_context_release(bdrv_get_aio_context(bs));
218f62c1729SKevin Wolf     }
219f62c1729SKevin Wolf }
220f62c1729SKevin Wolf 
22157f3d07bSKevin Wolf static void test_drv_cb_common(BlockBackend *blk, enum drain_type drain_type,
22257f3d07bSKevin Wolf                                bool recursive)
223881cfd17SKevin Wolf {
22457f3d07bSKevin Wolf     BlockDriverState *bs = blk_bs(blk);
22557f3d07bSKevin Wolf     BlockDriverState *backing = bs->backing->bs;
22686e1c840SKevin Wolf     BDRVTestState *s, *backing_s;
227881cfd17SKevin Wolf     BlockAIOCB *acb;
228881cfd17SKevin Wolf     int aio_ret;
229881cfd17SKevin Wolf 
230405d8fe0SVladimir Sementsov-Ogievskiy     QEMUIOVector qiov = QEMU_IOVEC_INIT_BUF(qiov, NULL, 0);
231881cfd17SKevin Wolf 
232881cfd17SKevin Wolf     s = bs->opaque;
23386e1c840SKevin Wolf     backing_s = backing->opaque;
23486e1c840SKevin Wolf 
235881cfd17SKevin Wolf     /* Simple bdrv_drain_all_begin/end pair, check that CBs are called */
236881cfd17SKevin Wolf     g_assert_cmpint(s->drain_count, ==, 0);
23786e1c840SKevin Wolf     g_assert_cmpint(backing_s->drain_count, ==, 0);
23886e1c840SKevin Wolf 
23986e1c840SKevin Wolf     do_drain_begin(drain_type, bs);
24086e1c840SKevin Wolf 
241881cfd17SKevin Wolf     g_assert_cmpint(s->drain_count, ==, 1);
24286e1c840SKevin Wolf     g_assert_cmpint(backing_s->drain_count, ==, !!recursive);
24386e1c840SKevin Wolf 
24486e1c840SKevin Wolf     do_drain_end(drain_type, bs);
24586e1c840SKevin Wolf 
246881cfd17SKevin Wolf     g_assert_cmpint(s->drain_count, ==, 0);
24786e1c840SKevin Wolf     g_assert_cmpint(backing_s->drain_count, ==, 0);
248881cfd17SKevin Wolf 
249881cfd17SKevin Wolf     /* Now do the same while a request is pending */
250881cfd17SKevin Wolf     aio_ret = -EINPROGRESS;
251881cfd17SKevin Wolf     acb = blk_aio_preadv(blk, 0, &qiov, 0, aio_ret_cb, &aio_ret);
252881cfd17SKevin Wolf     g_assert(acb != NULL);
253881cfd17SKevin Wolf     g_assert_cmpint(aio_ret, ==, -EINPROGRESS);
254881cfd17SKevin Wolf 
255881cfd17SKevin Wolf     g_assert_cmpint(s->drain_count, ==, 0);
25686e1c840SKevin Wolf     g_assert_cmpint(backing_s->drain_count, ==, 0);
25786e1c840SKevin Wolf 
25886e1c840SKevin Wolf     do_drain_begin(drain_type, bs);
25986e1c840SKevin Wolf 
260881cfd17SKevin Wolf     g_assert_cmpint(aio_ret, ==, 0);
261881cfd17SKevin Wolf     g_assert_cmpint(s->drain_count, ==, 1);
26286e1c840SKevin Wolf     g_assert_cmpint(backing_s->drain_count, ==, !!recursive);
263881cfd17SKevin Wolf 
26486e1c840SKevin Wolf     do_drain_end(drain_type, bs);
26586e1c840SKevin Wolf 
26686e1c840SKevin Wolf     g_assert_cmpint(s->drain_count, ==, 0);
26786e1c840SKevin Wolf     g_assert_cmpint(backing_s->drain_count, ==, 0);
268881cfd17SKevin Wolf }
269881cfd17SKevin Wolf 
27086e1c840SKevin Wolf static void test_drv_cb_drain_all(void)
27186e1c840SKevin Wolf {
27257f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
27357f3d07bSKevin Wolf     test_drv_cb_common(blk, BDRV_DRAIN_ALL, true);
27457f3d07bSKevin Wolf     blk_unref(blk);
27586e1c840SKevin Wolf }
27686e1c840SKevin Wolf 
27786e1c840SKevin Wolf static void test_drv_cb_drain(void)
27886e1c840SKevin Wolf {
27957f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
28057f3d07bSKevin Wolf     test_drv_cb_common(blk, BDRV_DRAIN, false);
28157f3d07bSKevin Wolf     blk_unref(blk);
28257f3d07bSKevin Wolf }
28357f3d07bSKevin Wolf 
28457f3d07bSKevin Wolf static void coroutine_fn test_drv_cb_co_drain_all_entry(void)
28557f3d07bSKevin Wolf {
28657f3d07bSKevin Wolf     BlockBackend *blk = blk_all_next(NULL);
28757f3d07bSKevin Wolf     test_drv_cb_common(blk, BDRV_DRAIN_ALL, true);
28886e1c840SKevin Wolf }
28986e1c840SKevin Wolf 
2906d0252f2SKevin Wolf static void test_drv_cb_co_drain_all(void)
2916d0252f2SKevin Wolf {
29257f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
29357f3d07bSKevin Wolf     call_in_coroutine(test_drv_cb_co_drain_all_entry);
29457f3d07bSKevin Wolf     blk_unref(blk);
29557f3d07bSKevin Wolf }
29657f3d07bSKevin Wolf 
29757f3d07bSKevin Wolf static void coroutine_fn test_drv_cb_co_drain_entry(void)
29857f3d07bSKevin Wolf {
29957f3d07bSKevin Wolf     BlockBackend *blk = blk_all_next(NULL);
30057f3d07bSKevin Wolf     test_drv_cb_common(blk, BDRV_DRAIN, false);
3016d0252f2SKevin Wolf }
3026d0252f2SKevin Wolf 
3030582eb10SKevin Wolf static void test_drv_cb_co_drain(void)
3040582eb10SKevin Wolf {
30557f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
30657f3d07bSKevin Wolf     call_in_coroutine(test_drv_cb_co_drain_entry);
30757f3d07bSKevin Wolf     blk_unref(blk);
3080582eb10SKevin Wolf }
3090582eb10SKevin Wolf 
31057f3d07bSKevin Wolf static void test_quiesce_common(BlockBackend *blk, enum drain_type drain_type,
31157f3d07bSKevin Wolf                                 bool recursive)
31289a6ceabSKevin Wolf {
31357f3d07bSKevin Wolf     BlockDriverState *bs = blk_bs(blk);
31457f3d07bSKevin Wolf     BlockDriverState *backing = bs->backing->bs;
31589a6ceabSKevin Wolf 
31689a6ceabSKevin Wolf     g_assert_cmpint(bs->quiesce_counter, ==, 0);
31789a6ceabSKevin Wolf     g_assert_cmpint(backing->quiesce_counter, ==, 0);
31889a6ceabSKevin Wolf 
31989a6ceabSKevin Wolf     do_drain_begin(drain_type, bs);
32089a6ceabSKevin Wolf 
32157e05be3SKevin Wolf     if (drain_type == BDRV_DRAIN_ALL) {
32257e05be3SKevin Wolf         g_assert_cmpint(bs->quiesce_counter, ==, 2);
32357e05be3SKevin Wolf     } else {
32489a6ceabSKevin Wolf         g_assert_cmpint(bs->quiesce_counter, ==, 1);
32557e05be3SKevin Wolf     }
32689a6ceabSKevin Wolf     g_assert_cmpint(backing->quiesce_counter, ==, !!recursive);
32789a6ceabSKevin Wolf 
32889a6ceabSKevin Wolf     do_drain_end(drain_type, bs);
32989a6ceabSKevin Wolf 
33089a6ceabSKevin Wolf     g_assert_cmpint(bs->quiesce_counter, ==, 0);
33189a6ceabSKevin Wolf     g_assert_cmpint(backing->quiesce_counter, ==, 0);
33289a6ceabSKevin Wolf }
33389a6ceabSKevin Wolf 
33489a6ceabSKevin Wolf static void test_quiesce_drain_all(void)
33589a6ceabSKevin Wolf {
33657f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
33757f3d07bSKevin Wolf     test_quiesce_common(blk, BDRV_DRAIN_ALL, true);
33857f3d07bSKevin Wolf     blk_unref(blk);
33989a6ceabSKevin Wolf }
34089a6ceabSKevin Wolf 
34189a6ceabSKevin Wolf static void test_quiesce_drain(void)
34289a6ceabSKevin Wolf {
34357f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
34457f3d07bSKevin Wolf     test_quiesce_common(blk, BDRV_DRAIN, false);
34557f3d07bSKevin Wolf     blk_unref(blk);
34657f3d07bSKevin Wolf }
34757f3d07bSKevin Wolf 
34857f3d07bSKevin Wolf static void coroutine_fn test_quiesce_co_drain_all_entry(void)
34957f3d07bSKevin Wolf {
35057f3d07bSKevin Wolf     BlockBackend *blk = blk_all_next(NULL);
35157f3d07bSKevin Wolf     test_quiesce_common(blk, BDRV_DRAIN_ALL, true);
35289a6ceabSKevin Wolf }
35389a6ceabSKevin Wolf 
3546d0252f2SKevin Wolf static void test_quiesce_co_drain_all(void)
3556d0252f2SKevin Wolf {
35657f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
35757f3d07bSKevin Wolf     call_in_coroutine(test_quiesce_co_drain_all_entry);
35857f3d07bSKevin Wolf     blk_unref(blk);
35957f3d07bSKevin Wolf }
36057f3d07bSKevin Wolf 
36157f3d07bSKevin Wolf static void coroutine_fn test_quiesce_co_drain_entry(void)
36257f3d07bSKevin Wolf {
36357f3d07bSKevin Wolf     BlockBackend *blk = blk_all_next(NULL);
36457f3d07bSKevin Wolf     test_quiesce_common(blk, BDRV_DRAIN, false);
3656d0252f2SKevin Wolf }
3666d0252f2SKevin Wolf 
3670582eb10SKevin Wolf static void test_quiesce_co_drain(void)
3680582eb10SKevin Wolf {
36957f3d07bSKevin Wolf     BlockBackend *blk = test_setup();
37057f3d07bSKevin Wolf     call_in_coroutine(test_quiesce_co_drain_entry);
37157f3d07bSKevin Wolf     blk_unref(blk);
3720582eb10SKevin Wolf }
3730582eb10SKevin Wolf 
3746c429a6aSKevin Wolf static void test_nested(void)
3756c429a6aSKevin Wolf {
3766c429a6aSKevin Wolf     BlockBackend *blk;
3776c429a6aSKevin Wolf     BlockDriverState *bs, *backing;
3786c429a6aSKevin Wolf     BDRVTestState *s, *backing_s;
3796c429a6aSKevin Wolf     enum drain_type outer, inner;
3806c429a6aSKevin Wolf 
381d861ab3aSKevin Wolf     blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
3826c429a6aSKevin Wolf     bs = bdrv_new_open_driver(&bdrv_test, "test-node", BDRV_O_RDWR,
3836c429a6aSKevin Wolf                               &error_abort);
3846c429a6aSKevin Wolf     s = bs->opaque;
3856c429a6aSKevin Wolf     blk_insert_bs(blk, bs, &error_abort);
3866c429a6aSKevin Wolf 
3876c429a6aSKevin Wolf     backing = bdrv_new_open_driver(&bdrv_test, "backing", 0, &error_abort);
3886c429a6aSKevin Wolf     backing_s = backing->opaque;
3896c429a6aSKevin Wolf     bdrv_set_backing_hd(bs, backing, &error_abort);
3906c429a6aSKevin Wolf 
3916c429a6aSKevin Wolf     for (outer = 0; outer < DRAIN_TYPE_MAX; outer++) {
3926c429a6aSKevin Wolf         for (inner = 0; inner < DRAIN_TYPE_MAX; inner++) {
39357e05be3SKevin Wolf             int backing_quiesce = (outer == BDRV_DRAIN_ALL) +
39457e05be3SKevin Wolf                                   (inner == BDRV_DRAIN_ALL);
3956c429a6aSKevin Wolf 
3966c429a6aSKevin Wolf             g_assert_cmpint(bs->quiesce_counter, ==, 0);
3976c429a6aSKevin Wolf             g_assert_cmpint(backing->quiesce_counter, ==, 0);
3986c429a6aSKevin Wolf             g_assert_cmpint(s->drain_count, ==, 0);
3996c429a6aSKevin Wolf             g_assert_cmpint(backing_s->drain_count, ==, 0);
4006c429a6aSKevin Wolf 
4016c429a6aSKevin Wolf             do_drain_begin(outer, bs);
4026c429a6aSKevin Wolf             do_drain_begin(inner, bs);
4036c429a6aSKevin Wolf 
40457e05be3SKevin Wolf             g_assert_cmpint(bs->quiesce_counter, ==, 2 + !!backing_quiesce);
4056c429a6aSKevin Wolf             g_assert_cmpint(backing->quiesce_counter, ==, backing_quiesce);
40657e05be3SKevin Wolf             g_assert_cmpint(s->drain_count, ==, 1);
40757e05be3SKevin Wolf             g_assert_cmpint(backing_s->drain_count, ==, !!backing_quiesce);
4086c429a6aSKevin Wolf 
4096c429a6aSKevin Wolf             do_drain_end(inner, bs);
4106c429a6aSKevin Wolf             do_drain_end(outer, bs);
4116c429a6aSKevin Wolf 
4126c429a6aSKevin Wolf             g_assert_cmpint(bs->quiesce_counter, ==, 0);
4136c429a6aSKevin Wolf             g_assert_cmpint(backing->quiesce_counter, ==, 0);
4146c429a6aSKevin Wolf             g_assert_cmpint(s->drain_count, ==, 0);
4156c429a6aSKevin Wolf             g_assert_cmpint(backing_s->drain_count, ==, 0);
4166c429a6aSKevin Wolf         }
4176c429a6aSKevin Wolf     }
4186c429a6aSKevin Wolf 
4196c429a6aSKevin Wolf     bdrv_unref(backing);
4206c429a6aSKevin Wolf     bdrv_unref(bs);
4216c429a6aSKevin Wolf     blk_unref(blk);
4226c429a6aSKevin Wolf }
4236c429a6aSKevin Wolf 
42419f7a7e5SKevin Wolf static void test_graph_change_drain_all(void)
42519f7a7e5SKevin Wolf {
42619f7a7e5SKevin Wolf     BlockBackend *blk_a, *blk_b;
42719f7a7e5SKevin Wolf     BlockDriverState *bs_a, *bs_b;
42819f7a7e5SKevin Wolf     BDRVTestState *a_s, *b_s;
42919f7a7e5SKevin Wolf 
43019f7a7e5SKevin Wolf     /* Create node A with a BlockBackend */
431d861ab3aSKevin Wolf     blk_a = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
43219f7a7e5SKevin Wolf     bs_a = bdrv_new_open_driver(&bdrv_test, "test-node-a", BDRV_O_RDWR,
43319f7a7e5SKevin Wolf                                 &error_abort);
43419f7a7e5SKevin Wolf     a_s = bs_a->opaque;
43519f7a7e5SKevin Wolf     blk_insert_bs(blk_a, bs_a, &error_abort);
43619f7a7e5SKevin Wolf 
43719f7a7e5SKevin Wolf     g_assert_cmpint(bs_a->quiesce_counter, ==, 0);
43819f7a7e5SKevin Wolf     g_assert_cmpint(a_s->drain_count, ==, 0);
43919f7a7e5SKevin Wolf 
44019f7a7e5SKevin Wolf     /* Call bdrv_drain_all_begin() */
44119f7a7e5SKevin Wolf     bdrv_drain_all_begin();
44219f7a7e5SKevin Wolf 
44319f7a7e5SKevin Wolf     g_assert_cmpint(bs_a->quiesce_counter, ==, 1);
44419f7a7e5SKevin Wolf     g_assert_cmpint(a_s->drain_count, ==, 1);
44519f7a7e5SKevin Wolf 
44619f7a7e5SKevin Wolf     /* Create node B with a BlockBackend */
447d861ab3aSKevin Wolf     blk_b = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
44819f7a7e5SKevin Wolf     bs_b = bdrv_new_open_driver(&bdrv_test, "test-node-b", BDRV_O_RDWR,
44919f7a7e5SKevin Wolf                                 &error_abort);
45019f7a7e5SKevin Wolf     b_s = bs_b->opaque;
45119f7a7e5SKevin Wolf     blk_insert_bs(blk_b, bs_b, &error_abort);
45219f7a7e5SKevin Wolf 
45319f7a7e5SKevin Wolf     g_assert_cmpint(bs_a->quiesce_counter, ==, 1);
45419f7a7e5SKevin Wolf     g_assert_cmpint(bs_b->quiesce_counter, ==, 1);
45519f7a7e5SKevin Wolf     g_assert_cmpint(a_s->drain_count, ==, 1);
45619f7a7e5SKevin Wolf     g_assert_cmpint(b_s->drain_count, ==, 1);
45719f7a7e5SKevin Wolf 
45819f7a7e5SKevin Wolf     /* Unref and finally delete node A */
45919f7a7e5SKevin Wolf     blk_unref(blk_a);
46019f7a7e5SKevin Wolf 
46119f7a7e5SKevin Wolf     g_assert_cmpint(bs_a->quiesce_counter, ==, 1);
46219f7a7e5SKevin Wolf     g_assert_cmpint(bs_b->quiesce_counter, ==, 1);
46319f7a7e5SKevin Wolf     g_assert_cmpint(a_s->drain_count, ==, 1);
46419f7a7e5SKevin Wolf     g_assert_cmpint(b_s->drain_count, ==, 1);
46519f7a7e5SKevin Wolf 
46619f7a7e5SKevin Wolf     bdrv_unref(bs_a);
46719f7a7e5SKevin Wolf 
46819f7a7e5SKevin Wolf     g_assert_cmpint(bs_b->quiesce_counter, ==, 1);
46919f7a7e5SKevin Wolf     g_assert_cmpint(b_s->drain_count, ==, 1);
47019f7a7e5SKevin Wolf 
47119f7a7e5SKevin Wolf     /* End the drained section */
47219f7a7e5SKevin Wolf     bdrv_drain_all_end();
47319f7a7e5SKevin Wolf 
47419f7a7e5SKevin Wolf     g_assert_cmpint(bs_b->quiesce_counter, ==, 0);
47519f7a7e5SKevin Wolf     g_assert_cmpint(b_s->drain_count, ==, 0);
47619f7a7e5SKevin Wolf 
47719f7a7e5SKevin Wolf     bdrv_unref(bs_b);
47819f7a7e5SKevin Wolf     blk_unref(blk_b);
47919f7a7e5SKevin Wolf }
48019f7a7e5SKevin Wolf 
481bb675689SKevin Wolf struct test_iothread_data {
482bb675689SKevin Wolf     BlockDriverState *bs;
483bb675689SKevin Wolf     enum drain_type drain_type;
484bb675689SKevin Wolf     int *aio_ret;
485ab613350SStefan Hajnoczi     bool co_done;
486bb675689SKevin Wolf };
487bb675689SKevin Wolf 
488ab613350SStefan Hajnoczi static void coroutine_fn test_iothread_drain_co_entry(void *opaque)
489bb675689SKevin Wolf {
490bb675689SKevin Wolf     struct test_iothread_data *data = opaque;
491bb675689SKevin Wolf 
492bb675689SKevin Wolf     do_drain_begin(data->drain_type, data->bs);
493bb675689SKevin Wolf     g_assert_cmpint(*data->aio_ret, ==, 0);
494bb675689SKevin Wolf     do_drain_end(data->drain_type, data->bs);
495bb675689SKevin Wolf 
496ab613350SStefan Hajnoczi     data->co_done = true;
497ab613350SStefan Hajnoczi     aio_wait_kick();
498bb675689SKevin Wolf }
499bb675689SKevin Wolf 
500bb675689SKevin Wolf static void test_iothread_aio_cb(void *opaque, int ret)
501bb675689SKevin Wolf {
502bb675689SKevin Wolf     int *aio_ret = opaque;
503bb675689SKevin Wolf     *aio_ret = ret;
504bb675689SKevin Wolf     qemu_event_set(&done_event);
505bb675689SKevin Wolf }
506bb675689SKevin Wolf 
507ecc1a5c7SKevin Wolf static void test_iothread_main_thread_bh(void *opaque)
508ecc1a5c7SKevin Wolf {
509ecc1a5c7SKevin Wolf     struct test_iothread_data *data = opaque;
510ecc1a5c7SKevin Wolf 
511ecc1a5c7SKevin Wolf     /* Test that the AioContext is not yet locked in a random BH that is
512ecc1a5c7SKevin Wolf      * executed during drain, otherwise this would deadlock. */
513ecc1a5c7SKevin Wolf     aio_context_acquire(bdrv_get_aio_context(data->bs));
514ecc1a5c7SKevin Wolf     bdrv_flush(data->bs);
515ecc1a5c7SKevin Wolf     aio_context_release(bdrv_get_aio_context(data->bs));
516ecc1a5c7SKevin Wolf }
517ecc1a5c7SKevin Wolf 
518bb675689SKevin Wolf /*
519bb675689SKevin Wolf  * Starts an AIO request on a BDS that runs in the AioContext of iothread 1.
520bb675689SKevin Wolf  * The request involves a BH on iothread 2 before it can complete.
521bb675689SKevin Wolf  *
522bb675689SKevin Wolf  * @drain_thread = 0 means that do_drain_begin/end are called from the main
523bb675689SKevin Wolf  * thread, @drain_thread = 1 means that they are called from iothread 1. Drain
524bb675689SKevin Wolf  * for this BDS cannot be called from iothread 2 because only the main thread
525bb675689SKevin Wolf  * may do cross-AioContext polling.
526bb675689SKevin Wolf  */
527bb675689SKevin Wolf static void test_iothread_common(enum drain_type drain_type, int drain_thread)
528bb675689SKevin Wolf {
529bb675689SKevin Wolf     BlockBackend *blk;
530bb675689SKevin Wolf     BlockDriverState *bs;
531bb675689SKevin Wolf     BDRVTestState *s;
532bb675689SKevin Wolf     BlockAIOCB *acb;
533ab613350SStefan Hajnoczi     Coroutine *co;
534bb675689SKevin Wolf     int aio_ret;
535bb675689SKevin Wolf     struct test_iothread_data data;
536bb675689SKevin Wolf 
537bb675689SKevin Wolf     IOThread *a = iothread_new();
538bb675689SKevin Wolf     IOThread *b = iothread_new();
539bb675689SKevin Wolf     AioContext *ctx_a = iothread_get_aio_context(a);
540bb675689SKevin Wolf     AioContext *ctx_b = iothread_get_aio_context(b);
541bb675689SKevin Wolf 
542405d8fe0SVladimir Sementsov-Ogievskiy     QEMUIOVector qiov = QEMU_IOVEC_INIT_BUF(qiov, NULL, 0);
543bb675689SKevin Wolf 
544bb675689SKevin Wolf     /* bdrv_drain_all() may only be called from the main loop thread */
545bb675689SKevin Wolf     if (drain_type == BDRV_DRAIN_ALL && drain_thread != 0) {
546bb675689SKevin Wolf         goto out;
547bb675689SKevin Wolf     }
548bb675689SKevin Wolf 
549d861ab3aSKevin Wolf     blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
550bb675689SKevin Wolf     bs = bdrv_new_open_driver(&bdrv_test, "test-node", BDRV_O_RDWR,
551bb675689SKevin Wolf                               &error_abort);
552bb675689SKevin Wolf     s = bs->opaque;
553bb675689SKevin Wolf     blk_insert_bs(blk, bs, &error_abort);
554cf312932SKevin Wolf     blk_set_disable_request_queuing(blk, true);
555bb675689SKevin Wolf 
55697896a48SKevin Wolf     blk_set_aio_context(blk, ctx_a, &error_abort);
557bb675689SKevin Wolf     aio_context_acquire(ctx_a);
558bb675689SKevin Wolf 
559bb675689SKevin Wolf     s->bh_indirection_ctx = ctx_b;
560bb675689SKevin Wolf 
561bb675689SKevin Wolf     aio_ret = -EINPROGRESS;
562dd353157SKevin Wolf     qemu_event_reset(&done_event);
563dd353157SKevin Wolf 
564bb675689SKevin Wolf     if (drain_thread == 0) {
565bb675689SKevin Wolf         acb = blk_aio_preadv(blk, 0, &qiov, 0, test_iothread_aio_cb, &aio_ret);
566bb675689SKevin Wolf     } else {
567bb675689SKevin Wolf         acb = blk_aio_preadv(blk, 0, &qiov, 0, aio_ret_cb, &aio_ret);
568bb675689SKevin Wolf     }
569bb675689SKevin Wolf     g_assert(acb != NULL);
570bb675689SKevin Wolf     g_assert_cmpint(aio_ret, ==, -EINPROGRESS);
571bb675689SKevin Wolf 
572bb675689SKevin Wolf     aio_context_release(ctx_a);
573bb675689SKevin Wolf 
574bb675689SKevin Wolf     data = (struct test_iothread_data) {
575bb675689SKevin Wolf         .bs         = bs,
576bb675689SKevin Wolf         .drain_type = drain_type,
577bb675689SKevin Wolf         .aio_ret    = &aio_ret,
578bb675689SKevin Wolf     };
579bb675689SKevin Wolf 
580bb675689SKevin Wolf     switch (drain_thread) {
581bb675689SKevin Wolf     case 0:
582bb675689SKevin Wolf         if (drain_type != BDRV_DRAIN_ALL) {
583bb675689SKevin Wolf             aio_context_acquire(ctx_a);
584bb675689SKevin Wolf         }
585bb675689SKevin Wolf 
586ecc1a5c7SKevin Wolf         aio_bh_schedule_oneshot(ctx_a, test_iothread_main_thread_bh, &data);
587ecc1a5c7SKevin Wolf 
588bb675689SKevin Wolf         /* The request is running on the IOThread a. Draining its block device
589bb675689SKevin Wolf          * will make sure that it has completed as far as the BDS is concerned,
590bb675689SKevin Wolf          * but the drain in this thread can continue immediately after
591bb675689SKevin Wolf          * bdrv_dec_in_flight() and aio_ret might be assigned only slightly
592bb675689SKevin Wolf          * later. */
593bb675689SKevin Wolf         do_drain_begin(drain_type, bs);
594bb675689SKevin Wolf         g_assert_cmpint(bs->in_flight, ==, 0);
595bb675689SKevin Wolf 
596bb675689SKevin Wolf         if (drain_type != BDRV_DRAIN_ALL) {
597bb675689SKevin Wolf             aio_context_release(ctx_a);
598bb675689SKevin Wolf         }
599bb675689SKevin Wolf         qemu_event_wait(&done_event);
600bb675689SKevin Wolf         if (drain_type != BDRV_DRAIN_ALL) {
601bb675689SKevin Wolf             aio_context_acquire(ctx_a);
602bb675689SKevin Wolf         }
603bb675689SKevin Wolf 
604bb675689SKevin Wolf         g_assert_cmpint(aio_ret, ==, 0);
605bb675689SKevin Wolf         do_drain_end(drain_type, bs);
606bb675689SKevin Wolf 
607bb675689SKevin Wolf         if (drain_type != BDRV_DRAIN_ALL) {
608bb675689SKevin Wolf             aio_context_release(ctx_a);
609bb675689SKevin Wolf         }
610bb675689SKevin Wolf         break;
611bb675689SKevin Wolf     case 1:
612ab613350SStefan Hajnoczi         co = qemu_coroutine_create(test_iothread_drain_co_entry, &data);
613ab613350SStefan Hajnoczi         aio_co_enter(ctx_a, co);
614ab613350SStefan Hajnoczi         AIO_WAIT_WHILE_UNLOCKED(NULL, !data.co_done);
615bb675689SKevin Wolf         break;
616bb675689SKevin Wolf     default:
617bb675689SKevin Wolf         g_assert_not_reached();
618bb675689SKevin Wolf     }
619bb675689SKevin Wolf 
620bb675689SKevin Wolf     aio_context_acquire(ctx_a);
62197896a48SKevin Wolf     blk_set_aio_context(blk, qemu_get_aio_context(), &error_abort);
622bb675689SKevin Wolf     aio_context_release(ctx_a);
623bb675689SKevin Wolf 
624bb675689SKevin Wolf     bdrv_unref(bs);
625bb675689SKevin Wolf     blk_unref(blk);
626bb675689SKevin Wolf 
627bb675689SKevin Wolf out:
628bb675689SKevin Wolf     iothread_join(a);
629bb675689SKevin Wolf     iothread_join(b);
630bb675689SKevin Wolf }
631bb675689SKevin Wolf 
632bb675689SKevin Wolf static void test_iothread_drain_all(void)
633bb675689SKevin Wolf {
634bb675689SKevin Wolf     test_iothread_common(BDRV_DRAIN_ALL, 0);
635bb675689SKevin Wolf     test_iothread_common(BDRV_DRAIN_ALL, 1);
636bb675689SKevin Wolf }
637bb675689SKevin Wolf 
638bb675689SKevin Wolf static void test_iothread_drain(void)
639bb675689SKevin Wolf {
640bb675689SKevin Wolf     test_iothread_common(BDRV_DRAIN, 0);
641bb675689SKevin Wolf     test_iothread_common(BDRV_DRAIN, 1);
642bb675689SKevin Wolf }
643bb675689SKevin Wolf 
6447253220dSKevin Wolf 
6457253220dSKevin Wolf typedef struct TestBlockJob {
6467253220dSKevin Wolf     BlockJob common;
6471b177bbeSVladimir Sementsov-Ogievskiy     BlockDriverState *bs;
648d49725afSKevin Wolf     int run_ret;
649d49725afSKevin Wolf     int prepare_ret;
650d8b3afd5SKevin Wolf     bool running;
6517253220dSKevin Wolf     bool should_complete;
6527253220dSKevin Wolf } TestBlockJob;
6537253220dSKevin Wolf 
654ae23dde9SKevin Wolf static int test_job_prepare(Job *job)
655ae23dde9SKevin Wolf {
656ae23dde9SKevin Wolf     TestBlockJob *s = container_of(job, TestBlockJob, common.job);
657ae23dde9SKevin Wolf 
658ae23dde9SKevin Wolf     /* Provoke an AIO_WAIT_WHILE() call to verify there is no deadlock */
6591b177bbeSVladimir Sementsov-Ogievskiy     bdrv_flush(s->bs);
660d49725afSKevin Wolf     return s->prepare_ret;
661d49725afSKevin Wolf }
662d49725afSKevin Wolf 
663d49725afSKevin Wolf static void test_job_commit(Job *job)
664d49725afSKevin Wolf {
665d49725afSKevin Wolf     TestBlockJob *s = container_of(job, TestBlockJob, common.job);
666d49725afSKevin Wolf 
667d49725afSKevin Wolf     /* Provoke an AIO_WAIT_WHILE() call to verify there is no deadlock */
6681b177bbeSVladimir Sementsov-Ogievskiy     bdrv_flush(s->bs);
669d49725afSKevin Wolf }
670d49725afSKevin Wolf 
671d49725afSKevin Wolf static void test_job_abort(Job *job)
672d49725afSKevin Wolf {
673d49725afSKevin Wolf     TestBlockJob *s = container_of(job, TestBlockJob, common.job);
674d49725afSKevin Wolf 
675d49725afSKevin Wolf     /* Provoke an AIO_WAIT_WHILE() call to verify there is no deadlock */
6761b177bbeSVladimir Sementsov-Ogievskiy     bdrv_flush(s->bs);
677ae23dde9SKevin Wolf }
678ae23dde9SKevin Wolf 
679f67432a2SJohn Snow static int coroutine_fn test_job_run(Job *job, Error **errp)
6807253220dSKevin Wolf {
681f67432a2SJohn Snow     TestBlockJob *s = container_of(job, TestBlockJob, common.job);
6827253220dSKevin Wolf 
683d8b3afd5SKevin Wolf     /* We are running the actual job code past the pause point in
684d8b3afd5SKevin Wolf      * job_co_entry(). */
685d8b3afd5SKevin Wolf     s->running = true;
686d8b3afd5SKevin Wolf 
6872e1795b5SKevin Wolf     job_transition_to_ready(&s->common.job);
6887253220dSKevin Wolf     while (!s->should_complete) {
6895599c162SKevin Wolf         /* Avoid job_sleep_ns() because it marks the job as !busy. We want to
6905599c162SKevin Wolf          * emulate some actual activity (probably some I/O) here so that drain
6915599c162SKevin Wolf          * has to wait for this activity to stop. */
692d8b3afd5SKevin Wolf         qemu_co_sleep_ns(QEMU_CLOCK_REALTIME, 1000000);
693d8b3afd5SKevin Wolf 
69489bd0305SKevin Wolf         job_pause_point(&s->common.job);
6957253220dSKevin Wolf     }
6967253220dSKevin Wolf 
697d49725afSKevin Wolf     return s->run_ret;
6987253220dSKevin Wolf }
6997253220dSKevin Wolf 
7003453d972SKevin Wolf static void test_job_complete(Job *job, Error **errp)
7017253220dSKevin Wolf {
7023453d972SKevin Wolf     TestBlockJob *s = container_of(job, TestBlockJob, common.job);
7037253220dSKevin Wolf     s->should_complete = true;
7047253220dSKevin Wolf }
7057253220dSKevin Wolf 
7067253220dSKevin Wolf BlockJobDriver test_job_driver = {
70733e9e9bdSKevin Wolf     .job_driver = {
7087253220dSKevin Wolf         .instance_size  = sizeof(TestBlockJob),
70980fa2c75SKevin Wolf         .free           = block_job_free,
710b15de828SKevin Wolf         .user_resume    = block_job_user_resume,
711f67432a2SJohn Snow         .run            = test_job_run,
7127253220dSKevin Wolf         .complete       = test_job_complete,
713ae23dde9SKevin Wolf         .prepare        = test_job_prepare,
714d49725afSKevin Wolf         .commit         = test_job_commit,
715d49725afSKevin Wolf         .abort          = test_job_abort,
7163453d972SKevin Wolf     },
7177253220dSKevin Wolf };
7187253220dSKevin Wolf 
719d49725afSKevin Wolf enum test_job_result {
720d49725afSKevin Wolf     TEST_JOB_SUCCESS,
721d49725afSKevin Wolf     TEST_JOB_FAIL_RUN,
722d49725afSKevin Wolf     TEST_JOB_FAIL_PREPARE,
723d49725afSKevin Wolf };
724d49725afSKevin Wolf 
725d8b3afd5SKevin Wolf enum test_job_drain_node {
726d8b3afd5SKevin Wolf     TEST_JOB_DRAIN_SRC,
727d8b3afd5SKevin Wolf     TEST_JOB_DRAIN_SRC_CHILD,
728d8b3afd5SKevin Wolf };
729d8b3afd5SKevin Wolf 
730d8b3afd5SKevin Wolf static void test_blockjob_common_drain_node(enum drain_type drain_type,
731d8b3afd5SKevin Wolf                                             bool use_iothread,
732d8b3afd5SKevin Wolf                                             enum test_job_result result,
733d8b3afd5SKevin Wolf                                             enum test_job_drain_node drain_node)
7347253220dSKevin Wolf {
7357253220dSKevin Wolf     BlockBackend *blk_src, *blk_target;
736d8b3afd5SKevin Wolf     BlockDriverState *src, *src_backing, *src_overlay, *target, *drain_bs;
7377253220dSKevin Wolf     BlockJob *job;
738d49725afSKevin Wolf     TestBlockJob *tjob;
739f62c1729SKevin Wolf     IOThread *iothread = NULL;
740f62c1729SKevin Wolf     AioContext *ctx;
7417253220dSKevin Wolf     int ret;
7427253220dSKevin Wolf 
7437253220dSKevin Wolf     src = bdrv_new_open_driver(&bdrv_test, "source", BDRV_O_RDWR,
7447253220dSKevin Wolf                                &error_abort);
745d8b3afd5SKevin Wolf     src_backing = bdrv_new_open_driver(&bdrv_test, "source-backing",
746d8b3afd5SKevin Wolf                                        BDRV_O_RDWR, &error_abort);
747d8b3afd5SKevin Wolf     src_overlay = bdrv_new_open_driver(&bdrv_test, "source-overlay",
748d8b3afd5SKevin Wolf                                        BDRV_O_RDWR, &error_abort);
749d8b3afd5SKevin Wolf 
750d8b3afd5SKevin Wolf     bdrv_set_backing_hd(src_overlay, src, &error_abort);
751d8b3afd5SKevin Wolf     bdrv_unref(src);
752d8b3afd5SKevin Wolf     bdrv_set_backing_hd(src, src_backing, &error_abort);
753d8b3afd5SKevin Wolf     bdrv_unref(src_backing);
754d8b3afd5SKevin Wolf 
755d861ab3aSKevin Wolf     blk_src = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
756d8b3afd5SKevin Wolf     blk_insert_bs(blk_src, src_overlay, &error_abort);
757d8b3afd5SKevin Wolf 
758d8b3afd5SKevin Wolf     switch (drain_node) {
759d8b3afd5SKevin Wolf     case TEST_JOB_DRAIN_SRC:
760d8b3afd5SKevin Wolf         drain_bs = src;
761d8b3afd5SKevin Wolf         break;
762d8b3afd5SKevin Wolf     case TEST_JOB_DRAIN_SRC_CHILD:
763d8b3afd5SKevin Wolf         drain_bs = src_backing;
764d8b3afd5SKevin Wolf         break;
765d8b3afd5SKevin Wolf     default:
766d8b3afd5SKevin Wolf         g_assert_not_reached();
767d8b3afd5SKevin Wolf     }
7687253220dSKevin Wolf 
769f62c1729SKevin Wolf     if (use_iothread) {
770f62c1729SKevin Wolf         iothread = iothread_new();
771f62c1729SKevin Wolf         ctx = iothread_get_aio_context(iothread);
77297896a48SKevin Wolf         blk_set_aio_context(blk_src, ctx, &error_abort);
773f62c1729SKevin Wolf     } else {
774f62c1729SKevin Wolf         ctx = qemu_get_aio_context();
775f62c1729SKevin Wolf     }
776f62c1729SKevin Wolf 
7777253220dSKevin Wolf     target = bdrv_new_open_driver(&bdrv_test, "target", BDRV_O_RDWR,
7787253220dSKevin Wolf                                   &error_abort);
779d861ab3aSKevin Wolf     blk_target = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
7807253220dSKevin Wolf     blk_insert_bs(blk_target, target, &error_abort);
781132ada80SKevin Wolf     blk_set_allow_aio_context_change(blk_target, true);
7827253220dSKevin Wolf 
783f62c1729SKevin Wolf     aio_context_acquire(ctx);
784d49725afSKevin Wolf     tjob = block_job_create("job0", &test_job_driver, NULL, src,
785d49725afSKevin Wolf                             0, BLK_PERM_ALL,
78675859b94SJohn Snow                             0, 0, NULL, NULL, &error_abort);
7871b177bbeSVladimir Sementsov-Ogievskiy     tjob->bs = src;
788d49725afSKevin Wolf     job = &tjob->common;
7897253220dSKevin Wolf     block_job_add_bdrv(job, "target", target, 0, BLK_PERM_ALL, &error_abort);
790d49725afSKevin Wolf 
791d49725afSKevin Wolf     switch (result) {
792d49725afSKevin Wolf     case TEST_JOB_SUCCESS:
793d49725afSKevin Wolf         break;
794d49725afSKevin Wolf     case TEST_JOB_FAIL_RUN:
795d49725afSKevin Wolf         tjob->run_ret = -EIO;
796d49725afSKevin Wolf         break;
797d49725afSKevin Wolf     case TEST_JOB_FAIL_PREPARE:
798d49725afSKevin Wolf         tjob->prepare_ret = -EIO;
799d49725afSKevin Wolf         break;
800d49725afSKevin Wolf     }
8016f592e5aSEmanuele Giuseppe Esposito     aio_context_release(ctx);
802d49725afSKevin Wolf 
803da01ff7fSKevin Wolf     job_start(&job->job);
8047253220dSKevin Wolf 
805d8b3afd5SKevin Wolf     if (use_iothread) {
806d8b3afd5SKevin Wolf         /* job_co_entry() is run in the I/O thread, wait for the actual job
807d8b3afd5SKevin Wolf          * code to start (we don't want to catch the job in the pause point in
808d8b3afd5SKevin Wolf          * job_co_entry(). */
809d8b3afd5SKevin Wolf         while (!tjob->running) {
810d8b3afd5SKevin Wolf             aio_poll(qemu_get_aio_context(), false);
811d8b3afd5SKevin Wolf         }
812d8b3afd5SKevin Wolf     }
813d8b3afd5SKevin Wolf 
814191e7af3SEmanuele Giuseppe Esposito     WITH_JOB_LOCK_GUARD() {
815da01ff7fSKevin Wolf         g_assert_cmpint(job->job.pause_count, ==, 0);
816da01ff7fSKevin Wolf         g_assert_false(job->job.paused);
817d8b3afd5SKevin Wolf         g_assert_true(tjob->running);
8185599c162SKevin Wolf         g_assert_true(job->job.busy); /* We're in qemu_co_sleep_ns() */
819191e7af3SEmanuele Giuseppe Esposito     }
8207253220dSKevin Wolf 
821d8b3afd5SKevin Wolf     do_drain_begin_unlocked(drain_type, drain_bs);
8227253220dSKevin Wolf 
823191e7af3SEmanuele Giuseppe Esposito     WITH_JOB_LOCK_GUARD() {
8247253220dSKevin Wolf         if (drain_type == BDRV_DRAIN_ALL) {
82581193349SKevin Wolf             /* bdrv_drain_all() drains both src and target */
826da01ff7fSKevin Wolf             g_assert_cmpint(job->job.pause_count, ==, 2);
8277253220dSKevin Wolf         } else {
828da01ff7fSKevin Wolf             g_assert_cmpint(job->job.pause_count, ==, 1);
8297253220dSKevin Wolf         }
83089bd0305SKevin Wolf         g_assert_true(job->job.paused);
831da01ff7fSKevin Wolf         g_assert_false(job->job.busy); /* The job is paused */
832191e7af3SEmanuele Giuseppe Esposito     }
8337253220dSKevin Wolf 
834d8b3afd5SKevin Wolf     do_drain_end_unlocked(drain_type, drain_bs);
835f62c1729SKevin Wolf 
836f62c1729SKevin Wolf     if (use_iothread) {
837191e7af3SEmanuele Giuseppe Esposito         /*
838191e7af3SEmanuele Giuseppe Esposito          * Here we are waiting for the paused status to change,
839191e7af3SEmanuele Giuseppe Esposito          * so don't bother protecting the read every time.
840191e7af3SEmanuele Giuseppe Esposito          *
841191e7af3SEmanuele Giuseppe Esposito          * paused is reset in the I/O thread, wait for it
842191e7af3SEmanuele Giuseppe Esposito          */
843f62c1729SKevin Wolf         while (job->job.paused) {
844f62c1729SKevin Wolf             aio_poll(qemu_get_aio_context(), false);
845f62c1729SKevin Wolf         }
846f62c1729SKevin Wolf     }
8477253220dSKevin Wolf 
848191e7af3SEmanuele Giuseppe Esposito     WITH_JOB_LOCK_GUARD() {
849da01ff7fSKevin Wolf         g_assert_cmpint(job->job.pause_count, ==, 0);
850da01ff7fSKevin Wolf         g_assert_false(job->job.paused);
85189bd0305SKevin Wolf         g_assert_true(job->job.busy); /* We're in qemu_co_sleep_ns() */
852191e7af3SEmanuele Giuseppe Esposito     }
8537253220dSKevin Wolf 
854132ada80SKevin Wolf     do_drain_begin_unlocked(drain_type, target);
8557253220dSKevin Wolf 
856191e7af3SEmanuele Giuseppe Esposito     WITH_JOB_LOCK_GUARD() {
8577253220dSKevin Wolf         if (drain_type == BDRV_DRAIN_ALL) {
85881193349SKevin Wolf             /* bdrv_drain_all() drains both src and target */
859da01ff7fSKevin Wolf             g_assert_cmpint(job->job.pause_count, ==, 2);
8607253220dSKevin Wolf         } else {
861da01ff7fSKevin Wolf             g_assert_cmpint(job->job.pause_count, ==, 1);
8627253220dSKevin Wolf         }
86389bd0305SKevin Wolf         g_assert_true(job->job.paused);
864da01ff7fSKevin Wolf         g_assert_false(job->job.busy); /* The job is paused */
865191e7af3SEmanuele Giuseppe Esposito     }
8667253220dSKevin Wolf 
867132ada80SKevin Wolf     do_drain_end_unlocked(drain_type, target);
8687253220dSKevin Wolf 
869f62c1729SKevin Wolf     if (use_iothread) {
870191e7af3SEmanuele Giuseppe Esposito         /*
871191e7af3SEmanuele Giuseppe Esposito          * Here we are waiting for the paused status to change,
872191e7af3SEmanuele Giuseppe Esposito          * so don't bother protecting the read every time.
873191e7af3SEmanuele Giuseppe Esposito          *
874191e7af3SEmanuele Giuseppe Esposito          * paused is reset in the I/O thread, wait for it
875191e7af3SEmanuele Giuseppe Esposito          */
876f62c1729SKevin Wolf         while (job->job.paused) {
877f62c1729SKevin Wolf             aio_poll(qemu_get_aio_context(), false);
878f62c1729SKevin Wolf         }
879f62c1729SKevin Wolf     }
880f62c1729SKevin Wolf 
881191e7af3SEmanuele Giuseppe Esposito     WITH_JOB_LOCK_GUARD() {
882da01ff7fSKevin Wolf         g_assert_cmpint(job->job.pause_count, ==, 0);
883da01ff7fSKevin Wolf         g_assert_false(job->job.paused);
8845599c162SKevin Wolf         g_assert_true(job->job.busy); /* We're in qemu_co_sleep_ns() */
885191e7af3SEmanuele Giuseppe Esposito     }
8867253220dSKevin Wolf 
887191e7af3SEmanuele Giuseppe Esposito     WITH_JOB_LOCK_GUARD() {
888191e7af3SEmanuele Giuseppe Esposito         ret = job_complete_sync_locked(&job->job, &error_abort);
889191e7af3SEmanuele Giuseppe Esposito     }
890d49725afSKevin Wolf     g_assert_cmpint(ret, ==, (result == TEST_JOB_SUCCESS ? 0 : -EIO));
8917253220dSKevin Wolf 
8926f592e5aSEmanuele Giuseppe Esposito     aio_context_acquire(ctx);
893f62c1729SKevin Wolf     if (use_iothread) {
89497896a48SKevin Wolf         blk_set_aio_context(blk_src, qemu_get_aio_context(), &error_abort);
895ad943dcbSKevin Wolf         assert(blk_get_aio_context(blk_target) == qemu_get_aio_context());
896f62c1729SKevin Wolf     }
897f62c1729SKevin Wolf     aio_context_release(ctx);
898f62c1729SKevin Wolf 
8997253220dSKevin Wolf     blk_unref(blk_src);
9007253220dSKevin Wolf     blk_unref(blk_target);
901d8b3afd5SKevin Wolf     bdrv_unref(src_overlay);
9027253220dSKevin Wolf     bdrv_unref(target);
903f62c1729SKevin Wolf 
904f62c1729SKevin Wolf     if (iothread) {
905f62c1729SKevin Wolf         iothread_join(iothread);
906f62c1729SKevin Wolf     }
9077253220dSKevin Wolf }
9087253220dSKevin Wolf 
909d8b3afd5SKevin Wolf static void test_blockjob_common(enum drain_type drain_type, bool use_iothread,
910d8b3afd5SKevin Wolf                                  enum test_job_result result)
911d8b3afd5SKevin Wolf {
912d8b3afd5SKevin Wolf     test_blockjob_common_drain_node(drain_type, use_iothread, result,
913d8b3afd5SKevin Wolf                                     TEST_JOB_DRAIN_SRC);
914d8b3afd5SKevin Wolf     test_blockjob_common_drain_node(drain_type, use_iothread, result,
915d8b3afd5SKevin Wolf                                     TEST_JOB_DRAIN_SRC_CHILD);
916d8b3afd5SKevin Wolf }
917d8b3afd5SKevin Wolf 
9187253220dSKevin Wolf static void test_blockjob_drain_all(void)
9197253220dSKevin Wolf {
920d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN_ALL, false, TEST_JOB_SUCCESS);
9217253220dSKevin Wolf }
9227253220dSKevin Wolf 
9237253220dSKevin Wolf static void test_blockjob_drain(void)
9247253220dSKevin Wolf {
925d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN, false, TEST_JOB_SUCCESS);
9267253220dSKevin Wolf }
9277253220dSKevin Wolf 
928d49725afSKevin Wolf static void test_blockjob_error_drain_all(void)
929d49725afSKevin Wolf {
930d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN_ALL, false, TEST_JOB_FAIL_RUN);
931d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN_ALL, false, TEST_JOB_FAIL_PREPARE);
932d49725afSKevin Wolf }
933d49725afSKevin Wolf 
934d49725afSKevin Wolf static void test_blockjob_error_drain(void)
935d49725afSKevin Wolf {
936d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN, false, TEST_JOB_FAIL_RUN);
937d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN, false, TEST_JOB_FAIL_PREPARE);
938d49725afSKevin Wolf }
939d49725afSKevin Wolf 
940f62c1729SKevin Wolf static void test_blockjob_iothread_drain_all(void)
941f62c1729SKevin Wolf {
942d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN_ALL, true, TEST_JOB_SUCCESS);
943f62c1729SKevin Wolf }
944f62c1729SKevin Wolf 
945f62c1729SKevin Wolf static void test_blockjob_iothread_drain(void)
946f62c1729SKevin Wolf {
947d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN, true, TEST_JOB_SUCCESS);
948f62c1729SKevin Wolf }
949f62c1729SKevin Wolf 
950d49725afSKevin Wolf static void test_blockjob_iothread_error_drain_all(void)
951d49725afSKevin Wolf {
952d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN_ALL, true, TEST_JOB_FAIL_RUN);
953d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN_ALL, true, TEST_JOB_FAIL_PREPARE);
954d49725afSKevin Wolf }
955d49725afSKevin Wolf 
956d49725afSKevin Wolf static void test_blockjob_iothread_error_drain(void)
957d49725afSKevin Wolf {
958d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN, true, TEST_JOB_FAIL_RUN);
959d49725afSKevin Wolf     test_blockjob_common(BDRV_DRAIN, true, TEST_JOB_FAIL_PREPARE);
960d49725afSKevin Wolf }
961d49725afSKevin Wolf 
9624c8158e3SMax Reitz 
9634c8158e3SMax Reitz typedef struct BDRVTestTopState {
9644c8158e3SMax Reitz     BdrvChild *wait_child;
9654c8158e3SMax Reitz } BDRVTestTopState;
9664c8158e3SMax Reitz 
9674c8158e3SMax Reitz static void bdrv_test_top_close(BlockDriverState *bs)
9684c8158e3SMax Reitz {
9694c8158e3SMax Reitz     BdrvChild *c, *next_c;
9704c8158e3SMax Reitz     QLIST_FOREACH_SAFE(c, &bs->children, next, next_c) {
9714c8158e3SMax Reitz         bdrv_unref_child(bs, c);
9724c8158e3SMax Reitz     }
9734c8158e3SMax Reitz }
9744c8158e3SMax Reitz 
975b9b10c35SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
976b9b10c35SKevin Wolf bdrv_test_top_co_preadv(BlockDriverState *bs, int64_t offset, int64_t bytes,
977b9b10c35SKevin Wolf                         QEMUIOVector *qiov, BdrvRequestFlags flags)
9784c8158e3SMax Reitz {
9794c8158e3SMax Reitz     BDRVTestTopState *tts = bs->opaque;
9804c8158e3SMax Reitz     return bdrv_co_preadv(tts->wait_child, offset, bytes, qiov, flags);
9814c8158e3SMax Reitz }
9824c8158e3SMax Reitz 
9834c8158e3SMax Reitz static BlockDriver bdrv_test_top_driver = {
9844c8158e3SMax Reitz     .format_name            = "test_top_driver",
9854c8158e3SMax Reitz     .instance_size          = sizeof(BDRVTestTopState),
9864c8158e3SMax Reitz 
9874c8158e3SMax Reitz     .bdrv_close             = bdrv_test_top_close,
9884c8158e3SMax Reitz     .bdrv_co_preadv         = bdrv_test_top_co_preadv,
9894c8158e3SMax Reitz 
99069dca43dSMax Reitz     .bdrv_child_perm        = bdrv_default_perms,
9914c8158e3SMax Reitz };
9924c8158e3SMax Reitz 
9934c8158e3SMax Reitz typedef struct TestCoDeleteByDrainData {
9944c8158e3SMax Reitz     BlockBackend *blk;
9954c8158e3SMax Reitz     bool detach_instead_of_delete;
9964c8158e3SMax Reitz     bool done;
9974c8158e3SMax Reitz } TestCoDeleteByDrainData;
9984c8158e3SMax Reitz 
9994c8158e3SMax Reitz static void coroutine_fn test_co_delete_by_drain(void *opaque)
10004c8158e3SMax Reitz {
10014c8158e3SMax Reitz     TestCoDeleteByDrainData *dbdd = opaque;
10024c8158e3SMax Reitz     BlockBackend *blk = dbdd->blk;
10034c8158e3SMax Reitz     BlockDriverState *bs = blk_bs(blk);
10044c8158e3SMax Reitz     BDRVTestTopState *tts = bs->opaque;
10054c8158e3SMax Reitz     void *buffer = g_malloc(65536);
1006405d8fe0SVladimir Sementsov-Ogievskiy     QEMUIOVector qiov = QEMU_IOVEC_INIT_BUF(qiov, buffer, 65536);
10074c8158e3SMax Reitz 
10084c8158e3SMax Reitz     /* Pretend some internal write operation from parent to child.
10094c8158e3SMax Reitz      * Important: We have to read from the child, not from the parent!
10104c8158e3SMax Reitz      * Draining works by first propagating it all up the tree to the
10114c8158e3SMax Reitz      * root and then waiting for drainage from root to the leaves
10124c8158e3SMax Reitz      * (protocol nodes).  If we have a request waiting on the root,
10134c8158e3SMax Reitz      * everything will be drained before we go back down the tree, but
10144c8158e3SMax Reitz      * we do not want that.  We want to be in the middle of draining
10154c8158e3SMax Reitz      * when this following requests returns. */
101687f130bdSKevin Wolf     bdrv_graph_co_rdlock();
10174c8158e3SMax Reitz     bdrv_co_preadv(tts->wait_child, 0, 65536, &qiov, 0);
101887f130bdSKevin Wolf     bdrv_graph_co_rdunlock();
10194c8158e3SMax Reitz 
10204c8158e3SMax Reitz     g_assert_cmpint(bs->refcnt, ==, 1);
10214c8158e3SMax Reitz 
10224c8158e3SMax Reitz     if (!dbdd->detach_instead_of_delete) {
102301a10c24SKevin Wolf         blk_co_unref(blk);
10244c8158e3SMax Reitz     } else {
10254c8158e3SMax Reitz         BdrvChild *c, *next_c;
10264c8158e3SMax Reitz         QLIST_FOREACH_SAFE(c, &bs->children, next, next_c) {
10274c8158e3SMax Reitz             bdrv_unref_child(bs, c);
10284c8158e3SMax Reitz         }
10294c8158e3SMax Reitz     }
10304c8158e3SMax Reitz 
10314c8158e3SMax Reitz     dbdd->done = true;
10327b43db3cSMarc-André Lureau     g_free(buffer);
10334c8158e3SMax Reitz }
10344c8158e3SMax Reitz 
10354c8158e3SMax Reitz /**
10364c8158e3SMax Reitz  * Test what happens when some BDS has some children, you drain one of
10374c8158e3SMax Reitz  * them and this results in the BDS being deleted.
10384c8158e3SMax Reitz  *
10394c8158e3SMax Reitz  * If @detach_instead_of_delete is set, the BDS is not going to be
10404c8158e3SMax Reitz  * deleted but will only detach all of its children.
10414c8158e3SMax Reitz  */
1042ebd31837SKevin Wolf static void do_test_delete_by_drain(bool detach_instead_of_delete,
1043ebd31837SKevin Wolf                                     enum drain_type drain_type)
10444c8158e3SMax Reitz {
10454c8158e3SMax Reitz     BlockBackend *blk;
10464c8158e3SMax Reitz     BlockDriverState *bs, *child_bs, *null_bs;
10474c8158e3SMax Reitz     BDRVTestTopState *tts;
10484c8158e3SMax Reitz     TestCoDeleteByDrainData dbdd;
10494c8158e3SMax Reitz     Coroutine *co;
10504c8158e3SMax Reitz 
10514c8158e3SMax Reitz     bs = bdrv_new_open_driver(&bdrv_test_top_driver, "top", BDRV_O_RDWR,
10524c8158e3SMax Reitz                               &error_abort);
10534c8158e3SMax Reitz     bs->total_sectors = 65536 >> BDRV_SECTOR_BITS;
10544c8158e3SMax Reitz     tts = bs->opaque;
10554c8158e3SMax Reitz 
10564c8158e3SMax Reitz     null_bs = bdrv_open("null-co://", NULL, NULL, BDRV_O_RDWR | BDRV_O_PROTOCOL,
10574c8158e3SMax Reitz                         &error_abort);
1058a16be3cdSMax Reitz     bdrv_attach_child(bs, null_bs, "null-child", &child_of_bds,
1059a16be3cdSMax Reitz                       BDRV_CHILD_DATA, &error_abort);
10604c8158e3SMax Reitz 
10614c8158e3SMax Reitz     /* This child will be the one to pass to requests through to, and
10624c8158e3SMax Reitz      * it will stall until a drain occurs */
10634c8158e3SMax Reitz     child_bs = bdrv_new_open_driver(&bdrv_test, "child", BDRV_O_RDWR,
10644c8158e3SMax Reitz                                     &error_abort);
10654c8158e3SMax Reitz     child_bs->total_sectors = 65536 >> BDRV_SECTOR_BITS;
10664c8158e3SMax Reitz     /* Takes our reference to child_bs */
1067a16be3cdSMax Reitz     tts->wait_child = bdrv_attach_child(bs, child_bs, "wait-child",
1068a16be3cdSMax Reitz                                         &child_of_bds,
1069a16be3cdSMax Reitz                                         BDRV_CHILD_DATA | BDRV_CHILD_PRIMARY,
1070a16be3cdSMax Reitz                                         &error_abort);
10714c8158e3SMax Reitz 
10724c8158e3SMax Reitz     /* This child is just there to be deleted
10734c8158e3SMax Reitz      * (for detach_instead_of_delete == true) */
10744c8158e3SMax Reitz     null_bs = bdrv_open("null-co://", NULL, NULL, BDRV_O_RDWR | BDRV_O_PROTOCOL,
10754c8158e3SMax Reitz                         &error_abort);
1076a16be3cdSMax Reitz     bdrv_attach_child(bs, null_bs, "null-child", &child_of_bds, BDRV_CHILD_DATA,
1077a16be3cdSMax Reitz                       &error_abort);
10784c8158e3SMax Reitz 
1079d861ab3aSKevin Wolf     blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
10804c8158e3SMax Reitz     blk_insert_bs(blk, bs, &error_abort);
10814c8158e3SMax Reitz 
10824c8158e3SMax Reitz     /* Referenced by blk now */
10834c8158e3SMax Reitz     bdrv_unref(bs);
10844c8158e3SMax Reitz 
10854c8158e3SMax Reitz     g_assert_cmpint(bs->refcnt, ==, 1);
10864c8158e3SMax Reitz     g_assert_cmpint(child_bs->refcnt, ==, 1);
10874c8158e3SMax Reitz     g_assert_cmpint(null_bs->refcnt, ==, 1);
10884c8158e3SMax Reitz 
10894c8158e3SMax Reitz 
10904c8158e3SMax Reitz     dbdd = (TestCoDeleteByDrainData){
10914c8158e3SMax Reitz         .blk = blk,
10924c8158e3SMax Reitz         .detach_instead_of_delete = detach_instead_of_delete,
10934c8158e3SMax Reitz         .done = false,
10944c8158e3SMax Reitz     };
10954c8158e3SMax Reitz     co = qemu_coroutine_create(test_co_delete_by_drain, &dbdd);
10964c8158e3SMax Reitz     qemu_coroutine_enter(co);
10974c8158e3SMax Reitz 
10984c8158e3SMax Reitz     /* Drain the child while the read operation is still pending.
10994c8158e3SMax Reitz      * This should result in the operation finishing and
11004c8158e3SMax Reitz      * test_co_delete_by_drain() resuming.  Thus, @bs will be deleted
11014c8158e3SMax Reitz      * and the coroutine will exit while this drain operation is still
11024c8158e3SMax Reitz      * in progress. */
1103ebd31837SKevin Wolf     switch (drain_type) {
1104ebd31837SKevin Wolf     case BDRV_DRAIN:
11054c8158e3SMax Reitz         bdrv_ref(child_bs);
11064c8158e3SMax Reitz         bdrv_drain(child_bs);
11074c8158e3SMax Reitz         bdrv_unref(child_bs);
1108ebd31837SKevin Wolf         break;
110919f7a7e5SKevin Wolf     case BDRV_DRAIN_ALL:
111019f7a7e5SKevin Wolf         bdrv_drain_all_begin();
111119f7a7e5SKevin Wolf         bdrv_drain_all_end();
111219f7a7e5SKevin Wolf         break;
1113ebd31837SKevin Wolf     default:
1114ebd31837SKevin Wolf         g_assert_not_reached();
1115ebd31837SKevin Wolf     }
11164c8158e3SMax Reitz 
11174c8158e3SMax Reitz     while (!dbdd.done) {
11184c8158e3SMax Reitz         aio_poll(qemu_get_aio_context(), true);
11194c8158e3SMax Reitz     }
11204c8158e3SMax Reitz 
11214c8158e3SMax Reitz     if (detach_instead_of_delete) {
11224c8158e3SMax Reitz         /* Here, the reference has not passed over to the coroutine,
11234c8158e3SMax Reitz          * so we have to delete the BB ourselves */
11244c8158e3SMax Reitz         blk_unref(blk);
11254c8158e3SMax Reitz     }
11264c8158e3SMax Reitz }
11274c8158e3SMax Reitz 
11284c8158e3SMax Reitz static void test_delete_by_drain(void)
11294c8158e3SMax Reitz {
1130ebd31837SKevin Wolf     do_test_delete_by_drain(false, BDRV_DRAIN);
11314c8158e3SMax Reitz }
11324c8158e3SMax Reitz 
113319f7a7e5SKevin Wolf static void test_detach_by_drain_all(void)
113419f7a7e5SKevin Wolf {
113519f7a7e5SKevin Wolf     do_test_delete_by_drain(true, BDRV_DRAIN_ALL);
113619f7a7e5SKevin Wolf }
113719f7a7e5SKevin Wolf 
11384c8158e3SMax Reitz static void test_detach_by_drain(void)
11394c8158e3SMax Reitz {
1140ebd31837SKevin Wolf     do_test_delete_by_drain(true, BDRV_DRAIN);
1141ebd31837SKevin Wolf }
1142ebd31837SKevin Wolf 
11434c8158e3SMax Reitz 
1144231281abSKevin Wolf struct detach_by_parent_data {
1145231281abSKevin Wolf     BlockDriverState *parent_b;
1146231281abSKevin Wolf     BdrvChild *child_b;
1147231281abSKevin Wolf     BlockDriverState *c;
1148231281abSKevin Wolf     BdrvChild *child_c;
114957320ca9SKevin Wolf     bool by_parent_cb;
1150617f3a96SKevin Wolf     bool detach_on_drain;
1151231281abSKevin Wolf };
115257320ca9SKevin Wolf static struct detach_by_parent_data detach_by_parent_data;
1153231281abSKevin Wolf 
115457320ca9SKevin Wolf static void detach_indirect_bh(void *opaque)
1155231281abSKevin Wolf {
1156231281abSKevin Wolf     struct detach_by_parent_data *data = opaque;
1157231281abSKevin Wolf 
1158617f3a96SKevin Wolf     bdrv_dec_in_flight(data->child_b->bs);
1159231281abSKevin Wolf     bdrv_unref_child(data->parent_b, data->child_b);
1160231281abSKevin Wolf 
1161231281abSKevin Wolf     bdrv_ref(data->c);
1162231281abSKevin Wolf     data->child_c = bdrv_attach_child(data->parent_b, data->c, "PB-C",
1163a16be3cdSMax Reitz                                       &child_of_bds, BDRV_CHILD_DATA,
1164a16be3cdSMax Reitz                                       &error_abort);
1165231281abSKevin Wolf }
1166231281abSKevin Wolf 
116757320ca9SKevin Wolf static void detach_by_parent_aio_cb(void *opaque, int ret)
116857320ca9SKevin Wolf {
116957320ca9SKevin Wolf     struct detach_by_parent_data *data = &detach_by_parent_data;
117057320ca9SKevin Wolf 
117157320ca9SKevin Wolf     g_assert_cmpint(ret, ==, 0);
117257320ca9SKevin Wolf     if (data->by_parent_cb) {
1173617f3a96SKevin Wolf         bdrv_inc_in_flight(data->child_b->bs);
117457320ca9SKevin Wolf         detach_indirect_bh(data);
117557320ca9SKevin Wolf     }
117657320ca9SKevin Wolf }
117757320ca9SKevin Wolf 
117857320ca9SKevin Wolf static void detach_by_driver_cb_drained_begin(BdrvChild *child)
117957320ca9SKevin Wolf {
1180617f3a96SKevin Wolf     struct detach_by_parent_data *data = &detach_by_parent_data;
1181617f3a96SKevin Wolf 
1182617f3a96SKevin Wolf     if (!data->detach_on_drain) {
1183617f3a96SKevin Wolf         return;
1184617f3a96SKevin Wolf     }
1185617f3a96SKevin Wolf     data->detach_on_drain = false;
1186617f3a96SKevin Wolf 
1187617f3a96SKevin Wolf     bdrv_inc_in_flight(data->child_b->bs);
118857320ca9SKevin Wolf     aio_bh_schedule_oneshot(qemu_get_current_aio_context(),
118957320ca9SKevin Wolf                             detach_indirect_bh, &detach_by_parent_data);
1190a16be3cdSMax Reitz     child_of_bds.drained_begin(child);
119157320ca9SKevin Wolf }
119257320ca9SKevin Wolf 
1193bd86fb99SMax Reitz static BdrvChildClass detach_by_driver_cb_class;
119457320ca9SKevin Wolf 
1195231281abSKevin Wolf /*
1196231281abSKevin Wolf  * Initial graph:
1197231281abSKevin Wolf  *
1198231281abSKevin Wolf  * PA     PB
1199231281abSKevin Wolf  *    \ /   \
1200231281abSKevin Wolf  *     A     B     C
1201231281abSKevin Wolf  *
120257320ca9SKevin Wolf  * by_parent_cb == true:  Test that parent callbacks don't poll
120357320ca9SKevin Wolf  *
120457320ca9SKevin Wolf  *     PA has a pending write request whose callback changes the child nodes of
120557320ca9SKevin Wolf  *     PB: It removes B and adds C instead. The subtree of PB is drained, which
120657320ca9SKevin Wolf  *     will indirectly drain the write request, too.
120757320ca9SKevin Wolf  *
120857320ca9SKevin Wolf  * by_parent_cb == false: Test that bdrv_drain_invoke() doesn't poll
120957320ca9SKevin Wolf  *
1210bd86fb99SMax Reitz  *     PA's BdrvChildClass has a .drained_begin callback that schedules a BH
121157320ca9SKevin Wolf  *     that does the same graph change. If bdrv_drain_invoke() calls it, the
121257320ca9SKevin Wolf  *     state is messed up, but if it is only polled in the single
121357320ca9SKevin Wolf  *     BDRV_POLL_WHILE() at the end of the drain, this should work fine.
1214231281abSKevin Wolf  */
121557320ca9SKevin Wolf static void test_detach_indirect(bool by_parent_cb)
1216231281abSKevin Wolf {
1217231281abSKevin Wolf     BlockBackend *blk;
1218231281abSKevin Wolf     BlockDriverState *parent_a, *parent_b, *a, *b, *c;
1219231281abSKevin Wolf     BdrvChild *child_a, *child_b;
1220231281abSKevin Wolf     BlockAIOCB *acb;
1221231281abSKevin Wolf 
1222405d8fe0SVladimir Sementsov-Ogievskiy     QEMUIOVector qiov = QEMU_IOVEC_INIT_BUF(qiov, NULL, 0);
1223231281abSKevin Wolf 
122457320ca9SKevin Wolf     if (!by_parent_cb) {
1225a16be3cdSMax Reitz         detach_by_driver_cb_class = child_of_bds;
1226bd86fb99SMax Reitz         detach_by_driver_cb_class.drained_begin =
122757320ca9SKevin Wolf             detach_by_driver_cb_drained_begin;
1228617f3a96SKevin Wolf         detach_by_driver_cb_class.drained_end = NULL;
1229617f3a96SKevin Wolf         detach_by_driver_cb_class.drained_poll = NULL;
123057320ca9SKevin Wolf     }
123157320ca9SKevin Wolf 
1232617f3a96SKevin Wolf     detach_by_parent_data = (struct detach_by_parent_data) {
1233617f3a96SKevin Wolf         .detach_on_drain = false,
1234617f3a96SKevin Wolf     };
1235617f3a96SKevin Wolf 
1236231281abSKevin Wolf     /* Create all involved nodes */
1237231281abSKevin Wolf     parent_a = bdrv_new_open_driver(&bdrv_test, "parent-a", BDRV_O_RDWR,
1238231281abSKevin Wolf                                     &error_abort);
1239231281abSKevin Wolf     parent_b = bdrv_new_open_driver(&bdrv_test, "parent-b", 0,
1240231281abSKevin Wolf                                     &error_abort);
1241231281abSKevin Wolf 
1242231281abSKevin Wolf     a = bdrv_new_open_driver(&bdrv_test, "a", BDRV_O_RDWR, &error_abort);
1243231281abSKevin Wolf     b = bdrv_new_open_driver(&bdrv_test, "b", BDRV_O_RDWR, &error_abort);
1244231281abSKevin Wolf     c = bdrv_new_open_driver(&bdrv_test, "c", BDRV_O_RDWR, &error_abort);
1245231281abSKevin Wolf 
1246231281abSKevin Wolf     /* blk is a BB for parent-a */
1247d861ab3aSKevin Wolf     blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
1248231281abSKevin Wolf     blk_insert_bs(blk, parent_a, &error_abort);
1249231281abSKevin Wolf     bdrv_unref(parent_a);
1250231281abSKevin Wolf 
125157320ca9SKevin Wolf     /* If we want to get bdrv_drain_invoke() to call aio_poll(), the driver
125257320ca9SKevin Wolf      * callback must not return immediately. */
125357320ca9SKevin Wolf     if (!by_parent_cb) {
125457320ca9SKevin Wolf         BDRVTestState *s = parent_a->opaque;
125557320ca9SKevin Wolf         s->sleep_in_drain_begin = true;
125657320ca9SKevin Wolf     }
125757320ca9SKevin Wolf 
1258231281abSKevin Wolf     /* Set child relationships */
1259231281abSKevin Wolf     bdrv_ref(b);
1260231281abSKevin Wolf     bdrv_ref(a);
1261a16be3cdSMax Reitz     child_b = bdrv_attach_child(parent_b, b, "PB-B", &child_of_bds,
1262a16be3cdSMax Reitz                                 BDRV_CHILD_DATA, &error_abort);
126325191e5fSMax Reitz     child_a = bdrv_attach_child(parent_b, a, "PB-A", &child_of_bds,
126425191e5fSMax Reitz                                 BDRV_CHILD_COW, &error_abort);
1265231281abSKevin Wolf 
1266231281abSKevin Wolf     bdrv_ref(a);
126757320ca9SKevin Wolf     bdrv_attach_child(parent_a, a, "PA-A",
1268a16be3cdSMax Reitz                       by_parent_cb ? &child_of_bds : &detach_by_driver_cb_class,
1269a16be3cdSMax Reitz                       BDRV_CHILD_DATA, &error_abort);
1270231281abSKevin Wolf 
1271231281abSKevin Wolf     g_assert_cmpint(parent_a->refcnt, ==, 1);
1272231281abSKevin Wolf     g_assert_cmpint(parent_b->refcnt, ==, 1);
1273231281abSKevin Wolf     g_assert_cmpint(a->refcnt, ==, 3);
1274231281abSKevin Wolf     g_assert_cmpint(b->refcnt, ==, 2);
1275231281abSKevin Wolf     g_assert_cmpint(c->refcnt, ==, 1);
1276231281abSKevin Wolf 
1277231281abSKevin Wolf     g_assert(QLIST_FIRST(&parent_b->children) == child_a);
1278231281abSKevin Wolf     g_assert(QLIST_NEXT(child_a, next) == child_b);
1279231281abSKevin Wolf     g_assert(QLIST_NEXT(child_b, next) == NULL);
1280231281abSKevin Wolf 
1281231281abSKevin Wolf     /* Start the evil write request */
128257320ca9SKevin Wolf     detach_by_parent_data = (struct detach_by_parent_data) {
1283231281abSKevin Wolf         .parent_b = parent_b,
1284231281abSKevin Wolf         .child_b = child_b,
1285231281abSKevin Wolf         .c = c,
128657320ca9SKevin Wolf         .by_parent_cb = by_parent_cb,
1287617f3a96SKevin Wolf         .detach_on_drain = true,
1288231281abSKevin Wolf     };
128957320ca9SKevin Wolf     acb = blk_aio_preadv(blk, 0, &qiov, 0, detach_by_parent_aio_cb, NULL);
1290231281abSKevin Wolf     g_assert(acb != NULL);
1291231281abSKevin Wolf 
1292231281abSKevin Wolf     /* Drain and check the expected result */
1293299403aeSKevin Wolf     bdrv_drained_begin(parent_b);
1294299403aeSKevin Wolf     bdrv_drained_begin(a);
1295299403aeSKevin Wolf     bdrv_drained_begin(b);
1296299403aeSKevin Wolf     bdrv_drained_begin(c);
1297231281abSKevin Wolf 
129857320ca9SKevin Wolf     g_assert(detach_by_parent_data.child_c != NULL);
1299231281abSKevin Wolf 
1300231281abSKevin Wolf     g_assert_cmpint(parent_a->refcnt, ==, 1);
1301231281abSKevin Wolf     g_assert_cmpint(parent_b->refcnt, ==, 1);
1302231281abSKevin Wolf     g_assert_cmpint(a->refcnt, ==, 3);
1303231281abSKevin Wolf     g_assert_cmpint(b->refcnt, ==, 1);
1304231281abSKevin Wolf     g_assert_cmpint(c->refcnt, ==, 2);
1305231281abSKevin Wolf 
130657320ca9SKevin Wolf     g_assert(QLIST_FIRST(&parent_b->children) == detach_by_parent_data.child_c);
130757320ca9SKevin Wolf     g_assert(QLIST_NEXT(detach_by_parent_data.child_c, next) == child_a);
1308231281abSKevin Wolf     g_assert(QLIST_NEXT(child_a, next) == NULL);
1309231281abSKevin Wolf 
1310231281abSKevin Wolf     g_assert_cmpint(parent_a->quiesce_counter, ==, 1);
1311299403aeSKevin Wolf     g_assert_cmpint(parent_b->quiesce_counter, ==, 3);
1312231281abSKevin Wolf     g_assert_cmpint(a->quiesce_counter, ==, 1);
1313299403aeSKevin Wolf     g_assert_cmpint(b->quiesce_counter, ==, 1);
1314231281abSKevin Wolf     g_assert_cmpint(c->quiesce_counter, ==, 1);
1315231281abSKevin Wolf 
1316299403aeSKevin Wolf     bdrv_drained_end(parent_b);
1317299403aeSKevin Wolf     bdrv_drained_end(a);
1318299403aeSKevin Wolf     bdrv_drained_end(b);
1319299403aeSKevin Wolf     bdrv_drained_end(c);
1320231281abSKevin Wolf 
1321231281abSKevin Wolf     bdrv_unref(parent_b);
1322231281abSKevin Wolf     blk_unref(blk);
1323231281abSKevin Wolf 
1324231281abSKevin Wolf     g_assert_cmpint(a->refcnt, ==, 1);
1325231281abSKevin Wolf     g_assert_cmpint(b->refcnt, ==, 1);
1326231281abSKevin Wolf     g_assert_cmpint(c->refcnt, ==, 1);
1327231281abSKevin Wolf     bdrv_unref(a);
1328231281abSKevin Wolf     bdrv_unref(b);
1329231281abSKevin Wolf     bdrv_unref(c);
1330231281abSKevin Wolf }
1331231281abSKevin Wolf 
133257320ca9SKevin Wolf static void test_detach_by_parent_cb(void)
133357320ca9SKevin Wolf {
133457320ca9SKevin Wolf     test_detach_indirect(true);
133557320ca9SKevin Wolf }
133657320ca9SKevin Wolf 
133757320ca9SKevin Wolf static void test_detach_by_driver_cb(void)
133857320ca9SKevin Wolf {
133957320ca9SKevin Wolf     test_detach_indirect(false);
134057320ca9SKevin Wolf }
1341231281abSKevin Wolf 
1342b994c5bcSKevin Wolf static void test_append_to_drained(void)
1343b994c5bcSKevin Wolf {
1344b994c5bcSKevin Wolf     BlockBackend *blk;
1345b994c5bcSKevin Wolf     BlockDriverState *base, *overlay;
1346b994c5bcSKevin Wolf     BDRVTestState *base_s, *overlay_s;
1347b994c5bcSKevin Wolf 
1348d861ab3aSKevin Wolf     blk = blk_new(qemu_get_aio_context(), BLK_PERM_ALL, BLK_PERM_ALL);
1349b994c5bcSKevin Wolf     base = bdrv_new_open_driver(&bdrv_test, "base", BDRV_O_RDWR, &error_abort);
1350b994c5bcSKevin Wolf     base_s = base->opaque;
1351b994c5bcSKevin Wolf     blk_insert_bs(blk, base, &error_abort);
1352b994c5bcSKevin Wolf 
1353b994c5bcSKevin Wolf     overlay = bdrv_new_open_driver(&bdrv_test, "overlay", BDRV_O_RDWR,
1354b994c5bcSKevin Wolf                                    &error_abort);
1355b994c5bcSKevin Wolf     overlay_s = overlay->opaque;
1356b994c5bcSKevin Wolf 
1357b994c5bcSKevin Wolf     do_drain_begin(BDRV_DRAIN, base);
1358b994c5bcSKevin Wolf     g_assert_cmpint(base->quiesce_counter, ==, 1);
1359b994c5bcSKevin Wolf     g_assert_cmpint(base_s->drain_count, ==, 1);
1360b994c5bcSKevin Wolf     g_assert_cmpint(base->in_flight, ==, 0);
1361b994c5bcSKevin Wolf 
1362*487b9187SKevin Wolf     aio_context_acquire(qemu_get_aio_context());
1363b994c5bcSKevin Wolf     bdrv_append(overlay, base, &error_abort);
1364*487b9187SKevin Wolf     aio_context_release(qemu_get_aio_context());
1365*487b9187SKevin Wolf 
1366b994c5bcSKevin Wolf     g_assert_cmpint(base->in_flight, ==, 0);
1367b994c5bcSKevin Wolf     g_assert_cmpint(overlay->in_flight, ==, 0);
1368b994c5bcSKevin Wolf 
1369b994c5bcSKevin Wolf     g_assert_cmpint(base->quiesce_counter, ==, 1);
1370b994c5bcSKevin Wolf     g_assert_cmpint(base_s->drain_count, ==, 1);
1371b994c5bcSKevin Wolf     g_assert_cmpint(overlay->quiesce_counter, ==, 1);
1372b994c5bcSKevin Wolf     g_assert_cmpint(overlay_s->drain_count, ==, 1);
1373b994c5bcSKevin Wolf 
1374b994c5bcSKevin Wolf     do_drain_end(BDRV_DRAIN, base);
1375b994c5bcSKevin Wolf 
1376b994c5bcSKevin Wolf     g_assert_cmpint(base->quiesce_counter, ==, 0);
1377b994c5bcSKevin Wolf     g_assert_cmpint(base_s->drain_count, ==, 0);
1378b994c5bcSKevin Wolf     g_assert_cmpint(overlay->quiesce_counter, ==, 0);
1379b994c5bcSKevin Wolf     g_assert_cmpint(overlay_s->drain_count, ==, 0);
1380b994c5bcSKevin Wolf 
1381ae9d4417SVladimir Sementsov-Ogievskiy     bdrv_unref(overlay);
1382b994c5bcSKevin Wolf     bdrv_unref(base);
1383b994c5bcSKevin Wolf     blk_unref(blk);
1384b994c5bcSKevin Wolf }
1385b994c5bcSKevin Wolf 
1386247d2737SKevin Wolf static void test_set_aio_context(void)
1387247d2737SKevin Wolf {
1388247d2737SKevin Wolf     BlockDriverState *bs;
1389247d2737SKevin Wolf     IOThread *a = iothread_new();
1390247d2737SKevin Wolf     IOThread *b = iothread_new();
1391247d2737SKevin Wolf     AioContext *ctx_a = iothread_get_aio_context(a);
1392247d2737SKevin Wolf     AioContext *ctx_b = iothread_get_aio_context(b);
1393247d2737SKevin Wolf 
1394247d2737SKevin Wolf     bs = bdrv_new_open_driver(&bdrv_test, "test-node", BDRV_O_RDWR,
1395247d2737SKevin Wolf                               &error_abort);
1396247d2737SKevin Wolf 
1397247d2737SKevin Wolf     bdrv_drained_begin(bs);
1398142e6907SEmanuele Giuseppe Esposito     bdrv_try_change_aio_context(bs, ctx_a, NULL, &error_abort);
1399247d2737SKevin Wolf 
1400247d2737SKevin Wolf     aio_context_acquire(ctx_a);
1401247d2737SKevin Wolf     bdrv_drained_end(bs);
1402247d2737SKevin Wolf 
1403247d2737SKevin Wolf     bdrv_drained_begin(bs);
1404142e6907SEmanuele Giuseppe Esposito     bdrv_try_change_aio_context(bs, ctx_b, NULL, &error_abort);
1405247d2737SKevin Wolf     aio_context_release(ctx_a);
1406247d2737SKevin Wolf     aio_context_acquire(ctx_b);
1407142e6907SEmanuele Giuseppe Esposito     bdrv_try_change_aio_context(bs, qemu_get_aio_context(), NULL, &error_abort);
1408247d2737SKevin Wolf     aio_context_release(ctx_b);
1409247d2737SKevin Wolf     bdrv_drained_end(bs);
1410247d2737SKevin Wolf 
1411247d2737SKevin Wolf     bdrv_unref(bs);
1412247d2737SKevin Wolf     iothread_join(a);
1413247d2737SKevin Wolf     iothread_join(b);
1414247d2737SKevin Wolf }
1415247d2737SKevin Wolf 
14168e442810SMax Reitz 
14178e442810SMax Reitz typedef struct TestDropBackingBlockJob {
14188e442810SMax Reitz     BlockJob common;
14198e442810SMax Reitz     bool should_complete;
14208e442810SMax Reitz     bool *did_complete;
14212afdc790SMax Reitz     BlockDriverState *detach_also;
14221b177bbeSVladimir Sementsov-Ogievskiy     BlockDriverState *bs;
14238e442810SMax Reitz } TestDropBackingBlockJob;
14248e442810SMax Reitz 
14258e442810SMax Reitz static int coroutine_fn test_drop_backing_job_run(Job *job, Error **errp)
14268e442810SMax Reitz {
14278e442810SMax Reitz     TestDropBackingBlockJob *s =
14288e442810SMax Reitz         container_of(job, TestDropBackingBlockJob, common.job);
14298e442810SMax Reitz 
14308e442810SMax Reitz     while (!s->should_complete) {
14318e442810SMax Reitz         job_sleep_ns(job, 0);
14328e442810SMax Reitz     }
14338e442810SMax Reitz 
14348e442810SMax Reitz     return 0;
14358e442810SMax Reitz }
14368e442810SMax Reitz 
14378e442810SMax Reitz static void test_drop_backing_job_commit(Job *job)
14388e442810SMax Reitz {
14398e442810SMax Reitz     TestDropBackingBlockJob *s =
14408e442810SMax Reitz         container_of(job, TestDropBackingBlockJob, common.job);
14418e442810SMax Reitz 
14421b177bbeSVladimir Sementsov-Ogievskiy     bdrv_set_backing_hd(s->bs, NULL, &error_abort);
14432afdc790SMax Reitz     bdrv_set_backing_hd(s->detach_also, NULL, &error_abort);
14448e442810SMax Reitz 
14458e442810SMax Reitz     *s->did_complete = true;
14468e442810SMax Reitz }
14478e442810SMax Reitz 
14488e442810SMax Reitz static const BlockJobDriver test_drop_backing_job_driver = {
14498e442810SMax Reitz     .job_driver = {
14508e442810SMax Reitz         .instance_size  = sizeof(TestDropBackingBlockJob),
14518e442810SMax Reitz         .free           = block_job_free,
14528e442810SMax Reitz         .user_resume    = block_job_user_resume,
14538e442810SMax Reitz         .run            = test_drop_backing_job_run,
14548e442810SMax Reitz         .commit         = test_drop_backing_job_commit,
14558e442810SMax Reitz     }
14568e442810SMax Reitz };
14578e442810SMax Reitz 
14588e442810SMax Reitz /**
14598e442810SMax Reitz  * Creates a child node with three parent nodes on it, and then runs a
14608e442810SMax Reitz  * block job on the final one, parent-node-2.
14618e442810SMax Reitz  *
14628e442810SMax Reitz  * The job is then asked to complete before a section where the child
14638e442810SMax Reitz  * is drained.
14648e442810SMax Reitz  *
14658e442810SMax Reitz  * Ending this section will undrain the child's parents, first
14668e442810SMax Reitz  * parent-node-2, then parent-node-1, then parent-node-0 -- the parent
14678e442810SMax Reitz  * list is in reverse order of how they were added.  Ending the drain
14688e442810SMax Reitz  * on parent-node-2 will resume the job, thus completing it and
14698e442810SMax Reitz  * scheduling job_exit().
14708e442810SMax Reitz  *
14718e442810SMax Reitz  * Ending the drain on parent-node-1 will poll the AioContext, which
14728e442810SMax Reitz  * lets job_exit() and thus test_drop_backing_job_commit() run.  That
14732afdc790SMax Reitz  * function first removes the child as parent-node-2's backing file.
14748e442810SMax Reitz  *
14758e442810SMax Reitz  * In old (and buggy) implementations, there are two problems with
14768e442810SMax Reitz  * that:
14778e442810SMax Reitz  * (A) bdrv_drain_invoke() polls for every node that leaves the
14788e442810SMax Reitz  *     drained section.  This means that job_exit() is scheduled
14798e442810SMax Reitz  *     before the child has left the drained section.  Its
14808e442810SMax Reitz  *     quiesce_counter is therefore still 1 when it is removed from
14818e442810SMax Reitz  *     parent-node-2.
14828e442810SMax Reitz  *
14838e442810SMax Reitz  * (B) bdrv_replace_child_noperm() calls drained_end() on the old
14848e442810SMax Reitz  *     child's parents as many times as the child is quiesced.  This
14858e442810SMax Reitz  *     means it will call drained_end() on parent-node-2 once.
14868e442810SMax Reitz  *     Because parent-node-2 is no longer quiesced at this point, this
14878e442810SMax Reitz  *     will fail.
14888e442810SMax Reitz  *
14898e442810SMax Reitz  * bdrv_replace_child_noperm() therefore must call drained_end() on
14908e442810SMax Reitz  * the parent only if it really is still drained because the child is
14918e442810SMax Reitz  * drained.
14922afdc790SMax Reitz  *
14932afdc790SMax Reitz  * If removing child from parent-node-2 was successful (as it should
14942afdc790SMax Reitz  * be), test_drop_backing_job_commit() will then also remove the child
14952afdc790SMax Reitz  * from parent-node-0.
14962afdc790SMax Reitz  *
14972afdc790SMax Reitz  * With an old version of our drain infrastructure ((A) above), that
14982afdc790SMax Reitz  * resulted in the following flow:
14992afdc790SMax Reitz  *
15002afdc790SMax Reitz  * 1. child attempts to leave its drained section.  The call recurses
15012afdc790SMax Reitz  *    to its parents.
15022afdc790SMax Reitz  *
15032afdc790SMax Reitz  * 2. parent-node-2 leaves the drained section.  Polling in
15042afdc790SMax Reitz  *    bdrv_drain_invoke() will schedule job_exit().
15052afdc790SMax Reitz  *
15062afdc790SMax Reitz  * 3. parent-node-1 leaves the drained section.  Polling in
15072afdc790SMax Reitz  *    bdrv_drain_invoke() will run job_exit(), thus disconnecting
15082afdc790SMax Reitz  *    parent-node-0 from the child node.
15092afdc790SMax Reitz  *
15102afdc790SMax Reitz  * 4. bdrv_parent_drained_end() uses a QLIST_FOREACH_SAFE() loop to
15112afdc790SMax Reitz  *    iterate over the parents.  Thus, it now accesses the BdrvChild
15122afdc790SMax Reitz  *    object that used to connect parent-node-0 and the child node.
15132afdc790SMax Reitz  *    However, that object no longer exists, so it accesses a dangling
15142afdc790SMax Reitz  *    pointer.
15152afdc790SMax Reitz  *
15162afdc790SMax Reitz  * The solution is to only poll once when running a bdrv_drained_end()
15172afdc790SMax Reitz  * operation, specifically at the end when all drained_end()
15182afdc790SMax Reitz  * operations for all involved nodes have been scheduled.
15192afdc790SMax Reitz  * Note that this also solves (A) above, thus hiding (B).
15208e442810SMax Reitz  */
15218e442810SMax Reitz static void test_blockjob_commit_by_drained_end(void)
15228e442810SMax Reitz {
15238e442810SMax Reitz     BlockDriverState *bs_child, *bs_parents[3];
15248e442810SMax Reitz     TestDropBackingBlockJob *job;
15258e442810SMax Reitz     bool job_has_completed = false;
15268e442810SMax Reitz     int i;
15278e442810SMax Reitz 
15288e442810SMax Reitz     bs_child = bdrv_new_open_driver(&bdrv_test, "child-node", BDRV_O_RDWR,
15298e442810SMax Reitz                                     &error_abort);
15308e442810SMax Reitz 
15318e442810SMax Reitz     for (i = 0; i < 3; i++) {
15328e442810SMax Reitz         char name[32];
15338e442810SMax Reitz         snprintf(name, sizeof(name), "parent-node-%i", i);
15348e442810SMax Reitz         bs_parents[i] = bdrv_new_open_driver(&bdrv_test, name, BDRV_O_RDWR,
15358e442810SMax Reitz                                              &error_abort);
15368e442810SMax Reitz         bdrv_set_backing_hd(bs_parents[i], bs_child, &error_abort);
15378e442810SMax Reitz     }
15388e442810SMax Reitz 
15398e442810SMax Reitz     job = block_job_create("job", &test_drop_backing_job_driver, NULL,
15408e442810SMax Reitz                            bs_parents[2], 0, BLK_PERM_ALL, 0, 0, NULL, NULL,
15418e442810SMax Reitz                            &error_abort);
15421b177bbeSVladimir Sementsov-Ogievskiy     job->bs = bs_parents[2];
15438e442810SMax Reitz 
15442afdc790SMax Reitz     job->detach_also = bs_parents[0];
15458e442810SMax Reitz     job->did_complete = &job_has_completed;
15468e442810SMax Reitz 
15478e442810SMax Reitz     job_start(&job->common.job);
15488e442810SMax Reitz 
15498e442810SMax Reitz     job->should_complete = true;
15508e442810SMax Reitz     bdrv_drained_begin(bs_child);
15518e442810SMax Reitz     g_assert(!job_has_completed);
15528e442810SMax Reitz     bdrv_drained_end(bs_child);
15535e8ac217SKevin Wolf     aio_poll(qemu_get_aio_context(), false);
15548e442810SMax Reitz     g_assert(job_has_completed);
15558e442810SMax Reitz 
15568e442810SMax Reitz     bdrv_unref(bs_parents[0]);
15578e442810SMax Reitz     bdrv_unref(bs_parents[1]);
15588e442810SMax Reitz     bdrv_unref(bs_parents[2]);
15598e442810SMax Reitz     bdrv_unref(bs_child);
15608e442810SMax Reitz }
15618e442810SMax Reitz 
15629746b35cSMax Reitz 
15639746b35cSMax Reitz typedef struct TestSimpleBlockJob {
15649746b35cSMax Reitz     BlockJob common;
15659746b35cSMax Reitz     bool should_complete;
15669746b35cSMax Reitz     bool *did_complete;
15679746b35cSMax Reitz } TestSimpleBlockJob;
15689746b35cSMax Reitz 
15699746b35cSMax Reitz static int coroutine_fn test_simple_job_run(Job *job, Error **errp)
15709746b35cSMax Reitz {
15719746b35cSMax Reitz     TestSimpleBlockJob *s = container_of(job, TestSimpleBlockJob, common.job);
15729746b35cSMax Reitz 
15739746b35cSMax Reitz     while (!s->should_complete) {
15749746b35cSMax Reitz         job_sleep_ns(job, 0);
15759746b35cSMax Reitz     }
15769746b35cSMax Reitz 
15779746b35cSMax Reitz     return 0;
15789746b35cSMax Reitz }
15799746b35cSMax Reitz 
15809746b35cSMax Reitz static void test_simple_job_clean(Job *job)
15819746b35cSMax Reitz {
15829746b35cSMax Reitz     TestSimpleBlockJob *s = container_of(job, TestSimpleBlockJob, common.job);
15839746b35cSMax Reitz     *s->did_complete = true;
15849746b35cSMax Reitz }
15859746b35cSMax Reitz 
15869746b35cSMax Reitz static const BlockJobDriver test_simple_job_driver = {
15879746b35cSMax Reitz     .job_driver = {
15889746b35cSMax Reitz         .instance_size  = sizeof(TestSimpleBlockJob),
15899746b35cSMax Reitz         .free           = block_job_free,
15909746b35cSMax Reitz         .user_resume    = block_job_user_resume,
15919746b35cSMax Reitz         .run            = test_simple_job_run,
15929746b35cSMax Reitz         .clean          = test_simple_job_clean,
15939746b35cSMax Reitz     },
15949746b35cSMax Reitz };
15959746b35cSMax Reitz 
15969746b35cSMax Reitz static int drop_intermediate_poll_update_filename(BdrvChild *child,
15979746b35cSMax Reitz                                                   BlockDriverState *new_base,
15989746b35cSMax Reitz                                                   const char *filename,
15999746b35cSMax Reitz                                                   Error **errp)
16009746b35cSMax Reitz {
16019746b35cSMax Reitz     /*
16029746b35cSMax Reitz      * We are free to poll here, which may change the block graph, if
16039746b35cSMax Reitz      * it is not drained.
16049746b35cSMax Reitz      */
16059746b35cSMax Reitz 
16069746b35cSMax Reitz     /* If the job is not drained: Complete it, schedule job_exit() */
16079746b35cSMax Reitz     aio_poll(qemu_get_current_aio_context(), false);
16089746b35cSMax Reitz     /* If the job is not drained: Run job_exit(), finish the job */
16099746b35cSMax Reitz     aio_poll(qemu_get_current_aio_context(), false);
16109746b35cSMax Reitz 
16119746b35cSMax Reitz     return 0;
16129746b35cSMax Reitz }
16139746b35cSMax Reitz 
16149746b35cSMax Reitz /**
16159746b35cSMax Reitz  * Test a poll in the midst of bdrv_drop_intermediate().
16169746b35cSMax Reitz  *
1617bd86fb99SMax Reitz  * bdrv_drop_intermediate() calls BdrvChildClass.update_filename(),
16189746b35cSMax Reitz  * which can yield or poll.  This may lead to graph changes, unless
16199746b35cSMax Reitz  * the whole subtree in question is drained.
16209746b35cSMax Reitz  *
16219746b35cSMax Reitz  * We test this on the following graph:
16229746b35cSMax Reitz  *
16239746b35cSMax Reitz  *                    Job
16249746b35cSMax Reitz  *
16259746b35cSMax Reitz  *                     |
16269746b35cSMax Reitz  *                  job-node
16279746b35cSMax Reitz  *                     |
16289746b35cSMax Reitz  *                     v
16299746b35cSMax Reitz  *
16309746b35cSMax Reitz  *                  job-node
16319746b35cSMax Reitz  *
16329746b35cSMax Reitz  *                     |
16339746b35cSMax Reitz  *                  backing
16349746b35cSMax Reitz  *                     |
16359746b35cSMax Reitz  *                     v
16369746b35cSMax Reitz  *
16379746b35cSMax Reitz  * node-2 --chain--> node-1 --chain--> node-0
16389746b35cSMax Reitz  *
16399746b35cSMax Reitz  * We drop node-1 with bdrv_drop_intermediate(top=node-1, base=node-0).
16409746b35cSMax Reitz  *
16419746b35cSMax Reitz  * This first updates node-2's backing filename by invoking
16429746b35cSMax Reitz  * drop_intermediate_poll_update_filename(), which polls twice.  This
16439746b35cSMax Reitz  * causes the job to finish, which in turns causes the job-node to be
16449746b35cSMax Reitz  * deleted.
16459746b35cSMax Reitz  *
16469746b35cSMax Reitz  * bdrv_drop_intermediate() uses a QLIST_FOREACH_SAFE() loop, so it
16479746b35cSMax Reitz  * already has a pointer to the BdrvChild edge between job-node and
16489746b35cSMax Reitz  * node-1.  When it tries to handle that edge, we probably get a
16499746b35cSMax Reitz  * segmentation fault because the object no longer exists.
16509746b35cSMax Reitz  *
16519746b35cSMax Reitz  *
16529746b35cSMax Reitz  * The solution is for bdrv_drop_intermediate() to drain top's
16539746b35cSMax Reitz  * subtree.  This prevents graph changes from happening just because
1654bd86fb99SMax Reitz  * BdrvChildClass.update_filename() yields or polls.  Thus, the block
16559746b35cSMax Reitz  * job is paused during that drained section and must finish before or
16569746b35cSMax Reitz  * after.
16579746b35cSMax Reitz  *
16589746b35cSMax Reitz  * (In addition, bdrv_replace_child() must keep the job paused.)
16599746b35cSMax Reitz  */
16609746b35cSMax Reitz static void test_drop_intermediate_poll(void)
16619746b35cSMax Reitz {
1662bd86fb99SMax Reitz     static BdrvChildClass chain_child_class;
16639746b35cSMax Reitz     BlockDriverState *chain[3];
16649746b35cSMax Reitz     TestSimpleBlockJob *job;
16659746b35cSMax Reitz     BlockDriverState *job_node;
16669746b35cSMax Reitz     bool job_has_completed = false;
16679746b35cSMax Reitz     int i;
16689746b35cSMax Reitz     int ret;
16699746b35cSMax Reitz 
167025191e5fSMax Reitz     chain_child_class = child_of_bds;
1671bd86fb99SMax Reitz     chain_child_class.update_filename = drop_intermediate_poll_update_filename;
16729746b35cSMax Reitz 
16739746b35cSMax Reitz     for (i = 0; i < 3; i++) {
16749746b35cSMax Reitz         char name[32];
16759746b35cSMax Reitz         snprintf(name, 32, "node-%i", i);
16769746b35cSMax Reitz 
16779746b35cSMax Reitz         chain[i] = bdrv_new_open_driver(&bdrv_test, name, 0, &error_abort);
16789746b35cSMax Reitz     }
16799746b35cSMax Reitz 
16809746b35cSMax Reitz     job_node = bdrv_new_open_driver(&bdrv_test, "job-node", BDRV_O_RDWR,
16819746b35cSMax Reitz                                     &error_abort);
16829746b35cSMax Reitz     bdrv_set_backing_hd(job_node, chain[1], &error_abort);
16839746b35cSMax Reitz 
16849746b35cSMax Reitz     /*
16859746b35cSMax Reitz      * Establish the chain last, so the chain links are the first
16869746b35cSMax Reitz      * elements in the BDS.parents lists
16879746b35cSMax Reitz      */
16889746b35cSMax Reitz     for (i = 0; i < 3; i++) {
16899746b35cSMax Reitz         if (i) {
16909746b35cSMax Reitz             /* Takes the reference to chain[i - 1] */
16915bb04747SVladimir Sementsov-Ogievskiy             bdrv_attach_child(chain[i], chain[i - 1], "chain",
16925bb04747SVladimir Sementsov-Ogievskiy                               &chain_child_class, BDRV_CHILD_COW, &error_abort);
16939746b35cSMax Reitz         }
16949746b35cSMax Reitz     }
16959746b35cSMax Reitz 
16969746b35cSMax Reitz     job = block_job_create("job", &test_simple_job_driver, NULL, job_node,
16979746b35cSMax Reitz                            0, BLK_PERM_ALL, 0, 0, NULL, NULL, &error_abort);
16989746b35cSMax Reitz 
16999746b35cSMax Reitz     /* The job has a reference now */
17009746b35cSMax Reitz     bdrv_unref(job_node);
17019746b35cSMax Reitz 
17029746b35cSMax Reitz     job->did_complete = &job_has_completed;
17039746b35cSMax Reitz 
17049746b35cSMax Reitz     job_start(&job->common.job);
17059746b35cSMax Reitz     job->should_complete = true;
17069746b35cSMax Reitz 
17079746b35cSMax Reitz     g_assert(!job_has_completed);
17089746b35cSMax Reitz     ret = bdrv_drop_intermediate(chain[1], chain[0], NULL);
17095e8ac217SKevin Wolf     aio_poll(qemu_get_aio_context(), false);
17109746b35cSMax Reitz     g_assert(ret == 0);
17119746b35cSMax Reitz     g_assert(job_has_completed);
17129746b35cSMax Reitz 
17139746b35cSMax Reitz     bdrv_unref(chain[2]);
17149746b35cSMax Reitz }
17159746b35cSMax Reitz 
17160513f984SMax Reitz 
17170513f984SMax Reitz typedef struct BDRVReplaceTestState {
171823987471SKevin Wolf     bool setup_completed;
17190513f984SMax Reitz     bool was_drained;
17200513f984SMax Reitz     bool was_undrained;
17210513f984SMax Reitz     bool has_read;
17220513f984SMax Reitz 
17230513f984SMax Reitz     int drain_count;
17240513f984SMax Reitz 
17250513f984SMax Reitz     bool yield_before_read;
17260513f984SMax Reitz     Coroutine *io_co;
17270513f984SMax Reitz     Coroutine *drain_co;
17280513f984SMax Reitz } BDRVReplaceTestState;
17290513f984SMax Reitz 
17300513f984SMax Reitz static void bdrv_replace_test_close(BlockDriverState *bs)
17310513f984SMax Reitz {
17320513f984SMax Reitz }
17330513f984SMax Reitz 
17340513f984SMax Reitz /**
17350513f984SMax Reitz  * If @bs has a backing file:
17360513f984SMax Reitz  *   Yield if .yield_before_read is true (and wait for drain_begin to
17370513f984SMax Reitz  *   wake us up).
17380513f984SMax Reitz  *   Forward the read to bs->backing.  Set .has_read to true.
17390513f984SMax Reitz  *   If drain_begin has woken us, wake it in turn.
17400513f984SMax Reitz  *
17410513f984SMax Reitz  * Otherwise:
17420513f984SMax Reitz  *   Set .has_read to true and return success.
17430513f984SMax Reitz  */
1744b9b10c35SKevin Wolf static int coroutine_fn GRAPH_RDLOCK
1745b9b10c35SKevin Wolf bdrv_replace_test_co_preadv(BlockDriverState *bs, int64_t offset, int64_t bytes,
1746b9b10c35SKevin Wolf                             QEMUIOVector *qiov, BdrvRequestFlags flags)
17470513f984SMax Reitz {
17480513f984SMax Reitz     BDRVReplaceTestState *s = bs->opaque;
17490513f984SMax Reitz 
17500513f984SMax Reitz     if (bs->backing) {
17510513f984SMax Reitz         int ret;
17520513f984SMax Reitz 
17530513f984SMax Reitz         g_assert(!s->drain_count);
17540513f984SMax Reitz 
17550513f984SMax Reitz         s->io_co = qemu_coroutine_self();
17560513f984SMax Reitz         if (s->yield_before_read) {
17570513f984SMax Reitz             s->yield_before_read = false;
17580513f984SMax Reitz             qemu_coroutine_yield();
17590513f984SMax Reitz         }
17600513f984SMax Reitz         s->io_co = NULL;
17610513f984SMax Reitz 
1762fae2681aSVladimir Sementsov-Ogievskiy         ret = bdrv_co_preadv(bs->backing, offset, bytes, qiov, 0);
17630513f984SMax Reitz         s->has_read = true;
17640513f984SMax Reitz 
17650513f984SMax Reitz         /* Wake up drain_co if it runs */
17660513f984SMax Reitz         if (s->drain_co) {
17670513f984SMax Reitz             aio_co_wake(s->drain_co);
17680513f984SMax Reitz         }
17690513f984SMax Reitz 
17700513f984SMax Reitz         return ret;
17710513f984SMax Reitz     }
17720513f984SMax Reitz 
17730513f984SMax Reitz     s->has_read = true;
17740513f984SMax Reitz     return 0;
17750513f984SMax Reitz }
17760513f984SMax Reitz 
17777bce1c29SKevin Wolf static void coroutine_fn bdrv_replace_test_drain_co(void *opaque)
17787bce1c29SKevin Wolf {
17797bce1c29SKevin Wolf     BlockDriverState *bs = opaque;
17807bce1c29SKevin Wolf     BDRVReplaceTestState *s = bs->opaque;
17817bce1c29SKevin Wolf 
17827bce1c29SKevin Wolf     /* Keep waking io_co up until it is done */
17837bce1c29SKevin Wolf     while (s->io_co) {
17847bce1c29SKevin Wolf         aio_co_wake(s->io_co);
17857bce1c29SKevin Wolf         s->io_co = NULL;
17867bce1c29SKevin Wolf         qemu_coroutine_yield();
17877bce1c29SKevin Wolf     }
17887bce1c29SKevin Wolf     s->drain_co = NULL;
17897bce1c29SKevin Wolf     bdrv_dec_in_flight(bs);
17907bce1c29SKevin Wolf }
17917bce1c29SKevin Wolf 
17920513f984SMax Reitz /**
17930513f984SMax Reitz  * If .drain_count is 0, wake up .io_co if there is one; and set
17940513f984SMax Reitz  * .was_drained.
17950513f984SMax Reitz  * Increment .drain_count.
17960513f984SMax Reitz  */
17975e8ac217SKevin Wolf static void bdrv_replace_test_drain_begin(BlockDriverState *bs)
17980513f984SMax Reitz {
17990513f984SMax Reitz     BDRVReplaceTestState *s = bs->opaque;
18000513f984SMax Reitz 
180123987471SKevin Wolf     if (!s->setup_completed) {
180223987471SKevin Wolf         return;
180323987471SKevin Wolf     }
180423987471SKevin Wolf 
18050513f984SMax Reitz     if (!s->drain_count) {
18067bce1c29SKevin Wolf         s->drain_co = qemu_coroutine_create(bdrv_replace_test_drain_co, bs);
18077bce1c29SKevin Wolf         bdrv_inc_in_flight(bs);
18087bce1c29SKevin Wolf         aio_co_enter(bdrv_get_aio_context(bs), s->drain_co);
18090513f984SMax Reitz         s->was_drained = true;
18100513f984SMax Reitz     }
18110513f984SMax Reitz     s->drain_count++;
18120513f984SMax Reitz }
18130513f984SMax Reitz 
18147bce1c29SKevin Wolf static void coroutine_fn bdrv_replace_test_read_entry(void *opaque)
18157bce1c29SKevin Wolf {
18167bce1c29SKevin Wolf     BlockDriverState *bs = opaque;
18177bce1c29SKevin Wolf     char data;
18187bce1c29SKevin Wolf     QEMUIOVector qiov = QEMU_IOVEC_INIT_BUF(qiov, &data, 1);
18197bce1c29SKevin Wolf     int ret;
18207bce1c29SKevin Wolf 
18217bce1c29SKevin Wolf     /* Queue a read request post-drain */
1822b9b10c35SKevin Wolf     bdrv_graph_co_rdlock();
18237bce1c29SKevin Wolf     ret = bdrv_replace_test_co_preadv(bs, 0, 1, &qiov, 0);
1824b9b10c35SKevin Wolf     bdrv_graph_co_rdunlock();
1825b9b10c35SKevin Wolf 
18267bce1c29SKevin Wolf     g_assert(ret >= 0);
18277bce1c29SKevin Wolf     bdrv_dec_in_flight(bs);
18287bce1c29SKevin Wolf }
18297bce1c29SKevin Wolf 
18300513f984SMax Reitz /**
18310513f984SMax Reitz  * Reduce .drain_count, set .was_undrained once it reaches 0.
18320513f984SMax Reitz  * If .drain_count reaches 0 and the node has a backing file, issue a
18330513f984SMax Reitz  * read request.
18340513f984SMax Reitz  */
18355e8ac217SKevin Wolf static void bdrv_replace_test_drain_end(BlockDriverState *bs)
18360513f984SMax Reitz {
18370513f984SMax Reitz     BDRVReplaceTestState *s = bs->opaque;
18380513f984SMax Reitz 
183923987471SKevin Wolf     if (!s->setup_completed) {
184023987471SKevin Wolf         return;
184123987471SKevin Wolf     }
184223987471SKevin Wolf 
18430513f984SMax Reitz     g_assert(s->drain_count > 0);
18440513f984SMax Reitz     if (!--s->drain_count) {
18450513f984SMax Reitz         s->was_undrained = true;
18460513f984SMax Reitz 
18470513f984SMax Reitz         if (bs->backing) {
18487bce1c29SKevin Wolf             Coroutine *co = qemu_coroutine_create(bdrv_replace_test_read_entry,
18497bce1c29SKevin Wolf                                                   bs);
18507bce1c29SKevin Wolf             bdrv_inc_in_flight(bs);
18517bce1c29SKevin Wolf             aio_co_enter(bdrv_get_aio_context(bs), co);
18520513f984SMax Reitz         }
18530513f984SMax Reitz     }
18540513f984SMax Reitz }
18550513f984SMax Reitz 
18560513f984SMax Reitz static BlockDriver bdrv_replace_test = {
18570513f984SMax Reitz     .format_name            = "replace_test",
18580513f984SMax Reitz     .instance_size          = sizeof(BDRVReplaceTestState),
18599ebfc111SVladimir Sementsov-Ogievskiy     .supports_backing       = true,
18600513f984SMax Reitz 
18610513f984SMax Reitz     .bdrv_close             = bdrv_replace_test_close,
18620513f984SMax Reitz     .bdrv_co_preadv         = bdrv_replace_test_co_preadv,
18630513f984SMax Reitz 
18645e8ac217SKevin Wolf     .bdrv_drain_begin       = bdrv_replace_test_drain_begin,
18655e8ac217SKevin Wolf     .bdrv_drain_end         = bdrv_replace_test_drain_end,
18660513f984SMax Reitz 
186769dca43dSMax Reitz     .bdrv_child_perm        = bdrv_default_perms,
18680513f984SMax Reitz };
18690513f984SMax Reitz 
18700513f984SMax Reitz static void coroutine_fn test_replace_child_mid_drain_read_co(void *opaque)
18710513f984SMax Reitz {
18720513f984SMax Reitz     int ret;
18730513f984SMax Reitz     char data;
18740513f984SMax Reitz 
18750513f984SMax Reitz     ret = blk_co_pread(opaque, 0, 1, &data, 0);
18760513f984SMax Reitz     g_assert(ret >= 0);
18770513f984SMax Reitz }
18780513f984SMax Reitz 
18790513f984SMax Reitz /**
18800513f984SMax Reitz  * We test two things:
18810513f984SMax Reitz  * (1) bdrv_replace_child_noperm() must not undrain the parent if both
18820513f984SMax Reitz  *     children are drained.
18830513f984SMax Reitz  * (2) bdrv_replace_child_noperm() must never flush I/O requests to a
18840513f984SMax Reitz  *     drained child.  If the old child is drained, it must flush I/O
18850513f984SMax Reitz  *     requests after the new one has been attached.  If the new child
18860513f984SMax Reitz  *     is drained, it must flush I/O requests before the old one is
18870513f984SMax Reitz  *     detached.
18880513f984SMax Reitz  *
18890513f984SMax Reitz  * To do so, we create one parent node and two child nodes; then
18900513f984SMax Reitz  * attach one of the children (old_child_bs) to the parent, then
18910513f984SMax Reitz  * drain both old_child_bs and new_child_bs according to
18920513f984SMax Reitz  * old_drain_count and new_drain_count, respectively, and finally
18930513f984SMax Reitz  * we invoke bdrv_replace_node() to replace old_child_bs by
18940513f984SMax Reitz  * new_child_bs.
18950513f984SMax Reitz  *
18960513f984SMax Reitz  * The test block driver we use here (bdrv_replace_test) has a read
18970513f984SMax Reitz  * function that:
18980513f984SMax Reitz  * - For the parent node, can optionally yield, and then forwards the
18990513f984SMax Reitz  *   read to bdrv_preadv(),
19000513f984SMax Reitz  * - For the child node, just returns immediately.
19010513f984SMax Reitz  *
19020513f984SMax Reitz  * If the read yields, the drain_begin function will wake it up.
19030513f984SMax Reitz  *
19040513f984SMax Reitz  * The drain_end function issues a read on the parent once it is fully
19050513f984SMax Reitz  * undrained (which simulates requests starting to come in again).
19060513f984SMax Reitz  */
19070513f984SMax Reitz static void do_test_replace_child_mid_drain(int old_drain_count,
19080513f984SMax Reitz                                             int new_drain_count)
19090513f984SMax Reitz {
19100513f984SMax Reitz     BlockBackend *parent_blk;
19110513f984SMax Reitz     BlockDriverState *parent_bs;
19120513f984SMax Reitz     BlockDriverState *old_child_bs, *new_child_bs;
19130513f984SMax Reitz     BDRVReplaceTestState *parent_s;
19140513f984SMax Reitz     BDRVReplaceTestState *old_child_s, *new_child_s;
19150513f984SMax Reitz     Coroutine *io_co;
19160513f984SMax Reitz     int i;
19170513f984SMax Reitz 
19180513f984SMax Reitz     parent_bs = bdrv_new_open_driver(&bdrv_replace_test, "parent", 0,
19190513f984SMax Reitz                                      &error_abort);
19200513f984SMax Reitz     parent_s = parent_bs->opaque;
19210513f984SMax Reitz 
19220513f984SMax Reitz     parent_blk = blk_new(qemu_get_aio_context(),
19230513f984SMax Reitz                          BLK_PERM_CONSISTENT_READ, BLK_PERM_ALL);
19240513f984SMax Reitz     blk_insert_bs(parent_blk, parent_bs, &error_abort);
19250513f984SMax Reitz 
19260513f984SMax Reitz     old_child_bs = bdrv_new_open_driver(&bdrv_replace_test, "old-child", 0,
19270513f984SMax Reitz                                         &error_abort);
19280513f984SMax Reitz     new_child_bs = bdrv_new_open_driver(&bdrv_replace_test, "new-child", 0,
19290513f984SMax Reitz                                         &error_abort);
19300513f984SMax Reitz     old_child_s = old_child_bs->opaque;
19310513f984SMax Reitz     new_child_s = new_child_bs->opaque;
19320513f984SMax Reitz 
19330513f984SMax Reitz     /* So that we can read something */
19340513f984SMax Reitz     parent_bs->total_sectors = 1;
19350513f984SMax Reitz     old_child_bs->total_sectors = 1;
19360513f984SMax Reitz     new_child_bs->total_sectors = 1;
19370513f984SMax Reitz 
19380513f984SMax Reitz     bdrv_ref(old_child_bs);
19395bb04747SVladimir Sementsov-Ogievskiy     bdrv_attach_child(parent_bs, old_child_bs, "child", &child_of_bds,
19405bb04747SVladimir Sementsov-Ogievskiy                       BDRV_CHILD_COW, &error_abort);
194123987471SKevin Wolf     parent_s->setup_completed = true;
19420513f984SMax Reitz 
19430513f984SMax Reitz     for (i = 0; i < old_drain_count; i++) {
19440513f984SMax Reitz         bdrv_drained_begin(old_child_bs);
19450513f984SMax Reitz     }
19460513f984SMax Reitz     for (i = 0; i < new_drain_count; i++) {
19470513f984SMax Reitz         bdrv_drained_begin(new_child_bs);
19480513f984SMax Reitz     }
19490513f984SMax Reitz 
19500513f984SMax Reitz     if (!old_drain_count) {
19510513f984SMax Reitz         /*
19520513f984SMax Reitz          * Start a read operation that will yield, so it will not
19530513f984SMax Reitz          * complete before the node is drained.
19540513f984SMax Reitz          */
19550513f984SMax Reitz         parent_s->yield_before_read = true;
19560513f984SMax Reitz         io_co = qemu_coroutine_create(test_replace_child_mid_drain_read_co,
19570513f984SMax Reitz                                       parent_blk);
19580513f984SMax Reitz         qemu_coroutine_enter(io_co);
19590513f984SMax Reitz     }
19600513f984SMax Reitz 
19610513f984SMax Reitz     /* If we have started a read operation, it should have yielded */
19620513f984SMax Reitz     g_assert(!parent_s->has_read);
19630513f984SMax Reitz 
19640513f984SMax Reitz     /* Reset drained status so we can see what bdrv_replace_node() does */
19650513f984SMax Reitz     parent_s->was_drained = false;
19660513f984SMax Reitz     parent_s->was_undrained = false;
19670513f984SMax Reitz 
19680513f984SMax Reitz     g_assert(parent_bs->quiesce_counter == old_drain_count);
19690513f984SMax Reitz     bdrv_replace_node(old_child_bs, new_child_bs, &error_abort);
19700513f984SMax Reitz     g_assert(parent_bs->quiesce_counter == new_drain_count);
19710513f984SMax Reitz 
19720513f984SMax Reitz     if (!old_drain_count && !new_drain_count) {
19730513f984SMax Reitz         /*
19740513f984SMax Reitz          * From undrained to undrained drains and undrains the parent,
19750513f984SMax Reitz          * because bdrv_replace_node() contains a drained section for
19760513f984SMax Reitz          * @old_child_bs.
19770513f984SMax Reitz          */
19780513f984SMax Reitz         g_assert(parent_s->was_drained && parent_s->was_undrained);
19790513f984SMax Reitz     } else if (!old_drain_count && new_drain_count) {
19800513f984SMax Reitz         /*
19810513f984SMax Reitz          * From undrained to drained should drain the parent and keep
19820513f984SMax Reitz          * it that way.
19830513f984SMax Reitz          */
19840513f984SMax Reitz         g_assert(parent_s->was_drained && !parent_s->was_undrained);
19850513f984SMax Reitz     } else if (old_drain_count && !new_drain_count) {
19860513f984SMax Reitz         /*
19870513f984SMax Reitz          * From drained to undrained should undrain the parent and
19880513f984SMax Reitz          * keep it that way.
19890513f984SMax Reitz          */
19900513f984SMax Reitz         g_assert(!parent_s->was_drained && parent_s->was_undrained);
19910513f984SMax Reitz     } else /* if (old_drain_count && new_drain_count) */ {
19920513f984SMax Reitz         /*
19930513f984SMax Reitz          * From drained to drained must not undrain the parent at any
19940513f984SMax Reitz          * point
19950513f984SMax Reitz          */
19960513f984SMax Reitz         g_assert(!parent_s->was_drained && !parent_s->was_undrained);
19970513f984SMax Reitz     }
19980513f984SMax Reitz 
19990513f984SMax Reitz     if (!old_drain_count || !new_drain_count) {
20000513f984SMax Reitz         /*
20010513f984SMax Reitz          * If !old_drain_count, we have started a read request before
20020513f984SMax Reitz          * bdrv_replace_node().  If !new_drain_count, the parent must
20030513f984SMax Reitz          * have been undrained at some point, and
20040513f984SMax Reitz          * bdrv_replace_test_co_drain_end() starts a read request
20050513f984SMax Reitz          * then.
20060513f984SMax Reitz          */
20070513f984SMax Reitz         g_assert(parent_s->has_read);
20080513f984SMax Reitz     } else {
20090513f984SMax Reitz         /*
20100513f984SMax Reitz          * If the parent was never undrained, there is no way to start
20110513f984SMax Reitz          * a read request.
20120513f984SMax Reitz          */
20130513f984SMax Reitz         g_assert(!parent_s->has_read);
20140513f984SMax Reitz     }
20150513f984SMax Reitz 
20160513f984SMax Reitz     /* A drained child must have not received any request */
20170513f984SMax Reitz     g_assert(!(old_drain_count && old_child_s->has_read));
20180513f984SMax Reitz     g_assert(!(new_drain_count && new_child_s->has_read));
20190513f984SMax Reitz 
20200513f984SMax Reitz     for (i = 0; i < new_drain_count; i++) {
20210513f984SMax Reitz         bdrv_drained_end(new_child_bs);
20220513f984SMax Reitz     }
20230513f984SMax Reitz     for (i = 0; i < old_drain_count; i++) {
20240513f984SMax Reitz         bdrv_drained_end(old_child_bs);
20250513f984SMax Reitz     }
20260513f984SMax Reitz 
20270513f984SMax Reitz     /*
20280513f984SMax Reitz      * By now, bdrv_replace_test_co_drain_end() must have been called
20290513f984SMax Reitz      * at some point while the new child was attached to the parent.
20300513f984SMax Reitz      */
20310513f984SMax Reitz     g_assert(parent_s->has_read);
20320513f984SMax Reitz     g_assert(new_child_s->has_read);
20330513f984SMax Reitz 
20340513f984SMax Reitz     blk_unref(parent_blk);
20350513f984SMax Reitz     bdrv_unref(parent_bs);
20360513f984SMax Reitz     bdrv_unref(old_child_bs);
20370513f984SMax Reitz     bdrv_unref(new_child_bs);
20380513f984SMax Reitz }
20390513f984SMax Reitz 
20400513f984SMax Reitz static void test_replace_child_mid_drain(void)
20410513f984SMax Reitz {
20420513f984SMax Reitz     int old_drain_count, new_drain_count;
20430513f984SMax Reitz 
20440513f984SMax Reitz     for (old_drain_count = 0; old_drain_count < 2; old_drain_count++) {
20450513f984SMax Reitz         for (new_drain_count = 0; new_drain_count < 2; new_drain_count++) {
20460513f984SMax Reitz             do_test_replace_child_mid_drain(old_drain_count, new_drain_count);
20470513f984SMax Reitz         }
20480513f984SMax Reitz     }
20490513f984SMax Reitz }
20500513f984SMax Reitz 
2051881cfd17SKevin Wolf int main(int argc, char **argv)
2052881cfd17SKevin Wolf {
2053bb675689SKevin Wolf     int ret;
2054bb675689SKevin Wolf 
2055881cfd17SKevin Wolf     bdrv_init();
2056881cfd17SKevin Wolf     qemu_init_main_loop(&error_abort);
2057881cfd17SKevin Wolf 
2058881cfd17SKevin Wolf     g_test_init(&argc, &argv, NULL);
2059bb675689SKevin Wolf     qemu_event_init(&done_event, false);
2060881cfd17SKevin Wolf 
2061881cfd17SKevin Wolf     g_test_add_func("/bdrv-drain/driver-cb/drain_all", test_drv_cb_drain_all);
206286e1c840SKevin Wolf     g_test_add_func("/bdrv-drain/driver-cb/drain", test_drv_cb_drain);
2063881cfd17SKevin Wolf 
20646d0252f2SKevin Wolf     g_test_add_func("/bdrv-drain/driver-cb/co/drain_all",
20656d0252f2SKevin Wolf                     test_drv_cb_co_drain_all);
20660582eb10SKevin Wolf     g_test_add_func("/bdrv-drain/driver-cb/co/drain", test_drv_cb_co_drain);
20670582eb10SKevin Wolf 
206889a6ceabSKevin Wolf     g_test_add_func("/bdrv-drain/quiesce/drain_all", test_quiesce_drain_all);
206989a6ceabSKevin Wolf     g_test_add_func("/bdrv-drain/quiesce/drain", test_quiesce_drain);
207089a6ceabSKevin Wolf 
20716d0252f2SKevin Wolf     g_test_add_func("/bdrv-drain/quiesce/co/drain_all",
20726d0252f2SKevin Wolf                     test_quiesce_co_drain_all);
20730582eb10SKevin Wolf     g_test_add_func("/bdrv-drain/quiesce/co/drain", test_quiesce_co_drain);
20740582eb10SKevin Wolf 
20756c429a6aSKevin Wolf     g_test_add_func("/bdrv-drain/nested", test_nested);
207619f7a7e5SKevin Wolf 
207719f7a7e5SKevin Wolf     g_test_add_func("/bdrv-drain/graph-change/drain_all",
207819f7a7e5SKevin Wolf                     test_graph_change_drain_all);
20796c429a6aSKevin Wolf 
2080bb675689SKevin Wolf     g_test_add_func("/bdrv-drain/iothread/drain_all", test_iothread_drain_all);
2081bb675689SKevin Wolf     g_test_add_func("/bdrv-drain/iothread/drain", test_iothread_drain);
2082bb675689SKevin Wolf 
20837253220dSKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/drain_all", test_blockjob_drain_all);
20847253220dSKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/drain", test_blockjob_drain);
20857253220dSKevin Wolf 
2086d49725afSKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/error/drain_all",
2087d49725afSKevin Wolf                     test_blockjob_error_drain_all);
2088d49725afSKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/error/drain",
2089d49725afSKevin Wolf                     test_blockjob_error_drain);
2090d49725afSKevin Wolf 
2091f62c1729SKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/iothread/drain_all",
2092f62c1729SKevin Wolf                     test_blockjob_iothread_drain_all);
2093f62c1729SKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/iothread/drain",
2094f62c1729SKevin Wolf                     test_blockjob_iothread_drain);
2095f62c1729SKevin Wolf 
2096d49725afSKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/iothread/error/drain_all",
2097d49725afSKevin Wolf                     test_blockjob_iothread_error_drain_all);
2098d49725afSKevin Wolf     g_test_add_func("/bdrv-drain/blockjob/iothread/error/drain",
2099d49725afSKevin Wolf                     test_blockjob_iothread_error_drain);
2100d49725afSKevin Wolf 
2101ebd31837SKevin Wolf     g_test_add_func("/bdrv-drain/deletion/drain", test_delete_by_drain);
210219f7a7e5SKevin Wolf     g_test_add_func("/bdrv-drain/detach/drain_all", test_detach_by_drain_all);
2103ebd31837SKevin Wolf     g_test_add_func("/bdrv-drain/detach/drain", test_detach_by_drain);
2104231281abSKevin Wolf     g_test_add_func("/bdrv-drain/detach/parent_cb", test_detach_by_parent_cb);
210557320ca9SKevin Wolf     g_test_add_func("/bdrv-drain/detach/driver_cb", test_detach_by_driver_cb);
21064c8158e3SMax Reitz 
2107b994c5bcSKevin Wolf     g_test_add_func("/bdrv-drain/attach/drain", test_append_to_drained);
2108b994c5bcSKevin Wolf 
2109247d2737SKevin Wolf     g_test_add_func("/bdrv-drain/set_aio_context", test_set_aio_context);
2110247d2737SKevin Wolf 
21118e442810SMax Reitz     g_test_add_func("/bdrv-drain/blockjob/commit_by_drained_end",
21128e442810SMax Reitz                     test_blockjob_commit_by_drained_end);
21138e442810SMax Reitz 
21149746b35cSMax Reitz     g_test_add_func("/bdrv-drain/bdrv_drop_intermediate/poll",
21159746b35cSMax Reitz                     test_drop_intermediate_poll);
21169746b35cSMax Reitz 
21170513f984SMax Reitz     g_test_add_func("/bdrv-drain/replace_child/mid-drain",
21180513f984SMax Reitz                     test_replace_child_mid_drain);
21190513f984SMax Reitz 
2120bb675689SKevin Wolf     ret = g_test_run();
2121bb675689SKevin Wolf     qemu_event_destroy(&done_event);
2122bb675689SKevin Wolf     return ret;
2123881cfd17SKevin Wolf }
2124