14f999d05SKevin Wolf /* 2c2b38b27SPaolo Bonzini * Data plane event loop 34f999d05SKevin Wolf * 44f999d05SKevin Wolf * Copyright (c) 2003-2008 Fabrice Bellard 5c2b38b27SPaolo Bonzini * Copyright (c) 2009-2017 QEMU contributors 64f999d05SKevin Wolf * 74f999d05SKevin Wolf * Permission is hereby granted, free of charge, to any person obtaining a copy 84f999d05SKevin Wolf * of this software and associated documentation files (the "Software"), to deal 94f999d05SKevin Wolf * in the Software without restriction, including without limitation the rights 104f999d05SKevin Wolf * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 114f999d05SKevin Wolf * copies of the Software, and to permit persons to whom the Software is 124f999d05SKevin Wolf * furnished to do so, subject to the following conditions: 134f999d05SKevin Wolf * 144f999d05SKevin Wolf * The above copyright notice and this permission notice shall be included in 154f999d05SKevin Wolf * all copies or substantial portions of the Software. 164f999d05SKevin Wolf * 174f999d05SKevin Wolf * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 184f999d05SKevin Wolf * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 194f999d05SKevin Wolf * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 204f999d05SKevin Wolf * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 214f999d05SKevin Wolf * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 224f999d05SKevin Wolf * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 234f999d05SKevin Wolf * THE SOFTWARE. 244f999d05SKevin Wolf */ 254f999d05SKevin Wolf 26d38ea87aSPeter Maydell #include "qemu/osdep.h" 27da34e65cSMarkus Armbruster #include "qapi/error.h" 28737e150eSPaolo Bonzini #include "block/aio.h" 299b34277dSStefan Hajnoczi #include "block/thread-pool.h" 30587d82faSEmanuele Giuseppe Esposito #include "block/graph-lock.h" 311de7afc9SPaolo Bonzini #include "qemu/main-loop.h" 320ceb849bSPaolo Bonzini #include "qemu/atomic.h" 338c6b0356SStefan Hajnoczi #include "qemu/rcu_queue.h" 340187f5c9SPaolo Bonzini #include "block/raw-aio.h" 350c330a73SPaolo Bonzini #include "qemu/coroutine_int.h" 3647b74464SStefan Hajnoczi #include "qemu/coroutine-tls.h" 3775bbe5e5SPavel Dovgalyuk #include "sysemu/cpu-timers.h" 380c330a73SPaolo Bonzini #include "trace.h" 399a1e9481SKevin Wolf 404f999d05SKevin Wolf /***********************************************************/ 414f999d05SKevin Wolf /* bottom halves (can be seen as timers which expire ASAP) */ 424f999d05SKevin Wolf 438c6b0356SStefan Hajnoczi /* QEMUBH::flags values */ 448c6b0356SStefan Hajnoczi enum { 458c6b0356SStefan Hajnoczi /* Already enqueued and waiting for aio_bh_poll() */ 468c6b0356SStefan Hajnoczi BH_PENDING = (1 << 0), 478c6b0356SStefan Hajnoczi 488c6b0356SStefan Hajnoczi /* Invoke the callback */ 498c6b0356SStefan Hajnoczi BH_SCHEDULED = (1 << 1), 508c6b0356SStefan Hajnoczi 518c6b0356SStefan Hajnoczi /* Delete without invoking callback */ 528c6b0356SStefan Hajnoczi BH_DELETED = (1 << 2), 538c6b0356SStefan Hajnoczi 548c6b0356SStefan Hajnoczi /* Delete after invoking callback */ 558c6b0356SStefan Hajnoczi BH_ONESHOT = (1 << 3), 568c6b0356SStefan Hajnoczi 578c6b0356SStefan Hajnoczi /* Schedule periodically when the event loop is idle */ 588c6b0356SStefan Hajnoczi BH_IDLE = (1 << 4), 598c6b0356SStefan Hajnoczi }; 608c6b0356SStefan Hajnoczi 614f999d05SKevin Wolf struct QEMUBH { 622f4dc3c1SPaolo Bonzini AioContext *ctx; 630f08586cSStefan Hajnoczi const char *name; 644f999d05SKevin Wolf QEMUBHFunc *cb; 654f999d05SKevin Wolf void *opaque; 668c6b0356SStefan Hajnoczi QSLIST_ENTRY(QEMUBH) next; 678c6b0356SStefan Hajnoczi unsigned flags; 689c86c97fSAlexander Bulekov MemReentrancyGuard *reentrancy_guard; 694f999d05SKevin Wolf }; 704f999d05SKevin Wolf 718c6b0356SStefan Hajnoczi /* Called concurrently from any thread */ 728c6b0356SStefan Hajnoczi static void aio_bh_enqueue(QEMUBH *bh, unsigned new_flags) 738c6b0356SStefan Hajnoczi { 748c6b0356SStefan Hajnoczi AioContext *ctx = bh->ctx; 758c6b0356SStefan Hajnoczi unsigned old_flags; 768c6b0356SStefan Hajnoczi 778c6b0356SStefan Hajnoczi /* 788dd48650SPaolo Bonzini * Synchronizes with atomic_fetch_and() in aio_bh_dequeue(), ensuring that 798dd48650SPaolo Bonzini * insertion starts after BH_PENDING is set. 808dd48650SPaolo Bonzini */ 818dd48650SPaolo Bonzini old_flags = qatomic_fetch_or(&bh->flags, BH_PENDING | new_flags); 828dd48650SPaolo Bonzini 838dd48650SPaolo Bonzini if (!(old_flags & BH_PENDING)) { 848dd48650SPaolo Bonzini /* 858dd48650SPaolo Bonzini * At this point the bottom half becomes visible to aio_bh_poll(). 868dd48650SPaolo Bonzini * This insertion thus synchronizes with QSLIST_MOVE_ATOMIC in 878dd48650SPaolo Bonzini * aio_bh_poll(), ensuring that: 888dd48650SPaolo Bonzini * 1. any writes needed by the callback are visible from the callback 898dd48650SPaolo Bonzini * after aio_bh_dequeue() returns bh. 908c6b0356SStefan Hajnoczi * 2. ctx is loaded before the callback has a chance to execute and bh 918c6b0356SStefan Hajnoczi * could be freed. 928c6b0356SStefan Hajnoczi */ 938c6b0356SStefan Hajnoczi QSLIST_INSERT_HEAD_ATOMIC(&ctx->bh_list, bh, next); 948c6b0356SStefan Hajnoczi } 958c6b0356SStefan Hajnoczi 968c6b0356SStefan Hajnoczi aio_notify(ctx); 97*72c603f8SPhilippe Mathieu-Daudé if (unlikely(icount_enabled())) { 9875bbe5e5SPavel Dovgalyuk /* 9975bbe5e5SPavel Dovgalyuk * Workaround for record/replay. 10075bbe5e5SPavel Dovgalyuk * vCPU execution should be suspended when new BH is set. 10175bbe5e5SPavel Dovgalyuk * This is needed to avoid guest timeouts caused 10275bbe5e5SPavel Dovgalyuk * by the long cycles of the execution. 10375bbe5e5SPavel Dovgalyuk */ 10475bbe5e5SPavel Dovgalyuk icount_notify_exit(); 1058c6b0356SStefan Hajnoczi } 106*72c603f8SPhilippe Mathieu-Daudé } 1078c6b0356SStefan Hajnoczi 1088c6b0356SStefan Hajnoczi /* Only called from aio_bh_poll() and aio_ctx_finalize() */ 1098c6b0356SStefan Hajnoczi static QEMUBH *aio_bh_dequeue(BHList *head, unsigned *flags) 1108c6b0356SStefan Hajnoczi { 1118c6b0356SStefan Hajnoczi QEMUBH *bh = QSLIST_FIRST_RCU(head); 1128c6b0356SStefan Hajnoczi 1138c6b0356SStefan Hajnoczi if (!bh) { 1148c6b0356SStefan Hajnoczi return NULL; 1158c6b0356SStefan Hajnoczi } 1168c6b0356SStefan Hajnoczi 1178c6b0356SStefan Hajnoczi QSLIST_REMOVE_HEAD(head, next); 1188c6b0356SStefan Hajnoczi 1198c6b0356SStefan Hajnoczi /* 1208dd48650SPaolo Bonzini * Synchronizes with qatomic_fetch_or() in aio_bh_enqueue(), ensuring that 1218dd48650SPaolo Bonzini * the removal finishes before BH_PENDING is reset. 1228c6b0356SStefan Hajnoczi */ 123d73415a3SStefan Hajnoczi *flags = qatomic_fetch_and(&bh->flags, 1248c6b0356SStefan Hajnoczi ~(BH_PENDING | BH_SCHEDULED | BH_IDLE)); 1258c6b0356SStefan Hajnoczi return bh; 1268c6b0356SStefan Hajnoczi } 1278c6b0356SStefan Hajnoczi 1280f08586cSStefan Hajnoczi void aio_bh_schedule_oneshot_full(AioContext *ctx, QEMUBHFunc *cb, 1290f08586cSStefan Hajnoczi void *opaque, const char *name) 1305b8bb359SPaolo Bonzini { 1315b8bb359SPaolo Bonzini QEMUBH *bh; 1325b8bb359SPaolo Bonzini bh = g_new(QEMUBH, 1); 1335b8bb359SPaolo Bonzini *bh = (QEMUBH){ 1345b8bb359SPaolo Bonzini .ctx = ctx, 1355b8bb359SPaolo Bonzini .cb = cb, 1365b8bb359SPaolo Bonzini .opaque = opaque, 1370f08586cSStefan Hajnoczi .name = name, 1385b8bb359SPaolo Bonzini }; 1398c6b0356SStefan Hajnoczi aio_bh_enqueue(bh, BH_SCHEDULED | BH_ONESHOT); 1405b8bb359SPaolo Bonzini } 1415b8bb359SPaolo Bonzini 1420f08586cSStefan Hajnoczi QEMUBH *aio_bh_new_full(AioContext *ctx, QEMUBHFunc *cb, void *opaque, 1439c86c97fSAlexander Bulekov const char *name, MemReentrancyGuard *reentrancy_guard) 1444f999d05SKevin Wolf { 1454f999d05SKevin Wolf QEMUBH *bh; 146ee82310fSPaolo Bonzini bh = g_new(QEMUBH, 1); 147ee82310fSPaolo Bonzini *bh = (QEMUBH){ 148ee82310fSPaolo Bonzini .ctx = ctx, 149ee82310fSPaolo Bonzini .cb = cb, 150ee82310fSPaolo Bonzini .opaque = opaque, 1510f08586cSStefan Hajnoczi .name = name, 1529c86c97fSAlexander Bulekov .reentrancy_guard = reentrancy_guard, 153ee82310fSPaolo Bonzini }; 1544f999d05SKevin Wolf return bh; 1554f999d05SKevin Wolf } 1564f999d05SKevin Wolf 157df281b80SPavel Dovgalyuk void aio_bh_call(QEMUBH *bh) 158df281b80SPavel Dovgalyuk { 1599c86c97fSAlexander Bulekov bool last_engaged_in_io = false; 1609c86c97fSAlexander Bulekov 1617915bd06SAlexander Bulekov /* Make a copy of the guard-pointer as cb may free the bh */ 1627915bd06SAlexander Bulekov MemReentrancyGuard *reentrancy_guard = bh->reentrancy_guard; 1637915bd06SAlexander Bulekov if (reentrancy_guard) { 1647915bd06SAlexander Bulekov last_engaged_in_io = reentrancy_guard->engaged_in_io; 1657915bd06SAlexander Bulekov if (reentrancy_guard->engaged_in_io) { 1669c86c97fSAlexander Bulekov trace_reentrant_aio(bh->ctx, bh->name); 1679c86c97fSAlexander Bulekov } 1687915bd06SAlexander Bulekov reentrancy_guard->engaged_in_io = true; 1699c86c97fSAlexander Bulekov } 1709c86c97fSAlexander Bulekov 171df281b80SPavel Dovgalyuk bh->cb(bh->opaque); 1729c86c97fSAlexander Bulekov 1737915bd06SAlexander Bulekov if (reentrancy_guard) { 1747915bd06SAlexander Bulekov reentrancy_guard->engaged_in_io = last_engaged_in_io; 1759c86c97fSAlexander Bulekov } 176df281b80SPavel Dovgalyuk } 177df281b80SPavel Dovgalyuk 1788c6b0356SStefan Hajnoczi /* Multiple occurrences of aio_bh_poll cannot be called concurrently. */ 179f627aab1SPaolo Bonzini int aio_bh_poll(AioContext *ctx) 1804f999d05SKevin Wolf { 1818c6b0356SStefan Hajnoczi BHListSlice slice; 1828c6b0356SStefan Hajnoczi BHListSlice *s; 1838c6b0356SStefan Hajnoczi int ret = 0; 184648fb0eaSKevin Wolf 1858dd48650SPaolo Bonzini /* Synchronizes with QSLIST_INSERT_HEAD_ATOMIC in aio_bh_enqueue(). */ 1868c6b0356SStefan Hajnoczi QSLIST_MOVE_ATOMIC(&slice.bh_list, &ctx->bh_list); 187d66ba6dcSCédric Le Goater 188d66ba6dcSCédric Le Goater /* 189d66ba6dcSCédric Le Goater * GCC13 [-Werror=dangling-pointer=] complains that the local variable 190d66ba6dcSCédric Le Goater * 'slice' is being stored in the global 'ctx->bh_slice_list' but the 191d66ba6dcSCédric Le Goater * list is emptied before this function returns. 192d66ba6dcSCédric Le Goater */ 193d66ba6dcSCédric Le Goater #if !defined(__clang__) 194d66ba6dcSCédric Le Goater #pragma GCC diagnostic push 195d66ba6dcSCédric Le Goater #pragma GCC diagnostic ignored "-Wpragmas" 196d66ba6dcSCédric Le Goater #pragma GCC diagnostic ignored "-Wdangling-pointer=" 197d66ba6dcSCédric Le Goater #endif 1988c6b0356SStefan Hajnoczi QSIMPLEQ_INSERT_TAIL(&ctx->bh_slice_list, &slice, next); 199d66ba6dcSCédric Le Goater #if !defined(__clang__) 200d66ba6dcSCédric Le Goater #pragma GCC diagnostic pop 201d66ba6dcSCédric Le Goater #endif 2028c6b0356SStefan Hajnoczi 2038c6b0356SStefan Hajnoczi while ((s = QSIMPLEQ_FIRST(&ctx->bh_slice_list))) { 2048c6b0356SStefan Hajnoczi QEMUBH *bh; 2058c6b0356SStefan Hajnoczi unsigned flags; 2068c6b0356SStefan Hajnoczi 2078c6b0356SStefan Hajnoczi bh = aio_bh_dequeue(&s->bh_list, &flags); 2088c6b0356SStefan Hajnoczi if (!bh) { 2098c6b0356SStefan Hajnoczi QSIMPLEQ_REMOVE_HEAD(&ctx->bh_slice_list, next); 2108c6b0356SStefan Hajnoczi continue; 2118c6b0356SStefan Hajnoczi } 2128c6b0356SStefan Hajnoczi 2138c6b0356SStefan Hajnoczi if ((flags & (BH_SCHEDULED | BH_DELETED)) == BH_SCHEDULED) { 21465c1b5b6SPaolo Bonzini /* Idle BHs don't count as progress */ 2158c6b0356SStefan Hajnoczi if (!(flags & BH_IDLE)) { 2164f999d05SKevin Wolf ret = 1; 217ca96ac44SStefan Hajnoczi } 218df281b80SPavel Dovgalyuk aio_bh_call(bh); 2194f999d05SKevin Wolf } 2208c6b0356SStefan Hajnoczi if (flags & (BH_DELETED | BH_ONESHOT)) { 2217267c094SAnthony Liguori g_free(bh); 2224f999d05SKevin Wolf } 223648fb0eaSKevin Wolf } 2248c6b0356SStefan Hajnoczi 2254f999d05SKevin Wolf return ret; 2264f999d05SKevin Wolf } 2274f999d05SKevin Wolf 2284f999d05SKevin Wolf void qemu_bh_schedule_idle(QEMUBH *bh) 2294f999d05SKevin Wolf { 2308c6b0356SStefan Hajnoczi aio_bh_enqueue(bh, BH_SCHEDULED | BH_IDLE); 2314f999d05SKevin Wolf } 2324f999d05SKevin Wolf 2334f999d05SKevin Wolf void qemu_bh_schedule(QEMUBH *bh) 2344f999d05SKevin Wolf { 2358c6b0356SStefan Hajnoczi aio_bh_enqueue(bh, BH_SCHEDULED); 2364f999d05SKevin Wolf } 237dcc772e2SLiu Ping Fan 238dcc772e2SLiu Ping Fan /* This func is async. 239dcc772e2SLiu Ping Fan */ 2404f999d05SKevin Wolf void qemu_bh_cancel(QEMUBH *bh) 2414f999d05SKevin Wolf { 242d73415a3SStefan Hajnoczi qatomic_and(&bh->flags, ~BH_SCHEDULED); 2434f999d05SKevin Wolf } 2444f999d05SKevin Wolf 245dcc772e2SLiu Ping Fan /* This func is async.The bottom half will do the delete action at the finial 246dcc772e2SLiu Ping Fan * end. 247dcc772e2SLiu Ping Fan */ 2484f999d05SKevin Wolf void qemu_bh_delete(QEMUBH *bh) 2494f999d05SKevin Wolf { 2508c6b0356SStefan Hajnoczi aio_bh_enqueue(bh, BH_DELETED); 2514f999d05SKevin Wolf } 2524f999d05SKevin Wolf 2538c6b0356SStefan Hajnoczi static int64_t aio_compute_bh_timeout(BHList *head, int timeout) 2544f999d05SKevin Wolf { 2554f999d05SKevin Wolf QEMUBH *bh; 2564f999d05SKevin Wolf 2578c6b0356SStefan Hajnoczi QSLIST_FOREACH_RCU(bh, head, next) { 2588c6b0356SStefan Hajnoczi if ((bh->flags & (BH_SCHEDULED | BH_DELETED)) == BH_SCHEDULED) { 2598c6b0356SStefan Hajnoczi if (bh->flags & BH_IDLE) { 2604f999d05SKevin Wolf /* idle bottom halves will be polled at least 2614f999d05SKevin Wolf * every 10ms */ 262845ca10dSPaolo Bonzini timeout = 10000000; 2634f999d05SKevin Wolf } else { 2644f999d05SKevin Wolf /* non-idle bottom halves will be executed 2654f999d05SKevin Wolf * immediately */ 266845ca10dSPaolo Bonzini return 0; 2674f999d05SKevin Wolf } 2684f999d05SKevin Wolf } 2694f999d05SKevin Wolf } 2704f999d05SKevin Wolf 2718c6b0356SStefan Hajnoczi return timeout; 2728c6b0356SStefan Hajnoczi } 2738c6b0356SStefan Hajnoczi 2748c6b0356SStefan Hajnoczi int64_t 2758c6b0356SStefan Hajnoczi aio_compute_timeout(AioContext *ctx) 2768c6b0356SStefan Hajnoczi { 2778c6b0356SStefan Hajnoczi BHListSlice *s; 2788c6b0356SStefan Hajnoczi int64_t deadline; 2798c6b0356SStefan Hajnoczi int timeout = -1; 2808c6b0356SStefan Hajnoczi 2818c6b0356SStefan Hajnoczi timeout = aio_compute_bh_timeout(&ctx->bh_list, timeout); 2828c6b0356SStefan Hajnoczi if (timeout == 0) { 2838c6b0356SStefan Hajnoczi return 0; 2848c6b0356SStefan Hajnoczi } 2858c6b0356SStefan Hajnoczi 2868c6b0356SStefan Hajnoczi QSIMPLEQ_FOREACH(s, &ctx->bh_slice_list, next) { 2878c6b0356SStefan Hajnoczi timeout = aio_compute_bh_timeout(&s->bh_list, timeout); 2888c6b0356SStefan Hajnoczi if (timeout == 0) { 2898c6b0356SStefan Hajnoczi return 0; 2908c6b0356SStefan Hajnoczi } 2918c6b0356SStefan Hajnoczi } 2928c6b0356SStefan Hajnoczi 293845ca10dSPaolo Bonzini deadline = timerlistgroup_deadline_ns(&ctx->tlg); 294533a8cf3SAlex Bligh if (deadline == 0) { 295845ca10dSPaolo Bonzini return 0; 296533a8cf3SAlex Bligh } else { 297845ca10dSPaolo Bonzini return qemu_soonest_timeout(timeout, deadline); 298845ca10dSPaolo Bonzini } 299533a8cf3SAlex Bligh } 300533a8cf3SAlex Bligh 301845ca10dSPaolo Bonzini static gboolean 302845ca10dSPaolo Bonzini aio_ctx_prepare(GSource *source, gint *timeout) 303845ca10dSPaolo Bonzini { 304845ca10dSPaolo Bonzini AioContext *ctx = (AioContext *) source; 305845ca10dSPaolo Bonzini 306d73415a3SStefan Hajnoczi qatomic_set(&ctx->notify_me, qatomic_read(&ctx->notify_me) | 1); 3075710a3e0SPaolo Bonzini 3085710a3e0SPaolo Bonzini /* 3095710a3e0SPaolo Bonzini * Write ctx->notify_me before computing the timeout 3105710a3e0SPaolo Bonzini * (reading bottom half flags, etc.). Pairs with 3115710a3e0SPaolo Bonzini * smp_mb in aio_notify(). 3125710a3e0SPaolo Bonzini */ 3135710a3e0SPaolo Bonzini smp_mb(); 314eabc9779SPaolo Bonzini 315845ca10dSPaolo Bonzini /* We assume there is no timeout already supplied */ 316845ca10dSPaolo Bonzini *timeout = qemu_timeout_ns_to_ms(aio_compute_timeout(ctx)); 317a3462c65SPaolo Bonzini 318a3462c65SPaolo Bonzini if (aio_prepare(ctx)) { 319a3462c65SPaolo Bonzini *timeout = 0; 320a3462c65SPaolo Bonzini } 321a3462c65SPaolo Bonzini 322845ca10dSPaolo Bonzini return *timeout == 0; 323e3713e00SPaolo Bonzini } 324e3713e00SPaolo Bonzini 325e3713e00SPaolo Bonzini static gboolean 326e3713e00SPaolo Bonzini aio_ctx_check(GSource *source) 327e3713e00SPaolo Bonzini { 328e3713e00SPaolo Bonzini AioContext *ctx = (AioContext *) source; 329e3713e00SPaolo Bonzini QEMUBH *bh; 3308c6b0356SStefan Hajnoczi BHListSlice *s; 331e3713e00SPaolo Bonzini 3325710a3e0SPaolo Bonzini /* Finish computing the timeout before clearing the flag. */ 333d73415a3SStefan Hajnoczi qatomic_store_release(&ctx->notify_me, qatomic_read(&ctx->notify_me) & ~1); 33405e514b1SPaolo Bonzini aio_notify_accept(ctx); 33521a03d17SPaolo Bonzini 3368c6b0356SStefan Hajnoczi QSLIST_FOREACH_RCU(bh, &ctx->bh_list, next) { 3378c6b0356SStefan Hajnoczi if ((bh->flags & (BH_SCHEDULED | BH_DELETED)) == BH_SCHEDULED) { 338e3713e00SPaolo Bonzini return true; 339e3713e00SPaolo Bonzini } 340e3713e00SPaolo Bonzini } 3418c6b0356SStefan Hajnoczi 3428c6b0356SStefan Hajnoczi QSIMPLEQ_FOREACH(s, &ctx->bh_slice_list, next) { 3438c6b0356SStefan Hajnoczi QSLIST_FOREACH_RCU(bh, &s->bh_list, next) { 3448c6b0356SStefan Hajnoczi if ((bh->flags & (BH_SCHEDULED | BH_DELETED)) == BH_SCHEDULED) { 3458c6b0356SStefan Hajnoczi return true; 3468c6b0356SStefan Hajnoczi } 3478c6b0356SStefan Hajnoczi } 3488c6b0356SStefan Hajnoczi } 349533a8cf3SAlex Bligh return aio_pending(ctx) || (timerlistgroup_deadline_ns(&ctx->tlg) == 0); 350e3713e00SPaolo Bonzini } 351e3713e00SPaolo Bonzini 352e3713e00SPaolo Bonzini static gboolean 353e3713e00SPaolo Bonzini aio_ctx_dispatch(GSource *source, 354e3713e00SPaolo Bonzini GSourceFunc callback, 355e3713e00SPaolo Bonzini gpointer user_data) 356e3713e00SPaolo Bonzini { 357e3713e00SPaolo Bonzini AioContext *ctx = (AioContext *) source; 358e3713e00SPaolo Bonzini 359e3713e00SPaolo Bonzini assert(callback == NULL); 360a153bf52SPaolo Bonzini aio_dispatch(ctx); 361e3713e00SPaolo Bonzini return true; 362e3713e00SPaolo Bonzini } 363e3713e00SPaolo Bonzini 3642f4dc3c1SPaolo Bonzini static void 3652f4dc3c1SPaolo Bonzini aio_ctx_finalize(GSource *source) 3662f4dc3c1SPaolo Bonzini { 3672f4dc3c1SPaolo Bonzini AioContext *ctx = (AioContext *) source; 3688c6b0356SStefan Hajnoczi QEMUBH *bh; 3698c6b0356SStefan Hajnoczi unsigned flags; 3702f4dc3c1SPaolo Bonzini 3719b34277dSStefan Hajnoczi thread_pool_free(ctx->thread_pool); 372a076972aSStefan Hajnoczi 3730187f5c9SPaolo Bonzini #ifdef CONFIG_LINUX_AIO 3740187f5c9SPaolo Bonzini if (ctx->linux_aio) { 3750187f5c9SPaolo Bonzini laio_detach_aio_context(ctx->linux_aio, ctx); 3760187f5c9SPaolo Bonzini laio_cleanup(ctx->linux_aio); 3770187f5c9SPaolo Bonzini ctx->linux_aio = NULL; 3780187f5c9SPaolo Bonzini } 3790187f5c9SPaolo Bonzini #endif 3800187f5c9SPaolo Bonzini 381fcb7a4a4SAarushi Mehta #ifdef CONFIG_LINUX_IO_URING 382fcb7a4a4SAarushi Mehta if (ctx->linux_io_uring) { 383fcb7a4a4SAarushi Mehta luring_detach_aio_context(ctx->linux_io_uring, ctx); 384fcb7a4a4SAarushi Mehta luring_cleanup(ctx->linux_io_uring); 385fcb7a4a4SAarushi Mehta ctx->linux_io_uring = NULL; 386fcb7a4a4SAarushi Mehta } 387fcb7a4a4SAarushi Mehta #endif 388fcb7a4a4SAarushi Mehta 3890c330a73SPaolo Bonzini assert(QSLIST_EMPTY(&ctx->scheduled_coroutines)); 3900c330a73SPaolo Bonzini qemu_bh_delete(ctx->co_schedule_bh); 3910c330a73SPaolo Bonzini 3928c6b0356SStefan Hajnoczi /* There must be no aio_bh_poll() calls going on */ 3938c6b0356SStefan Hajnoczi assert(QSIMPLEQ_EMPTY(&ctx->bh_slice_list)); 394a076972aSStefan Hajnoczi 3958c6b0356SStefan Hajnoczi while ((bh = aio_bh_dequeue(&ctx->bh_list, &flags))) { 396023ca420SStefan Hajnoczi /* 397023ca420SStefan Hajnoczi * qemu_bh_delete() must have been called on BHs in this AioContext. In 398023ca420SStefan Hajnoczi * many cases memory leaks, hangs, or inconsistent state occur when a 399023ca420SStefan Hajnoczi * BH is leaked because something still expects it to run. 400023ca420SStefan Hajnoczi * 401023ca420SStefan Hajnoczi * If you hit this, fix the lifecycle of the BH so that 402023ca420SStefan Hajnoczi * qemu_bh_delete() and any associated cleanup is called before the 403023ca420SStefan Hajnoczi * AioContext is finalized. 404023ca420SStefan Hajnoczi */ 405023ca420SStefan Hajnoczi if (unlikely(!(flags & BH_DELETED))) { 406023ca420SStefan Hajnoczi fprintf(stderr, "%s: BH '%s' leaked, aborting...\n", 407023ca420SStefan Hajnoczi __func__, bh->name); 408023ca420SStefan Hajnoczi abort(); 409023ca420SStefan Hajnoczi } 410a076972aSStefan Hajnoczi 4118c6b0356SStefan Hajnoczi g_free(bh); 412a076972aSStefan Hajnoczi } 413a076972aSStefan Hajnoczi 41460f782b6SStefan Hajnoczi aio_set_event_notifier(ctx, &ctx->notifier, NULL, NULL, NULL); 4152f4dc3c1SPaolo Bonzini event_notifier_cleanup(&ctx->notifier); 4163fe71223SPaolo Bonzini qemu_rec_mutex_destroy(&ctx->lock); 417d7c99a12SPaolo Bonzini qemu_lockcnt_destroy(&ctx->list_lock); 418dae21b98SAlex Bligh timerlistgroup_deinit(&ctx->tlg); 419587d82faSEmanuele Giuseppe Esposito unregister_aiocontext(ctx); 420cd0a6d2bSJie Wang aio_context_destroy(ctx); 4212f4dc3c1SPaolo Bonzini } 4222f4dc3c1SPaolo Bonzini 423e3713e00SPaolo Bonzini static GSourceFuncs aio_source_funcs = { 424e3713e00SPaolo Bonzini aio_ctx_prepare, 425e3713e00SPaolo Bonzini aio_ctx_check, 426e3713e00SPaolo Bonzini aio_ctx_dispatch, 4272f4dc3c1SPaolo Bonzini aio_ctx_finalize 428e3713e00SPaolo Bonzini }; 429e3713e00SPaolo Bonzini 430e3713e00SPaolo Bonzini GSource *aio_get_g_source(AioContext *ctx) 431e3713e00SPaolo Bonzini { 432ba607ca8SStefan Hajnoczi aio_context_use_g_source(ctx); 433e3713e00SPaolo Bonzini g_source_ref(&ctx->source); 434e3713e00SPaolo Bonzini return &ctx->source; 435e3713e00SPaolo Bonzini } 436a915f4bcSPaolo Bonzini 4379b34277dSStefan Hajnoczi ThreadPool *aio_get_thread_pool(AioContext *ctx) 4389b34277dSStefan Hajnoczi { 4399b34277dSStefan Hajnoczi if (!ctx->thread_pool) { 4409b34277dSStefan Hajnoczi ctx->thread_pool = thread_pool_new(ctx); 4419b34277dSStefan Hajnoczi } 4429b34277dSStefan Hajnoczi return ctx->thread_pool; 4439b34277dSStefan Hajnoczi } 4449b34277dSStefan Hajnoczi 4450187f5c9SPaolo Bonzini #ifdef CONFIG_LINUX_AIO 446ed6e2161SNishanth Aravamudan LinuxAioState *aio_setup_linux_aio(AioContext *ctx, Error **errp) 4470187f5c9SPaolo Bonzini { 4480187f5c9SPaolo Bonzini if (!ctx->linux_aio) { 449ed6e2161SNishanth Aravamudan ctx->linux_aio = laio_init(errp); 450ed6e2161SNishanth Aravamudan if (ctx->linux_aio) { 4510187f5c9SPaolo Bonzini laio_attach_aio_context(ctx->linux_aio, ctx); 4520187f5c9SPaolo Bonzini } 453ed6e2161SNishanth Aravamudan } 454ed6e2161SNishanth Aravamudan return ctx->linux_aio; 455ed6e2161SNishanth Aravamudan } 456ed6e2161SNishanth Aravamudan 457ed6e2161SNishanth Aravamudan LinuxAioState *aio_get_linux_aio(AioContext *ctx) 458ed6e2161SNishanth Aravamudan { 459ed6e2161SNishanth Aravamudan assert(ctx->linux_aio); 4600187f5c9SPaolo Bonzini return ctx->linux_aio; 4610187f5c9SPaolo Bonzini } 4620187f5c9SPaolo Bonzini #endif 4630187f5c9SPaolo Bonzini 464fcb7a4a4SAarushi Mehta #ifdef CONFIG_LINUX_IO_URING 465fcb7a4a4SAarushi Mehta LuringState *aio_setup_linux_io_uring(AioContext *ctx, Error **errp) 466fcb7a4a4SAarushi Mehta { 467fcb7a4a4SAarushi Mehta if (ctx->linux_io_uring) { 468fcb7a4a4SAarushi Mehta return ctx->linux_io_uring; 469fcb7a4a4SAarushi Mehta } 470fcb7a4a4SAarushi Mehta 471fcb7a4a4SAarushi Mehta ctx->linux_io_uring = luring_init(errp); 472fcb7a4a4SAarushi Mehta if (!ctx->linux_io_uring) { 473fcb7a4a4SAarushi Mehta return NULL; 474fcb7a4a4SAarushi Mehta } 475fcb7a4a4SAarushi Mehta 476fcb7a4a4SAarushi Mehta luring_attach_aio_context(ctx->linux_io_uring, ctx); 477fcb7a4a4SAarushi Mehta return ctx->linux_io_uring; 478fcb7a4a4SAarushi Mehta } 479fcb7a4a4SAarushi Mehta 480fcb7a4a4SAarushi Mehta LuringState *aio_get_linux_io_uring(AioContext *ctx) 481fcb7a4a4SAarushi Mehta { 482fcb7a4a4SAarushi Mehta assert(ctx->linux_io_uring); 483fcb7a4a4SAarushi Mehta return ctx->linux_io_uring; 484fcb7a4a4SAarushi Mehta } 485fcb7a4a4SAarushi Mehta #endif 486fcb7a4a4SAarushi Mehta 4872f4dc3c1SPaolo Bonzini void aio_notify(AioContext *ctx) 4882f4dc3c1SPaolo Bonzini { 489601829f8SStefan Hajnoczi /* 4908dd48650SPaolo Bonzini * Write e.g. ctx->bh_list before writing ctx->notified. Pairs with 4918dd48650SPaolo Bonzini * smp_mb() in aio_notify_accept(). 492601829f8SStefan Hajnoczi */ 493601829f8SStefan Hajnoczi smp_wmb(); 494d73415a3SStefan Hajnoczi qatomic_set(&ctx->notified, true); 495601829f8SStefan Hajnoczi 496601829f8SStefan Hajnoczi /* 4978dd48650SPaolo Bonzini * Write ctx->notified (and also ctx->bh_list) before reading ctx->notify_me. 4988dd48650SPaolo Bonzini * Pairs with smp_mb() in aio_ctx_prepare or aio_poll. 499eabc9779SPaolo Bonzini */ 5000ceb849bSPaolo Bonzini smp_mb(); 501d73415a3SStefan Hajnoczi if (qatomic_read(&ctx->notify_me)) { 5022f4dc3c1SPaolo Bonzini event_notifier_set(&ctx->notifier); 50305e514b1SPaolo Bonzini } 50405e514b1SPaolo Bonzini } 50505e514b1SPaolo Bonzini 50605e514b1SPaolo Bonzini void aio_notify_accept(AioContext *ctx) 50705e514b1SPaolo Bonzini { 508d73415a3SStefan Hajnoczi qatomic_set(&ctx->notified, false); 509601829f8SStefan Hajnoczi 510601829f8SStefan Hajnoczi /* 5116229438cSPaolo Bonzini * Order reads of ctx->notified (in aio_context_notifier_poll()) and the 5126229438cSPaolo Bonzini * above clearing of ctx->notified before reads of e.g. bh->flags. Pairs 5136229438cSPaolo Bonzini * with smp_wmb() in aio_notify. 514601829f8SStefan Hajnoczi */ 515601829f8SStefan Hajnoczi smp_mb(); 5160ceb849bSPaolo Bonzini } 5172f4dc3c1SPaolo Bonzini 5183f53bc61SPaolo Bonzini static void aio_timerlist_notify(void *opaque, QEMUClockType type) 519d5541d86SAlex Bligh { 520d5541d86SAlex Bligh aio_notify(opaque); 521d5541d86SAlex Bligh } 522d5541d86SAlex Bligh 523601829f8SStefan Hajnoczi static void aio_context_notifier_cb(EventNotifier *e) 52421a03d17SPaolo Bonzini { 525601829f8SStefan Hajnoczi AioContext *ctx = container_of(e, AioContext, notifier); 526601829f8SStefan Hajnoczi 527601829f8SStefan Hajnoczi event_notifier_test_and_clear(&ctx->notifier); 52821a03d17SPaolo Bonzini } 52921a03d17SPaolo Bonzini 5304a1cba38SStefan Hajnoczi /* Returns true if aio_notify() was called (e.g. a BH was scheduled) */ 531c13be5a1SStefan Hajnoczi static bool aio_context_notifier_poll(void *opaque) 5324a1cba38SStefan Hajnoczi { 5334a1cba38SStefan Hajnoczi EventNotifier *e = opaque; 5344a1cba38SStefan Hajnoczi AioContext *ctx = container_of(e, AioContext, notifier); 5354a1cba38SStefan Hajnoczi 5366229438cSPaolo Bonzini /* 5376229438cSPaolo Bonzini * No need for load-acquire because we just want to kick the 5386229438cSPaolo Bonzini * event loop. aio_notify_accept() takes care of synchronizing 5396229438cSPaolo Bonzini * the event loop with the producers. 5406229438cSPaolo Bonzini */ 541d73415a3SStefan Hajnoczi return qatomic_read(&ctx->notified); 5424a1cba38SStefan Hajnoczi } 5434a1cba38SStefan Hajnoczi 544826cc324SStefan Hajnoczi static void aio_context_notifier_poll_ready(EventNotifier *e) 545826cc324SStefan Hajnoczi { 546826cc324SStefan Hajnoczi /* Do nothing, we just wanted to kick the event loop */ 547826cc324SStefan Hajnoczi } 548826cc324SStefan Hajnoczi 5490c330a73SPaolo Bonzini static void co_schedule_bh_cb(void *opaque) 5500c330a73SPaolo Bonzini { 5510c330a73SPaolo Bonzini AioContext *ctx = opaque; 5520c330a73SPaolo Bonzini QSLIST_HEAD(, Coroutine) straight, reversed; 5530c330a73SPaolo Bonzini 5540c330a73SPaolo Bonzini QSLIST_MOVE_ATOMIC(&reversed, &ctx->scheduled_coroutines); 5550c330a73SPaolo Bonzini QSLIST_INIT(&straight); 5560c330a73SPaolo Bonzini 5570c330a73SPaolo Bonzini while (!QSLIST_EMPTY(&reversed)) { 5580c330a73SPaolo Bonzini Coroutine *co = QSLIST_FIRST(&reversed); 5590c330a73SPaolo Bonzini QSLIST_REMOVE_HEAD(&reversed, co_scheduled_next); 5600c330a73SPaolo Bonzini QSLIST_INSERT_HEAD(&straight, co, co_scheduled_next); 5610c330a73SPaolo Bonzini } 5620c330a73SPaolo Bonzini 5630c330a73SPaolo Bonzini while (!QSLIST_EMPTY(&straight)) { 5640c330a73SPaolo Bonzini Coroutine *co = QSLIST_FIRST(&straight); 5650c330a73SPaolo Bonzini QSLIST_REMOVE_HEAD(&straight, co_scheduled_next); 5660c330a73SPaolo Bonzini trace_aio_co_schedule_bh_cb(ctx, co); 5676133b39fSJeff Cody 5686133b39fSJeff Cody /* Protected by write barrier in qemu_aio_coroutine_enter */ 569d73415a3SStefan Hajnoczi qatomic_set(&co->scheduled, NULL); 5706808ae04SSergio Lopez qemu_aio_coroutine_enter(ctx, co); 5710c330a73SPaolo Bonzini } 5720c330a73SPaolo Bonzini } 5730c330a73SPaolo Bonzini 5742f78e491SChrysostomos Nanakos AioContext *aio_context_new(Error **errp) 575f627aab1SPaolo Bonzini { 5762f78e491SChrysostomos Nanakos int ret; 5772f4dc3c1SPaolo Bonzini AioContext *ctx; 57837fcee5dSFam Zheng 5792f4dc3c1SPaolo Bonzini ctx = (AioContext *) g_source_new(&aio_source_funcs, sizeof(AioContext)); 5808c6b0356SStefan Hajnoczi QSLIST_INIT(&ctx->bh_list); 5818c6b0356SStefan Hajnoczi QSIMPLEQ_INIT(&ctx->bh_slice_list); 5827e003465SCao jin aio_context_setup(ctx); 5837e003465SCao jin 5842f78e491SChrysostomos Nanakos ret = event_notifier_init(&ctx->notifier, false); 5852f78e491SChrysostomos Nanakos if (ret < 0) { 5862f78e491SChrysostomos Nanakos error_setg_errno(errp, -ret, "Failed to initialize event notifier"); 58737fcee5dSFam Zheng goto fail; 5882f78e491SChrysostomos Nanakos } 589fcf5def1SPaolo Bonzini g_source_set_can_recurse(&ctx->source, true); 590d7c99a12SPaolo Bonzini qemu_lockcnt_init(&ctx->list_lock); 5910c330a73SPaolo Bonzini 5920c330a73SPaolo Bonzini ctx->co_schedule_bh = aio_bh_new(ctx, co_schedule_bh_cb, ctx); 5930c330a73SPaolo Bonzini QSLIST_INIT(&ctx->scheduled_coroutines); 5940c330a73SPaolo Bonzini 5952f78e491SChrysostomos Nanakos aio_set_event_notifier(ctx, &ctx->notifier, 596601829f8SStefan Hajnoczi aio_context_notifier_cb, 597826cc324SStefan Hajnoczi aio_context_notifier_poll, 598826cc324SStefan Hajnoczi aio_context_notifier_poll_ready); 5990187f5c9SPaolo Bonzini #ifdef CONFIG_LINUX_AIO 6000187f5c9SPaolo Bonzini ctx->linux_aio = NULL; 6010187f5c9SPaolo Bonzini #endif 602fcb7a4a4SAarushi Mehta 603fcb7a4a4SAarushi Mehta #ifdef CONFIG_LINUX_IO_URING 604fcb7a4a4SAarushi Mehta ctx->linux_io_uring = NULL; 605fcb7a4a4SAarushi Mehta #endif 606fcb7a4a4SAarushi Mehta 6079b34277dSStefan Hajnoczi ctx->thread_pool = NULL; 6083fe71223SPaolo Bonzini qemu_rec_mutex_init(&ctx->lock); 609d5541d86SAlex Bligh timerlistgroup_init(&ctx->tlg, aio_timerlist_notify, ctx); 6102f4dc3c1SPaolo Bonzini 61182a41186SStefan Hajnoczi ctx->poll_ns = 0; 6124a1cba38SStefan Hajnoczi ctx->poll_max_ns = 0; 61382a41186SStefan Hajnoczi ctx->poll_grow = 0; 61482a41186SStefan Hajnoczi ctx->poll_shrink = 0; 6154a1cba38SStefan Hajnoczi 6161793ad02SStefano Garzarella ctx->aio_max_batch = 0; 6171793ad02SStefano Garzarella 61871ad4713SNicolas Saenz Julienne ctx->thread_pool_min = 0; 61971ad4713SNicolas Saenz Julienne ctx->thread_pool_max = THREAD_POOL_MAX_THREADS_DEFAULT; 62071ad4713SNicolas Saenz Julienne 621587d82faSEmanuele Giuseppe Esposito register_aiocontext(ctx); 622587d82faSEmanuele Giuseppe Esposito 6232f4dc3c1SPaolo Bonzini return ctx; 62437fcee5dSFam Zheng fail: 62537fcee5dSFam Zheng g_source_destroy(&ctx->source); 62637fcee5dSFam Zheng return NULL; 627e3713e00SPaolo Bonzini } 628e3713e00SPaolo Bonzini 6290c330a73SPaolo Bonzini void aio_co_schedule(AioContext *ctx, Coroutine *co) 6300c330a73SPaolo Bonzini { 6310c330a73SPaolo Bonzini trace_aio_co_schedule(ctx, co); 632d73415a3SStefan Hajnoczi const char *scheduled = qatomic_cmpxchg(&co->scheduled, NULL, 6336133b39fSJeff Cody __func__); 6346133b39fSJeff Cody 6356133b39fSJeff Cody if (scheduled) { 6366133b39fSJeff Cody fprintf(stderr, 6376133b39fSJeff Cody "%s: Co-routine was already scheduled in '%s'\n", 6386133b39fSJeff Cody __func__, scheduled); 6396133b39fSJeff Cody abort(); 6406133b39fSJeff Cody } 6416133b39fSJeff Cody 642f0f81002SStefan Hajnoczi /* The coroutine might run and release the last ctx reference before we 643f0f81002SStefan Hajnoczi * invoke qemu_bh_schedule(). Take a reference to keep ctx alive until 644f0f81002SStefan Hajnoczi * we're done. 645f0f81002SStefan Hajnoczi */ 646f0f81002SStefan Hajnoczi aio_context_ref(ctx); 647f0f81002SStefan Hajnoczi 6480c330a73SPaolo Bonzini QSLIST_INSERT_HEAD_ATOMIC(&ctx->scheduled_coroutines, 6490c330a73SPaolo Bonzini co, co_scheduled_next); 6500c330a73SPaolo Bonzini qemu_bh_schedule(ctx->co_schedule_bh); 651f0f81002SStefan Hajnoczi 652f0f81002SStefan Hajnoczi aio_context_unref(ctx); 6530c330a73SPaolo Bonzini } 6540c330a73SPaolo Bonzini 65526b0b698SKevin Wolf typedef struct AioCoRescheduleSelf { 65626b0b698SKevin Wolf Coroutine *co; 65726b0b698SKevin Wolf AioContext *new_ctx; 65826b0b698SKevin Wolf } AioCoRescheduleSelf; 65926b0b698SKevin Wolf 66026b0b698SKevin Wolf static void aio_co_reschedule_self_bh(void *opaque) 66126b0b698SKevin Wolf { 66226b0b698SKevin Wolf AioCoRescheduleSelf *data = opaque; 66326b0b698SKevin Wolf aio_co_schedule(data->new_ctx, data->co); 66426b0b698SKevin Wolf } 66526b0b698SKevin Wolf 66626b0b698SKevin Wolf void coroutine_fn aio_co_reschedule_self(AioContext *new_ctx) 66726b0b698SKevin Wolf { 66826b0b698SKevin Wolf AioContext *old_ctx = qemu_get_current_aio_context(); 66926b0b698SKevin Wolf 67026b0b698SKevin Wolf if (old_ctx != new_ctx) { 67126b0b698SKevin Wolf AioCoRescheduleSelf data = { 67226b0b698SKevin Wolf .co = qemu_coroutine_self(), 67326b0b698SKevin Wolf .new_ctx = new_ctx, 67426b0b698SKevin Wolf }; 67526b0b698SKevin Wolf /* 67626b0b698SKevin Wolf * We can't directly schedule the coroutine in the target context 67726b0b698SKevin Wolf * because this would be racy: The other thread could try to enter the 67826b0b698SKevin Wolf * coroutine before it has yielded in this one. 67926b0b698SKevin Wolf */ 68026b0b698SKevin Wolf aio_bh_schedule_oneshot(old_ctx, aio_co_reschedule_self_bh, &data); 68126b0b698SKevin Wolf qemu_coroutine_yield(); 68226b0b698SKevin Wolf } 68326b0b698SKevin Wolf } 68426b0b698SKevin Wolf 68543695601SMarkus Armbruster void aio_co_wake(Coroutine *co) 6860c330a73SPaolo Bonzini { 6870c330a73SPaolo Bonzini AioContext *ctx; 6880c330a73SPaolo Bonzini 6890c330a73SPaolo Bonzini /* Read coroutine before co->ctx. Matches smp_wmb in 6900c330a73SPaolo Bonzini * qemu_coroutine_enter. 6910c330a73SPaolo Bonzini */ 6920c330a73SPaolo Bonzini smp_read_barrier_depends(); 693d73415a3SStefan Hajnoczi ctx = qatomic_read(&co->ctx); 6940c330a73SPaolo Bonzini 6958865852eSFam Zheng aio_co_enter(ctx, co); 6968865852eSFam Zheng } 6978865852eSFam Zheng 69843695601SMarkus Armbruster void aio_co_enter(AioContext *ctx, Coroutine *co) 6998865852eSFam Zheng { 7000c330a73SPaolo Bonzini if (ctx != qemu_get_current_aio_context()) { 7010c330a73SPaolo Bonzini aio_co_schedule(ctx, co); 7020c330a73SPaolo Bonzini return; 7030c330a73SPaolo Bonzini } 7040c330a73SPaolo Bonzini 7050c330a73SPaolo Bonzini if (qemu_in_coroutine()) { 7060c330a73SPaolo Bonzini Coroutine *self = qemu_coroutine_self(); 7070c330a73SPaolo Bonzini assert(self != co); 7080c330a73SPaolo Bonzini QSIMPLEQ_INSERT_TAIL(&self->co_queue_wakeup, co, co_queue_next); 7090c330a73SPaolo Bonzini } else { 7108865852eSFam Zheng qemu_aio_coroutine_enter(ctx, co); 7110c330a73SPaolo Bonzini } 7120c330a73SPaolo Bonzini } 7130c330a73SPaolo Bonzini 714e3713e00SPaolo Bonzini void aio_context_ref(AioContext *ctx) 715e3713e00SPaolo Bonzini { 716e3713e00SPaolo Bonzini g_source_ref(&ctx->source); 717e3713e00SPaolo Bonzini } 718e3713e00SPaolo Bonzini 719e3713e00SPaolo Bonzini void aio_context_unref(AioContext *ctx) 720e3713e00SPaolo Bonzini { 721e3713e00SPaolo Bonzini g_source_unref(&ctx->source); 722f627aab1SPaolo Bonzini } 72398563fc3SStefan Hajnoczi 72447b74464SStefan Hajnoczi QEMU_DEFINE_STATIC_CO_TLS(AioContext *, my_aiocontext) 7255f50be9bSPaolo Bonzini 7265f50be9bSPaolo Bonzini AioContext *qemu_get_current_aio_context(void) 7275f50be9bSPaolo Bonzini { 72847b74464SStefan Hajnoczi AioContext *ctx = get_my_aiocontext(); 72947b74464SStefan Hajnoczi if (ctx) { 73047b74464SStefan Hajnoczi return ctx; 7315f50be9bSPaolo Bonzini } 732195801d7SStefan Hajnoczi if (bql_locked()) { 7335f50be9bSPaolo Bonzini /* Possibly in a vCPU thread. */ 7345f50be9bSPaolo Bonzini return qemu_get_aio_context(); 7355f50be9bSPaolo Bonzini } 7365f50be9bSPaolo Bonzini return NULL; 7375f50be9bSPaolo Bonzini } 7385f50be9bSPaolo Bonzini 7395f50be9bSPaolo Bonzini void qemu_set_current_aio_context(AioContext *ctx) 7405f50be9bSPaolo Bonzini { 74147b74464SStefan Hajnoczi assert(!get_my_aiocontext()); 74247b74464SStefan Hajnoczi set_my_aiocontext(ctx); 7435f50be9bSPaolo Bonzini } 74471ad4713SNicolas Saenz Julienne 74571ad4713SNicolas Saenz Julienne void aio_context_set_thread_pool_params(AioContext *ctx, int64_t min, 74671ad4713SNicolas Saenz Julienne int64_t max, Error **errp) 74771ad4713SNicolas Saenz Julienne { 74871ad4713SNicolas Saenz Julienne 74971ad4713SNicolas Saenz Julienne if (min > max || !max || min > INT_MAX || max > INT_MAX) { 75071ad4713SNicolas Saenz Julienne error_setg(errp, "bad thread-pool-min/thread-pool-max values"); 75171ad4713SNicolas Saenz Julienne return; 75271ad4713SNicolas Saenz Julienne } 75371ad4713SNicolas Saenz Julienne 75471ad4713SNicolas Saenz Julienne ctx->thread_pool_min = min; 75571ad4713SNicolas Saenz Julienne ctx->thread_pool_max = max; 75671ad4713SNicolas Saenz Julienne 75771ad4713SNicolas Saenz Julienne if (ctx->thread_pool) { 75871ad4713SNicolas Saenz Julienne thread_pool_update_params(ctx->thread_pool, ctx); 75971ad4713SNicolas Saenz Julienne } 76071ad4713SNicolas Saenz Julienne } 761