LXR qemu/util/aio-posix.c

   1/*
   2 * QEMU aio implementation
   3 *
   4 * Copyright IBM, Corp. 2008
   5 *
   6 * Authors:
   7 *  Anthony Liguori   <aliguori@us.ibm.com>
   8 *
   9 * This work is licensed under the terms of the GNU GPL, version 2.  See
  10 * the COPYING file in the top-level directory.
  11 *
  12 * Contributions after 2012-01-13 are licensed under the terms of the
  13 * GNU GPL, version 2 or (at your option) any later version.
  14 */
  15
  16#include "qemu/osdep.h"
  17#include "block/block.h"
  18#include "block/thread-pool.h"
  19#include "qemu/main-loop.h"
  20#include "qemu/rcu.h"
  21#include "qemu/rcu_queue.h"
  22#include "qemu/sockets.h"
  23#include "qemu/cutils.h"
  24#include "trace.h"
  25#include "aio-posix.h"
  26
  27/* Stop userspace polling on a handler if it isn't active for some time */
  28#define POLL_IDLE_INTERVAL_NS (7 * NANOSECONDS_PER_SECOND)
  29
  30bool aio_poll_disabled(AioContext *ctx)
  31{
  32    return qatomic_read(&ctx->poll_disable_cnt);
  33}
  34
  35void aio_add_ready_handler(AioHandlerList *ready_list,
  36                           AioHandler *node,
  37                           int revents)
  38{
  39    QLIST_SAFE_REMOVE(node, node_ready); /* remove from nested parent's list */
  40    node->pfd.revents = revents;
  41    QLIST_INSERT_HEAD(ready_list, node, node_ready);
  42}
  43
  44static void aio_add_poll_ready_handler(AioHandlerList *ready_list,
  45                                       AioHandler *node)
  46{
  47    QLIST_SAFE_REMOVE(node, node_ready); /* remove from nested parent's list */
  48    node->poll_ready = true;
  49    QLIST_INSERT_HEAD(ready_list, node, node_ready);
  50}
  51
  52static AioHandler *find_aio_handler(AioContext *ctx, int fd)
  53{
  54    AioHandler *node;
  55
  56    QLIST_FOREACH(node, &ctx->aio_handlers, node) {
  57        if (node->pfd.fd == fd) {
  58            if (!QLIST_IS_INSERTED(node, node_deleted)) {
  59                return node;
  60            }
  61        }
  62    }
  63
  64    return NULL;
  65}
  66
  67static bool aio_remove_fd_handler(AioContext *ctx, AioHandler *node)
  68{
  69    /* If the GSource is in the process of being destroyed then
  70     * g_source_remove_poll() causes an assertion failure.  Skip
  71     * removal in that case, because glib cleans up its state during
  72     * destruction anyway.
  73     */
  74    if (!g_source_is_destroyed(&ctx->source)) {
  75        g_source_remove_poll(&ctx->source, &node->pfd);
  76    }
  77
  78    node->pfd.revents = 0;
  79    node->poll_ready = false;
  80
  81    /* If the fd monitor has already marked it deleted, leave it alone */
  82    if (QLIST_IS_INSERTED(node, node_deleted)) {
  83        return false;
  84    }
  85
  86    /* If a read is in progress, just mark the node as deleted */
  87    if (qemu_lockcnt_count(&ctx->list_lock)) {
  88        QLIST_INSERT_HEAD_RCU(&ctx->deleted_aio_handlers, node, node_deleted);
  89        return false;
  90    }
  91    /* Otherwise, delete it for real.  We can't just mark it as
  92     * deleted because deleted nodes are only cleaned up while
  93     * no one is walking the handlers list.
  94     */
  95    QLIST_SAFE_REMOVE(node, node_poll);
  96    QLIST_REMOVE(node, node);
  97    return true;
  98}
  99
 100void aio_set_fd_handler(AioContext *ctx,
 101                        int fd,
 102                        bool is_external,
 103                        IOHandler *io_read,
 104                        IOHandler *io_write,
 105                        AioPollFn *io_poll,
 106                        IOHandler *io_poll_ready,
 107                        void *opaque)
 108{
 109    AioHandler *node;
 110    AioHandler *new_node = NULL;
 111    bool is_new = false;
 112    bool deleted = false;
 113    int poll_disable_change;
 114
 115    if (io_poll && !io_poll_ready) {
 116        io_poll = NULL; /* polling only makes sense if there is a handler */
 117    }
 118
 119    qemu_lockcnt_lock(&ctx->list_lock);
 120
 121    node = find_aio_handler(ctx, fd);
 122
 123    /* Are we deleting the fd handler? */
 124    if (!io_read && !io_write && !io_poll) {
 125        if (node == NULL) {
 126            qemu_lockcnt_unlock(&ctx->list_lock);
 127            return;
 128        }
 129        /* Clean events in order to unregister fd from the ctx epoll. */
 130        node->pfd.events = 0;
 131
 132        poll_disable_change = -!node->io_poll;
 133    } else {
 134        poll_disable_change = !io_poll - (node && !node->io_poll);
 135        if (node == NULL) {
 136            is_new = true;
 137        }
 138        /* Alloc and insert if it's not already there */
 139        new_node = g_new0(AioHandler, 1);
 140
 141        /* Update handler with latest information */
 142        new_node->io_read = io_read;
 143        new_node->io_write = io_write;
 144        new_node->io_poll = io_poll;
 145        new_node->io_poll_ready = io_poll_ready;
 146        new_node->opaque = opaque;
 147        new_node->is_external = is_external;
 148
 149        if (is_new) {
 150            new_node->pfd.fd = fd;
 151        } else {
 152            new_node->pfd = node->pfd;
 153        }
 154        g_source_add_poll(&ctx->source, &new_node->pfd);
 155
 156        new_node->pfd.events = (io_read ? G_IO_IN | G_IO_HUP | G_IO_ERR : 0);
 157        new_node->pfd.events |= (io_write ? G_IO_OUT | G_IO_ERR : 0);
 158
 159        QLIST_INSERT_HEAD_RCU(&ctx->aio_handlers, new_node, node);
 160    }
 161
 162    /* No need to order poll_disable_cnt writes against other updates;
 163     * the counter is only used to avoid wasting time and latency on
 164     * iterated polling when the system call will be ultimately necessary.
 165     * Changing handlers is a rare event, and a little wasted polling until
 166     * the aio_notify below is not an issue.
 167     */
 168    qatomic_set(&ctx->poll_disable_cnt,
 169               qatomic_read(&ctx->poll_disable_cnt) + poll_disable_change);
 170
 171    ctx->fdmon_ops->update(ctx, node, new_node);
 172    if (node) {
 173        deleted = aio_remove_fd_handler(ctx, node);
 174    }
 175    qemu_lockcnt_unlock(&ctx->list_lock);
 176    aio_notify(ctx);
 177
 178    if (deleted) {
 179        g_free(node);
 180    }
 181}
 182
 183void aio_set_fd_poll(AioContext *ctx, int fd,
 184                     IOHandler *io_poll_begin,
 185                     IOHandler *io_poll_end)
 186{
 187    AioHandler *node = find_aio_handler(ctx, fd);
 188
 189    if (!node) {
 190        return;
 191    }
 192
 193    node->io_poll_begin = io_poll_begin;
 194    node->io_poll_end = io_poll_end;
 195}
 196
 197void aio_set_event_notifier(AioContext *ctx,
 198                            EventNotifier *notifier,
 199                            bool is_external,
 200                            EventNotifierHandler *io_read,
 201                            AioPollFn *io_poll,
 202                            EventNotifierHandler *io_poll_ready)
 203{
 204    aio_set_fd_handler(ctx, event_notifier_get_fd(notifier), is_external,
 205                       (IOHandler *)io_read, NULL, io_poll,
 206                       (IOHandler *)io_poll_ready, notifier);
 207}
 208
 209void aio_set_event_notifier_poll(AioContext *ctx,
 210                                 EventNotifier *notifier,
 211                                 EventNotifierHandler *io_poll_begin,
 212                                 EventNotifierHandler *io_poll_end)
 213{
 214    aio_set_fd_poll(ctx, event_notifier_get_fd(notifier),
 215                    (IOHandler *)io_poll_begin,
 216                    (IOHandler *)io_poll_end);
 217}
 218
 219static bool poll_set_started(AioContext *ctx, AioHandlerList *ready_list,
 220                             bool started)
 221{
 222    AioHandler *node;
 223    bool progress = false;
 224
 225    if (started == ctx->poll_started) {
 226        return false;
 227    }
 228
 229    ctx->poll_started = started;
 230
 231    qemu_lockcnt_inc(&ctx->list_lock);
 232    QLIST_FOREACH(node, &ctx->poll_aio_handlers, node_poll) {
 233        IOHandler *fn;
 234
 235        if (QLIST_IS_INSERTED(node, node_deleted)) {
 236            continue;
 237        }
 238
 239        if (started) {
 240            fn = node->io_poll_begin;
 241        } else {
 242            fn = node->io_poll_end;
 243        }
 244
 245        if (fn) {
 246            fn(node->opaque);
 247        }
 248
 249        /* Poll one last time in case ->io_poll_end() raced with the event */
 250        if (!started && node->io_poll(node->opaque)) {
 251            aio_add_poll_ready_handler(ready_list, node);
 252            progress = true;
 253        }
 254    }
 255    qemu_lockcnt_dec(&ctx->list_lock);
 256
 257    return progress;
 258}
 259
 260
 261bool aio_prepare(AioContext *ctx)
 262{
 263    AioHandlerList ready_list = QLIST_HEAD_INITIALIZER(ready_list);
 264
 265    /* Poll mode cannot be used with glib's event loop, disable it. */
 266    poll_set_started(ctx, &ready_list, false);
 267    /* TODO what to do with this list? */
 268
 269    return false;
 270}
 271
 272bool aio_pending(AioContext *ctx)
 273{
 274    AioHandler *node;
 275    bool result = false;
 276
 277    /*
 278     * We have to walk very carefully in case aio_set_fd_handler is
 279     * called while we're walking.
 280     */
 281    qemu_lockcnt_inc(&ctx->list_lock);
 282
 283    QLIST_FOREACH_RCU(node, &ctx->aio_handlers, node) {
 284        int revents;
 285
 286        /* TODO should this check poll ready? */
 287        revents = node->pfd.revents & node->pfd.events;
 288        if (revents & (G_IO_IN | G_IO_HUP | G_IO_ERR) && node->io_read &&
 289            aio_node_check(ctx, node->is_external)) {
 290            result = true;
 291            break;
 292        }
 293        if (revents & (G_IO_OUT | G_IO_ERR) && node->io_write &&
 294            aio_node_check(ctx, node->is_external)) {
 295            result = true;
 296            break;
 297        }
 298    }
 299    qemu_lockcnt_dec(&ctx->list_lock);
 300
 301    return result;
 302}
 303
 304static void aio_free_deleted_handlers(AioContext *ctx)
 305{
 306    AioHandler *node;
 307
 308    if (QLIST_EMPTY_RCU(&ctx->deleted_aio_handlers)) {
 309        return;
 310    }
 311    if (!qemu_lockcnt_dec_if_lock(&ctx->list_lock)) {
 312        return; /* we are nested, let the parent do the freeing */
 313    }
 314
 315    while ((node = QLIST_FIRST_RCU(&ctx->deleted_aio_handlers))) {
 316        QLIST_REMOVE(node, node);
 317        QLIST_REMOVE(node, node_deleted);
 318        QLIST_SAFE_REMOVE(node, node_poll);
 319        g_free(node);
 320    }
 321
 322    qemu_lockcnt_inc_and_unlock(&ctx->list_lock);
 323}
 324
 325static bool aio_dispatch_handler(AioContext *ctx, AioHandler *node)
 326{
 327    bool progress = false;
 328    bool poll_ready;
 329    int revents;
 330
 331    revents = node->pfd.revents & node->pfd.events;
 332    node->pfd.revents = 0;
 333
 334    poll_ready = node->poll_ready;
 335    node->poll_ready = false;
 336
 337    /*
 338     * Start polling AioHandlers when they become ready because activity is
 339     * likely to continue.  Note that starvation is theoretically possible when
 340     * fdmon_supports_polling(), but only until the fd fires for the first
 341     * time.
 342     */
 343    if (!QLIST_IS_INSERTED(node, node_deleted) &&
 344        !QLIST_IS_INSERTED(node, node_poll) &&
 345        node->io_poll) {
 346        trace_poll_add(ctx, node, node->pfd.fd, revents);
 347        if (ctx->poll_started && node->io_poll_begin) {
 348            node->io_poll_begin(node->opaque);
 349        }
 350        QLIST_INSERT_HEAD(&ctx->poll_aio_handlers, node, node_poll);
 351    }
 352    if (!QLIST_IS_INSERTED(node, node_deleted) &&
 353        poll_ready && revents == 0 &&
 354        aio_node_check(ctx, node->is_external) &&
 355        node->io_poll_ready) {
 356        node->io_poll_ready(node->opaque);
 357
 358        /*
 359         * Return early since revents was zero. aio_notify() does not count as
 360         * progress.
 361         */
 362        return node->opaque != &ctx->notifier;
 363    }
 364
 365    if (!QLIST_IS_INSERTED(node, node_deleted) &&
 366        (revents & (G_IO_IN | G_IO_HUP | G_IO_ERR)) &&
 367        aio_node_check(ctx, node->is_external) &&
 368        node->io_read) {
 369        node->io_read(node->opaque);
 370
 371        /* aio_notify() does not count as progress */
 372        if (node->opaque != &ctx->notifier) {
 373            progress = true;
 374        }
 375    }
 376    if (!QLIST_IS_INSERTED(node, node_deleted) &&
 377        (revents & (G_IO_OUT | G_IO_ERR)) &&
 378        aio_node_check(ctx, node->is_external) &&
 379        node->io_write) {
 380        node->io_write(node->opaque);
 381        progress = true;
 382    }
 383
 384    return progress;
 385}
 386
 387/*
 388 * If we have a list of ready handlers then this is more efficient than
 389 * scanning all handlers with aio_dispatch_handlers().
 390 */
 391static bool aio_dispatch_ready_handlers(AioContext *ctx,
 392                                        AioHandlerList *ready_list)
 393{
 394    bool progress = false;
 395    AioHandler *node;
 396
 397    while ((node = QLIST_FIRST(ready_list))) {
 398        QLIST_REMOVE(node, node_ready);
 399        progress = aio_dispatch_handler(ctx, node) || progress;
 400    }
 401
 402    return progress;
 403}
 404
 405/* Slower than aio_dispatch_ready_handlers() but only used via glib */
 406static bool aio_dispatch_handlers(AioContext *ctx)
 407{
 408    AioHandler *node, *tmp;
 409    bool progress = false;
 410
 411    QLIST_FOREACH_SAFE_RCU(node, &ctx->aio_handlers, node, tmp) {
 412        progress = aio_dispatch_handler(ctx, node) || progress;
 413    }
 414
 415    return progress;
 416}
 417
 418void aio_dispatch(AioContext *ctx)
 419{
 420    qemu_lockcnt_inc(&ctx->list_lock);
 421    aio_bh_poll(ctx);
 422    aio_dispatch_handlers(ctx);
 423    aio_free_deleted_handlers(ctx);
 424    qemu_lockcnt_dec(&ctx->list_lock);
 425
 426    timerlistgroup_run_timers(&ctx->tlg);
 427}
 428
 429static bool run_poll_handlers_once(AioContext *ctx,
 430                                   AioHandlerList *ready_list,
 431                                   int64_t now,
 432                                   int64_t *timeout)
 433{
 434    bool progress = false;
 435    AioHandler *node;
 436    AioHandler *tmp;
 437
 438    QLIST_FOREACH_SAFE(node, &ctx->poll_aio_handlers, node_poll, tmp) {
 439        if (aio_node_check(ctx, node->is_external) &&
 440            node->io_poll(node->opaque)) {
 441            aio_add_poll_ready_handler(ready_list, node);
 442
 443            node->poll_idle_timeout = now + POLL_IDLE_INTERVAL_NS;
 444
 445            /*
 446             * Polling was successful, exit try_poll_mode immediately
 447             * to adjust the next polling time.
 448             */
 449            *timeout = 0;
 450            if (node->opaque != &ctx->notifier) {
 451                progress = true;
 452            }
 453        }
 454
 455        /* Caller handles freeing deleted nodes.  Don't do it here. */
 456    }
 457
 458    return progress;
 459}
 460
 461static bool fdmon_supports_polling(AioContext *ctx)
 462{
 463    return ctx->fdmon_ops->need_wait != aio_poll_disabled;
 464}
 465
 466static bool remove_idle_poll_handlers(AioContext *ctx,
 467                                      AioHandlerList *ready_list,
 468                                      int64_t now)
 469{
 470    AioHandler *node;
 471    AioHandler *tmp;
 472    bool progress = false;
 473
 474    /*
 475     * File descriptor monitoring implementations without userspace polling
 476     * support suffer from starvation when a subset of handlers is polled
 477     * because fds will not be processed in a timely fashion.  Don't remove
 478     * idle poll handlers.
 479     */
 480    if (!fdmon_supports_polling(ctx)) {
 481        return false;
 482    }
 483
 484    QLIST_FOREACH_SAFE(node, &ctx->poll_aio_handlers, node_poll, tmp) {
 485        if (node->poll_idle_timeout == 0LL) {
 486            node->poll_idle_timeout = now + POLL_IDLE_INTERVAL_NS;
 487        } else if (now >= node->poll_idle_timeout) {
 488            trace_poll_remove(ctx, node, node->pfd.fd);
 489            node->poll_idle_timeout = 0LL;
 490            QLIST_SAFE_REMOVE(node, node_poll);
 491            if (ctx->poll_started && node->io_poll_end) {
 492                node->io_poll_end(node->opaque);
 493
 494                /*
 495                 * Final poll in case ->io_poll_end() races with an event.
 496                 * Nevermind about re-adding the handler in the rare case where
 497                 * this causes progress.
 498                 */
 499                if (node->io_poll(node->opaque)) {
 500                    aio_add_poll_ready_handler(ready_list, node);
 501                    progress = true;
 502                }
 503            }
 504        }
 505    }
 506
 507    return progress;
 508}
 509
 510/* run_poll_handlers:
 511 * @ctx: the AioContext
 512 * @ready_list: the list to place ready handlers on
 513 * @max_ns: maximum time to poll for, in nanoseconds
 514 *
 515 * Polls for a given time.
 516 *
 517 * Note that the caller must have incremented ctx->list_lock.
 518 *
 519 * Returns: true if progress was made, false otherwise
 520 */
 521static bool run_poll_handlers(AioContext *ctx, AioHandlerList *ready_list,
 522                              int64_t max_ns, int64_t *timeout)
 523{
 524    bool progress;
 525    int64_t start_time, elapsed_time;
 526
 527    assert(qemu_lockcnt_count(&ctx->list_lock) > 0);
 528
 529    trace_run_poll_handlers_begin(ctx, max_ns, *timeout);
 530
 531    /*
 532     * Optimization: ->io_poll() handlers often contain RCU read critical
 533     * sections and we therefore see many rcu_read_lock() -> rcu_read_unlock()
 534     * -> rcu_read_lock() -> ... sequences with expensive memory
 535     * synchronization primitives.  Make the entire polling loop an RCU
 536     * critical section because nested rcu_read_lock()/rcu_read_unlock() calls
 537     * are cheap.
 538     */
 539    RCU_READ_LOCK_GUARD();
 540
 541    start_time = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
 542    do {
 543        progress = run_poll_handlers_once(ctx, ready_list,
 544                                          start_time, timeout);
 545        elapsed_time = qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - start_time;
 546        max_ns = qemu_soonest_timeout(*timeout, max_ns);
 547        assert(!(max_ns && progress));
 548    } while (elapsed_time < max_ns && !ctx->fdmon_ops->need_wait(ctx));
 549
 550    if (remove_idle_poll_handlers(ctx, ready_list,
 551                                  start_time + elapsed_time)) {
 552        *timeout = 0;
 553        progress = true;
 554    }
 555
 556    /* If time has passed with no successful polling, adjust *timeout to
 557     * keep the same ending time.
 558     */
 559    if (*timeout != -1) {
 560        *timeout -= MIN(*timeout, elapsed_time);
 561    }
 562
 563    trace_run_poll_handlers_end(ctx, progress, *timeout);
 564    return progress;
 565}
 566
 567/* try_poll_mode:
 568 * @ctx: the AioContext
 569 * @ready_list: list to add handlers that need to be run
 570 * @timeout: timeout for blocking wait, computed by the caller and updated if
 571 *    polling succeeds.
 572 *
 573 * Note that the caller must have incremented ctx->list_lock.
 574 *
 575 * Returns: true if progress was made, false otherwise
 576 */
 577static bool try_poll_mode(AioContext *ctx, AioHandlerList *ready_list,
 578                          int64_t *timeout)
 579{
 580    int64_t max_ns;
 581
 582    if (QLIST_EMPTY_RCU(&ctx->poll_aio_handlers)) {
 583        return false;
 584    }
 585
 586    max_ns = qemu_soonest_timeout(*timeout, ctx->poll_ns);
 587    if (max_ns && !ctx->fdmon_ops->need_wait(ctx)) {
 588        poll_set_started(ctx, ready_list, true);
 589
 590        if (run_poll_handlers(ctx, ready_list, max_ns, timeout)) {
 591            return true;
 592        }
 593    }
 594
 595    if (poll_set_started(ctx, ready_list, false)) {
 596        *timeout = 0;
 597        return true;
 598    }
 599
 600    return false;
 601}
 602
 603bool aio_poll(AioContext *ctx, bool blocking)
 604{
 605    AioHandlerList ready_list = QLIST_HEAD_INITIALIZER(ready_list);
 606    bool progress;
 607    bool use_notify_me;
 608    int64_t timeout;
 609    int64_t start = 0;
 610
 611    /*
 612     * There cannot be two concurrent aio_poll calls for the same AioContext (or
 613     * an aio_poll concurrent with a GSource prepare/check/dispatch callback).
 614     * We rely on this below to avoid slow locked accesses to ctx->notify_me.
 615     *
 616     * aio_poll() may only be called in the AioContext's thread. iohandler_ctx
 617     * is special in that it runs in the main thread, but that thread's context
 618     * is qemu_aio_context.
 619     */
 620    assert(in_aio_context_home_thread(ctx == iohandler_get_aio_context() ?
 621                                      qemu_get_aio_context() : ctx));
 622
 623    qemu_lockcnt_inc(&ctx->list_lock);
 624
 625    if (ctx->poll_max_ns) {
 626        start = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
 627    }
 628
 629    timeout = blocking ? aio_compute_timeout(ctx) : 0;
 630    progress = try_poll_mode(ctx, &ready_list, &timeout);
 631    assert(!(timeout && progress));
 632
 633    /*
 634     * aio_notify can avoid the expensive event_notifier_set if
 635     * everything (file descriptors, bottom halves, timers) will
 636     * be re-evaluated before the next blocking poll().  This is
 637     * already true when aio_poll is called with blocking == false;
 638     * if blocking == true, it is only true after poll() returns,
 639     * so disable the optimization now.
 640     */
 641    use_notify_me = timeout != 0;
 642    if (use_notify_me) {
 643        qatomic_set(&ctx->notify_me, qatomic_read(&ctx->notify_me) + 2);
 644        /*
 645         * Write ctx->notify_me before reading ctx->notified.  Pairs with
 646         * smp_mb in aio_notify().
 647         */
 648        smp_mb();
 649
 650        /* Don't block if aio_notify() was called */
 651        if (qatomic_read(&ctx->notified)) {
 652            timeout = 0;
 653        }
 654    }
 655
 656    /* If polling is allowed, non-blocking aio_poll does not need the
 657     * system call---a single round of run_poll_handlers_once suffices.
 658     */
 659    if (timeout || ctx->fdmon_ops->need_wait(ctx)) {
 660        ctx->fdmon_ops->wait(ctx, &ready_list, timeout);
 661    }
 662
 663    if (use_notify_me) {
 664        /* Finish the poll before clearing the flag.  */
 665        qatomic_store_release(&ctx->notify_me,
 666                             qatomic_read(&ctx->notify_me) - 2);
 667    }
 668
 669    aio_notify_accept(ctx);
 670
 671    /* Adjust polling time */
 672    if (ctx->poll_max_ns) {
 673        int64_t block_ns = qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - start;
 674
 675        if (block_ns <= ctx->poll_ns) {
 676            /* This is the sweet spot, no adjustment needed */
 677        } else if (block_ns > ctx->poll_max_ns) {
 678            /* We'd have to poll for too long, poll less */
 679            int64_t old = ctx->poll_ns;
 680
 681            if (ctx->poll_shrink) {
 682                ctx->poll_ns /= ctx->poll_shrink;
 683            } else {
 684                ctx->poll_ns = 0;
 685            }
 686
 687            trace_poll_shrink(ctx, old, ctx->poll_ns);
 688        } else if (ctx->poll_ns < ctx->poll_max_ns &&
 689                   block_ns < ctx->poll_max_ns) {
 690            /* There is room to grow, poll longer */
 691            int64_t old = ctx->poll_ns;
 692            int64_t grow = ctx->poll_grow;
 693
 694            if (grow == 0) {
 695                grow = 2;
 696            }
 697
 698            if (ctx->poll_ns) {
 699                ctx->poll_ns *= grow;
 700            } else {
 701                ctx->poll_ns = 4000; /* start polling at 4 microseconds */
 702            }
 703
 704            if (ctx->poll_ns > ctx->poll_max_ns) {
 705                ctx->poll_ns = ctx->poll_max_ns;
 706            }
 707
 708            trace_poll_grow(ctx, old, ctx->poll_ns);
 709        }
 710    }
 711
 712    progress |= aio_bh_poll(ctx);
 713    progress |= aio_dispatch_ready_handlers(ctx, &ready_list);
 714
 715    aio_free_deleted_handlers(ctx);
 716
 717    qemu_lockcnt_dec(&ctx->list_lock);
 718
 719    progress |= timerlistgroup_run_timers(&ctx->tlg);
 720
 721    return progress;
 722}
 723
 724void aio_context_setup(AioContext *ctx)
 725{
 726    ctx->fdmon_ops = &fdmon_poll_ops;
 727    ctx->epollfd = -1;
 728
 729    /* Use the fastest fd monitoring implementation if available */
 730    if (fdmon_io_uring_setup(ctx)) {
 731        return;
 732    }
 733
 734    fdmon_epoll_setup(ctx);
 735}
 736
 737void aio_context_destroy(AioContext *ctx)
 738{
 739    fdmon_io_uring_destroy(ctx);
 740    fdmon_epoll_disable(ctx);
 741    aio_free_deleted_handlers(ctx);
 742}
 743
 744void aio_context_use_g_source(AioContext *ctx)
 745{
 746    /*
 747     * Disable io_uring when the glib main loop is used because it doesn't
 748     * support mixed glib/aio_poll() usage. It relies on aio_poll() being
 749     * called regularly so that changes to the monitored file descriptors are
 750     * submitted, otherwise a list of pending fd handlers builds up.
 751     */
 752    fdmon_io_uring_destroy(ctx);
 753    aio_free_deleted_handlers(ctx);
 754}
 755
 756void aio_context_set_poll_params(AioContext *ctx, int64_t max_ns,
 757                                 int64_t grow, int64_t shrink, Error **errp)
 758{
 759    /* No thread synchronization here, it doesn't matter if an incorrect value
 760     * is used once.
 761     */
 762    ctx->poll_max_ns = max_ns;
 763    ctx->poll_ns = 0;
 764    ctx->poll_grow = grow;
 765    ctx->poll_shrink = shrink;
 766
 767    aio_notify(ctx);
 768}
 769
 770void aio_context_set_aio_params(AioContext *ctx, int64_t max_batch,
 771                                Error **errp)
 772{
 773    /*
 774     * No thread synchronization here, it doesn't matter if an incorrect value
 775     * is used once.
 776     */
 777    ctx->aio_max_batch = max_batch;
 778
 779    aio_notify(ctx);
 780}
 781