On Fri, 01/13 14:17, Paolo Bonzini wrote:
> aio_co_wake provides the infrastructure to start a coroutine on a "home"
> AioContext.  It will be used by CoMutex and CoQueue, so that coroutines
> don't jump from one context to another when they go to sleep on a
> mutex or waitqueue.  However, it can also be used as a more efficient
> alternative to one-shot bottom halves, and saves the effort of tracking
> which AioContext a coroutine is running on.
> 
> aio_co_schedule is the part of aio_co_wake that starts a coroutine
> on a remove AioContext, but it is also useful to implement e.g.

s/remove/remote/ and maybe s/but/and/ ?

> bdrv_set_aio_context callbacks.
> 
> The implementation of aio_co_schedule is based on a lock-free
> multiple-producer, single-consumer queue.  The multiple producers use
> cmpxchg to add to a LIFO stack.  The consumer (a per-AioContext bottom
> half) grabs all items added so far, inverts the list to make it FIFO,
> and goes through it one item at a time until it's empty.  The data
> structure was inspired by OSv, which uses it in the very code we'll
> "port" to QEMU for the thread-safe CoMutex.
> 
> Most of the new code is really tests.
> 
> Signed-off-by: Paolo Bonzini <pbonz...@redhat.com>
> ---
>  async.c                      |  65 +++++++++++++
>  include/block/aio.h          |  32 +++++++
>  include/qemu/coroutine_int.h |  10 +-
>  tests/Makefile.include       |  13 ++-
>  tests/iothread.c             |  91 ++++++++++++++++++
>  tests/iothread.h             |  25 +++++
>  tests/test-aio-multithread.c | 213 
> +++++++++++++++++++++++++++++++++++++++++++
>  tests/test-vmstate.c         |  11 ---
>  trace-events                 |   4 +
>  util/qemu-coroutine.c        |   8 ++
>  10 files changed, 456 insertions(+), 16 deletions(-)
>  create mode 100644 tests/iothread.c
>  create mode 100644 tests/iothread.h
>  create mode 100644 tests/test-aio-multithread.c
> 
> diff --git a/async.c b/async.c
> index 0d218ab..1338682 100644
> --- a/async.c
> +++ b/async.c
> @@ -30,6 +30,8 @@
>  #include "qemu/main-loop.h"
>  #include "qemu/atomic.h"
>  #include "block/raw-aio.h"
> +#include "trace/generated-tracers.h"
> +#include "qemu/coroutine_int.h"
>  
>  /***********************************************************/
>  /* bottom halves (can be seen as timers which expire ASAP) */
> @@ -274,6 +276,9 @@ aio_ctx_finalize(GSource     *source)
>      }
>  #endif
>  
> +    assert(QSLIST_EMPTY(&ctx->scheduled_coroutines));
> +    qemu_bh_delete(ctx->co_schedule_bh);
> +
>      qemu_lockcnt_lock(&ctx->list_lock);
>      assert(!qemu_lockcnt_count(&ctx->list_lock));
>      while (ctx->first_bh) {
> @@ -363,6 +368,28 @@ static bool event_notifier_poll(void *opaque)
>      return atomic_read(&ctx->notified);
>  }
>  
> +static void co_schedule_bh_cb(void *opaque)
> +{
> +    AioContext *ctx = opaque;
> +    QSLIST_HEAD(, Coroutine) straight, reversed;
> +
> +    QSLIST_MOVE_ATOMIC(&reversed, &ctx->scheduled_coroutines);
> +    QSLIST_INIT(&straight);

Worth special casing 1 element case?

> +
> +    while (!QSLIST_EMPTY(&reversed)) {
> +        Coroutine *co = QSLIST_FIRST(&reversed);
> +        QSLIST_REMOVE_HEAD(&reversed, co_scheduled_next);
> +        QSLIST_INSERT_HEAD(&straight, co, co_scheduled_next);
> +    }
> +
> +    while (!QSLIST_EMPTY(&straight)) {
> +        Coroutine *co = QSLIST_FIRST(&straight);
> +        QSLIST_REMOVE_HEAD(&straight, co_scheduled_next);
> +        trace_aio_co_schedule_bh_cb(ctx, co);
> +        qemu_coroutine_enter(co);
> +    }
> +}
> +
> diff --git a/tests/iothread.c b/tests/iothread.c
> new file mode 100644
> index 0000000..777d9ee
> --- /dev/null
> +++ b/tests/iothread.c
> @@ -0,0 +1,91 @@
> +/*
> + * Event loop thread implementation for unit tests

Curious: what is preventing from (perhaps enhancing and then) using the top
iothread.c implementation?

> + *
> + * Copyright Red Hat Inc., 2013, 2016
> + *
> + * Authors:
> + *  Stefan Hajnoczi   <stefa...@redhat.com>
> + *  Paolo Bonzini     <pbonz...@redhat.com>
> + *
> + * This work is licensed under the terms of the GNU GPL, version 2 or later.
> + * See the COPYING file in the top-level directory.
> + *
> + */
> +
> +#include "qemu/osdep.h"
> +#include "qapi/error.h"
> +#include "block/aio.h"
> +#include "qemu/main-loop.h"
> +#include "qemu/rcu.h"
> +#include "iothread.h"
> +
> +struct IOThread {
> +    AioContext *ctx;
> +
> +    QemuThread thread;
> +    QemuMutex init_done_lock;
> +    QemuCond init_done_cond;    /* is thread initialization done? */
> +    bool stopping;
> +};
> +
> +static __thread IOThread *my_iothread;
> +
> +AioContext *qemu_get_current_aio_context(void)
> +{
> +    return my_iothread ? my_iothread->ctx : qemu_get_aio_context();
> +}
> +
> +static void *iothread_run(void *opaque)
> +{
> +    IOThread *iothread = opaque;
> +
> +    rcu_register_thread();
> +
> +    my_iothread = iothread;
> +    qemu_mutex_lock(&iothread->init_done_lock);
> +    iothread->ctx = aio_context_new(&error_abort);
> +    qemu_cond_signal(&iothread->init_done_cond);
> +    qemu_mutex_unlock(&iothread->init_done_lock);
> +
> +    while (!atomic_read(&iothread->stopping)) {
> +        aio_poll(iothread->ctx, true);
> +    }
> +
> +    rcu_unregister_thread();
> +    return NULL;
> +}
> +
> +void iothread_join(IOThread *iothread)
> +{
> +    iothread->stopping = true;
> +    aio_notify(iothread->ctx);
> +    qemu_thread_join(&iothread->thread);
> +    qemu_cond_destroy(&iothread->init_done_cond);
> +    qemu_mutex_destroy(&iothread->init_done_lock);
> +    aio_context_unref(iothread->ctx);
> +    g_free(iothread);
> +}
> +
> +IOThread *iothread_new(void)
> +{
> +    IOThread *iothread = g_new0(IOThread, 1);
> +
> +    qemu_mutex_init(&iothread->init_done_lock);
> +    qemu_cond_init(&iothread->init_done_cond);
> +    qemu_thread_create(&iothread->thread, NULL, iothread_run,
> +                       iothread, QEMU_THREAD_JOINABLE);
> +
> +    /* Wait for initialization to complete */
> +    qemu_mutex_lock(&iothread->init_done_lock);
> +    while (iothread->ctx == NULL) {
> +        qemu_cond_wait(&iothread->init_done_cond,
> +                       &iothread->init_done_lock);
> +    }
> +    qemu_mutex_unlock(&iothread->init_done_lock);
> +    return iothread;
> +}
> +
> +AioContext *iothread_get_aio_context(IOThread *iothread)
> +{
> +    return iothread->ctx;
> +}
> diff --git a/tests/test-aio-multithread.c b/tests/test-aio-multithread.c
> new file mode 100644
> index 0000000..17e81f9
> --- /dev/null
> +++ b/tests/test-aio-multithread.c
> @@ -0,0 +1,213 @@
> +/*
> + * AioContext multithreading tests
> + *
> + * Copyright Red Hat, Inc. 2016
> + *
> + * Authors:
> + *  Paolo Bonzini    <pbonz...@redhat.com>
> + *
> + * This work is licensed under the terms of the GNU LGPL, version 2 or later.
> + * See the COPYING.LIB file in the top-level directory.
> + */
> +
> +#include "qemu/osdep.h"
> +#include <glib.h>
> +#include "block/aio.h"
> +#include "qapi/error.h"
> +#include "qemu/coroutine.h"
> +#include "qemu/thread.h"
> +#include "qemu/error-report.h"
> +#include "iothread.h"
> +
> +/* AioContext management */
> +
> +#define NUM_CONTEXTS 5
> +
> +static IOThread *threads[NUM_CONTEXTS];
> +static AioContext *ctx[NUM_CONTEXTS];
> +static __thread int id = -1;
> +
> +static QemuEvent done_event;
> +
> +/* Run a function synchronously on a remote iothread. */
> +
> +typedef struct CtxRunData {
> +    QEMUBHFunc *cb;
> +    void *arg;
> +} CtxRunData;
> +
> +static void ctx_run_bh_cb(void *opaque)
> +{
> +    CtxRunData *data = opaque;
> +
> +    data->cb(data->arg);
> +    qemu_event_set(&done_event);
> +}
> +
> +static void ctx_run(int i, QEMUBHFunc *cb, void *opaque)
> +{
> +    CtxRunData data = {
> +        .cb = cb,
> +        .arg = opaque
> +    };
> +
> +    qemu_event_reset(&done_event);
> +    aio_bh_schedule_oneshot(ctx[i], ctx_run_bh_cb, &data);
> +    qemu_event_wait(&done_event);
> +}
> +
> +/* Starting the iothreads. */
> +
> +static void set_id_cb(void *opaque)
> +{
> +    int *i = opaque;
> +
> +    id = *i;
> +}
> +
> +static void create_aio_contexts(void)
> +{
> +    int i;
> +
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        threads[i] = iothread_new();
> +        ctx[i] = iothread_get_aio_context(threads[i]);
> +    }
> +
> +    qemu_event_init(&done_event, false);
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        ctx_run(i, set_id_cb, &i);
> +    }
> +}
> +
> +/* Stopping the iothreads. */
> +
> +static void join_aio_contexts(void)
> +{
> +    int i;
> +
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        aio_context_ref(ctx[i]);
> +    }
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        iothread_join(threads[i]);
> +    }
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        aio_context_unref(ctx[i]);
> +    }
> +    qemu_event_destroy(&done_event);
> +}
> +
> +/* Basic test for the stuff above. */
> +
> +static void test_lifecycle(void)
> +{
> +    create_aio_contexts();
> +    join_aio_contexts();
> +}
> +
> +/* aio_co_schedule test.  */
> +
> +static Coroutine *to_schedule[NUM_CONTEXTS];
> +
> +static bool now_stopping;
> +
> +static int count_retry;
> +static int count_here;
> +static int count_other;
> +
> +static bool schedule_next(int n)
> +{
> +    Coroutine *co;
> +
> +    co = atomic_xchg(&to_schedule[n], NULL);
> +    if (!co) {
> +        atomic_inc(&count_retry);
> +        return false;
> +    }
> +
> +    if (n == id) {
> +        atomic_inc(&count_here);
> +    } else {
> +        atomic_inc(&count_other);
> +    }
> +
> +    aio_co_schedule(ctx[n], co);
> +    return true;
> +}
> +
> +static void finish_cb(void *opaque)
> +{
> +    schedule_next(id);
> +}
> +
> +static void test_multi_co_schedule_entry(void *opaque)
> +{
> +    g_assert(to_schedule[id] == NULL);
> +    atomic_mb_set(&to_schedule[id], qemu_coroutine_self());
> +
> +    while (!atomic_mb_read(&now_stopping)) {
> +        int n;
> +
> +        n = g_test_rand_int_range(0, NUM_CONTEXTS);
> +        schedule_next(n);
> +        qemu_coroutine_yield();
> +
> +        g_assert(to_schedule[id] == NULL);
> +        atomic_mb_set(&to_schedule[id], qemu_coroutine_self());
> +    }
> +}
> +
> +
> +static void test_multi_co_schedule(int seconds)
> +{
> +    int i;
> +
> +    count_here = count_other = count_retry = 0;
> +    now_stopping = false;
> +
> +    create_aio_contexts();
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        Coroutine *co1 = qemu_coroutine_create(test_multi_co_schedule_entry, 
> NULL);
> +        aio_co_schedule(ctx[i], co1);
> +    }
> +
> +    g_usleep(seconds * 1000000);
> +
> +    atomic_mb_set(&now_stopping, true);
> +    for (i = 0; i < NUM_CONTEXTS; i++) {
> +        ctx_run(i, finish_cb, NULL);
> +        to_schedule[i] = NULL;
> +    }
> +
> +    join_aio_contexts();
> +    g_test_message("scheduled %d, queued %d, retry %d, total %d\n",
> +                  count_other, count_here, count_retry,
> +                  count_here + count_other + count_retry);
> +}
> +
> +static void test_multi_co_schedule_1(void)
> +{
> +    test_multi_co_schedule(1);
> +}
> +
> +static void test_multi_co_schedule_10(void)
> +{
> +    test_multi_co_schedule(10);
> +}
> +
> +/* End of tests.  */
> +
> +int main(int argc, char **argv)
> +{
> +    init_clocks();
> +
> +    g_test_init(&argc, &argv, NULL);
> +    g_test_add_func("/aio/multi/lifecycle", test_lifecycle);
> +    if (g_test_quick()) {
> +        g_test_add_func("/aio/multi/schedule", test_multi_co_schedule_1);
> +    } else {
> +        g_test_add_func("/aio/multi/schedule", test_multi_co_schedule_10);
> +    }
> +    return g_test_run();
> +}

Fam

Reply via email to