qemu-devel
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [Qemu-devel] [PATCH 01/16] aio: introduce aio_co_schedule and aio_co


From: Paolo Bonzini
Subject: Re: [Qemu-devel] [PATCH 01/16] aio: introduce aio_co_schedule and aio_co_wake
Date: Mon, 16 Jan 2017 13:19:44 +0100
User-agent: Mozilla/5.0 (X11; Linux x86_64; rv:45.0) Gecko/20100101 Thunderbird/45.5.1


On 16/01/2017 12:09, Fam Zheng wrote:
> On Fri, 01/13 14:17, Paolo Bonzini wrote:
>> aio_co_wake provides the infrastructure to start a coroutine on a "home"
>> AioContext.  It will be used by CoMutex and CoQueue, so that coroutines
>> don't jump from one context to another when they go to sleep on a
>> mutex or waitqueue.  However, it can also be used as a more efficient
>> alternative to one-shot bottom halves, and saves the effort of tracking
>> which AioContext a coroutine is running on.
>>
>> aio_co_schedule is the part of aio_co_wake that starts a coroutine
>> on a remove AioContext, but it is also useful to implement e.g.
> 
> s/remove/remote/ and maybe s/but/and/ ?
> 
>> bdrv_set_aio_context callbacks.
>>
>> The implementation of aio_co_schedule is based on a lock-free
>> multiple-producer, single-consumer queue.  The multiple producers use
>> cmpxchg to add to a LIFO stack.  The consumer (a per-AioContext bottom
>> half) grabs all items added so far, inverts the list to make it FIFO,
>> and goes through it one item at a time until it's empty.  The data
>> structure was inspired by OSv, which uses it in the very code we'll
>> "port" to QEMU for the thread-safe CoMutex.
>>
>> Most of the new code is really tests.
>>
>> Signed-off-by: Paolo Bonzini <address@hidden>
>> ---
>>  async.c                      |  65 +++++++++++++
>>  include/block/aio.h          |  32 +++++++
>>  include/qemu/coroutine_int.h |  10 +-
>>  tests/Makefile.include       |  13 ++-
>>  tests/iothread.c             |  91 ++++++++++++++++++
>>  tests/iothread.h             |  25 +++++
>>  tests/test-aio-multithread.c | 213 
>> +++++++++++++++++++++++++++++++++++++++++++
>>  tests/test-vmstate.c         |  11 ---
>>  trace-events                 |   4 +
>>  util/qemu-coroutine.c        |   8 ++
>>  10 files changed, 456 insertions(+), 16 deletions(-)
>>  create mode 100644 tests/iothread.c
>>  create mode 100644 tests/iothread.h
>>  create mode 100644 tests/test-aio-multithread.c
>>
>> diff --git a/async.c b/async.c
>> index 0d218ab..1338682 100644
>> --- a/async.c
>> +++ b/async.c
>> @@ -30,6 +30,8 @@
>>  #include "qemu/main-loop.h"
>>  #include "qemu/atomic.h"
>>  #include "block/raw-aio.h"
>> +#include "trace/generated-tracers.h"
>> +#include "qemu/coroutine_int.h"
>>  
>>  /***********************************************************/
>>  /* bottom halves (can be seen as timers which expire ASAP) */
>> @@ -274,6 +276,9 @@ aio_ctx_finalize(GSource     *source)
>>      }
>>  #endif
>>  
>> +    assert(QSLIST_EMPTY(&ctx->scheduled_coroutines));
>> +    qemu_bh_delete(ctx->co_schedule_bh);
>> +
>>      qemu_lockcnt_lock(&ctx->list_lock);
>>      assert(!qemu_lockcnt_count(&ctx->list_lock));
>>      while (ctx->first_bh) {
>> @@ -363,6 +368,28 @@ static bool event_notifier_poll(void *opaque)
>>      return atomic_read(&ctx->notified);
>>  }
>>  
>> +static void co_schedule_bh_cb(void *opaque)
>> +{
>> +    AioContext *ctx = opaque;
>> +    QSLIST_HEAD(, Coroutine) straight, reversed;
>> +
>> +    QSLIST_MOVE_ATOMIC(&reversed, &ctx->scheduled_coroutines);
>> +    QSLIST_INIT(&straight);
> 
> Worth special casing 1 element case?

Sounds like premature optimization; the QSLIST_MOVE_ATOMIC is going to
be pretty expensive anyway.  Do you mean something like:

        if (QSLIST_EMPTY(&reversed)) {
            return;
        }
        Coroutine *co = QSLIST_FIRST(&reversed);
        if (!QSLIST_NEXT(co, co_scheduled_next)) {
            straight = reversed;
        } else {
            do {
                ...
            } while (!QSLIST_EMPTY(&reversed);
        }

        do {
            ...
        } while (!QSLIST_EMPTY(&straight);

?  Looks a but busy.  However, removing the QSLIST_EMPTY case and then
using do/while may be a nice middle.

Paolo

>> +
>> +    while (!QSLIST_EMPTY(&reversed)) {
>> +        Coroutine *co = QSLIST_FIRST(&reversed);
>> +        QSLIST_REMOVE_HEAD(&reversed, co_scheduled_next);
>> +        QSLIST_INSERT_HEAD(&straight, co, co_scheduled_next);
>> +    }
>> +
>> +    while (!QSLIST_EMPTY(&straight)) {
>> +        Coroutine *co = QSLIST_FIRST(&straight);
>> +        QSLIST_REMOVE_HEAD(&straight, co_scheduled_next);
>> +        trace_aio_co_schedule_bh_cb(ctx, co);
>> +        qemu_coroutine_enter(co);
>> +    }
>> +}
>> +
>> diff --git a/tests/iothread.c b/tests/iothread.c
>> new file mode 100644
>> index 0000000..777d9ee
>> --- /dev/null
>> +++ b/tests/iothread.c
>> @@ -0,0 +1,91 @@
>> +/*
>> + * Event loop thread implementation for unit tests
> 
> Curious: what is preventing from (perhaps enhancing and then) using the top
> iothread.c implementation?

Mostly the dependency of iothread.c on QOM.  iothread_new is much
simpler than creating a new object, adding it to the QOM tree, calling
user_creatable_complete, etc.  A wrapper wouldn't be much smaller than
this file.

Paolo

>> + *
>> + * Copyright Red Hat Inc., 2013, 2016
>> + *
>> + * Authors:
>> + *  Stefan Hajnoczi   <address@hidden>
>> + *  Paolo Bonzini     <address@hidden>
>> + *
>> + * This work is licensed under the terms of the GNU GPL, version 2 or later.
>> + * See the COPYING file in the top-level directory.
>> + *
>> + */
>> +
>> +#include "qemu/osdep.h"
>> +#include "qapi/error.h"
>> +#include "block/aio.h"
>> +#include "qemu/main-loop.h"
>> +#include "qemu/rcu.h"
>> +#include "iothread.h"
>> +
>> +struct IOThread {
>> +    AioContext *ctx;
>> +
>> +    QemuThread thread;
>> +    QemuMutex init_done_lock;
>> +    QemuCond init_done_cond;    /* is thread initialization done? */
>> +    bool stopping;
>> +};
>> +
>> +static __thread IOThread *my_iothread;
>> +
>> +AioContext *qemu_get_current_aio_context(void)
>> +{
>> +    return my_iothread ? my_iothread->ctx : qemu_get_aio_context();
>> +}
>> +
>> +static void *iothread_run(void *opaque)
>> +{
>> +    IOThread *iothread = opaque;
>> +
>> +    rcu_register_thread();
>> +
>> +    my_iothread = iothread;
>> +    qemu_mutex_lock(&iothread->init_done_lock);
>> +    iothread->ctx = aio_context_new(&error_abort);
>> +    qemu_cond_signal(&iothread->init_done_cond);
>> +    qemu_mutex_unlock(&iothread->init_done_lock);
>> +
>> +    while (!atomic_read(&iothread->stopping)) {
>> +        aio_poll(iothread->ctx, true);
>> +    }
>> +
>> +    rcu_unregister_thread();
>> +    return NULL;
>> +}
>> +
>> +void iothread_join(IOThread *iothread)
>> +{
>> +    iothread->stopping = true;
>> +    aio_notify(iothread->ctx);
>> +    qemu_thread_join(&iothread->thread);
>> +    qemu_cond_destroy(&iothread->init_done_cond);
>> +    qemu_mutex_destroy(&iothread->init_done_lock);
>> +    aio_context_unref(iothread->ctx);
>> +    g_free(iothread);
>> +}
>> +
>> +IOThread *iothread_new(void)
>> +{
>> +    IOThread *iothread = g_new0(IOThread, 1);
>> +
>> +    qemu_mutex_init(&iothread->init_done_lock);
>> +    qemu_cond_init(&iothread->init_done_cond);
>> +    qemu_thread_create(&iothread->thread, NULL, iothread_run,
>> +                       iothread, QEMU_THREAD_JOINABLE);
>> +
>> +    /* Wait for initialization to complete */
>> +    qemu_mutex_lock(&iothread->init_done_lock);
>> +    while (iothread->ctx == NULL) {
>> +        qemu_cond_wait(&iothread->init_done_cond,
>> +                       &iothread->init_done_lock);
>> +    }
>> +    qemu_mutex_unlock(&iothread->init_done_lock);
>> +    return iothread;
>> +}
>> +
>> +AioContext *iothread_get_aio_context(IOThread *iothread)
>> +{
>> +    return iothread->ctx;
>> +}
>> diff --git a/tests/test-aio-multithread.c b/tests/test-aio-multithread.c
>> new file mode 100644
>> index 0000000..17e81f9
>> --- /dev/null
>> +++ b/tests/test-aio-multithread.c
>> @@ -0,0 +1,213 @@
>> +/*
>> + * AioContext multithreading tests
>> + *
>> + * Copyright Red Hat, Inc. 2016
>> + *
>> + * Authors:
>> + *  Paolo Bonzini    <address@hidden>
>> + *
>> + * This work is licensed under the terms of the GNU LGPL, version 2 or 
>> later.
>> + * See the COPYING.LIB file in the top-level directory.
>> + */
>> +
>> +#include "qemu/osdep.h"
>> +#include <glib.h>
>> +#include "block/aio.h"
>> +#include "qapi/error.h"
>> +#include "qemu/coroutine.h"
>> +#include "qemu/thread.h"
>> +#include "qemu/error-report.h"
>> +#include "iothread.h"
>> +
>> +/* AioContext management */
>> +
>> +#define NUM_CONTEXTS 5
>> +
>> +static IOThread *threads[NUM_CONTEXTS];
>> +static AioContext *ctx[NUM_CONTEXTS];
>> +static __thread int id = -1;
>> +
>> +static QemuEvent done_event;
>> +
>> +/* Run a function synchronously on a remote iothread. */
>> +
>> +typedef struct CtxRunData {
>> +    QEMUBHFunc *cb;
>> +    void *arg;
>> +} CtxRunData;
>> +
>> +static void ctx_run_bh_cb(void *opaque)
>> +{
>> +    CtxRunData *data = opaque;
>> +
>> +    data->cb(data->arg);
>> +    qemu_event_set(&done_event);
>> +}
>> +
>> +static void ctx_run(int i, QEMUBHFunc *cb, void *opaque)
>> +{
>> +    CtxRunData data = {
>> +        .cb = cb,
>> +        .arg = opaque
>> +    };
>> +
>> +    qemu_event_reset(&done_event);
>> +    aio_bh_schedule_oneshot(ctx[i], ctx_run_bh_cb, &data);
>> +    qemu_event_wait(&done_event);
>> +}
>> +
>> +/* Starting the iothreads. */
>> +
>> +static void set_id_cb(void *opaque)
>> +{
>> +    int *i = opaque;
>> +
>> +    id = *i;
>> +}
>> +
>> +static void create_aio_contexts(void)
>> +{
>> +    int i;
>> +
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        threads[i] = iothread_new();
>> +        ctx[i] = iothread_get_aio_context(threads[i]);
>> +    }
>> +
>> +    qemu_event_init(&done_event, false);
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        ctx_run(i, set_id_cb, &i);
>> +    }
>> +}
>> +
>> +/* Stopping the iothreads. */
>> +
>> +static void join_aio_contexts(void)
>> +{
>> +    int i;
>> +
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        aio_context_ref(ctx[i]);
>> +    }
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        iothread_join(threads[i]);
>> +    }
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        aio_context_unref(ctx[i]);
>> +    }
>> +    qemu_event_destroy(&done_event);
>> +}
>> +
>> +/* Basic test for the stuff above. */
>> +
>> +static void test_lifecycle(void)
>> +{
>> +    create_aio_contexts();
>> +    join_aio_contexts();
>> +}
>> +
>> +/* aio_co_schedule test.  */
>> +
>> +static Coroutine *to_schedule[NUM_CONTEXTS];
>> +
>> +static bool now_stopping;
>> +
>> +static int count_retry;
>> +static int count_here;
>> +static int count_other;
>> +
>> +static bool schedule_next(int n)
>> +{
>> +    Coroutine *co;
>> +
>> +    co = atomic_xchg(&to_schedule[n], NULL);
>> +    if (!co) {
>> +        atomic_inc(&count_retry);
>> +        return false;
>> +    }
>> +
>> +    if (n == id) {
>> +        atomic_inc(&count_here);
>> +    } else {
>> +        atomic_inc(&count_other);
>> +    }
>> +
>> +    aio_co_schedule(ctx[n], co);
>> +    return true;
>> +}
>> +
>> +static void finish_cb(void *opaque)
>> +{
>> +    schedule_next(id);
>> +}
>> +
>> +static void test_multi_co_schedule_entry(void *opaque)
>> +{
>> +    g_assert(to_schedule[id] == NULL);
>> +    atomic_mb_set(&to_schedule[id], qemu_coroutine_self());
>> +
>> +    while (!atomic_mb_read(&now_stopping)) {
>> +        int n;
>> +
>> +        n = g_test_rand_int_range(0, NUM_CONTEXTS);
>> +        schedule_next(n);
>> +        qemu_coroutine_yield();
>> +
>> +        g_assert(to_schedule[id] == NULL);
>> +        atomic_mb_set(&to_schedule[id], qemu_coroutine_self());
>> +    }
>> +}
>> +
>> +
>> +static void test_multi_co_schedule(int seconds)
>> +{
>> +    int i;
>> +
>> +    count_here = count_other = count_retry = 0;
>> +    now_stopping = false;
>> +
>> +    create_aio_contexts();
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        Coroutine *co1 = 
>> qemu_coroutine_create(test_multi_co_schedule_entry, NULL);
>> +        aio_co_schedule(ctx[i], co1);
>> +    }
>> +
>> +    g_usleep(seconds * 1000000);
>> +
>> +    atomic_mb_set(&now_stopping, true);
>> +    for (i = 0; i < NUM_CONTEXTS; i++) {
>> +        ctx_run(i, finish_cb, NULL);
>> +        to_schedule[i] = NULL;
>> +    }
>> +
>> +    join_aio_contexts();
>> +    g_test_message("scheduled %d, queued %d, retry %d, total %d\n",
>> +                  count_other, count_here, count_retry,
>> +                  count_here + count_other + count_retry);
>> +}
>> +
>> +static void test_multi_co_schedule_1(void)
>> +{
>> +    test_multi_co_schedule(1);
>> +}
>> +
>> +static void test_multi_co_schedule_10(void)
>> +{
>> +    test_multi_co_schedule(10);
>> +}
>> +
>> +/* End of tests.  */
>> +
>> +int main(int argc, char **argv)
>> +{
>> +    init_clocks();
>> +
>> +    g_test_init(&argc, &argv, NULL);
>> +    g_test_add_func("/aio/multi/lifecycle", test_lifecycle);
>> +    if (g_test_quick()) {
>> +        g_test_add_func("/aio/multi/schedule", test_multi_co_schedule_1);
>> +    } else {
>> +        g_test_add_func("/aio/multi/schedule", test_multi_co_schedule_10);
>> +    }
>> +    return g_test_run();
>> +}
> 
> Fam
> 
> 



reply via email to

[Prev in Thread] Current Thread [Next in Thread]