Statistics
| Branch: | Revision:

root / thread-pool.c @ 737e150e

History | View | Annotate | Download (7.6 kB)

1 d354c7ec Paolo Bonzini
/*
2 d354c7ec Paolo Bonzini
 * QEMU block layer thread pool
3 d354c7ec Paolo Bonzini
 *
4 d354c7ec Paolo Bonzini
 * Copyright IBM, Corp. 2008
5 d354c7ec Paolo Bonzini
 * Copyright Red Hat, Inc. 2012
6 d354c7ec Paolo Bonzini
 *
7 d354c7ec Paolo Bonzini
 * Authors:
8 d354c7ec Paolo Bonzini
 *  Anthony Liguori   <aliguori@us.ibm.com>
9 d354c7ec Paolo Bonzini
 *  Paolo Bonzini     <pbonzini@redhat.com>
10 d354c7ec Paolo Bonzini
 *
11 d354c7ec Paolo Bonzini
 * This work is licensed under the terms of the GNU GPL, version 2.  See
12 d354c7ec Paolo Bonzini
 * the COPYING file in the top-level directory.
13 d354c7ec Paolo Bonzini
 *
14 d354c7ec Paolo Bonzini
 * Contributions after 2012-01-13 are licensed under the terms of the
15 d354c7ec Paolo Bonzini
 * GNU GPL, version 2 or (at your option) any later version.
16 d354c7ec Paolo Bonzini
 */
17 d354c7ec Paolo Bonzini
#include "qemu-common.h"
18 d354c7ec Paolo Bonzini
#include "qemu-queue.h"
19 d354c7ec Paolo Bonzini
#include "qemu-thread.h"
20 d354c7ec Paolo Bonzini
#include "osdep.h"
21 737e150e Paolo Bonzini
#include "block/coroutine.h"
22 d354c7ec Paolo Bonzini
#include "trace.h"
23 737e150e Paolo Bonzini
#include "block/block_int.h"
24 d354c7ec Paolo Bonzini
#include "event_notifier.h"
25 737e150e Paolo Bonzini
#include "block/thread-pool.h"
26 d354c7ec Paolo Bonzini
27 d354c7ec Paolo Bonzini
static void do_spawn_thread(void);
28 d354c7ec Paolo Bonzini
29 d354c7ec Paolo Bonzini
typedef struct ThreadPoolElement ThreadPoolElement;
30 d354c7ec Paolo Bonzini
31 d354c7ec Paolo Bonzini
enum ThreadState {
32 d354c7ec Paolo Bonzini
    THREAD_QUEUED,
33 d354c7ec Paolo Bonzini
    THREAD_ACTIVE,
34 d354c7ec Paolo Bonzini
    THREAD_DONE,
35 d354c7ec Paolo Bonzini
    THREAD_CANCELED,
36 d354c7ec Paolo Bonzini
};
37 d354c7ec Paolo Bonzini
38 d354c7ec Paolo Bonzini
struct ThreadPoolElement {
39 d354c7ec Paolo Bonzini
    BlockDriverAIOCB common;
40 d354c7ec Paolo Bonzini
    ThreadPoolFunc *func;
41 d354c7ec Paolo Bonzini
    void *arg;
42 19d092cf Paolo Bonzini
43 19d092cf Paolo Bonzini
    /* Moving state out of THREAD_QUEUED is protected by lock.  After
44 19d092cf Paolo Bonzini
     * that, only the worker thread can write to it.  Reads and writes
45 19d092cf Paolo Bonzini
     * of state and ret are ordered with memory barriers.
46 19d092cf Paolo Bonzini
     */
47 d354c7ec Paolo Bonzini
    enum ThreadState state;
48 d354c7ec Paolo Bonzini
    int ret;
49 d354c7ec Paolo Bonzini
50 d354c7ec Paolo Bonzini
    /* Access to this list is protected by lock.  */
51 d354c7ec Paolo Bonzini
    QTAILQ_ENTRY(ThreadPoolElement) reqs;
52 d354c7ec Paolo Bonzini
53 d354c7ec Paolo Bonzini
    /* Access to this list is protected by the global mutex.  */
54 d354c7ec Paolo Bonzini
    QLIST_ENTRY(ThreadPoolElement) all;
55 d354c7ec Paolo Bonzini
};
56 d354c7ec Paolo Bonzini
57 d354c7ec Paolo Bonzini
static EventNotifier notifier;
58 d354c7ec Paolo Bonzini
static QemuMutex lock;
59 d354c7ec Paolo Bonzini
static QemuCond check_cancel;
60 d354c7ec Paolo Bonzini
static QemuSemaphore sem;
61 d354c7ec Paolo Bonzini
static int max_threads = 64;
62 d354c7ec Paolo Bonzini
static QEMUBH *new_thread_bh;
63 d354c7ec Paolo Bonzini
64 d354c7ec Paolo Bonzini
/* The following variables are protected by the global mutex.  */
65 d354c7ec Paolo Bonzini
static QLIST_HEAD(, ThreadPoolElement) head;
66 d354c7ec Paolo Bonzini
67 d354c7ec Paolo Bonzini
/* The following variables are protected by lock.  */
68 d354c7ec Paolo Bonzini
static QTAILQ_HEAD(, ThreadPoolElement) request_list;
69 d354c7ec Paolo Bonzini
static int cur_threads;
70 d354c7ec Paolo Bonzini
static int idle_threads;
71 d354c7ec Paolo Bonzini
static int new_threads;     /* backlog of threads we need to create */
72 d354c7ec Paolo Bonzini
static int pending_threads; /* threads created but not running yet */
73 d354c7ec Paolo Bonzini
static int pending_cancellations; /* whether we need a cond_broadcast */
74 d354c7ec Paolo Bonzini
75 d354c7ec Paolo Bonzini
static void *worker_thread(void *unused)
76 d354c7ec Paolo Bonzini
{
77 d354c7ec Paolo Bonzini
    qemu_mutex_lock(&lock);
78 d354c7ec Paolo Bonzini
    pending_threads--;
79 d354c7ec Paolo Bonzini
    do_spawn_thread();
80 d354c7ec Paolo Bonzini
81 d354c7ec Paolo Bonzini
    while (1) {
82 d354c7ec Paolo Bonzini
        ThreadPoolElement *req;
83 d354c7ec Paolo Bonzini
        int ret;
84 d354c7ec Paolo Bonzini
85 d354c7ec Paolo Bonzini
        do {
86 d354c7ec Paolo Bonzini
            idle_threads++;
87 d354c7ec Paolo Bonzini
            qemu_mutex_unlock(&lock);
88 d354c7ec Paolo Bonzini
            ret = qemu_sem_timedwait(&sem, 10000);
89 d354c7ec Paolo Bonzini
            qemu_mutex_lock(&lock);
90 d354c7ec Paolo Bonzini
            idle_threads--;
91 d354c7ec Paolo Bonzini
        } while (ret == -1 && !QTAILQ_EMPTY(&request_list));
92 d354c7ec Paolo Bonzini
        if (ret == -1) {
93 d354c7ec Paolo Bonzini
            break;
94 d354c7ec Paolo Bonzini
        }
95 d354c7ec Paolo Bonzini
96 d354c7ec Paolo Bonzini
        req = QTAILQ_FIRST(&request_list);
97 d354c7ec Paolo Bonzini
        QTAILQ_REMOVE(&request_list, req, reqs);
98 d354c7ec Paolo Bonzini
        req->state = THREAD_ACTIVE;
99 d354c7ec Paolo Bonzini
        qemu_mutex_unlock(&lock);
100 d354c7ec Paolo Bonzini
101 d354c7ec Paolo Bonzini
        ret = req->func(req->arg);
102 d354c7ec Paolo Bonzini
103 d354c7ec Paolo Bonzini
        req->ret = ret;
104 19d092cf Paolo Bonzini
        /* Write ret before state.  */
105 19d092cf Paolo Bonzini
        smp_wmb();
106 19d092cf Paolo Bonzini
        req->state = THREAD_DONE;
107 19d092cf Paolo Bonzini
108 19d092cf Paolo Bonzini
        qemu_mutex_lock(&lock);
109 d354c7ec Paolo Bonzini
        if (pending_cancellations) {
110 d354c7ec Paolo Bonzini
            qemu_cond_broadcast(&check_cancel);
111 d354c7ec Paolo Bonzini
        }
112 d354c7ec Paolo Bonzini
113 d354c7ec Paolo Bonzini
        event_notifier_set(&notifier);
114 d354c7ec Paolo Bonzini
    }
115 d354c7ec Paolo Bonzini
116 d354c7ec Paolo Bonzini
    cur_threads--;
117 d354c7ec Paolo Bonzini
    qemu_mutex_unlock(&lock);
118 d354c7ec Paolo Bonzini
    return NULL;
119 d354c7ec Paolo Bonzini
}
120 d354c7ec Paolo Bonzini
121 d354c7ec Paolo Bonzini
static void do_spawn_thread(void)
122 d354c7ec Paolo Bonzini
{
123 d354c7ec Paolo Bonzini
    QemuThread t;
124 d354c7ec Paolo Bonzini
125 d354c7ec Paolo Bonzini
    /* Runs with lock taken.  */
126 d354c7ec Paolo Bonzini
    if (!new_threads) {
127 d354c7ec Paolo Bonzini
        return;
128 d354c7ec Paolo Bonzini
    }
129 d354c7ec Paolo Bonzini
130 d354c7ec Paolo Bonzini
    new_threads--;
131 d354c7ec Paolo Bonzini
    pending_threads++;
132 d354c7ec Paolo Bonzini
133 d354c7ec Paolo Bonzini
    qemu_thread_create(&t, worker_thread, NULL, QEMU_THREAD_DETACHED);
134 d354c7ec Paolo Bonzini
}
135 d354c7ec Paolo Bonzini
136 d354c7ec Paolo Bonzini
static void spawn_thread_bh_fn(void *opaque)
137 d354c7ec Paolo Bonzini
{
138 d354c7ec Paolo Bonzini
    qemu_mutex_lock(&lock);
139 d354c7ec Paolo Bonzini
    do_spawn_thread();
140 d354c7ec Paolo Bonzini
    qemu_mutex_unlock(&lock);
141 d354c7ec Paolo Bonzini
}
142 d354c7ec Paolo Bonzini
143 d354c7ec Paolo Bonzini
static void spawn_thread(void)
144 d354c7ec Paolo Bonzini
{
145 d354c7ec Paolo Bonzini
    cur_threads++;
146 d354c7ec Paolo Bonzini
    new_threads++;
147 d354c7ec Paolo Bonzini
    /* If there are threads being created, they will spawn new workers, so
148 d354c7ec Paolo Bonzini
     * we don't spend time creating many threads in a loop holding a mutex or
149 d354c7ec Paolo Bonzini
     * starving the current vcpu.
150 d354c7ec Paolo Bonzini
     *
151 d354c7ec Paolo Bonzini
     * If there are no idle threads, ask the main thread to create one, so we
152 d354c7ec Paolo Bonzini
     * inherit the correct affinity instead of the vcpu affinity.
153 d354c7ec Paolo Bonzini
     */
154 d354c7ec Paolo Bonzini
    if (!pending_threads) {
155 d354c7ec Paolo Bonzini
        qemu_bh_schedule(new_thread_bh);
156 d354c7ec Paolo Bonzini
    }
157 d354c7ec Paolo Bonzini
}
158 d354c7ec Paolo Bonzini
159 d354c7ec Paolo Bonzini
static void event_notifier_ready(EventNotifier *notifier)
160 d354c7ec Paolo Bonzini
{
161 d354c7ec Paolo Bonzini
    ThreadPoolElement *elem, *next;
162 d354c7ec Paolo Bonzini
163 d354c7ec Paolo Bonzini
    event_notifier_test_and_clear(notifier);
164 d354c7ec Paolo Bonzini
restart:
165 d354c7ec Paolo Bonzini
    QLIST_FOREACH_SAFE(elem, &head, all, next) {
166 d354c7ec Paolo Bonzini
        if (elem->state != THREAD_CANCELED && elem->state != THREAD_DONE) {
167 d354c7ec Paolo Bonzini
            continue;
168 d354c7ec Paolo Bonzini
        }
169 d354c7ec Paolo Bonzini
        if (elem->state == THREAD_DONE) {
170 d354c7ec Paolo Bonzini
            trace_thread_pool_complete(elem, elem->common.opaque, elem->ret);
171 d354c7ec Paolo Bonzini
        }
172 d354c7ec Paolo Bonzini
        if (elem->state == THREAD_DONE && elem->common.cb) {
173 d354c7ec Paolo Bonzini
            QLIST_REMOVE(elem, all);
174 19d092cf Paolo Bonzini
            /* Read state before ret.  */
175 19d092cf Paolo Bonzini
            smp_rmb();
176 19d092cf Paolo Bonzini
            elem->common.cb(elem->common.opaque, elem->ret);
177 d354c7ec Paolo Bonzini
            qemu_aio_release(elem);
178 d354c7ec Paolo Bonzini
            goto restart;
179 d354c7ec Paolo Bonzini
        } else {
180 d354c7ec Paolo Bonzini
            /* remove the request */
181 d354c7ec Paolo Bonzini
            QLIST_REMOVE(elem, all);
182 d354c7ec Paolo Bonzini
            qemu_aio_release(elem);
183 d354c7ec Paolo Bonzini
        }
184 d354c7ec Paolo Bonzini
    }
185 d354c7ec Paolo Bonzini
}
186 d354c7ec Paolo Bonzini
187 d354c7ec Paolo Bonzini
static int thread_pool_active(EventNotifier *notifier)
188 d354c7ec Paolo Bonzini
{
189 d354c7ec Paolo Bonzini
    return !QLIST_EMPTY(&head);
190 d354c7ec Paolo Bonzini
}
191 d354c7ec Paolo Bonzini
192 d354c7ec Paolo Bonzini
static void thread_pool_cancel(BlockDriverAIOCB *acb)
193 d354c7ec Paolo Bonzini
{
194 d354c7ec Paolo Bonzini
    ThreadPoolElement *elem = (ThreadPoolElement *)acb;
195 d354c7ec Paolo Bonzini
196 d354c7ec Paolo Bonzini
    trace_thread_pool_cancel(elem, elem->common.opaque);
197 d354c7ec Paolo Bonzini
198 d354c7ec Paolo Bonzini
    qemu_mutex_lock(&lock);
199 d354c7ec Paolo Bonzini
    if (elem->state == THREAD_QUEUED &&
200 d354c7ec Paolo Bonzini
        /* No thread has yet started working on elem. we can try to "steal"
201 d354c7ec Paolo Bonzini
         * the item from the worker if we can get a signal from the
202 d354c7ec Paolo Bonzini
         * semaphore.  Because this is non-blocking, we can do it with
203 d354c7ec Paolo Bonzini
         * the lock taken and ensure that elem will remain THREAD_QUEUED.
204 d354c7ec Paolo Bonzini
         */
205 d354c7ec Paolo Bonzini
        qemu_sem_timedwait(&sem, 0) == 0) {
206 d354c7ec Paolo Bonzini
        QTAILQ_REMOVE(&request_list, elem, reqs);
207 d354c7ec Paolo Bonzini
        elem->state = THREAD_CANCELED;
208 d354c7ec Paolo Bonzini
        event_notifier_set(&notifier);
209 d354c7ec Paolo Bonzini
    } else {
210 d354c7ec Paolo Bonzini
        pending_cancellations++;
211 d354c7ec Paolo Bonzini
        while (elem->state != THREAD_CANCELED && elem->state != THREAD_DONE) {
212 d354c7ec Paolo Bonzini
            qemu_cond_wait(&check_cancel, &lock);
213 d354c7ec Paolo Bonzini
        }
214 d354c7ec Paolo Bonzini
        pending_cancellations--;
215 d354c7ec Paolo Bonzini
    }
216 d354c7ec Paolo Bonzini
    qemu_mutex_unlock(&lock);
217 d354c7ec Paolo Bonzini
}
218 d354c7ec Paolo Bonzini
219 d7331bed Stefan Hajnoczi
static const AIOCBInfo thread_pool_aiocb_info = {
220 d354c7ec Paolo Bonzini
    .aiocb_size         = sizeof(ThreadPoolElement),
221 d354c7ec Paolo Bonzini
    .cancel             = thread_pool_cancel,
222 d354c7ec Paolo Bonzini
};
223 d354c7ec Paolo Bonzini
224 d354c7ec Paolo Bonzini
BlockDriverAIOCB *thread_pool_submit_aio(ThreadPoolFunc *func, void *arg,
225 d354c7ec Paolo Bonzini
        BlockDriverCompletionFunc *cb, void *opaque)
226 d354c7ec Paolo Bonzini
{
227 d354c7ec Paolo Bonzini
    ThreadPoolElement *req;
228 d354c7ec Paolo Bonzini
229 d7331bed Stefan Hajnoczi
    req = qemu_aio_get(&thread_pool_aiocb_info, NULL, cb, opaque);
230 d354c7ec Paolo Bonzini
    req->func = func;
231 d354c7ec Paolo Bonzini
    req->arg = arg;
232 d354c7ec Paolo Bonzini
    req->state = THREAD_QUEUED;
233 d354c7ec Paolo Bonzini
234 d354c7ec Paolo Bonzini
    QLIST_INSERT_HEAD(&head, req, all);
235 d354c7ec Paolo Bonzini
236 d354c7ec Paolo Bonzini
    trace_thread_pool_submit(req, arg);
237 d354c7ec Paolo Bonzini
238 d354c7ec Paolo Bonzini
    qemu_mutex_lock(&lock);
239 d354c7ec Paolo Bonzini
    if (idle_threads == 0 && cur_threads < max_threads) {
240 d354c7ec Paolo Bonzini
        spawn_thread();
241 d354c7ec Paolo Bonzini
    }
242 d354c7ec Paolo Bonzini
    QTAILQ_INSERT_TAIL(&request_list, req, reqs);
243 d354c7ec Paolo Bonzini
    qemu_mutex_unlock(&lock);
244 d354c7ec Paolo Bonzini
    qemu_sem_post(&sem);
245 d354c7ec Paolo Bonzini
    return &req->common;
246 d354c7ec Paolo Bonzini
}
247 d354c7ec Paolo Bonzini
248 d354c7ec Paolo Bonzini
typedef struct ThreadPoolCo {
249 d354c7ec Paolo Bonzini
    Coroutine *co;
250 d354c7ec Paolo Bonzini
    int ret;
251 d354c7ec Paolo Bonzini
} ThreadPoolCo;
252 d354c7ec Paolo Bonzini
253 d354c7ec Paolo Bonzini
static void thread_pool_co_cb(void *opaque, int ret)
254 d354c7ec Paolo Bonzini
{
255 d354c7ec Paolo Bonzini
    ThreadPoolCo *co = opaque;
256 d354c7ec Paolo Bonzini
257 d354c7ec Paolo Bonzini
    co->ret = ret;
258 d354c7ec Paolo Bonzini
    qemu_coroutine_enter(co->co, NULL);
259 d354c7ec Paolo Bonzini
}
260 d354c7ec Paolo Bonzini
261 d354c7ec Paolo Bonzini
int coroutine_fn thread_pool_submit_co(ThreadPoolFunc *func, void *arg)
262 d354c7ec Paolo Bonzini
{
263 d354c7ec Paolo Bonzini
    ThreadPoolCo tpc = { .co = qemu_coroutine_self(), .ret = -EINPROGRESS };
264 d354c7ec Paolo Bonzini
    assert(qemu_in_coroutine());
265 d354c7ec Paolo Bonzini
    thread_pool_submit_aio(func, arg, thread_pool_co_cb, &tpc);
266 d354c7ec Paolo Bonzini
    qemu_coroutine_yield();
267 d354c7ec Paolo Bonzini
    return tpc.ret;
268 d354c7ec Paolo Bonzini
}
269 d354c7ec Paolo Bonzini
270 d354c7ec Paolo Bonzini
void thread_pool_submit(ThreadPoolFunc *func, void *arg)
271 d354c7ec Paolo Bonzini
{
272 d354c7ec Paolo Bonzini
    thread_pool_submit_aio(func, arg, NULL, NULL);
273 d354c7ec Paolo Bonzini
}
274 d354c7ec Paolo Bonzini
275 d354c7ec Paolo Bonzini
static void thread_pool_init(void)
276 d354c7ec Paolo Bonzini
{
277 d354c7ec Paolo Bonzini
    QLIST_INIT(&head);
278 d354c7ec Paolo Bonzini
    event_notifier_init(&notifier, false);
279 d354c7ec Paolo Bonzini
    qemu_mutex_init(&lock);
280 d354c7ec Paolo Bonzini
    qemu_cond_init(&check_cancel);
281 d354c7ec Paolo Bonzini
    qemu_sem_init(&sem, 0);
282 d354c7ec Paolo Bonzini
    qemu_aio_set_event_notifier(&notifier, event_notifier_ready,
283 d354c7ec Paolo Bonzini
                                thread_pool_active);
284 d354c7ec Paolo Bonzini
285 d354c7ec Paolo Bonzini
    QTAILQ_INIT(&request_list);
286 d354c7ec Paolo Bonzini
    new_thread_bh = qemu_bh_new(spawn_thread_bh_fn, NULL);
287 d354c7ec Paolo Bonzini
}
288 d354c7ec Paolo Bonzini
289 d354c7ec Paolo Bonzini
block_init(thread_pool_init)