2 * QEMU block layer thread pool
4 * Copyright IBM, Corp. 2008
5 * Copyright Red Hat, Inc. 2012
8 * Anthony Liguori <aliguori@us.ibm.com>
9 * Paolo Bonzini <pbonzini@redhat.com>
11 * This work is licensed under the terms of the GNU GPL, version 2. See
12 * the COPYING file in the top-level directory.
14 * Contributions after 2012-01-13 are licensed under the terms of the
15 * GNU GPL, version 2 or (at your option) any later version.
17 #include "qemu-common.h"
18 #include "qemu-queue.h"
19 #include "qemu-thread.h"
21 #include "qemu-coroutine.h"
23 #include "block_int.h"
24 #include "event_notifier.h"
25 #include "thread-pool.h"
27 static void do_spawn_thread(void);
29 typedef struct ThreadPoolElement ThreadPoolElement
;
38 struct ThreadPoolElement
{
39 BlockDriverAIOCB common
;
43 /* Moving state out of THREAD_QUEUED is protected by lock. After
44 * that, only the worker thread can write to it. Reads and writes
45 * of state and ret are ordered with memory barriers.
47 enum ThreadState state
;
50 /* Access to this list is protected by lock. */
51 QTAILQ_ENTRY(ThreadPoolElement
) reqs
;
53 /* Access to this list is protected by the global mutex. */
54 QLIST_ENTRY(ThreadPoolElement
) all
;
57 static EventNotifier notifier
;
58 static QemuMutex lock
;
59 static QemuCond check_cancel
;
60 static QemuSemaphore sem
;
61 static int max_threads
= 64;
62 static QEMUBH
*new_thread_bh
;
64 /* The following variables are protected by the global mutex. */
65 static QLIST_HEAD(, ThreadPoolElement
) head
;
67 /* The following variables are protected by lock. */
68 static QTAILQ_HEAD(, ThreadPoolElement
) request_list
;
69 static int cur_threads
;
70 static int idle_threads
;
71 static int new_threads
; /* backlog of threads we need to create */
72 static int pending_threads
; /* threads created but not running yet */
73 static int pending_cancellations
; /* whether we need a cond_broadcast */
75 static void *worker_thread(void *unused
)
77 qemu_mutex_lock(&lock
);
82 ThreadPoolElement
*req
;
87 qemu_mutex_unlock(&lock
);
88 ret
= qemu_sem_timedwait(&sem
, 10000);
89 qemu_mutex_lock(&lock
);
91 } while (ret
== -1 && !QTAILQ_EMPTY(&request_list
));
96 req
= QTAILQ_FIRST(&request_list
);
97 QTAILQ_REMOVE(&request_list
, req
, reqs
);
98 req
->state
= THREAD_ACTIVE
;
99 qemu_mutex_unlock(&lock
);
101 ret
= req
->func(req
->arg
);
104 /* Write ret before state. */
106 req
->state
= THREAD_DONE
;
108 qemu_mutex_lock(&lock
);
109 if (pending_cancellations
) {
110 qemu_cond_broadcast(&check_cancel
);
113 event_notifier_set(¬ifier
);
117 qemu_mutex_unlock(&lock
);
121 static void do_spawn_thread(void)
125 /* Runs with lock taken. */
133 qemu_thread_create(&t
, worker_thread
, NULL
, QEMU_THREAD_DETACHED
);
136 static void spawn_thread_bh_fn(void *opaque
)
138 qemu_mutex_lock(&lock
);
140 qemu_mutex_unlock(&lock
);
143 static void spawn_thread(void)
147 /* If there are threads being created, they will spawn new workers, so
148 * we don't spend time creating many threads in a loop holding a mutex or
149 * starving the current vcpu.
151 * If there are no idle threads, ask the main thread to create one, so we
152 * inherit the correct affinity instead of the vcpu affinity.
154 if (!pending_threads
) {
155 qemu_bh_schedule(new_thread_bh
);
159 static void event_notifier_ready(EventNotifier
*notifier
)
161 ThreadPoolElement
*elem
, *next
;
163 event_notifier_test_and_clear(notifier
);
165 QLIST_FOREACH_SAFE(elem
, &head
, all
, next
) {
166 if (elem
->state
!= THREAD_CANCELED
&& elem
->state
!= THREAD_DONE
) {
169 if (elem
->state
== THREAD_DONE
) {
170 trace_thread_pool_complete(elem
, elem
->common
.opaque
, elem
->ret
);
172 if (elem
->state
== THREAD_DONE
&& elem
->common
.cb
) {
173 QLIST_REMOVE(elem
, all
);
174 /* Read state before ret. */
176 elem
->common
.cb(elem
->common
.opaque
, elem
->ret
);
177 qemu_aio_release(elem
);
180 /* remove the request */
181 QLIST_REMOVE(elem
, all
);
182 qemu_aio_release(elem
);
187 static int thread_pool_active(EventNotifier
*notifier
)
189 return !QLIST_EMPTY(&head
);
192 static void thread_pool_cancel(BlockDriverAIOCB
*acb
)
194 ThreadPoolElement
*elem
= (ThreadPoolElement
*)acb
;
196 trace_thread_pool_cancel(elem
, elem
->common
.opaque
);
198 qemu_mutex_lock(&lock
);
199 if (elem
->state
== THREAD_QUEUED
&&
200 /* No thread has yet started working on elem. we can try to "steal"
201 * the item from the worker if we can get a signal from the
202 * semaphore. Because this is non-blocking, we can do it with
203 * the lock taken and ensure that elem will remain THREAD_QUEUED.
205 qemu_sem_timedwait(&sem
, 0) == 0) {
206 QTAILQ_REMOVE(&request_list
, elem
, reqs
);
207 elem
->state
= THREAD_CANCELED
;
208 event_notifier_set(¬ifier
);
210 pending_cancellations
++;
211 while (elem
->state
!= THREAD_CANCELED
&& elem
->state
!= THREAD_DONE
) {
212 qemu_cond_wait(&check_cancel
, &lock
);
214 pending_cancellations
--;
216 qemu_mutex_unlock(&lock
);
219 static AIOPool thread_pool_cb_pool
= {
220 .aiocb_size
= sizeof(ThreadPoolElement
),
221 .cancel
= thread_pool_cancel
,
224 BlockDriverAIOCB
*thread_pool_submit_aio(ThreadPoolFunc
*func
, void *arg
,
225 BlockDriverCompletionFunc
*cb
, void *opaque
)
227 ThreadPoolElement
*req
;
229 req
= qemu_aio_get(&thread_pool_cb_pool
, NULL
, cb
, opaque
);
232 req
->state
= THREAD_QUEUED
;
234 QLIST_INSERT_HEAD(&head
, req
, all
);
236 trace_thread_pool_submit(req
, arg
);
238 qemu_mutex_lock(&lock
);
239 if (idle_threads
== 0 && cur_threads
< max_threads
) {
242 QTAILQ_INSERT_TAIL(&request_list
, req
, reqs
);
243 qemu_mutex_unlock(&lock
);
248 typedef struct ThreadPoolCo
{
253 static void thread_pool_co_cb(void *opaque
, int ret
)
255 ThreadPoolCo
*co
= opaque
;
258 qemu_coroutine_enter(co
->co
, NULL
);
261 int coroutine_fn
thread_pool_submit_co(ThreadPoolFunc
*func
, void *arg
)
263 ThreadPoolCo tpc
= { .co
= qemu_coroutine_self(), .ret
= -EINPROGRESS
};
264 assert(qemu_in_coroutine());
265 thread_pool_submit_aio(func
, arg
, thread_pool_co_cb
, &tpc
);
266 qemu_coroutine_yield();
270 void thread_pool_submit(ThreadPoolFunc
*func
, void *arg
)
272 thread_pool_submit_aio(func
, arg
, NULL
, NULL
);
275 static void thread_pool_init(void)
278 event_notifier_init(¬ifier
, false);
279 qemu_mutex_init(&lock
);
280 qemu_cond_init(&check_cancel
);
281 qemu_sem_init(&sem
, 0);
282 qemu_aio_set_event_notifier(¬ifier
, event_notifier_ready
,
285 QTAILQ_INIT(&request_list
);
286 new_thread_bh
= qemu_bh_new(spawn_thread_bh_fn
, NULL
);
289 block_init(thread_pool_init
)