]> git.proxmox.com Git - mirror_qemu.git/blame - iothread.c
Merge remote-tracking branch 'remotes/bonzini/tags/for-upstream' into staging
[mirror_qemu.git] / iothread.c
CommitLineData
be8d8537
SH
1/*
2 * Event loop thread
3 *
4 * Copyright Red Hat Inc., 2013
5 *
6 * Authors:
7 * Stefan Hajnoczi <stefanha@redhat.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2 or later.
10 * See the COPYING file in the top-level directory.
11 *
12 */
13
d38ea87a 14#include "qemu/osdep.h"
be8d8537
SH
15#include "qom/object.h"
16#include "qom/object_interfaces.h"
17#include "qemu/module.h"
be8d8537 18#include "block/aio.h"
d16341fa 19#include "block/block.h"
be8d8537 20#include "sysemu/iothread.h"
e688df6b 21#include "qapi/error.h"
112ed241 22#include "qapi/qapi-commands-misc.h"
2f78e491 23#include "qemu/error-report.h"
ab28bd23 24#include "qemu/rcu.h"
e4370165 25#include "qemu/main-loop.h"
be8d8537 26
be8d8537 27typedef ObjectClass IOThreadClass;
be8d8537
SH
28
29#define IOTHREAD_GET_CLASS(obj) \
30 OBJECT_GET_CLASS(IOThreadClass, obj, TYPE_IOTHREAD)
31#define IOTHREAD_CLASS(klass) \
32 OBJECT_CLASS_CHECK(IOThreadClass, klass, TYPE_IOTHREAD)
33
90c558be 34#ifdef CONFIG_POSIX
cdd7abfd
SH
35/* Benchmark results from 2016 on NVMe SSD drives show max polling times around
36 * 16-32 microseconds yield IOPS improvements for both iodepth=1 and iodepth=32
37 * workloads.
38 */
39#define IOTHREAD_POLL_MAX_NS_DEFAULT 32768ULL
90c558be
PX
40#else
41#define IOTHREAD_POLL_MAX_NS_DEFAULT 0ULL
42#endif
cdd7abfd 43
e4370165
PB
44static __thread IOThread *my_iothread;
45
46AioContext *qemu_get_current_aio_context(void)
47{
48 return my_iothread ? my_iothread->ctx : qemu_get_aio_context();
49}
50
be8d8537
SH
51static void *iothread_run(void *opaque)
52{
53 IOThread *iothread = opaque;
54
ab28bd23 55 rcu_register_thread();
b60ec76a
PX
56 /*
57 * g_main_context_push_thread_default() must be called before anything
58 * in this new thread uses glib.
59 */
60 g_main_context_push_thread_default(iothread->worker_context);
e4370165 61 my_iothread = iothread;
88eb7c29 62 iothread->thread_id = qemu_get_thread_id();
21c4d15b 63 qemu_sem_post(&iothread->init_done_sem);
88eb7c29 64
2362a28e 65 while (iothread->running) {
6ca20620
PX
66 /*
67 * Note: from functional-wise the g_main_loop_run() below can
68 * already cover the aio_poll() events, but we can't run the
69 * main loop unconditionally because explicit aio_poll() here
70 * is faster than g_main_loop_run() when we do not need the
71 * gcontext at all (e.g., pure block layer iothreads). In
72 * other words, when we want to run the gcontext with the
73 * iothread we need to pay some performance for functionality.
74 */
65c1b5b6 75 aio_poll(iothread->ctx, true);
329163cb 76
6c95363d
PX
77 /*
78 * We must check the running state again in case it was
79 * changed in previous aio_poll()
80 */
b506e0f1 81 if (iothread->running && atomic_read(&iothread->run_gcontext)) {
329163cb 82 g_main_loop_run(iothread->main_loop);
329163cb 83 }
be8d8537 84 }
ab28bd23 85
b60ec76a 86 g_main_context_pop_thread_default(iothread->worker_context);
ab28bd23 87 rcu_unregister_thread();
be8d8537
SH
88 return NULL;
89}
90
2362a28e
SH
91/* Runs in iothread_run() thread */
92static void iothread_stop_bh(void *opaque)
93{
94 IOThread *iothread = opaque;
95
96 iothread->running = false; /* stop iothread_run() */
97
98 if (iothread->main_loop) {
99 g_main_loop_quit(iothread->main_loop);
100 }
101}
102
82d90705 103void iothread_stop(IOThread *iothread)
be8d8537 104{
82d90705
PX
105 if (!iothread->ctx || iothread->stopping) {
106 return;
2f78e491 107 }
be8d8537 108 iothread->stopping = true;
2362a28e 109 aio_bh_schedule_oneshot(iothread->ctx, iothread_stop_bh, iothread);
be8d8537 110 qemu_thread_join(&iothread->thread);
82d90705
PX
111}
112
cdd7abfd
SH
113static void iothread_instance_init(Object *obj)
114{
115 IOThread *iothread = IOTHREAD(obj);
116
117 iothread->poll_max_ns = IOTHREAD_POLL_MAX_NS_DEFAULT;
14a2d118 118 iothread->thread_id = -1;
21c4d15b 119 qemu_sem_init(&iothread->init_done_sem, 0);
b506e0f1
PX
120 /* By default, we don't run gcontext */
121 atomic_set(&iothread->run_gcontext, 0);
cdd7abfd
SH
122}
123
dce8921b
FZ
124static void iothread_instance_finalize(Object *obj)
125{
126 IOThread *iothread = IOTHREAD(obj);
127
82d90705 128 iothread_stop(iothread);
14a2d118 129
15544349
PX
130 /*
131 * Before glib2 2.33.10, there is a glib2 bug that GSource context
132 * pointer may not be cleared even if the context has already been
133 * destroyed (while it should). Here let's free the AIO context
134 * earlier to bypass that glib bug.
135 *
136 * We can remove this comment after the minimum supported glib2
137 * version boosts to 2.33.10. Before that, let's free the
138 * GSources first before destroying any GMainContext.
139 */
140 if (iothread->ctx) {
141 aio_context_unref(iothread->ctx);
142 iothread->ctx = NULL;
143 }
5b3ac23f
PX
144 if (iothread->worker_context) {
145 g_main_context_unref(iothread->worker_context);
146 iothread->worker_context = NULL;
0bd2d233
PX
147 g_main_loop_unref(iothread->main_loop);
148 iothread->main_loop = NULL;
5b3ac23f 149 }
21c4d15b 150 qemu_sem_destroy(&iothread->init_done_sem);
be8d8537
SH
151}
152
b506e0f1
PX
153static void iothread_init_gcontext(IOThread *iothread)
154{
155 GSource *source;
156
157 iothread->worker_context = g_main_context_new();
158 source = aio_get_g_source(iothread_get_aio_context(iothread));
159 g_source_attach(source, iothread->worker_context);
160 g_source_unref(source);
0bd2d233 161 iothread->main_loop = g_main_loop_new(iothread->worker_context, TRUE);
b506e0f1
PX
162}
163
be8d8537
SH
164static void iothread_complete(UserCreatable *obj, Error **errp)
165{
2f78e491 166 Error *local_error = NULL;
be8d8537 167 IOThread *iothread = IOTHREAD(obj);
d21e8776 168 char *name, *thread_name;
be8d8537
SH
169
170 iothread->stopping = false;
2362a28e 171 iothread->running = true;
2f78e491
CN
172 iothread->ctx = aio_context_new(&local_error);
173 if (!iothread->ctx) {
174 error_propagate(errp, local_error);
175 return;
176 }
88eb7c29 177
b506e0f1
PX
178 /*
179 * Init one GMainContext for the iothread unconditionally, even if
180 * it's not used
181 */
182 iothread_init_gcontext(iothread);
183
5e5db499
SH
184 aio_context_set_poll_params(iothread->ctx,
185 iothread->poll_max_ns,
186 iothread->poll_grow,
187 iothread->poll_shrink,
0d9d86fb
SH
188 &local_error);
189 if (local_error) {
190 error_propagate(errp, local_error);
191 aio_context_unref(iothread->ctx);
192 iothread->ctx = NULL;
193 return;
194 }
195
be8d8537
SH
196 /* This assumes we are called from a thread with useful CPU affinity for us
197 * to inherit.
198 */
d21e8776
PB
199 name = object_get_canonical_path_component(OBJECT(obj));
200 thread_name = g_strdup_printf("IO %s", name);
201 qemu_thread_create(&iothread->thread, thread_name, iothread_run,
be8d8537 202 iothread, QEMU_THREAD_JOINABLE);
d21e8776
PB
203 g_free(thread_name);
204 g_free(name);
88eb7c29
SH
205
206 /* Wait for initialization to complete */
88eb7c29 207 while (iothread->thread_id == -1) {
21c4d15b 208 qemu_sem_wait(&iothread->init_done_sem);
88eb7c29 209 }
be8d8537
SH
210}
211
5e5db499
SH
212typedef struct {
213 const char *name;
214 ptrdiff_t offset; /* field's byte offset in IOThread struct */
215} PollParamInfo;
216
217static PollParamInfo poll_max_ns_info = {
218 "poll-max-ns", offsetof(IOThread, poll_max_ns),
219};
220static PollParamInfo poll_grow_info = {
221 "poll-grow", offsetof(IOThread, poll_grow),
222};
223static PollParamInfo poll_shrink_info = {
224 "poll-shrink", offsetof(IOThread, poll_shrink),
225};
226
227static void iothread_get_poll_param(Object *obj, Visitor *v,
0d9d86fb
SH
228 const char *name, void *opaque, Error **errp)
229{
230 IOThread *iothread = IOTHREAD(obj);
5e5db499
SH
231 PollParamInfo *info = opaque;
232 int64_t *field = (void *)iothread + info->offset;
0d9d86fb 233
5e5db499 234 visit_type_int64(v, name, field, errp);
0d9d86fb
SH
235}
236
5e5db499 237static void iothread_set_poll_param(Object *obj, Visitor *v,
0d9d86fb
SH
238 const char *name, void *opaque, Error **errp)
239{
240 IOThread *iothread = IOTHREAD(obj);
5e5db499
SH
241 PollParamInfo *info = opaque;
242 int64_t *field = (void *)iothread + info->offset;
0d9d86fb
SH
243 Error *local_err = NULL;
244 int64_t value;
245
246 visit_type_int64(v, name, &value, &local_err);
247 if (local_err) {
248 goto out;
249 }
250
251 if (value < 0) {
5e5db499
SH
252 error_setg(&local_err, "%s value must be in range [0, %"PRId64"]",
253 info->name, INT64_MAX);
0d9d86fb
SH
254 goto out;
255 }
256
5e5db499 257 *field = value;
0d9d86fb
SH
258
259 if (iothread->ctx) {
5e5db499
SH
260 aio_context_set_poll_params(iothread->ctx,
261 iothread->poll_max_ns,
262 iothread->poll_grow,
263 iothread->poll_shrink,
264 &local_err);
0d9d86fb
SH
265 }
266
267out:
268 error_propagate(errp, local_err);
269}
270
be8d8537
SH
271static void iothread_class_init(ObjectClass *klass, void *class_data)
272{
273 UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
274 ucc->complete = iothread_complete;
0d9d86fb
SH
275
276 object_class_property_add(klass, "poll-max-ns", "int",
5e5db499
SH
277 iothread_get_poll_param,
278 iothread_set_poll_param,
279 NULL, &poll_max_ns_info, &error_abort);
280 object_class_property_add(klass, "poll-grow", "int",
281 iothread_get_poll_param,
282 iothread_set_poll_param,
283 NULL, &poll_grow_info, &error_abort);
284 object_class_property_add(klass, "poll-shrink", "int",
285 iothread_get_poll_param,
286 iothread_set_poll_param,
287 NULL, &poll_shrink_info, &error_abort);
be8d8537
SH
288}
289
290static const TypeInfo iothread_info = {
291 .name = TYPE_IOTHREAD,
292 .parent = TYPE_OBJECT,
293 .class_init = iothread_class_init,
294 .instance_size = sizeof(IOThread),
cdd7abfd 295 .instance_init = iothread_instance_init,
be8d8537
SH
296 .instance_finalize = iothread_instance_finalize,
297 .interfaces = (InterfaceInfo[]) {
298 {TYPE_USER_CREATABLE},
299 {}
300 },
301};
302
303static void iothread_register_types(void)
304{
305 type_register_static(&iothread_info);
306}
307
308type_init(iothread_register_types)
309
be8d8537
SH
310char *iothread_get_id(IOThread *iothread)
311{
312 return object_get_canonical_path_component(OBJECT(iothread));
313}
314
315AioContext *iothread_get_aio_context(IOThread *iothread)
316{
317 return iothread->ctx;
318}
dc3dd0d2
SH
319
320static int query_one_iothread(Object *object, void *opaque)
321{
322 IOThreadInfoList ***prev = opaque;
323 IOThreadInfoList *elem;
324 IOThreadInfo *info;
325 IOThread *iothread;
326
327 iothread = (IOThread *)object_dynamic_cast(object, TYPE_IOTHREAD);
328 if (!iothread) {
329 return 0;
330 }
331
332 info = g_new0(IOThreadInfo, 1);
333 info->id = iothread_get_id(iothread);
334 info->thread_id = iothread->thread_id;
5fc00480
PH
335 info->poll_max_ns = iothread->poll_max_ns;
336 info->poll_grow = iothread->poll_grow;
337 info->poll_shrink = iothread->poll_shrink;
dc3dd0d2
SH
338
339 elem = g_new0(IOThreadInfoList, 1);
340 elem->value = info;
341 elem->next = NULL;
342
343 **prev = elem;
344 *prev = &elem->next;
345 return 0;
346}
347
348IOThreadInfoList *qmp_query_iothreads(Error **errp)
349{
350 IOThreadInfoList *head = NULL;
351 IOThreadInfoList **prev = &head;
bc2256c4 352 Object *container = object_get_objects_root();
dc3dd0d2
SH
353
354 object_child_foreach(container, query_one_iothread, &prev);
355 return head;
356}
dce8921b 357
329163cb
WY
358GMainContext *iothread_get_g_main_context(IOThread *iothread)
359{
b506e0f1
PX
360 atomic_set(&iothread->run_gcontext, 1);
361 aio_notify(iothread->ctx);
329163cb
WY
362 return iothread->worker_context;
363}
0173e21b
PX
364
365IOThread *iothread_create(const char *id, Error **errp)
366{
367 Object *obj;
368
369 obj = object_new_with_props(TYPE_IOTHREAD,
370 object_get_internal_root(),
371 id, errp, NULL);
372
373 return IOTHREAD(obj);
374}
375
376void iothread_destroy(IOThread *iothread)
377{
378 object_unparent(OBJECT(iothread));
379}
fbcc6923
SH
380
381/* Lookup IOThread by its id. Only finds user-created objects, not internal
382 * iothread_create() objects. */
383IOThread *iothread_by_id(const char *id)
384{
385 return IOTHREAD(object_resolve_path_type(id, TYPE_IOTHREAD, NULL));
386}