]> git.proxmox.com Git - qemu.git/blame - main-loop.c
target-i386: Introduce X86CPU::filtered_features field
[qemu.git] / main-loop.c
CommitLineData
d3b12f5d
PB
1/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
d3b12f5d 24
0ec024f6 25#include "qemu-common.h"
1de7afc9 26#include "qemu/timer.h"
0ec024f6 27#include "slirp/slirp.h"
1de7afc9 28#include "qemu/main-loop.h"
737e150e 29#include "block/aio.h"
d3b12f5d
PB
30
31#ifndef _WIN32
32
1de7afc9 33#include "qemu/compatfd.h"
0ec024f6 34
d3b12f5d
PB
35/* If we have signalfd, we mask out the signals we want to handle and then
36 * use signalfd to listen for them. We rely on whatever the current signal
37 * handler is to dispatch the signals when we receive them.
38 */
39static void sigfd_handler(void *opaque)
40{
41 int fd = (intptr_t)opaque;
42 struct qemu_signalfd_siginfo info;
43 struct sigaction action;
44 ssize_t len;
45
46 while (1) {
47 do {
48 len = read(fd, &info, sizeof(info));
49 } while (len == -1 && errno == EINTR);
50
51 if (len == -1 && errno == EAGAIN) {
52 break;
53 }
54
55 if (len != sizeof(info)) {
56 printf("read from sigfd returned %zd: %m\n", len);
57 return;
58 }
59
60 sigaction(info.ssi_signo, NULL, &action);
61 if ((action.sa_flags & SA_SIGINFO) && action.sa_sigaction) {
62 action.sa_sigaction(info.ssi_signo,
63 (siginfo_t *)&info, NULL);
64 } else if (action.sa_handler) {
65 action.sa_handler(info.ssi_signo);
66 }
67 }
68}
69
70static int qemu_signal_init(void)
71{
72 int sigfd;
73 sigset_t set;
74
75 /*
76 * SIG_IPI must be blocked in the main thread and must not be caught
77 * by sigwait() in the signal thread. Otherwise, the cpu thread will
78 * not catch it reliably.
79 */
80 sigemptyset(&set);
81 sigaddset(&set, SIG_IPI);
d3b12f5d
PB
82 sigaddset(&set, SIGIO);
83 sigaddset(&set, SIGALRM);
84 sigaddset(&set, SIGBUS);
85 pthread_sigmask(SIG_BLOCK, &set, NULL);
86
4aa7534d 87 sigdelset(&set, SIG_IPI);
d3b12f5d
PB
88 sigfd = qemu_signalfd(&set);
89 if (sigfd == -1) {
90 fprintf(stderr, "failed to create signalfd\n");
91 return -errno;
92 }
93
94 fcntl_setfl(sigfd, O_NONBLOCK);
95
96 qemu_set_fd_handler2(sigfd, NULL, sigfd_handler, NULL,
97 (void *)(intptr_t)sigfd);
98
99 return 0;
100}
101
102#else /* _WIN32 */
103
4c8d0d27 104static int qemu_signal_init(void)
d3b12f5d 105{
d3b12f5d
PB
106 return 0;
107}
4c8d0d27
PB
108#endif
109
110static AioContext *qemu_aio_context;
d3b12f5d 111
5f3aa1ff
SH
112AioContext *qemu_get_aio_context(void)
113{
114 return qemu_aio_context;
115}
116
d3b12f5d
PB
117void qemu_notify_event(void)
118{
4c8d0d27 119 if (!qemu_aio_context) {
ee77dfb2
MR
120 return;
121 }
4c8d0d27 122 aio_notify(qemu_aio_context);
d3b12f5d
PB
123}
124
cbff4b34
SH
125static GArray *gpollfds;
126
172061a0 127int qemu_init_main_loop(void)
d3b12f5d
PB
128{
129 int ret;
82cbbdc6 130 GSource *src;
d3b12f5d 131
172061a0 132 init_clocks();
f9ab4654
PB
133 if (init_timer_alarm() < 0) {
134 fprintf(stderr, "could not initialize alarm timer\n");
135 exit(1);
136 }
172061a0 137
d3b12f5d
PB
138 ret = qemu_signal_init();
139 if (ret) {
140 return ret;
141 }
142
cbff4b34 143 gpollfds = g_array_new(FALSE, FALSE, sizeof(GPollFD));
f627aab1 144 qemu_aio_context = aio_context_new();
82cbbdc6
PB
145 src = aio_get_g_source(qemu_aio_context);
146 g_source_attach(src, NULL);
147 g_source_unref(src);
d3b12f5d
PB
148 return 0;
149}
150
d3b12f5d
PB
151static int max_priority;
152
ea26ce76 153#ifndef _WIN32
48ce11ff
SH
154static int glib_pollfds_idx;
155static int glib_n_poll_fds;
156
157static void glib_pollfds_fill(uint32_t *cur_timeout)
d3b12f5d
PB
158{
159 GMainContext *context = g_main_context_default();
4dae83ae 160 int timeout = 0;
48ce11ff 161 int n;
d3b12f5d
PB
162
163 g_main_context_prepare(context, &max_priority);
164
48ce11ff
SH
165 glib_pollfds_idx = gpollfds->len;
166 n = glib_n_poll_fds;
167 do {
168 GPollFD *pfds;
169 glib_n_poll_fds = n;
170 g_array_set_size(gpollfds, glib_pollfds_idx + glib_n_poll_fds);
171 pfds = &g_array_index(gpollfds, GPollFD, glib_pollfds_idx);
172 n = g_main_context_query(context, max_priority, &timeout, pfds,
173 glib_n_poll_fds);
174 } while (n != glib_n_poll_fds);
d3b12f5d 175
4dae83ae
PB
176 if (timeout >= 0 && timeout < *cur_timeout) {
177 *cur_timeout = timeout;
d3b12f5d
PB
178 }
179}
180
48ce11ff 181static void glib_pollfds_poll(void)
d3b12f5d
PB
182{
183 GMainContext *context = g_main_context_default();
48ce11ff 184 GPollFD *pfds = &g_array_index(gpollfds, GPollFD, glib_pollfds_idx);
d3b12f5d 185
48ce11ff 186 if (g_main_context_check(context, max_priority, pfds, glib_n_poll_fds)) {
d3b12f5d
PB
187 g_main_context_dispatch(context);
188 }
189}
190
893986fe
AL
191#define MAX_MAIN_LOOP_SPIN (1000)
192
7c7db755 193static int os_host_main_loop_wait(uint32_t timeout)
15455536 194{
15455536 195 int ret;
893986fe 196 static int spin_counter;
15455536 197
48ce11ff 198 glib_pollfds_fill(&timeout);
15455536 199
893986fe
AL
200 /* If the I/O thread is very busy or we are incorrectly busy waiting in
201 * the I/O thread, this can lead to starvation of the BQL such that the
202 * VCPU threads never run. To make sure we can detect the later case,
203 * print a message to the screen. If we run into this condition, create
204 * a fake timeout in order to give the VCPU threads a chance to run.
205 */
206 if (spin_counter > MAX_MAIN_LOOP_SPIN) {
207 static bool notified;
208
209 if (!notified) {
210 fprintf(stderr,
211 "main-loop: WARNING: I/O thread spun for %d iterations\n",
212 MAX_MAIN_LOOP_SPIN);
213 notified = true;
214 }
215
216 timeout = 1;
217 }
218
15455536 219 if (timeout > 0) {
893986fe 220 spin_counter = 0;
15455536 221 qemu_mutex_unlock_iothread();
893986fe
AL
222 } else {
223 spin_counter++;
15455536
PB
224 }
225
cbff4b34
SH
226 ret = g_poll((GPollFD *)gpollfds->data, gpollfds->len, timeout);
227
15455536
PB
228 if (timeout > 0) {
229 qemu_mutex_lock_iothread();
230 }
231
48ce11ff 232 glib_pollfds_poll();
15455536
PB
233 return ret;
234}
235#else
d3b12f5d
PB
236/***********************************************************/
237/* Polling handling */
238
239typedef struct PollingEntry {
240 PollingFunc *func;
241 void *opaque;
242 struct PollingEntry *next;
243} PollingEntry;
244
245static PollingEntry *first_polling_entry;
246
247int qemu_add_polling_cb(PollingFunc *func, void *opaque)
248{
249 PollingEntry **ppe, *pe;
250 pe = g_malloc0(sizeof(PollingEntry));
251 pe->func = func;
252 pe->opaque = opaque;
253 for(ppe = &first_polling_entry; *ppe != NULL; ppe = &(*ppe)->next);
254 *ppe = pe;
255 return 0;
256}
257
258void qemu_del_polling_cb(PollingFunc *func, void *opaque)
259{
260 PollingEntry **ppe, *pe;
261 for(ppe = &first_polling_entry; *ppe != NULL; ppe = &(*ppe)->next) {
262 pe = *ppe;
263 if (pe->func == func && pe->opaque == opaque) {
264 *ppe = pe->next;
265 g_free(pe);
266 break;
267 }
268 }
269}
270
271/***********************************************************/
272/* Wait objects support */
273typedef struct WaitObjects {
274 int num;
06ac7d49 275 int revents[MAXIMUM_WAIT_OBJECTS + 1];
d3b12f5d
PB
276 HANDLE events[MAXIMUM_WAIT_OBJECTS + 1];
277 WaitObjectFunc *func[MAXIMUM_WAIT_OBJECTS + 1];
278 void *opaque[MAXIMUM_WAIT_OBJECTS + 1];
279} WaitObjects;
280
281static WaitObjects wait_objects = {0};
282
283int qemu_add_wait_object(HANDLE handle, WaitObjectFunc *func, void *opaque)
284{
285 WaitObjects *w = &wait_objects;
286 if (w->num >= MAXIMUM_WAIT_OBJECTS) {
287 return -1;
288 }
289 w->events[w->num] = handle;
290 w->func[w->num] = func;
291 w->opaque[w->num] = opaque;
06ac7d49 292 w->revents[w->num] = 0;
d3b12f5d
PB
293 w->num++;
294 return 0;
295}
296
297void qemu_del_wait_object(HANDLE handle, WaitObjectFunc *func, void *opaque)
298{
299 int i, found;
300 WaitObjects *w = &wait_objects;
301
302 found = 0;
303 for (i = 0; i < w->num; i++) {
304 if (w->events[i] == handle) {
305 found = 1;
306 }
307 if (found) {
308 w->events[i] = w->events[i + 1];
309 w->func[i] = w->func[i + 1];
310 w->opaque[i] = w->opaque[i + 1];
06ac7d49 311 w->revents[i] = w->revents[i + 1];
d3b12f5d
PB
312 }
313 }
314 if (found) {
315 w->num--;
316 }
317}
318
d3385eb4
PB
319void qemu_fd_register(int fd)
320{
4c8d0d27
PB
321 WSAEventSelect(fd, event_notifier_get_handle(&qemu_aio_context->notifier),
322 FD_READ | FD_ACCEPT | FD_CLOSE |
d3385eb4
PB
323 FD_CONNECT | FD_WRITE | FD_OOB);
324}
325
cbff4b34
SH
326static int pollfds_fill(GArray *pollfds, fd_set *rfds, fd_set *wfds,
327 fd_set *xfds)
328{
329 int nfds = -1;
330 int i;
331
332 for (i = 0; i < pollfds->len; i++) {
333 GPollFD *pfd = &g_array_index(pollfds, GPollFD, i);
334 int fd = pfd->fd;
335 int events = pfd->events;
336 if (events & (G_IO_IN | G_IO_HUP | G_IO_ERR)) {
337 FD_SET(fd, rfds);
338 nfds = MAX(nfds, fd);
339 }
340 if (events & (G_IO_OUT | G_IO_ERR)) {
341 FD_SET(fd, wfds);
342 nfds = MAX(nfds, fd);
343 }
344 if (events & G_IO_PRI) {
345 FD_SET(fd, xfds);
346 nfds = MAX(nfds, fd);
347 }
348 }
349 return nfds;
350}
351
352static void pollfds_poll(GArray *pollfds, int nfds, fd_set *rfds,
353 fd_set *wfds, fd_set *xfds)
354{
355 int i;
356
357 for (i = 0; i < pollfds->len; i++) {
358 GPollFD *pfd = &g_array_index(pollfds, GPollFD, i);
359 int fd = pfd->fd;
360 int revents = 0;
361
362 if (FD_ISSET(fd, rfds)) {
363 revents |= G_IO_IN | G_IO_HUP | G_IO_ERR;
364 }
365 if (FD_ISSET(fd, wfds)) {
366 revents |= G_IO_OUT | G_IO_ERR;
367 }
368 if (FD_ISSET(fd, xfds)) {
369 revents |= G_IO_PRI;
370 }
371 pfd->revents = revents & pfd->events;
372 }
373}
374
7c7db755 375static int os_host_main_loop_wait(uint32_t timeout)
d3b12f5d 376{
ea26ce76 377 GMainContext *context = g_main_context_default();
48ce11ff 378 GPollFD poll_fds[1024 * 2]; /* this is probably overkill */
134a03e0 379 int select_ret = 0;
48ce11ff 380 int g_poll_ret, ret, i, n_poll_fds;
d3b12f5d 381 PollingEntry *pe;
d3385eb4 382 WaitObjects *w = &wait_objects;
42fe1c24 383 gint poll_timeout;
15455536 384 static struct timeval tv0;
9cbaacf9
SH
385 fd_set rfds, wfds, xfds;
386 int nfds;
d3b12f5d
PB
387
388 /* XXX: need to suppress polling by better using win32 events */
389 ret = 0;
390 for (pe = first_polling_entry; pe != NULL; pe = pe->next) {
391 ret |= pe->func(pe->opaque);
392 }
d3385eb4
PB
393 if (ret != 0) {
394 return ret;
395 }
d3b12f5d 396
ea26ce76 397 g_main_context_prepare(context, &max_priority);
42fe1c24 398 n_poll_fds = g_main_context_query(context, max_priority, &poll_timeout,
ea26ce76
PB
399 poll_fds, ARRAY_SIZE(poll_fds));
400 g_assert(n_poll_fds <= ARRAY_SIZE(poll_fds));
401
06ac7d49 402 for (i = 0; i < w->num; i++) {
58b9630d 403 poll_fds[n_poll_fds + i].fd = (DWORD_PTR)w->events[i];
ea26ce76 404 poll_fds[n_poll_fds + i].events = G_IO_IN;
06ac7d49
PB
405 }
406
3239ad04
SW
407 if (poll_timeout < 0 || timeout < poll_timeout) {
408 poll_timeout = timeout;
409 }
410
d3385eb4 411 qemu_mutex_unlock_iothread();
5e3bc735 412 g_poll_ret = g_poll(poll_fds, n_poll_fds + w->num, poll_timeout);
d3385eb4 413 qemu_mutex_lock_iothread();
5e3bc735 414 if (g_poll_ret > 0) {
06ac7d49 415 for (i = 0; i < w->num; i++) {
ea26ce76 416 w->revents[i] = poll_fds[n_poll_fds + i].revents;
d3385eb4 417 }
06ac7d49
PB
418 for (i = 0; i < w->num; i++) {
419 if (w->revents[i] && w->func[i]) {
420 w->func[i](w->opaque[i]);
d3b12f5d 421 }
d3b12f5d
PB
422 }
423 }
424
ea26ce76
PB
425 if (g_main_context_check(context, max_priority, poll_fds, n_poll_fds)) {
426 g_main_context_dispatch(context);
427 }
428
5e3bc735
FC
429 /* Call select after g_poll to avoid a useless iteration and therefore
430 * improve socket latency.
d3385eb4
PB
431 */
432
cbff4b34
SH
433 FD_ZERO(&rfds);
434 FD_ZERO(&wfds);
435 FD_ZERO(&xfds);
436 nfds = pollfds_fill(gpollfds, &rfds, &wfds, &xfds);
5e3bc735
FC
437 if (nfds >= 0) {
438 select_ret = select(nfds + 1, &rfds, &wfds, &xfds, &tv0);
439 if (select_ret != 0) {
440 timeout = 0;
441 }
cbff4b34
SH
442 if (select_ret > 0) {
443 pollfds_poll(gpollfds, nfds, &rfds, &wfds, &xfds);
444 }
5e3bc735
FC
445 }
446
447 return select_ret || g_poll_ret;
d3b12f5d
PB
448}
449#endif
450
451int main_loop_wait(int nonblocking)
452{
7c7db755
SS
453 int ret;
454 uint32_t timeout = UINT32_MAX;
d3b12f5d
PB
455
456 if (nonblocking) {
457 timeout = 0;
d3b12f5d
PB
458 }
459
d3b12f5d 460 /* poll any events */
cbff4b34 461 g_array_set_size(gpollfds, 0); /* reset for new iteration */
d3b12f5d 462 /* XXX: separate device handlers from system ones */
d3b12f5d 463#ifdef CONFIG_SLIRP
7c7db755 464 slirp_update_timeout(&timeout);
8917c3bd 465 slirp_pollfds_fill(gpollfds);
d3b12f5d 466#endif
a3e4b4a8 467 qemu_iohandler_fill(gpollfds);
15455536 468 ret = os_host_main_loop_wait(timeout);
a3e4b4a8 469 qemu_iohandler_poll(gpollfds, ret);
d3b12f5d 470#ifdef CONFIG_SLIRP
8917c3bd 471 slirp_pollfds_poll(gpollfds, (ret < 0));
d3b12f5d
PB
472#endif
473
474 qemu_run_all_timers();
475
d3b12f5d
PB
476 return ret;
477}
f627aab1
PB
478
479/* Functions to operate on the main QEMU AioContext. */
480
481QEMUBH *qemu_bh_new(QEMUBHFunc *cb, void *opaque)
482{
483 return aio_bh_new(qemu_aio_context, cb, opaque);
484}
485
a915f4bc
PB
486bool qemu_aio_wait(void)
487{
7c0628b2 488 return aio_poll(qemu_aio_context, true);
a915f4bc
PB
489}
490
f42b2207 491#ifdef CONFIG_POSIX
a915f4bc
PB
492void qemu_aio_set_fd_handler(int fd,
493 IOHandler *io_read,
494 IOHandler *io_write,
495 AioFlushHandler *io_flush,
496 void *opaque)
497{
498 aio_set_fd_handler(qemu_aio_context, fd, io_read, io_write, io_flush,
499 opaque);
a915f4bc 500}
82cbbdc6 501#endif
a915f4bc 502
a915f4bc
PB
503void qemu_aio_set_event_notifier(EventNotifier *notifier,
504 EventNotifierHandler *io_read,
505 AioFlushEventNotifierHandler *io_flush)
506{
82cbbdc6 507 aio_set_event_notifier(qemu_aio_context, notifier, io_read, io_flush);
a915f4bc 508}