]> git.proxmox.com Git - mirror_qemu.git/blame - include/block/aio.h
aio-posix: move pollfds to thread-local storage
[mirror_qemu.git] / include / block / aio.h
CommitLineData
a76bab49
AL
1/*
2 * QEMU aio implementation
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#ifndef QEMU_AIO_H
15#define QEMU_AIO_H
16
6a1751b7 17#include "qemu/typedefs.h"
a76bab49 18#include "qemu-common.h"
1de7afc9
PB
19#include "qemu/queue.h"
20#include "qemu/event_notifier.h"
dcc772e2 21#include "qemu/thread.h"
98563fc3 22#include "qemu/rfifolock.h"
dae21b98 23#include "qemu/timer.h"
a76bab49 24
7c84b1b8 25typedef struct BlockAIOCB BlockAIOCB;
097310b5 26typedef void BlockCompletionFunc(void *opaque, int ret);
85e8dab1 27
d7331bed 28typedef struct AIOCBInfo {
7c84b1b8
MA
29 void (*cancel_async)(BlockAIOCB *acb);
30 AioContext *(*get_aio_context)(BlockAIOCB *acb);
8c82e9a4 31 size_t aiocb_size;
d7331bed 32} AIOCBInfo;
85e8dab1 33
7c84b1b8 34struct BlockAIOCB {
d7331bed 35 const AIOCBInfo *aiocb_info;
85e8dab1 36 BlockDriverState *bs;
097310b5 37 BlockCompletionFunc *cb;
85e8dab1 38 void *opaque;
f197fe2b 39 int refcnt;
85e8dab1
PB
40};
41
d7331bed 42void *qemu_aio_get(const AIOCBInfo *aiocb_info, BlockDriverState *bs,
097310b5 43 BlockCompletionFunc *cb, void *opaque);
8007429a 44void qemu_aio_unref(void *p);
f197fe2b 45void qemu_aio_ref(void *p);
85e8dab1 46
f627aab1
PB
47typedef struct AioHandler AioHandler;
48typedef void QEMUBHFunc(void *opaque);
49typedef void IOHandler(void *opaque);
50
6a1751b7 51struct AioContext {
e3713e00
PB
52 GSource source;
53
98563fc3
SH
54 /* Protects all fields from multi-threaded access */
55 RFifoLock lock;
56
a915f4bc
PB
57 /* The list of registered AIO handlers */
58 QLIST_HEAD(, AioHandler) aio_handlers;
59
60 /* This is a simple lock used to protect the aio_handlers list.
61 * Specifically, it's used to ensure that no callbacks are removed while
62 * we're walking and dispatching callbacks.
63 */
64 int walking_handlers;
65
0ceb849b
PB
66 /* Used to avoid unnecessary event_notifier_set calls in aio_notify.
67 * Writes protected by lock or BQL, reads are lockless.
68 */
69 bool dispatching;
70
dcc772e2
LPF
71 /* lock to protect between bh's adders and deleter */
72 QemuMutex bh_lock;
0ceb849b 73
f627aab1
PB
74 /* Anchor of the list of Bottom Halves belonging to the context */
75 struct QEMUBH *first_bh;
76
77 /* A simple lock used to protect the first_bh list, and ensure that
78 * no callbacks are removed while we're walking and dispatching callbacks.
79 */
80 int walking_bh;
2f4dc3c1
PB
81
82 /* Used for aio_notify. */
83 EventNotifier notifier;
6b5f8762 84
9b34277d
SH
85 /* Thread pool for performing work and receiving completion callbacks */
86 struct ThreadPool *thread_pool;
dae21b98
AB
87
88 /* TimerLists for calling timers - one per clock type */
89 QEMUTimerListGroup tlg;
6a1751b7 90};
f627aab1 91
0ceb849b
PB
92/* Used internally to synchronize aio_poll against qemu_bh_schedule. */
93void aio_set_dispatching(AioContext *ctx, bool dispatching);
94
f627aab1
PB
95/**
96 * aio_context_new: Allocate a new AioContext.
97 *
98 * AioContext provide a mini event-loop that can be waited on synchronously.
99 * They also provide bottom halves, a service to execute a piece of code
100 * as soon as possible.
101 */
2f78e491 102AioContext *aio_context_new(Error **errp);
f627aab1 103
e3713e00
PB
104/**
105 * aio_context_ref:
106 * @ctx: The AioContext to operate on.
107 *
108 * Add a reference to an AioContext.
109 */
110void aio_context_ref(AioContext *ctx);
111
112/**
113 * aio_context_unref:
114 * @ctx: The AioContext to operate on.
115 *
116 * Drop a reference to an AioContext.
117 */
118void aio_context_unref(AioContext *ctx);
119
98563fc3
SH
120/* Take ownership of the AioContext. If the AioContext will be shared between
121 * threads, a thread must have ownership when calling aio_poll().
122 *
123 * Note that multiple threads calling aio_poll() means timers, BHs, and
124 * callbacks may be invoked from a different thread than they were registered
125 * from. Therefore, code must use AioContext acquire/release or use
126 * fine-grained synchronization to protect shared state if other threads will
127 * be accessing it simultaneously.
128 */
129void aio_context_acquire(AioContext *ctx);
130
131/* Relinquish ownership of the AioContext. */
132void aio_context_release(AioContext *ctx);
133
f627aab1
PB
134/**
135 * aio_bh_new: Allocate a new bottom half structure.
136 *
137 * Bottom halves are lightweight callbacks whose invocation is guaranteed
138 * to be wait-free, thread-safe and signal-safe. The #QEMUBH structure
139 * is opaque and must be allocated prior to its use.
140 */
141QEMUBH *aio_bh_new(AioContext *ctx, QEMUBHFunc *cb, void *opaque);
142
2f4dc3c1
PB
143/**
144 * aio_notify: Force processing of pending events.
145 *
146 * Similar to signaling a condition variable, aio_notify forces
147 * aio_wait to exit, so that the next call will re-examine pending events.
148 * The caller of aio_notify will usually call aio_wait again very soon,
149 * or go through another iteration of the GLib main loop. Hence, aio_notify
150 * also has the side effect of recalculating the sets of file descriptors
151 * that the main loop waits for.
152 *
153 * Calling aio_notify is rarely necessary, because for example scheduling
154 * a bottom half calls it already.
155 */
156void aio_notify(AioContext *ctx);
157
f627aab1
PB
158/**
159 * aio_bh_poll: Poll bottom halves for an AioContext.
160 *
161 * These are internal functions used by the QEMU main loop.
dcc772e2
LPF
162 * And notice that multiple occurrences of aio_bh_poll cannot
163 * be called concurrently
f627aab1
PB
164 */
165int aio_bh_poll(AioContext *ctx);
f627aab1
PB
166
167/**
168 * qemu_bh_schedule: Schedule a bottom half.
169 *
170 * Scheduling a bottom half interrupts the main loop and causes the
171 * execution of the callback that was passed to qemu_bh_new.
172 *
173 * Bottom halves that are scheduled from a bottom half handler are instantly
174 * invoked. This can create an infinite loop if a bottom half handler
175 * schedules itself.
176 *
177 * @bh: The bottom half to be scheduled.
178 */
179void qemu_bh_schedule(QEMUBH *bh);
180
181/**
182 * qemu_bh_cancel: Cancel execution of a bottom half.
183 *
184 * Canceling execution of a bottom half undoes the effect of calls to
185 * qemu_bh_schedule without freeing its resources yet. While cancellation
186 * itself is also wait-free and thread-safe, it can of course race with the
187 * loop that executes bottom halves unless you are holding the iothread
188 * mutex. This makes it mostly useless if you are not holding the mutex.
189 *
190 * @bh: The bottom half to be canceled.
191 */
192void qemu_bh_cancel(QEMUBH *bh);
193
194/**
195 *qemu_bh_delete: Cancel execution of a bottom half and free its resources.
196 *
197 * Deleting a bottom half frees the memory that was allocated for it by
198 * qemu_bh_new. It also implies canceling the bottom half if it was
199 * scheduled.
dcc772e2
LPF
200 * This func is async. The bottom half will do the delete action at the finial
201 * end.
f627aab1
PB
202 *
203 * @bh: The bottom half to be deleted.
204 */
205void qemu_bh_delete(QEMUBH *bh);
206
cd9ba1eb 207/* Return whether there are any pending callbacks from the GSource
a3462c65
PB
208 * attached to the AioContext, before g_poll is invoked.
209 *
210 * This is used internally in the implementation of the GSource.
211 */
212bool aio_prepare(AioContext *ctx);
213
214/* Return whether there are any pending callbacks from the GSource
215 * attached to the AioContext, after g_poll is invoked.
cd9ba1eb
PB
216 *
217 * This is used internally in the implementation of the GSource.
218 */
219bool aio_pending(AioContext *ctx);
220
e4c7e2d1
PB
221/* Dispatch any pending callbacks from the GSource attached to the AioContext.
222 *
223 * This is used internally in the implementation of the GSource.
224 */
225bool aio_dispatch(AioContext *ctx);
226
7c0628b2
PB
227/* Progress in completing AIO work to occur. This can issue new pending
228 * aio as a result of executing I/O completion or bh callbacks.
bcdc1857 229 *
acfb23ad
PB
230 * Return whether any progress was made by executing AIO or bottom half
231 * handlers. If @blocking == true, this should always be true except
232 * if someone called aio_notify.
7c0628b2
PB
233 *
234 * If there are no pending bottom halves, but there are pending AIO
235 * operations, it may not be possible to make any progress without
236 * blocking. If @blocking is true, this function will wait until one
237 * or more AIO events have completed, to ensure something has moved
238 * before returning.
7c0628b2
PB
239 */
240bool aio_poll(AioContext *ctx, bool blocking);
a76bab49
AL
241
242/* Register a file descriptor and associated callbacks. Behaves very similarly
243 * to qemu_set_fd_handler2. Unlike qemu_set_fd_handler2, these callbacks will
87f68d31 244 * be invoked when using aio_poll().
a76bab49
AL
245 *
246 * Code that invokes AIO completion functions should rely on this function
247 * instead of qemu_set_fd_handler[2].
248 */
a915f4bc
PB
249void aio_set_fd_handler(AioContext *ctx,
250 int fd,
251 IOHandler *io_read,
252 IOHandler *io_write,
a915f4bc 253 void *opaque);
9958c351
PB
254
255/* Register an event notifier and associated callbacks. Behaves very similarly
256 * to event_notifier_set_handler. Unlike event_notifier_set_handler, these callbacks
87f68d31 257 * will be invoked when using aio_poll().
9958c351
PB
258 *
259 * Code that invokes AIO completion functions should rely on this function
260 * instead of event_notifier_set_handler.
261 */
a915f4bc
PB
262void aio_set_event_notifier(AioContext *ctx,
263 EventNotifier *notifier,
f2e5dca4 264 EventNotifierHandler *io_read);
a915f4bc 265
e3713e00
PB
266/* Return a GSource that lets the main loop poll the file descriptors attached
267 * to this AioContext.
268 */
269GSource *aio_get_g_source(AioContext *ctx);
270
9b34277d
SH
271/* Return the ThreadPool bound to this AioContext */
272struct ThreadPool *aio_get_thread_pool(AioContext *ctx);
273
4e29e831
AB
274/**
275 * aio_timer_new:
276 * @ctx: the aio context
277 * @type: the clock type
278 * @scale: the scale
279 * @cb: the callback to call on timer expiry
280 * @opaque: the opaque pointer to pass to the callback
281 *
282 * Allocate a new timer attached to the context @ctx.
283 * The function is responsible for memory allocation.
284 *
285 * The preferred interface is aio_timer_init. Use that
286 * unless you really need dynamic memory allocation.
287 *
288 * Returns: a pointer to the new timer
289 */
290static inline QEMUTimer *aio_timer_new(AioContext *ctx, QEMUClockType type,
291 int scale,
292 QEMUTimerCB *cb, void *opaque)
293{
294 return timer_new_tl(ctx->tlg.tl[type], scale, cb, opaque);
295}
296
297/**
298 * aio_timer_init:
299 * @ctx: the aio context
300 * @ts: the timer
301 * @type: the clock type
302 * @scale: the scale
303 * @cb: the callback to call on timer expiry
304 * @opaque: the opaque pointer to pass to the callback
305 *
306 * Initialise a new timer attached to the context @ctx.
307 * The caller is responsible for memory allocation.
308 */
309static inline void aio_timer_init(AioContext *ctx,
310 QEMUTimer *ts, QEMUClockType type,
311 int scale,
312 QEMUTimerCB *cb, void *opaque)
313{
f186aa97 314 timer_init_tl(ts, ctx->tlg.tl[type], scale, cb, opaque);
4e29e831
AB
315}
316
845ca10d
PB
317/**
318 * aio_compute_timeout:
319 * @ctx: the aio context
320 *
321 * Compute the timeout that a blocking aio_poll should use.
322 */
323int64_t aio_compute_timeout(AioContext *ctx);
324
a76bab49 325#endif