]> git.proxmox.com Git - mirror_qemu.git/blame - block/throttle-groups.c
CODING_STYLE: specify the indent rule for multiline code
[mirror_qemu.git] / block / throttle-groups.c
CommitLineData
2ff1f2e3
AG
1/*
2 * QEMU block throttling group infrastructure
3 *
4 * Copyright (C) Nodalink, EURL. 2014
5 * Copyright (C) Igalia, S.L. 2015
6 *
7 * Authors:
8 * BenoƮt Canet <benoit.canet@nodalink.com>
9 * Alberto Garcia <berto@igalia.com>
10 *
11 * This program is free software; you can redistribute it and/or
12 * modify it under the terms of the GNU General Public License as
13 * published by the Free Software Foundation; either version 2 or
14 * (at your option) version 3 of the License.
15 *
16 * This program is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU General Public License for more details.
20 *
21 * You should have received a copy of the GNU General Public License
22 * along with this program; if not, see <http://www.gnu.org/licenses/>.
23 */
24
80c71a24 25#include "qemu/osdep.h"
31dce3cc 26#include "sysemu/block-backend.h"
2ff1f2e3 27#include "block/throttle-groups.h"
432d889e 28#include "qemu/throttle-options.h"
76f4afb4
AG
29#include "qemu/queue.h"
30#include "qemu/thread.h"
31#include "sysemu/qtest.h"
432d889e 32#include "qapi/error.h"
9af23989 33#include "qapi/qapi-visit-block-core.h"
432d889e
MP
34#include "qom/object.h"
35#include "qom/object_interfaces.h"
36
37static void throttle_group_obj_init(Object *obj);
38static void throttle_group_obj_complete(UserCreatable *obj, Error **errp);
25b8e4db 39static void timer_cb(ThrottleGroupMember *tgm, bool is_write);
2ff1f2e3
AG
40
41/* The ThrottleGroup structure (with its ThrottleState) is shared
022cdc9f 42 * among different ThrottleGroupMembers and it's independent from
2ff1f2e3
AG
43 * AioContext, so in order to use it from different threads it needs
44 * its own locking.
45 *
46 * This locking is however handled internally in this file, so it's
d87d01e1 47 * transparent to outside users.
2ff1f2e3
AG
48 *
49 * The whole ThrottleGroup structure is private and invisible to
50 * outside users, that only use it through its ThrottleState.
51 *
022cdc9f 52 * In addition to the ThrottleGroup structure, ThrottleGroupMember has
2ff1f2e3 53 * fields that need to be accessed by other members of the group and
27ccdd52 54 * therefore also need to be protected by this lock. Once a
022cdc9f 55 * ThrottleGroupMember is registered in a group those fields can be accessed
27ccdd52 56 * by other threads any time.
2ff1f2e3
AG
57 *
58 * Again, all this is handled internally and is mostly transparent to
59 * the outside. The 'throttle_timers' field however has an additional
60 * constraint because it may be temporarily invalid (see for example
0d2fac8e 61 * blk_set_aio_context()). Therefore in this file a thread will
022cdc9f
MP
62 * access some other ThrottleGroupMember's timers only after verifying that
63 * that ThrottleGroupMember has throttled requests in the queue.
2ff1f2e3
AG
64 */
65typedef struct ThrottleGroup {
432d889e
MP
66 Object parent_obj;
67
68 /* refuse individual property change if initialization is complete */
69 bool is_initialized;
2ff1f2e3
AG
70 char *name; /* This is constant during the lifetime of the group */
71
72 QemuMutex lock; /* This lock protects the following four fields */
73 ThrottleState ts;
022cdc9f
MP
74 QLIST_HEAD(, ThrottleGroupMember) head;
75 ThrottleGroupMember *tokens[2];
2ff1f2e3 76 bool any_timer_armed[2];
dbe824cc 77 QEMUClockType clock_type;
2ff1f2e3 78
432d889e 79 /* This field is protected by the global QEMU mutex */
2ff1f2e3
AG
80 QTAILQ_ENTRY(ThrottleGroup) list;
81} ThrottleGroup;
82
432d889e 83/* This is protected by the global QEMU mutex */
2ff1f2e3
AG
84static QTAILQ_HEAD(, ThrottleGroup) throttle_groups =
85 QTAILQ_HEAD_INITIALIZER(throttle_groups);
86
432d889e
MP
87
88/* This function reads throttle_groups and must be called under the global
89 * mutex.
90 */
91static ThrottleGroup *throttle_group_by_name(const char *name)
92{
93 ThrottleGroup *iter;
94
95 /* Look for an existing group with that name */
96 QTAILQ_FOREACH(iter, &throttle_groups, list) {
97 if (!g_strcmp0(name, iter->name)) {
98 return iter;
99 }
100 }
101
102 return NULL;
103}
104
d8e7d87e
MP
105/* This function reads throttle_groups and must be called under the global
106 * mutex.
107 */
108bool throttle_group_exists(const char *name)
109{
110 return throttle_group_by_name(name) != NULL;
111}
112
2ff1f2e3
AG
113/* Increments the reference count of a ThrottleGroup given its name.
114 *
115 * If no ThrottleGroup is found with the given name a new one is
116 * created.
117 *
432d889e
MP
118 * This function edits throttle_groups and must be called under the global
119 * mutex.
120 *
2ff1f2e3 121 * @name: the name of the ThrottleGroup
973f2ddf 122 * @ret: the ThrottleState member of the ThrottleGroup
2ff1f2e3 123 */
973f2ddf 124ThrottleState *throttle_group_incref(const char *name)
2ff1f2e3
AG
125{
126 ThrottleGroup *tg = NULL;
2ff1f2e3
AG
127
128 /* Look for an existing group with that name */
432d889e
MP
129 tg = throttle_group_by_name(name);
130
131 if (tg) {
132 object_ref(OBJECT(tg));
133 } else {
134 /* Create a new one if not found */
135 /* new ThrottleGroup obj will have a refcnt = 1 */
136 tg = THROTTLE_GROUP(object_new(TYPE_THROTTLE_GROUP));
2ff1f2e3 137 tg->name = g_strdup(name);
432d889e 138 throttle_group_obj_complete(USER_CREATABLE(tg), &error_abort);
2ff1f2e3
AG
139 }
140
973f2ddf 141 return &tg->ts;
2ff1f2e3
AG
142}
143
144/* Decrease the reference count of a ThrottleGroup.
145 *
146 * When the reference count reaches zero the ThrottleGroup is
147 * destroyed.
148 *
432d889e
MP
149 * This function edits throttle_groups and must be called under the global
150 * mutex.
151 *
973f2ddf 152 * @ts: The ThrottleGroup to unref, given by its ThrottleState member
2ff1f2e3 153 */
973f2ddf 154void throttle_group_unref(ThrottleState *ts)
2ff1f2e3 155{
973f2ddf 156 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
432d889e 157 object_unref(OBJECT(tg));
2ff1f2e3
AG
158}
159
022cdc9f 160/* Get the name from a ThrottleGroupMember's group. The name (and the pointer)
49d2165d 161 * is guaranteed to remain constant during the lifetime of the group.
2ff1f2e3 162 *
022cdc9f 163 * @tgm: a ThrottleGroupMember
2ff1f2e3
AG
164 * @ret: the name of the group.
165 */
022cdc9f 166const char *throttle_group_get_name(ThrottleGroupMember *tgm)
2ff1f2e3 167{
022cdc9f 168 ThrottleGroup *tg = container_of(tgm->throttle_state, ThrottleGroup, ts);
2ff1f2e3
AG
169 return tg->name;
170}
171
022cdc9f
MP
172/* Return the next ThrottleGroupMember in the round-robin sequence, simulating
173 * a circular list.
2ff1f2e3
AG
174 *
175 * This assumes that tg->lock is held.
176 *
022cdc9f
MP
177 * @tgm: the current ThrottleGroupMember
178 * @ret: the next ThrottleGroupMember in the sequence
2ff1f2e3 179 */
022cdc9f 180static ThrottleGroupMember *throttle_group_next_tgm(ThrottleGroupMember *tgm)
2ff1f2e3 181{
022cdc9f 182 ThrottleState *ts = tgm->throttle_state;
2ff1f2e3 183 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
022cdc9f 184 ThrottleGroupMember *next = QLIST_NEXT(tgm, round_robin);
2ff1f2e3
AG
185
186 if (!next) {
31dce3cc 187 next = QLIST_FIRST(&tg->head);
2ff1f2e3
AG
188 }
189
022cdc9f 190 return next;
2ff1f2e3
AG
191}
192
6bf77e1c 193/*
022cdc9f 194 * Return whether a ThrottleGroupMember has pending requests.
6bf77e1c
AG
195 *
196 * This assumes that tg->lock is held.
197 *
022cdc9f
MP
198 * @tgm: the ThrottleGroupMember
199 * @is_write: the type of operation (read/write)
200 * @ret: whether the ThrottleGroupMember has pending requests.
6bf77e1c 201 */
022cdc9f 202static inline bool tgm_has_pending_reqs(ThrottleGroupMember *tgm,
6bf77e1c
AG
203 bool is_write)
204{
022cdc9f 205 return tgm->pending_reqs[is_write];
6bf77e1c
AG
206}
207
022cdc9f
MP
208/* Return the next ThrottleGroupMember in the round-robin sequence with pending
209 * I/O requests.
76f4afb4
AG
210 *
211 * This assumes that tg->lock is held.
212 *
022cdc9f 213 * @tgm: the current ThrottleGroupMember
76f4afb4 214 * @is_write: the type of operation (read/write)
022cdc9f
MP
215 * @ret: the next ThrottleGroupMember with pending requests, or tgm if
216 * there is none.
76f4afb4 217 */
022cdc9f
MP
218static ThrottleGroupMember *next_throttle_token(ThrottleGroupMember *tgm,
219 bool is_write)
76f4afb4 220{
022cdc9f
MP
221 ThrottleState *ts = tgm->throttle_state;
222 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
223 ThrottleGroupMember *token, *start;
76f4afb4 224
5d8e4ca0
AG
225 /* If this member has its I/O limits disabled then it means that
226 * it's being drained. Skip the round-robin search and return tgm
227 * immediately if it has pending requests. Otherwise we could be
228 * forcing it to wait for other member's throttled requests. */
229 if (tgm_has_pending_reqs(tgm, is_write) &&
230 atomic_read(&tgm->io_limits_disabled)) {
231 return tgm;
232 }
233
76f4afb4
AG
234 start = token = tg->tokens[is_write];
235
236 /* get next bs round in round robin style */
022cdc9f
MP
237 token = throttle_group_next_tgm(token);
238 while (token != start && !tgm_has_pending_reqs(token, is_write)) {
239 token = throttle_group_next_tgm(token);
76f4afb4
AG
240 }
241
242 /* If no IO are queued for scheduling on the next round robin token
022cdc9f
MP
243 * then decide the token is the current tgm because chances are
244 * the current tgm got the current request queued.
76f4afb4 245 */
022cdc9f
MP
246 if (token == start && !tgm_has_pending_reqs(token, is_write)) {
247 token = tgm;
76f4afb4
AG
248 }
249
022cdc9f
MP
250 /* Either we return the original TGM, or one with pending requests */
251 assert(token == tgm || tgm_has_pending_reqs(token, is_write));
6bf77e1c 252
76f4afb4
AG
253 return token;
254}
255
022cdc9f
MP
256/* Check if the next I/O request for a ThrottleGroupMember needs to be
257 * throttled or not. If there's no timer set in this group, set one and update
258 * the token accordingly.
76f4afb4
AG
259 *
260 * This assumes that tg->lock is held.
261 *
022cdc9f 262 * @tgm: the current ThrottleGroupMember
76f4afb4
AG
263 * @is_write: the type of operation (read/write)
264 * @ret: whether the I/O request needs to be throttled or not
265 */
022cdc9f
MP
266static bool throttle_group_schedule_timer(ThrottleGroupMember *tgm,
267 bool is_write)
76f4afb4 268{
022cdc9f 269 ThrottleState *ts = tgm->throttle_state;
76f4afb4 270 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
022cdc9f 271 ThrottleTimers *tt = &tgm->throttle_timers;
76f4afb4
AG
272 bool must_wait;
273
022cdc9f 274 if (atomic_read(&tgm->io_limits_disabled)) {
ce0f1412
PB
275 return false;
276 }
277
76f4afb4
AG
278 /* Check if any of the timers in this group is already armed */
279 if (tg->any_timer_armed[is_write]) {
280 return true;
281 }
282
283 must_wait = throttle_schedule_timer(ts, tt, is_write);
284
022cdc9f 285 /* If a timer just got armed, set tgm as the current token */
76f4afb4 286 if (must_wait) {
022cdc9f 287 tg->tokens[is_write] = tgm;
76f4afb4
AG
288 tg->any_timer_armed[is_write] = true;
289 }
290
291 return must_wait;
292}
293
022cdc9f 294/* Start the next pending I/O request for a ThrottleGroupMember. Return whether
3b170dc8
PB
295 * any request was actually pending.
296 *
022cdc9f 297 * @tgm: the current ThrottleGroupMember
3b170dc8
PB
298 * @is_write: the type of operation (read/write)
299 */
022cdc9f 300static bool coroutine_fn throttle_group_co_restart_queue(ThrottleGroupMember *tgm,
3b170dc8
PB
301 bool is_write)
302{
93001e9d 303 bool ret;
3b170dc8 304
022cdc9f
MP
305 qemu_co_mutex_lock(&tgm->throttled_reqs_lock);
306 ret = qemu_co_queue_next(&tgm->throttled_reqs[is_write]);
307 qemu_co_mutex_unlock(&tgm->throttled_reqs_lock);
93001e9d
PB
308
309 return ret;
3b170dc8
PB
310}
311
76f4afb4
AG
312/* Look for the next pending I/O request and schedule it.
313 *
314 * This assumes that tg->lock is held.
315 *
022cdc9f 316 * @tgm: the current ThrottleGroupMember
76f4afb4
AG
317 * @is_write: the type of operation (read/write)
318 */
022cdc9f 319static void schedule_next_request(ThrottleGroupMember *tgm, bool is_write)
76f4afb4 320{
022cdc9f
MP
321 ThrottleState *ts = tgm->throttle_state;
322 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
76f4afb4 323 bool must_wait;
022cdc9f 324 ThrottleGroupMember *token;
76f4afb4
AG
325
326 /* Check if there's any pending request to schedule next */
022cdc9f
MP
327 token = next_throttle_token(tgm, is_write);
328 if (!tgm_has_pending_reqs(token, is_write)) {
76f4afb4
AG
329 return;
330 }
331
332 /* Set a timer for the request if it needs to be throttled */
333 must_wait = throttle_group_schedule_timer(token, is_write);
334
335 /* If it doesn't have to wait, queue it for immediate execution */
336 if (!must_wait) {
022cdc9f 337 /* Give preference to requests from the current tgm */
76f4afb4 338 if (qemu_in_coroutine() &&
022cdc9f
MP
339 throttle_group_co_restart_queue(tgm, is_write)) {
340 token = tgm;
76f4afb4 341 } else {
022cdc9f 342 ThrottleTimers *tt = &token->throttle_timers;
dbe824cc 343 int64_t now = qemu_clock_get_ns(tg->clock_type);
7258ed93 344 timer_mod(tt->timers[is_write], now);
76f4afb4
AG
345 tg->any_timer_armed[is_write] = true;
346 }
347 tg->tokens[is_write] = token;
348 }
349}
350
351/* Check if an I/O request needs to be throttled, wait and set a timer
352 * if necessary, and schedule the next request using a round robin
353 * algorithm.
354 *
022cdc9f 355 * @tgm: the current ThrottleGroupMember
76f4afb4
AG
356 * @bytes: the number of bytes for this I/O
357 * @is_write: the type of operation (read/write)
358 */
022cdc9f 359void coroutine_fn throttle_group_co_io_limits_intercept(ThrottleGroupMember *tgm,
76f4afb4
AG
360 unsigned int bytes,
361 bool is_write)
362{
363 bool must_wait;
022cdc9f
MP
364 ThrottleGroupMember *token;
365 ThrottleGroup *tg = container_of(tgm->throttle_state, ThrottleGroup, ts);
76f4afb4
AG
366 qemu_mutex_lock(&tg->lock);
367
368 /* First we check if this I/O has to be throttled. */
022cdc9f 369 token = next_throttle_token(tgm, is_write);
76f4afb4
AG
370 must_wait = throttle_group_schedule_timer(token, is_write);
371
372 /* Wait if there's a timer set or queued requests of this type */
022cdc9f
MP
373 if (must_wait || tgm->pending_reqs[is_write]) {
374 tgm->pending_reqs[is_write]++;
76f4afb4 375 qemu_mutex_unlock(&tg->lock);
022cdc9f
MP
376 qemu_co_mutex_lock(&tgm->throttled_reqs_lock);
377 qemu_co_queue_wait(&tgm->throttled_reqs[is_write],
378 &tgm->throttled_reqs_lock);
379 qemu_co_mutex_unlock(&tgm->throttled_reqs_lock);
76f4afb4 380 qemu_mutex_lock(&tg->lock);
022cdc9f 381 tgm->pending_reqs[is_write]--;
76f4afb4
AG
382 }
383
384 /* The I/O will be executed, so do the accounting */
022cdc9f 385 throttle_account(tgm->throttle_state, is_write, bytes);
76f4afb4
AG
386
387 /* Schedule the next request */
022cdc9f 388 schedule_next_request(tgm, is_write);
76f4afb4
AG
389
390 qemu_mutex_unlock(&tg->lock);
391}
392
3b170dc8 393typedef struct {
022cdc9f 394 ThrottleGroupMember *tgm;
3b170dc8
PB
395 bool is_write;
396} RestartData;
397
398static void coroutine_fn throttle_group_restart_queue_entry(void *opaque)
7258ed93 399{
3b170dc8 400 RestartData *data = opaque;
022cdc9f
MP
401 ThrottleGroupMember *tgm = data->tgm;
402 ThrottleState *ts = tgm->throttle_state;
403 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
3b170dc8 404 bool is_write = data->is_write;
7258ed93
PB
405 bool empty_queue;
406
022cdc9f 407 empty_queue = !throttle_group_co_restart_queue(tgm, is_write);
7258ed93
PB
408
409 /* If the request queue was empty then we have to take care of
410 * scheduling the next one */
411 if (empty_queue) {
412 qemu_mutex_lock(&tg->lock);
022cdc9f 413 schedule_next_request(tgm, is_write);
7258ed93
PB
414 qemu_mutex_unlock(&tg->lock);
415 }
43a5dc02
MP
416
417 g_free(data);
bc19a0a6
SH
418
419 atomic_dec(&tgm->restart_pending);
420 aio_wait_kick();
7258ed93
PB
421}
422
022cdc9f 423static void throttle_group_restart_queue(ThrottleGroupMember *tgm, bool is_write)
3b170dc8
PB
424{
425 Coroutine *co;
43a5dc02
MP
426 RestartData *rd = g_new0(RestartData, 1);
427
428 rd->tgm = tgm;
429 rd->is_write = is_write;
3b170dc8 430
25b8e4db
AG
431 /* This function is called when a timer is fired or when
432 * throttle_group_restart_tgm() is called. Either way, there can
433 * be no timer pending on this tgm at this point */
434 assert(!timer_pending(tgm->throttle_timers.timers[is_write]));
435
bc19a0a6
SH
436 atomic_inc(&tgm->restart_pending);
437
43a5dc02 438 co = qemu_coroutine_create(throttle_group_restart_queue_entry, rd);
c61791fc 439 aio_co_enter(tgm->aio_context, co);
3b170dc8
PB
440}
441
022cdc9f 442void throttle_group_restart_tgm(ThrottleGroupMember *tgm)
a72f6414 443{
25b8e4db
AG
444 int i;
445
022cdc9f 446 if (tgm->throttle_state) {
25b8e4db
AG
447 for (i = 0; i < 2; i++) {
448 QEMUTimer *t = tgm->throttle_timers.timers[i];
449 if (timer_pending(t)) {
450 /* If there's a pending timer on this tgm, fire it now */
451 timer_del(t);
452 timer_cb(tgm, i);
453 } else {
454 /* Else run the next request from the queue manually */
455 throttle_group_restart_queue(tgm, i);
456 }
457 }
a72f6414
PB
458 }
459}
460
2ff1f2e3
AG
461/* Update the throttle configuration for a particular group. Similar
462 * to throttle_config(), but guarantees atomicity within the
463 * throttling group.
464 *
022cdc9f 465 * @tgm: a ThrottleGroupMember that is a member of the group
2ff1f2e3
AG
466 * @cfg: the configuration to set
467 */
022cdc9f 468void throttle_group_config(ThrottleGroupMember *tgm, ThrottleConfig *cfg)
2ff1f2e3 469{
022cdc9f 470 ThrottleState *ts = tgm->throttle_state;
2ff1f2e3
AG
471 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
472 qemu_mutex_lock(&tg->lock);
27e4cf13 473 throttle_config(ts, tg->clock_type, cfg);
2ff1f2e3 474 qemu_mutex_unlock(&tg->lock);
a72f6414 475
022cdc9f 476 throttle_group_restart_tgm(tgm);
2ff1f2e3
AG
477}
478
479/* Get the throttle configuration from a particular group. Similar to
480 * throttle_get_config(), but guarantees atomicity within the
481 * throttling group.
482 *
022cdc9f 483 * @tgm: a ThrottleGroupMember that is a member of the group
2ff1f2e3
AG
484 * @cfg: the configuration will be written here
485 */
022cdc9f 486void throttle_group_get_config(ThrottleGroupMember *tgm, ThrottleConfig *cfg)
2ff1f2e3 487{
022cdc9f 488 ThrottleState *ts = tgm->throttle_state;
2ff1f2e3
AG
489 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
490 qemu_mutex_lock(&tg->lock);
491 throttle_get_config(ts, cfg);
492 qemu_mutex_unlock(&tg->lock);
493}
494
76f4afb4
AG
495/* ThrottleTimers callback. This wakes up a request that was waiting
496 * because it had been throttled.
497 *
c61791fc 498 * @tgm: the ThrottleGroupMember whose request had been throttled
76f4afb4
AG
499 * @is_write: the type of operation (read/write)
500 */
c61791fc 501static void timer_cb(ThrottleGroupMember *tgm, bool is_write)
76f4afb4 502{
022cdc9f 503 ThrottleState *ts = tgm->throttle_state;
76f4afb4 504 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
76f4afb4
AG
505
506 /* The timer has just been fired, so we can update the flag */
507 qemu_mutex_lock(&tg->lock);
508 tg->any_timer_armed[is_write] = false;
509 qemu_mutex_unlock(&tg->lock);
510
511 /* Run the request that was waiting for this timer */
022cdc9f 512 throttle_group_restart_queue(tgm, is_write);
76f4afb4
AG
513}
514
515static void read_timer_cb(void *opaque)
516{
517 timer_cb(opaque, false);
518}
519
520static void write_timer_cb(void *opaque)
521{
522 timer_cb(opaque, true);
523}
524
022cdc9f
MP
525/* Register a ThrottleGroupMember from the throttling group, also initializing
526 * its timers and updating its throttle_state pointer to point to it. If a
31dce3cc 527 * throttling group with that name does not exist yet, it will be created.
2ff1f2e3 528 *
432d889e
MP
529 * This function edits throttle_groups and must be called under the global
530 * mutex.
531 *
022cdc9f 532 * @tgm: the ThrottleGroupMember to insert
2ff1f2e3 533 * @groupname: the name of the group
c61791fc 534 * @ctx: the AioContext to use
2ff1f2e3 535 */
022cdc9f 536void throttle_group_register_tgm(ThrottleGroupMember *tgm,
c61791fc
MP
537 const char *groupname,
538 AioContext *ctx)
2ff1f2e3
AG
539{
540 int i;
973f2ddf
HR
541 ThrottleState *ts = throttle_group_incref(groupname);
542 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
022cdc9f
MP
543
544 tgm->throttle_state = ts;
c61791fc 545 tgm->aio_context = ctx;
bc19a0a6 546 atomic_set(&tgm->restart_pending, 0);
2ff1f2e3
AG
547
548 qemu_mutex_lock(&tg->lock);
022cdc9f 549 /* If the ThrottleGroup is new set this ThrottleGroupMember as the token */
2ff1f2e3
AG
550 for (i = 0; i < 2; i++) {
551 if (!tg->tokens[i]) {
022cdc9f 552 tg->tokens[i] = tgm;
2ff1f2e3
AG
553 }
554 }
555
022cdc9f 556 QLIST_INSERT_HEAD(&tg->head, tgm, round_robin);
76f4afb4 557
022cdc9f 558 throttle_timers_init(&tgm->throttle_timers,
c61791fc 559 tgm->aio_context,
dbe824cc 560 tg->clock_type,
76f4afb4
AG
561 read_timer_cb,
562 write_timer_cb,
c61791fc 563 tgm);
f738cfc8
MP
564 qemu_co_mutex_init(&tgm->throttled_reqs_lock);
565 qemu_co_queue_init(&tgm->throttled_reqs[0]);
566 qemu_co_queue_init(&tgm->throttled_reqs[1]);
76f4afb4 567
2ff1f2e3
AG
568 qemu_mutex_unlock(&tg->lock);
569}
570
022cdc9f 571/* Unregister a ThrottleGroupMember from its group, removing it from the list,
31dce3cc 572 * destroying the timers and setting the throttle_state pointer to NULL.
2ff1f2e3 573 *
022cdc9f
MP
574 * The ThrottleGroupMember must not have pending throttled requests, so the
575 * caller has to drain them first.
5ac72418 576 *
2ff1f2e3
AG
577 * The group will be destroyed if it's empty after this operation.
578 *
022cdc9f 579 * @tgm the ThrottleGroupMember to remove
2ff1f2e3 580 */
022cdc9f 581void throttle_group_unregister_tgm(ThrottleGroupMember *tgm)
2ff1f2e3 582{
022cdc9f
MP
583 ThrottleState *ts = tgm->throttle_state;
584 ThrottleGroup *tg = container_of(ts, ThrottleGroup, ts);
585 ThrottleGroupMember *token;
2ff1f2e3
AG
586 int i;
587
d8e7d87e
MP
588 if (!ts) {
589 /* Discard already unregistered tgm */
590 return;
591 }
592
bc19a0a6
SH
593 /* Wait for throttle_group_restart_queue_entry() coroutines to finish */
594 AIO_WAIT_WHILE(tgm->aio_context, atomic_read(&tgm->restart_pending) > 0);
595
2ff1f2e3
AG
596 qemu_mutex_lock(&tg->lock);
597 for (i = 0; i < 2; i++) {
25b8e4db
AG
598 assert(tgm->pending_reqs[i] == 0);
599 assert(qemu_co_queue_empty(&tgm->throttled_reqs[i]));
600 assert(!timer_pending(tgm->throttle_timers.timers[i]));
022cdc9f
MP
601 if (tg->tokens[i] == tgm) {
602 token = throttle_group_next_tgm(tgm);
603 /* Take care of the case where this is the last tgm in the group */
604 if (token == tgm) {
2ff1f2e3
AG
605 token = NULL;
606 }
607 tg->tokens[i] = token;
608 }
609 }
610
022cdc9f
MP
611 /* remove the current tgm from the list */
612 QLIST_REMOVE(tgm, round_robin);
613 throttle_timers_destroy(&tgm->throttle_timers);
2ff1f2e3
AG
614 qemu_mutex_unlock(&tg->lock);
615
973f2ddf 616 throttle_group_unref(&tg->ts);
022cdc9f 617 tgm->throttle_state = NULL;
2ff1f2e3
AG
618}
619
c61791fc
MP
620void throttle_group_attach_aio_context(ThrottleGroupMember *tgm,
621 AioContext *new_context)
622{
623 ThrottleTimers *tt = &tgm->throttle_timers;
624 throttle_timers_attach_aio_context(tt, new_context);
625 tgm->aio_context = new_context;
626}
627
628void throttle_group_detach_aio_context(ThrottleGroupMember *tgm)
629{
341e0b56 630 ThrottleGroup *tg = container_of(tgm->throttle_state, ThrottleGroup, ts);
c61791fc 631 ThrottleTimers *tt = &tgm->throttle_timers;
341e0b56 632 int i;
dc868fb0
SH
633
634 /* Requests must have been drained */
635 assert(tgm->pending_reqs[0] == 0 && tgm->pending_reqs[1] == 0);
636 assert(qemu_co_queue_empty(&tgm->throttled_reqs[0]));
637 assert(qemu_co_queue_empty(&tgm->throttled_reqs[1]));
638
341e0b56
SH
639 /* Kick off next ThrottleGroupMember, if necessary */
640 qemu_mutex_lock(&tg->lock);
641 for (i = 0; i < 2; i++) {
642 if (timer_pending(tt->timers[i])) {
643 tg->any_timer_armed[i] = false;
644 schedule_next_request(tgm, i);
645 }
646 }
647 qemu_mutex_unlock(&tg->lock);
648
c61791fc
MP
649 throttle_timers_detach_aio_context(tt);
650 tgm->aio_context = NULL;
651}
652
432d889e
MP
653#undef THROTTLE_OPT_PREFIX
654#define THROTTLE_OPT_PREFIX "x-"
655
656/* Helper struct and array for QOM property setter/getter */
657typedef struct {
658 const char *name;
659 BucketType type;
660 enum {
661 AVG,
662 MAX,
663 BURST_LENGTH,
664 IOPS_SIZE,
665 } category;
666} ThrottleParamInfo;
667
668static ThrottleParamInfo properties[] = {
669 {
670 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_TOTAL,
671 THROTTLE_OPS_TOTAL, AVG,
672 },
673 {
674 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_TOTAL_MAX,
675 THROTTLE_OPS_TOTAL, MAX,
676 },
677 {
678 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_TOTAL_MAX_LENGTH,
679 THROTTLE_OPS_TOTAL, BURST_LENGTH,
680 },
681 {
682 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_READ,
683 THROTTLE_OPS_READ, AVG,
684 },
685 {
686 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_READ_MAX,
687 THROTTLE_OPS_READ, MAX,
688 },
689 {
690 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_READ_MAX_LENGTH,
691 THROTTLE_OPS_READ, BURST_LENGTH,
692 },
693 {
694 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_WRITE,
695 THROTTLE_OPS_WRITE, AVG,
696 },
697 {
698 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_WRITE_MAX,
699 THROTTLE_OPS_WRITE, MAX,
700 },
701 {
702 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_WRITE_MAX_LENGTH,
703 THROTTLE_OPS_WRITE, BURST_LENGTH,
704 },
705 {
706 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_TOTAL,
707 THROTTLE_BPS_TOTAL, AVG,
708 },
709 {
710 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_TOTAL_MAX,
711 THROTTLE_BPS_TOTAL, MAX,
712 },
713 {
714 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_TOTAL_MAX_LENGTH,
715 THROTTLE_BPS_TOTAL, BURST_LENGTH,
716 },
717 {
718 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_READ,
719 THROTTLE_BPS_READ, AVG,
720 },
721 {
722 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_READ_MAX,
723 THROTTLE_BPS_READ, MAX,
724 },
725 {
726 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_READ_MAX_LENGTH,
727 THROTTLE_BPS_READ, BURST_LENGTH,
728 },
729 {
730 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_WRITE,
731 THROTTLE_BPS_WRITE, AVG,
732 },
733 {
734 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_WRITE_MAX,
735 THROTTLE_BPS_WRITE, MAX,
736 },
737 {
738 THROTTLE_OPT_PREFIX QEMU_OPT_BPS_WRITE_MAX_LENGTH,
739 THROTTLE_BPS_WRITE, BURST_LENGTH,
740 },
741 {
742 THROTTLE_OPT_PREFIX QEMU_OPT_IOPS_SIZE,
743 0, IOPS_SIZE,
744 }
745};
746
747/* This function edits throttle_groups and must be called under the global
748 * mutex */
749static void throttle_group_obj_init(Object *obj)
750{
751 ThrottleGroup *tg = THROTTLE_GROUP(obj);
752
753 tg->clock_type = QEMU_CLOCK_REALTIME;
754 if (qtest_enabled()) {
755 /* For testing block IO throttling only */
756 tg->clock_type = QEMU_CLOCK_VIRTUAL;
757 }
758 tg->is_initialized = false;
759 qemu_mutex_init(&tg->lock);
760 throttle_init(&tg->ts);
761 QLIST_INIT(&tg->head);
762}
763
764/* This function edits throttle_groups and must be called under the global
765 * mutex */
766static void throttle_group_obj_complete(UserCreatable *obj, Error **errp)
767{
768 ThrottleGroup *tg = THROTTLE_GROUP(obj);
769 ThrottleConfig cfg;
770
771 /* set group name to object id if it exists */
772 if (!tg->name && tg->parent_obj.parent) {
773 tg->name = object_get_canonical_path_component(OBJECT(obj));
774 }
775 /* We must have a group name at this point */
776 assert(tg->name);
777
778 /* error if name is duplicate */
d8e7d87e 779 if (throttle_group_exists(tg->name)) {
432d889e
MP
780 error_setg(errp, "A group with this name already exists");
781 return;
782 }
783
784 /* check validity */
785 throttle_get_config(&tg->ts, &cfg);
786 if (!throttle_is_valid(&cfg, errp)) {
787 return;
788 }
789 throttle_config(&tg->ts, tg->clock_type, &cfg);
790 QTAILQ_INSERT_TAIL(&throttle_groups, tg, list);
791 tg->is_initialized = true;
792}
793
794/* This function edits throttle_groups and must be called under the global
795 * mutex */
796static void throttle_group_obj_finalize(Object *obj)
797{
798 ThrottleGroup *tg = THROTTLE_GROUP(obj);
799 if (tg->is_initialized) {
800 QTAILQ_REMOVE(&throttle_groups, tg, list);
801 }
802 qemu_mutex_destroy(&tg->lock);
803 g_free(tg->name);
804}
805
806static void throttle_group_set(Object *obj, Visitor *v, const char * name,
807 void *opaque, Error **errp)
808
809{
810 ThrottleGroup *tg = THROTTLE_GROUP(obj);
811 ThrottleConfig *cfg;
812 ThrottleParamInfo *info = opaque;
813 Error *local_err = NULL;
814 int64_t value;
815
816 /* If we have finished initialization, don't accept individual property
817 * changes through QOM. Throttle configuration limits must be set in one
818 * transaction, as certain combinations are invalid.
819 */
820 if (tg->is_initialized) {
821 error_setg(&local_err, "Property cannot be set after initialization");
822 goto ret;
823 }
824
825 visit_type_int64(v, name, &value, &local_err);
826 if (local_err) {
827 goto ret;
828 }
829 if (value < 0) {
830 error_setg(&local_err, "Property values cannot be negative");
831 goto ret;
832 }
833
834 cfg = &tg->ts.cfg;
835 switch (info->category) {
836 case AVG:
837 cfg->buckets[info->type].avg = value;
838 break;
839 case MAX:
840 cfg->buckets[info->type].max = value;
841 break;
842 case BURST_LENGTH:
843 if (value > UINT_MAX) {
844 error_setg(&local_err, "%s value must be in the"
845 "range [0, %u]", info->name, UINT_MAX);
846 goto ret;
847 }
848 cfg->buckets[info->type].burst_length = value;
849 break;
850 case IOPS_SIZE:
851 cfg->op_size = value;
852 break;
853 }
854
855ret:
856 error_propagate(errp, local_err);
857 return;
858
859}
860
861static void throttle_group_get(Object *obj, Visitor *v, const char *name,
862 void *opaque, Error **errp)
863{
864 ThrottleGroup *tg = THROTTLE_GROUP(obj);
865 ThrottleConfig cfg;
866 ThrottleParamInfo *info = opaque;
867 int64_t value;
868
869 throttle_get_config(&tg->ts, &cfg);
870 switch (info->category) {
871 case AVG:
872 value = cfg.buckets[info->type].avg;
873 break;
874 case MAX:
875 value = cfg.buckets[info->type].max;
876 break;
877 case BURST_LENGTH:
878 value = cfg.buckets[info->type].burst_length;
879 break;
880 case IOPS_SIZE:
881 value = cfg.op_size;
882 break;
883 }
884
885 visit_type_int64(v, name, &value, errp);
886}
887
888static void throttle_group_set_limits(Object *obj, Visitor *v,
889 const char *name, void *opaque,
890 Error **errp)
891
892{
893 ThrottleGroup *tg = THROTTLE_GROUP(obj);
894 ThrottleConfig cfg;
895 ThrottleLimits arg = { 0 };
896 ThrottleLimits *argp = &arg;
897 Error *local_err = NULL;
898
899 visit_type_ThrottleLimits(v, name, &argp, &local_err);
900 if (local_err) {
901 goto ret;
902 }
903 qemu_mutex_lock(&tg->lock);
904 throttle_get_config(&tg->ts, &cfg);
905 throttle_limits_to_config(argp, &cfg, &local_err);
906 if (local_err) {
907 goto unlock;
908 }
909 throttle_config(&tg->ts, tg->clock_type, &cfg);
910
911unlock:
912 qemu_mutex_unlock(&tg->lock);
913ret:
914 error_propagate(errp, local_err);
915 return;
916}
917
918static void throttle_group_get_limits(Object *obj, Visitor *v,
919 const char *name, void *opaque,
920 Error **errp)
921{
922 ThrottleGroup *tg = THROTTLE_GROUP(obj);
923 ThrottleConfig cfg;
924 ThrottleLimits arg = { 0 };
925 ThrottleLimits *argp = &arg;
926
927 qemu_mutex_lock(&tg->lock);
928 throttle_get_config(&tg->ts, &cfg);
929 qemu_mutex_unlock(&tg->lock);
930
931 throttle_config_to_limits(&cfg, argp);
932
933 visit_type_ThrottleLimits(v, name, &argp, errp);
934}
935
936static bool throttle_group_can_be_deleted(UserCreatable *uc)
937{
938 return OBJECT(uc)->ref == 1;
939}
940
941static void throttle_group_obj_class_init(ObjectClass *klass, void *class_data)
942{
943 size_t i = 0;
944 UserCreatableClass *ucc = USER_CREATABLE_CLASS(klass);
945
946 ucc->complete = throttle_group_obj_complete;
947 ucc->can_be_deleted = throttle_group_can_be_deleted;
948
949 /* individual properties */
950 for (i = 0; i < sizeof(properties) / sizeof(ThrottleParamInfo); i++) {
951 object_class_property_add(klass,
952 properties[i].name,
953 "int",
954 throttle_group_get,
955 throttle_group_set,
956 NULL, &properties[i],
957 &error_abort);
958 }
959
960 /* ThrottleLimits */
961 object_class_property_add(klass,
962 "limits", "ThrottleLimits",
963 throttle_group_get_limits,
964 throttle_group_set_limits,
965 NULL, NULL,
966 &error_abort);
967}
968
969static const TypeInfo throttle_group_info = {
970 .name = TYPE_THROTTLE_GROUP,
971 .parent = TYPE_OBJECT,
972 .class_init = throttle_group_obj_class_init,
973 .instance_size = sizeof(ThrottleGroup),
974 .instance_init = throttle_group_obj_init,
975 .instance_finalize = throttle_group_obj_finalize,
976 .interfaces = (InterfaceInfo[]) {
977 { TYPE_USER_CREATABLE },
978 { }
979 },
980};
981
2ff1f2e3
AG
982static void throttle_groups_init(void)
983{
432d889e 984 type_register_static(&throttle_group_info);
2ff1f2e3
AG
985}
986
432d889e 987type_init(throttle_groups_init);