]> git.proxmox.com Git - mirror_qemu.git/blame - block/blkdebug.c
block/accounting: Use lock guard macros
[mirror_qemu.git] / block / blkdebug.c
CommitLineData
6a143727
KW
1/*
2 * Block protocol for I/O error injection
3 *
63188c24 4 * Copyright (C) 2016-2017 Red Hat, Inc.
6a143727
KW
5 * Copyright (c) 2010 Kevin Wolf <kwolf@redhat.com>
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 * THE SOFTWARE.
24 */
25
80c71a24 26#include "qemu/osdep.h"
da34e65c 27#include "qapi/error.h"
f348b6d1 28#include "qemu/cutils.h"
1de7afc9 29#include "qemu/config-file.h"
737e150e 30#include "block/block_int.h"
69c6449f 31#include "block/qdict.h"
1de7afc9 32#include "qemu/module.h"
922a01a0 33#include "qemu/option.h"
69c6449f 34#include "qapi/qapi-visit-block-core.h"
2c31b04c 35#include "qapi/qmp/qdict.h"
69c6449f 36#include "qapi/qmp/qlist.h"
2c31b04c 37#include "qapi/qmp/qstring.h"
69c6449f 38#include "qapi/qobject-input-visitor.h"
20873526 39#include "sysemu/qtest.h"
6a143727
KW
40
41typedef struct BDRVBlkdebugState {
571cd43e 42 int state;
8f96b5be 43 int new_state;
3dc834f8 44 uint64_t align;
430b26a8
EB
45 uint64_t max_transfer;
46 uint64_t opt_write_zero;
47 uint64_t max_write_zero;
48 uint64_t opt_discard;
49 uint64_t max_discard;
3c90c65d 50
69c6449f
HR
51 uint64_t take_child_perms;
52 uint64_t unshare_child_perms;
53
036990d7
HR
54 /* For blkdebug_refresh_filename() */
55 char *config_file;
56
7fb1cf16 57 QLIST_HEAD(, BlkdebugRule) rules[BLKDBG__MAX];
571cd43e 58 QSIMPLEQ_HEAD(, BlkdebugRule) active_rules;
3c90c65d 59 QLIST_HEAD(, BlkdebugSuspendedReq) suspended_reqs;
6a143727
KW
60} BDRVBlkdebugState;
61
b9f66d96 62typedef struct BlkdebugAIOCB {
7c84b1b8 63 BlockAIOCB common;
b9f66d96
KW
64 int ret;
65} BlkdebugAIOCB;
66
3c90c65d
KW
67typedef struct BlkdebugSuspendedReq {
68 Coroutine *co;
69 char *tag;
70 QLIST_ENTRY(BlkdebugSuspendedReq) next;
71} BlkdebugSuspendedReq;
72
8b9b0cc2
KW
73enum {
74 ACTION_INJECT_ERROR,
75 ACTION_SET_STATE,
3c90c65d 76 ACTION_SUSPEND,
8b9b0cc2
KW
77};
78
79typedef struct BlkdebugRule {
a31939e6 80 BlkdebugEvent event;
8b9b0cc2
KW
81 int action;
82 int state;
83 union {
84 struct {
16789db3 85 uint64_t iotype_mask;
8b9b0cc2
KW
86 int error;
87 int immediately;
88 int once;
7c3a9985 89 int64_t offset;
8b9b0cc2
KW
90 } inject;
91 struct {
92 int new_state;
93 } set_state;
3c90c65d
KW
94 struct {
95 char *tag;
96 } suspend;
8b9b0cc2
KW
97 } options;
98 QLIST_ENTRY(BlkdebugRule) next;
571cd43e 99 QSIMPLEQ_ENTRY(BlkdebugRule) active_next;
8b9b0cc2
KW
100} BlkdebugRule;
101
16789db3
HR
102QEMU_BUILD_BUG_MSG(BLKDEBUG_IO_TYPE__MAX > 64,
103 "BlkdebugIOType mask does not fit into an uint64_t");
104
8b9b0cc2
KW
105static QemuOptsList inject_error_opts = {
106 .name = "inject-error",
107 .head = QTAILQ_HEAD_INITIALIZER(inject_error_opts.head),
108 .desc = {
109 {
110 .name = "event",
111 .type = QEMU_OPT_STRING,
112 },
113 {
114 .name = "state",
115 .type = QEMU_OPT_NUMBER,
116 },
16789db3
HR
117 {
118 .name = "iotype",
119 .type = QEMU_OPT_STRING,
120 },
8b9b0cc2
KW
121 {
122 .name = "errno",
123 .type = QEMU_OPT_NUMBER,
124 },
e4780db4
PB
125 {
126 .name = "sector",
127 .type = QEMU_OPT_NUMBER,
128 },
8b9b0cc2
KW
129 {
130 .name = "once",
131 .type = QEMU_OPT_BOOL,
132 },
133 {
134 .name = "immediately",
135 .type = QEMU_OPT_BOOL,
136 },
137 { /* end of list */ }
138 },
139};
140
141static QemuOptsList set_state_opts = {
142 .name = "set-state",
327cdad4 143 .head = QTAILQ_HEAD_INITIALIZER(set_state_opts.head),
8b9b0cc2
KW
144 .desc = {
145 {
146 .name = "event",
147 .type = QEMU_OPT_STRING,
148 },
149 {
150 .name = "state",
151 .type = QEMU_OPT_NUMBER,
152 },
153 {
154 .name = "new_state",
155 .type = QEMU_OPT_NUMBER,
156 },
157 { /* end of list */ }
158 },
159};
160
161static QemuOptsList *config_groups[] = {
162 &inject_error_opts,
163 &set_state_opts,
164 NULL
165};
166
8b9b0cc2
KW
167struct add_rule_data {
168 BDRVBlkdebugState *s;
169 int action;
170};
171
28d0de7a 172static int add_rule(void *opaque, QemuOpts *opts, Error **errp)
8b9b0cc2
KW
173{
174 struct add_rule_data *d = opaque;
175 BDRVBlkdebugState *s = d->s;
5f14f31d 176 const char *event_name;
f9509d15 177 int event;
8b9b0cc2 178 struct BlkdebugRule *rule;
7c3a9985 179 int64_t sector;
16789db3
HR
180 BlkdebugIOType iotype;
181 Error *local_error = NULL;
8b9b0cc2
KW
182
183 /* Find the right event for the rule */
184 event_name = qemu_opt_get(opts, "event");
d4362d64 185 if (!event_name) {
8809cfc3 186 error_setg(errp, "Missing event name for rule");
d4362d64 187 return -1;
f9509d15 188 }
f7abe0ec 189 event = qapi_enum_parse(&BlkdebugEvent_lookup, event_name, -1, errp);
f9509d15 190 if (event < 0) {
8b9b0cc2
KW
191 return -1;
192 }
193
194 /* Set attributes common for all actions */
7267c094 195 rule = g_malloc0(sizeof(*rule));
8b9b0cc2
KW
196 *rule = (struct BlkdebugRule) {
197 .event = event,
198 .action = d->action,
199 .state = qemu_opt_get_number(opts, "state", 0),
200 };
201
202 /* Parse action-specific options */
203 switch (d->action) {
204 case ACTION_INJECT_ERROR:
205 rule->options.inject.error = qemu_opt_get_number(opts, "errno", EIO);
206 rule->options.inject.once = qemu_opt_get_bool(opts, "once", 0);
207 rule->options.inject.immediately =
208 qemu_opt_get_bool(opts, "immediately", 0);
7c3a9985
KW
209 sector = qemu_opt_get_number(opts, "sector", -1);
210 rule->options.inject.offset =
211 sector == -1 ? -1 : sector * BDRV_SECTOR_SIZE;
16789db3
HR
212
213 iotype = qapi_enum_parse(&BlkdebugIOType_lookup,
214 qemu_opt_get(opts, "iotype"),
215 BLKDEBUG_IO_TYPE__MAX, &local_error);
216 if (local_error) {
217 error_propagate(errp, local_error);
5b4c95d0 218 g_free(rule);
16789db3
HR
219 return -1;
220 }
221 if (iotype != BLKDEBUG_IO_TYPE__MAX) {
222 rule->options.inject.iotype_mask = (1ull << iotype);
223 } else {
224 /* Apply the default */
225 rule->options.inject.iotype_mask =
226 (1ull << BLKDEBUG_IO_TYPE_READ)
227 | (1ull << BLKDEBUG_IO_TYPE_WRITE)
228 | (1ull << BLKDEBUG_IO_TYPE_WRITE_ZEROES)
229 | (1ull << BLKDEBUG_IO_TYPE_DISCARD)
230 | (1ull << BLKDEBUG_IO_TYPE_FLUSH);
231 }
232
8b9b0cc2
KW
233 break;
234
235 case ACTION_SET_STATE:
236 rule->options.set_state.new_state =
237 qemu_opt_get_number(opts, "new_state", 0);
238 break;
3c90c65d
KW
239
240 case ACTION_SUSPEND:
241 rule->options.suspend.tag =
242 g_strdup(qemu_opt_get(opts, "tag"));
243 break;
8b9b0cc2
KW
244 };
245
246 /* Add the rule */
247 QLIST_INSERT_HEAD(&s->rules[event], rule, next);
248
249 return 0;
250}
251
9e35542b
KW
252static void remove_rule(BlkdebugRule *rule)
253{
254 switch (rule->action) {
255 case ACTION_INJECT_ERROR:
256 case ACTION_SET_STATE:
257 break;
3c90c65d
KW
258 case ACTION_SUSPEND:
259 g_free(rule->options.suspend.tag);
260 break;
9e35542b
KW
261 }
262
263 QLIST_REMOVE(rule, next);
264 g_free(rule);
265}
266
89f2b21e
HR
267static int read_config(BDRVBlkdebugState *s, const char *filename,
268 QDict *options, Error **errp)
8b9b0cc2 269{
85a040e5 270 FILE *f = NULL;
8b9b0cc2
KW
271 int ret;
272 struct add_rule_data d;
89f2b21e 273 Error *local_err = NULL;
8b9b0cc2 274
85a040e5
HR
275 if (filename) {
276 f = fopen(filename, "r");
277 if (f == NULL) {
278 error_setg_errno(errp, errno, "Could not read blkdebug config file");
279 return -errno;
280 }
8b9b0cc2 281
85a040e5
HR
282 ret = qemu_config_parse(f, config_groups, filename);
283 if (ret < 0) {
284 error_setg(errp, "Could not parse blkdebug config file");
85a040e5
HR
285 goto fail;
286 }
8b9b0cc2
KW
287 }
288
89f2b21e 289 qemu_config_parse_qdict(options, config_groups, &local_err);
84d18f06 290 if (local_err) {
89f2b21e
HR
291 error_propagate(errp, local_err);
292 ret = -EINVAL;
293 goto fail;
294 }
295
8b9b0cc2
KW
296 d.s = s;
297 d.action = ACTION_INJECT_ERROR;
8809cfc3 298 qemu_opts_foreach(&inject_error_opts, add_rule, &d, &local_err);
d4362d64
SH
299 if (local_err) {
300 error_propagate(errp, local_err);
301 ret = -EINVAL;
302 goto fail;
303 }
8b9b0cc2
KW
304
305 d.action = ACTION_SET_STATE;
8809cfc3 306 qemu_opts_foreach(&set_state_opts, add_rule, &d, &local_err);
d4362d64
SH
307 if (local_err) {
308 error_propagate(errp, local_err);
309 ret = -EINVAL;
310 goto fail;
311 }
8b9b0cc2
KW
312
313 ret = 0;
314fail:
698f0d52
KW
315 qemu_opts_reset(&inject_error_opts);
316 qemu_opts_reset(&set_state_opts);
85a040e5
HR
317 if (f) {
318 fclose(f);
319 }
8b9b0cc2
KW
320 return ret;
321}
322
323/* Valid blkdebug filenames look like blkdebug:path/to/config:path/to/image */
f4681212
KW
324static void blkdebug_parse_filename(const char *filename, QDict *options,
325 Error **errp)
6a143727 326{
f4681212 327 const char *c;
6a143727 328
8b9b0cc2 329 /* Parse the blkdebug: prefix */
f4681212 330 if (!strstart(filename, "blkdebug:", &filename)) {
d4881b9b
HR
331 /* There was no prefix; therefore, all options have to be already
332 present in the QDict (except for the filename) */
46f5ac20 333 qdict_put_str(options, "x-image", filename);
f4681212 334 return;
6a143727 335 }
6a143727 336
f4681212 337 /* Parse config file path */
8b9b0cc2
KW
338 c = strchr(filename, ':');
339 if (c == NULL) {
f4681212
KW
340 error_setg(errp, "blkdebug requires both config file and image path");
341 return;
8b9b0cc2
KW
342 }
343
f4681212
KW
344 if (c != filename) {
345 QString *config_path;
ba891d68 346 config_path = qstring_from_substr(filename, 0, c - filename);
f4681212 347 qdict_put(options, "config", config_path);
8b9b0cc2 348 }
f4681212
KW
349
350 /* TODO Allow multi-level nesting and set file.filename here */
8b9b0cc2 351 filename = c + 1;
46f5ac20 352 qdict_put_str(options, "x-image", filename);
f4681212
KW
353}
354
69c6449f
HR
355static int blkdebug_parse_perm_list(uint64_t *dest, QDict *options,
356 const char *prefix, Error **errp)
357{
358 int ret = 0;
359 QDict *subqdict = NULL;
360 QObject *crumpled_subqdict = NULL;
361 Visitor *v = NULL;
362 BlockPermissionList *perm_list = NULL, *element;
69c6449f
HR
363
364 *dest = 0;
365
366 qdict_extract_subqdict(options, &subqdict, prefix);
367 if (!qdict_size(subqdict)) {
368 goto out;
369 }
370
371 crumpled_subqdict = qdict_crumple(subqdict, errp);
372 if (!crumpled_subqdict) {
373 ret = -EINVAL;
374 goto out;
375 }
376
377 v = qobject_input_visitor_new(crumpled_subqdict);
af175e85 378 if (!visit_type_BlockPermissionList(v, NULL, &perm_list, errp)) {
69c6449f
HR
379 ret = -EINVAL;
380 goto out;
381 }
382
383 for (element = perm_list; element; element = element->next) {
384 *dest |= bdrv_qapi_perm_to_blk_perm(element->value);
385 }
386
387out:
388 qapi_free_BlockPermissionList(perm_list);
389 visit_free(v);
390 qobject_unref(subqdict);
391 qobject_unref(crumpled_subqdict);
392 return ret;
393}
394
395static int blkdebug_parse_perms(BDRVBlkdebugState *s, QDict *options,
396 Error **errp)
397{
398 int ret;
399
400 ret = blkdebug_parse_perm_list(&s->take_child_perms, options,
401 "take-child-perms.", errp);
402 if (ret < 0) {
403 return ret;
404 }
405
406 ret = blkdebug_parse_perm_list(&s->unshare_child_perms, options,
407 "unshare-child-perms.", errp);
408 if (ret < 0) {
409 return ret;
410 }
411
412 return 0;
413}
414
f4681212
KW
415static QemuOptsList runtime_opts = {
416 .name = "blkdebug",
417 .head = QTAILQ_HEAD_INITIALIZER(runtime_opts.head),
418 .desc = {
419 {
420 .name = "config",
421 .type = QEMU_OPT_STRING,
422 .help = "Path to the configuration file",
423 },
424 {
425 .name = "x-image",
426 .type = QEMU_OPT_STRING,
427 .help = "[internal use only, will be removed]",
428 },
b35ee7fb
KW
429 {
430 .name = "align",
431 .type = QEMU_OPT_SIZE,
432 .help = "Required alignment in bytes",
433 },
430b26a8
EB
434 {
435 .name = "max-transfer",
436 .type = QEMU_OPT_SIZE,
437 .help = "Maximum transfer size in bytes",
438 },
439 {
440 .name = "opt-write-zero",
441 .type = QEMU_OPT_SIZE,
442 .help = "Optimum write zero alignment in bytes",
443 },
444 {
445 .name = "max-write-zero",
446 .type = QEMU_OPT_SIZE,
447 .help = "Maximum write zero size in bytes",
448 },
449 {
450 .name = "opt-discard",
451 .type = QEMU_OPT_SIZE,
452 .help = "Optimum discard alignment in bytes",
453 },
454 {
455 .name = "max-discard",
456 .type = QEMU_OPT_SIZE,
457 .help = "Maximum discard size in bytes",
458 },
f4681212
KW
459 { /* end of list */ }
460 },
461};
462
015a1036
HR
463static int blkdebug_open(BlockDriverState *bs, QDict *options, int flags,
464 Error **errp)
f4681212
KW
465{
466 BDRVBlkdebugState *s = bs->opaque;
467 QemuOpts *opts;
468 Error *local_err = NULL;
f4681212 469 int ret;
430b26a8 470 uint64_t align;
f4681212 471
87ea75d5 472 opts = qemu_opts_create(&runtime_opts, NULL, 0, &error_abort);
af175e85 473 if (!qemu_opts_absorb_qdict(opts, options, errp)) {
f4681212 474 ret = -EINVAL;
eaf944a4 475 goto out;
f4681212
KW
476 }
477
89f2b21e 478 /* Read rules from config file or command line options */
036990d7
HR
479 s->config_file = g_strdup(qemu_opt_get(opts, "config"));
480 ret = read_config(s, s->config_file, options, errp);
85a040e5 481 if (ret) {
eaf944a4 482 goto out;
f4681212 483 }
8b9b0cc2 484
8db520ce 485 /* Set initial state */
571cd43e 486 s->state = 1;
8db520ce 487
69c6449f
HR
488 /* Parse permissions modifiers before opening the image file */
489 ret = blkdebug_parse_perms(s, options, errp);
490 if (ret < 0) {
491 goto out;
492 }
493
6b826af7 494 /* Open the image file */
9a4f4c31 495 bs->file = bdrv_open_child(qemu_opt_get(opts, "x-image"), options, "image",
b3af2af4
HR
496 bs, &child_of_bds,
497 BDRV_CHILD_FILTERED | BDRV_CHILD_PRIMARY,
498 false, &local_err);
9a4f4c31
KW
499 if (local_err) {
500 ret = -EINVAL;
10ffa72f 501 error_propagate(errp, local_err);
eaf944a4 502 goto out;
8b9b0cc2
KW
503 }
504
228345bf
HR
505 bs->supported_write_flags = BDRV_REQ_WRITE_UNCHANGED |
506 (BDRV_REQ_FUA & bs->file->bs->supported_write_flags);
507 bs->supported_zero_flags = BDRV_REQ_WRITE_UNCHANGED |
80f5c33f 508 ((BDRV_REQ_FUA | BDRV_REQ_MAY_UNMAP | BDRV_REQ_NO_FALLBACK) &
228345bf 509 bs->file->bs->supported_zero_flags);
3dc834f8 510 ret = -EINVAL;
63188c24 511
430b26a8 512 /* Set alignment overrides */
3dc834f8
EB
513 s->align = qemu_opt_get_size(opts, "align", 0);
514 if (s->align && (s->align >= INT_MAX || !is_power_of_2(s->align))) {
515 error_setg(errp, "Cannot meet constraints with align %" PRIu64,
516 s->align);
de234897 517 goto out;
b35ee7fb 518 }
430b26a8
EB
519 align = MAX(s->align, bs->file->bs->bl.request_alignment);
520
521 s->max_transfer = qemu_opt_get_size(opts, "max-transfer", 0);
522 if (s->max_transfer &&
523 (s->max_transfer >= INT_MAX ||
524 !QEMU_IS_ALIGNED(s->max_transfer, align))) {
525 error_setg(errp, "Cannot meet constraints with max-transfer %" PRIu64,
526 s->max_transfer);
527 goto out;
528 }
529
530 s->opt_write_zero = qemu_opt_get_size(opts, "opt-write-zero", 0);
531 if (s->opt_write_zero &&
532 (s->opt_write_zero >= INT_MAX ||
533 !QEMU_IS_ALIGNED(s->opt_write_zero, align))) {
534 error_setg(errp, "Cannot meet constraints with opt-write-zero %" PRIu64,
535 s->opt_write_zero);
536 goto out;
537 }
538
539 s->max_write_zero = qemu_opt_get_size(opts, "max-write-zero", 0);
540 if (s->max_write_zero &&
541 (s->max_write_zero >= INT_MAX ||
542 !QEMU_IS_ALIGNED(s->max_write_zero,
543 MAX(s->opt_write_zero, align)))) {
544 error_setg(errp, "Cannot meet constraints with max-write-zero %" PRIu64,
545 s->max_write_zero);
546 goto out;
547 }
548
549 s->opt_discard = qemu_opt_get_size(opts, "opt-discard", 0);
550 if (s->opt_discard &&
551 (s->opt_discard >= INT_MAX ||
552 !QEMU_IS_ALIGNED(s->opt_discard, align))) {
553 error_setg(errp, "Cannot meet constraints with opt-discard %" PRIu64,
554 s->opt_discard);
555 goto out;
556 }
557
558 s->max_discard = qemu_opt_get_size(opts, "max-discard", 0);
559 if (s->max_discard &&
560 (s->max_discard >= INT_MAX ||
561 !QEMU_IS_ALIGNED(s->max_discard,
562 MAX(s->opt_discard, align)))) {
563 error_setg(errp, "Cannot meet constraints with max-discard %" PRIu64,
564 s->max_discard);
565 goto out;
566 }
b35ee7fb 567
f8cec157
HR
568 bdrv_debug_event(bs, BLKDBG_NONE);
569
f4681212 570 ret = 0;
eaf944a4 571out:
036990d7
HR
572 if (ret < 0) {
573 g_free(s->config_file);
574 }
f4681212
KW
575 qemu_opts_del(opts);
576 return ret;
6a143727
KW
577}
578
16789db3
HR
579static int rule_check(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
580 BlkdebugIOType iotype)
b9f66d96
KW
581{
582 BDRVBlkdebugState *s = bs->opaque;
d157ed5f
EB
583 BlkdebugRule *rule = NULL;
584 int error;
585 bool immediately;
586
587 QSIMPLEQ_FOREACH(rule, &s->active_rules, active_next) {
588 uint64_t inject_offset = rule->options.inject.offset;
589
16789db3
HR
590 if ((inject_offset == -1 ||
591 (bytes && inject_offset >= offset &&
592 inject_offset < offset + bytes)) &&
593 (rule->options.inject.iotype_mask & (1ull << iotype)))
d157ed5f
EB
594 {
595 break;
596 }
597 }
598
599 if (!rule || !rule->options.inject.error) {
600 return 0;
601 }
602
603 immediately = rule->options.inject.immediately;
604 error = rule->options.inject.error;
b9f66d96 605
571cd43e 606 if (rule->options.inject.once) {
a069e2f1
JS
607 QSIMPLEQ_REMOVE(&s->active_rules, rule, BlkdebugRule, active_next);
608 remove_rule(rule);
b9f66d96
KW
609 }
610
7c3a9985 611 if (!immediately) {
e5c67ab5 612 aio_co_schedule(qemu_get_current_aio_context(), qemu_coroutine_self());
7c3a9985 613 qemu_coroutine_yield();
b9f66d96
KW
614 }
615
7c3a9985 616 return -error;
b9f66d96
KW
617}
618
7c3a9985
KW
619static int coroutine_fn
620blkdebug_co_preadv(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
621 QEMUIOVector *qiov, int flags)
6a143727 622{
d157ed5f 623 int err;
e4780db4 624
e0ef4395
EB
625 /* Sanity check block layer guarantees */
626 assert(QEMU_IS_ALIGNED(offset, bs->bl.request_alignment));
627 assert(QEMU_IS_ALIGNED(bytes, bs->bl.request_alignment));
628 if (bs->bl.max_transfer) {
629 assert(bytes <= bs->bl.max_transfer);
630 }
631
16789db3 632 err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_READ);
d157ed5f
EB
633 if (err) {
634 return err;
b9f66d96
KW
635 }
636
7c3a9985 637 return bdrv_co_preadv(bs->file, offset, bytes, qiov, flags);
6a143727
KW
638}
639
7c3a9985
KW
640static int coroutine_fn
641blkdebug_co_pwritev(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
642 QEMUIOVector *qiov, int flags)
6a143727 643{
d157ed5f 644 int err;
e4780db4 645
e0ef4395
EB
646 /* Sanity check block layer guarantees */
647 assert(QEMU_IS_ALIGNED(offset, bs->bl.request_alignment));
648 assert(QEMU_IS_ALIGNED(bytes, bs->bl.request_alignment));
649 if (bs->bl.max_transfer) {
650 assert(bytes <= bs->bl.max_transfer);
651 }
652
16789db3 653 err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_WRITE);
d157ed5f
EB
654 if (err) {
655 return err;
b9f66d96
KW
656 }
657
7c3a9985 658 return bdrv_co_pwritev(bs->file, offset, bytes, qiov, flags);
6a143727
KW
659}
660
7c3a9985 661static int blkdebug_co_flush(BlockDriverState *bs)
9e52c53b 662{
16789db3 663 int err = rule_check(bs, 0, 0, BLKDEBUG_IO_TYPE_FLUSH);
9e52c53b 664
d157ed5f
EB
665 if (err) {
666 return err;
9e52c53b
PB
667 }
668
7c3a9985 669 return bdrv_co_flush(bs->file->bs);
9e52c53b
PB
670}
671
63188c24 672static int coroutine_fn blkdebug_co_pwrite_zeroes(BlockDriverState *bs,
f5a5ca79 673 int64_t offset, int bytes,
63188c24
EB
674 BdrvRequestFlags flags)
675{
676 uint32_t align = MAX(bs->bl.request_alignment,
677 bs->bl.pwrite_zeroes_alignment);
678 int err;
679
680 /* Only pass through requests that are larger than requested
681 * preferred alignment (so that we test the fallback to writes on
682 * unaligned portions), and check that the block layer never hands
683 * us anything unaligned that crosses an alignment boundary. */
f5a5ca79 684 if (bytes < align) {
63188c24 685 assert(QEMU_IS_ALIGNED(offset, align) ||
f5a5ca79 686 QEMU_IS_ALIGNED(offset + bytes, align) ||
63188c24 687 DIV_ROUND_UP(offset, align) ==
f5a5ca79 688 DIV_ROUND_UP(offset + bytes, align));
63188c24
EB
689 return -ENOTSUP;
690 }
691 assert(QEMU_IS_ALIGNED(offset, align));
f5a5ca79 692 assert(QEMU_IS_ALIGNED(bytes, align));
63188c24 693 if (bs->bl.max_pwrite_zeroes) {
f5a5ca79 694 assert(bytes <= bs->bl.max_pwrite_zeroes);
63188c24
EB
695 }
696
16789db3 697 err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_WRITE_ZEROES);
63188c24
EB
698 if (err) {
699 return err;
700 }
701
f5a5ca79 702 return bdrv_co_pwrite_zeroes(bs->file, offset, bytes, flags);
63188c24
EB
703}
704
705static int coroutine_fn blkdebug_co_pdiscard(BlockDriverState *bs,
f5a5ca79 706 int64_t offset, int bytes)
63188c24
EB
707{
708 uint32_t align = bs->bl.pdiscard_alignment;
709 int err;
710
711 /* Only pass through requests that are larger than requested
712 * minimum alignment, and ensure that unaligned requests do not
713 * cross optimum discard boundaries. */
f5a5ca79 714 if (bytes < bs->bl.request_alignment) {
63188c24 715 assert(QEMU_IS_ALIGNED(offset, align) ||
f5a5ca79 716 QEMU_IS_ALIGNED(offset + bytes, align) ||
63188c24 717 DIV_ROUND_UP(offset, align) ==
f5a5ca79 718 DIV_ROUND_UP(offset + bytes, align));
63188c24
EB
719 return -ENOTSUP;
720 }
721 assert(QEMU_IS_ALIGNED(offset, bs->bl.request_alignment));
f5a5ca79
MP
722 assert(QEMU_IS_ALIGNED(bytes, bs->bl.request_alignment));
723 if (align && bytes >= align) {
63188c24 724 assert(QEMU_IS_ALIGNED(offset, align));
f5a5ca79 725 assert(QEMU_IS_ALIGNED(bytes, align));
63188c24
EB
726 }
727 if (bs->bl.max_pdiscard) {
f5a5ca79 728 assert(bytes <= bs->bl.max_pdiscard);
63188c24
EB
729 }
730
16789db3 731 err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_DISCARD);
63188c24
EB
732 if (err) {
733 return err;
734 }
735
0b9fd3f4 736 return bdrv_co_pdiscard(bs->file, offset, bytes);
63188c24 737}
3c90c65d 738
3e4d0e72
EB
739static int coroutine_fn blkdebug_co_block_status(BlockDriverState *bs,
740 bool want_zero,
741 int64_t offset,
742 int64_t bytes,
743 int64_t *pnum,
744 int64_t *map,
745 BlockDriverState **file)
efa6e2ed 746{
1adb0b5e
HR
747 int err;
748
3e4d0e72 749 assert(QEMU_IS_ALIGNED(offset | bytes, bs->bl.request_alignment));
1adb0b5e
HR
750
751 err = rule_check(bs, offset, bytes, BLKDEBUG_IO_TYPE_BLOCK_STATUS);
752 if (err) {
753 return err;
754 }
755
549ec0d9
HR
756 assert(bs->file && bs->file->bs);
757 *pnum = bytes;
758 *map = offset;
759 *file = bs->file->bs;
760 return BDRV_BLOCK_RAW | BDRV_BLOCK_OFFSET_VALID;
efa6e2ed
EB
761}
762
6a143727
KW
763static void blkdebug_close(BlockDriverState *bs)
764{
765 BDRVBlkdebugState *s = bs->opaque;
8b9b0cc2
KW
766 BlkdebugRule *rule, *next;
767 int i;
768
7fb1cf16 769 for (i = 0; i < BLKDBG__MAX; i++) {
8b9b0cc2 770 QLIST_FOREACH_SAFE(rule, &s->rules[i], next, next) {
9e35542b 771 remove_rule(rule);
8b9b0cc2
KW
772 }
773 }
036990d7
HR
774
775 g_free(s->config_file);
6a143727
KW
776}
777
3c90c65d
KW
778static void suspend_request(BlockDriverState *bs, BlkdebugRule *rule)
779{
780 BDRVBlkdebugState *s = bs->opaque;
781 BlkdebugSuspendedReq r;
782
783 r = (BlkdebugSuspendedReq) {
784 .co = qemu_coroutine_self(),
785 .tag = g_strdup(rule->options.suspend.tag),
786 };
787
788 remove_rule(rule);
789 QLIST_INSERT_HEAD(&s->suspended_reqs, &r, next);
790
20873526
MT
791 if (!qtest_enabled()) {
792 printf("blkdebug: Suspended request '%s'\n", r.tag);
793 }
3c90c65d 794 qemu_coroutine_yield();
20873526
MT
795 if (!qtest_enabled()) {
796 printf("blkdebug: Resuming request '%s'\n", r.tag);
797 }
3c90c65d
KW
798
799 QLIST_REMOVE(&r, next);
800 g_free(r.tag);
801}
802
571cd43e 803static bool process_rule(BlockDriverState *bs, struct BlkdebugRule *rule,
8f96b5be 804 bool injected)
8b9b0cc2
KW
805{
806 BDRVBlkdebugState *s = bs->opaque;
8b9b0cc2
KW
807
808 /* Only process rules for the current state */
8f96b5be 809 if (rule->state && rule->state != s->state) {
571cd43e 810 return injected;
8b9b0cc2
KW
811 }
812
813 /* Take the action */
814 switch (rule->action) {
815 case ACTION_INJECT_ERROR:
571cd43e
PB
816 if (!injected) {
817 QSIMPLEQ_INIT(&s->active_rules);
818 injected = true;
819 }
820 QSIMPLEQ_INSERT_HEAD(&s->active_rules, rule, active_next);
8b9b0cc2
KW
821 break;
822
823 case ACTION_SET_STATE:
8f96b5be 824 s->new_state = rule->options.set_state.new_state;
8b9b0cc2 825 break;
3c90c65d
KW
826
827 case ACTION_SUSPEND:
828 suspend_request(bs, rule);
829 break;
8b9b0cc2 830 }
571cd43e 831 return injected;
8b9b0cc2
KW
832}
833
a31939e6 834static void blkdebug_debug_event(BlockDriverState *bs, BlkdebugEvent event)
8b9b0cc2
KW
835{
836 BDRVBlkdebugState *s = bs->opaque;
3c90c65d 837 struct BlkdebugRule *rule, *next;
571cd43e 838 bool injected;
8b9b0cc2 839
7fb1cf16 840 assert((int)event >= 0 && event < BLKDBG__MAX);
8b9b0cc2 841
571cd43e 842 injected = false;
8f96b5be 843 s->new_state = s->state;
3c90c65d 844 QLIST_FOREACH_SAFE(rule, &s->rules[event], next, next) {
8f96b5be 845 injected = process_rule(bs, rule, injected);
8b9b0cc2 846 }
8f96b5be 847 s->state = s->new_state;
8b9b0cc2
KW
848}
849
3c90c65d
KW
850static int blkdebug_debug_breakpoint(BlockDriverState *bs, const char *event,
851 const char *tag)
852{
853 BDRVBlkdebugState *s = bs->opaque;
854 struct BlkdebugRule *rule;
f9509d15 855 int blkdebug_event;
3c90c65d 856
f7abe0ec 857 blkdebug_event = qapi_enum_parse(&BlkdebugEvent_lookup, event, -1, NULL);
f9509d15 858 if (blkdebug_event < 0) {
3c90c65d
KW
859 return -ENOENT;
860 }
861
3c90c65d
KW
862 rule = g_malloc(sizeof(*rule));
863 *rule = (struct BlkdebugRule) {
864 .event = blkdebug_event,
865 .action = ACTION_SUSPEND,
866 .state = 0,
867 .options.suspend.tag = g_strdup(tag),
868 };
869
870 QLIST_INSERT_HEAD(&s->rules[blkdebug_event], rule, next);
871
872 return 0;
873}
874
875static int blkdebug_debug_resume(BlockDriverState *bs, const char *tag)
876{
877 BDRVBlkdebugState *s = bs->opaque;
c547e564 878 BlkdebugSuspendedReq *r, *next;
3c90c65d 879
c547e564 880 QLIST_FOREACH_SAFE(r, &s->suspended_reqs, next, next) {
3c90c65d 881 if (!strcmp(r->tag, tag)) {
0b8b8753 882 qemu_coroutine_enter(r->co);
3c90c65d
KW
883 return 0;
884 }
885 }
886 return -ENOENT;
887}
888
4cc70e93
FZ
889static int blkdebug_debug_remove_breakpoint(BlockDriverState *bs,
890 const char *tag)
891{
892 BDRVBlkdebugState *s = bs->opaque;
c547e564 893 BlkdebugSuspendedReq *r, *r_next;
4cc70e93
FZ
894 BlkdebugRule *rule, *next;
895 int i, ret = -ENOENT;
896
7fb1cf16 897 for (i = 0; i < BLKDBG__MAX; i++) {
4cc70e93
FZ
898 QLIST_FOREACH_SAFE(rule, &s->rules[i], next, next) {
899 if (rule->action == ACTION_SUSPEND &&
900 !strcmp(rule->options.suspend.tag, tag)) {
901 remove_rule(rule);
902 ret = 0;
903 }
904 }
905 }
c547e564 906 QLIST_FOREACH_SAFE(r, &s->suspended_reqs, next, r_next) {
4cc70e93 907 if (!strcmp(r->tag, tag)) {
0b8b8753 908 qemu_coroutine_enter(r->co);
4cc70e93
FZ
909 ret = 0;
910 }
911 }
912 return ret;
913}
3c90c65d
KW
914
915static bool blkdebug_debug_is_suspended(BlockDriverState *bs, const char *tag)
916{
917 BDRVBlkdebugState *s = bs->opaque;
918 BlkdebugSuspendedReq *r;
919
920 QLIST_FOREACH(r, &s->suspended_reqs, next) {
921 if (!strcmp(r->tag, tag)) {
922 return true;
923 }
924 }
925 return false;
926}
927
e1302255
PB
928static int64_t blkdebug_getlength(BlockDriverState *bs)
929{
9a4f4c31 930 return bdrv_getlength(bs->file->bs);
e1302255
PB
931}
932
998b3a1e 933static void blkdebug_refresh_filename(BlockDriverState *bs)
2c31b04c 934{
036990d7 935 BDRVBlkdebugState *s = bs->opaque;
8779441b 936 const QDictEntry *e;
998b3a1e 937 int ret;
2c31b04c 938
998b3a1e 939 if (!bs->file->bs->exact_filename[0]) {
2c31b04c
HR
940 return;
941 }
942
998b3a1e
HR
943 for (e = qdict_first(bs->full_open_options); e;
944 e = qdict_next(bs->full_open_options, e))
945 {
946 /* Real child options are under "image", but "x-image" may
947 * contain a filename */
948 if (strcmp(qdict_entry_key(e), "config") &&
949 strcmp(qdict_entry_key(e), "image") &&
950 strcmp(qdict_entry_key(e), "x-image") &&
951 strcmp(qdict_entry_key(e), "driver"))
952 {
953 return;
de81d72d 954 }
8779441b
HR
955 }
956
998b3a1e
HR
957 ret = snprintf(bs->exact_filename, sizeof(bs->exact_filename),
958 "blkdebug:%s:%s",
959 s->config_file ?: "", bs->file->bs->exact_filename);
960 if (ret >= sizeof(bs->exact_filename)) {
961 /* An overflow makes the filename unusable, so do not report any */
962 bs->exact_filename[0] = 0;
2c31b04c 963 }
2c31b04c
HR
964}
965
835db3ee
EB
966static void blkdebug_refresh_limits(BlockDriverState *bs, Error **errp)
967{
968 BDRVBlkdebugState *s = bs->opaque;
969
970 if (s->align) {
a5b8dd2c 971 bs->bl.request_alignment = s->align;
835db3ee 972 }
430b26a8
EB
973 if (s->max_transfer) {
974 bs->bl.max_transfer = s->max_transfer;
975 }
976 if (s->opt_write_zero) {
977 bs->bl.pwrite_zeroes_alignment = s->opt_write_zero;
978 }
979 if (s->max_write_zero) {
980 bs->bl.max_pwrite_zeroes = s->max_write_zero;
981 }
982 if (s->opt_discard) {
983 bs->bl.pdiscard_alignment = s->opt_discard;
984 }
985 if (s->max_discard) {
986 bs->bl.max_pdiscard = s->max_discard;
987 }
835db3ee
EB
988}
989
c5e8bfb7
KW
990static int blkdebug_reopen_prepare(BDRVReopenState *reopen_state,
991 BlockReopenQueue *queue, Error **errp)
992{
993 return 0;
994}
995
69c6449f 996static void blkdebug_child_perm(BlockDriverState *bs, BdrvChild *c,
bf8e925e 997 BdrvChildRole role,
69c6449f
HR
998 BlockReopenQueue *reopen_queue,
999 uint64_t perm, uint64_t shared,
1000 uint64_t *nperm, uint64_t *nshared)
1001{
1002 BDRVBlkdebugState *s = bs->opaque;
1003
e5d8a406 1004 bdrv_default_perms(bs, c, role, reopen_queue,
69dca43d 1005 perm, shared, nperm, nshared);
69c6449f
HR
1006
1007 *nperm |= s->take_child_perms;
1008 *nshared &= ~s->unshare_child_perms;
1009}
1010
2654267c
HR
1011static const char *const blkdebug_strong_runtime_opts[] = {
1012 "config",
1013 "inject-error.",
1014 "set-state.",
1015 "align",
1016 "max-transfer",
1017 "opt-write-zero",
1018 "max-write-zero",
1019 "opt-discard",
1020 "max-discard",
1021
1022 NULL
1023};
1024
6a143727 1025static BlockDriver bdrv_blkdebug = {
f4681212
KW
1026 .format_name = "blkdebug",
1027 .protocol_name = "blkdebug",
1028 .instance_size = sizeof(BDRVBlkdebugState),
d8e12cd3 1029 .is_filter = true,
6a143727 1030
f4681212
KW
1031 .bdrv_parse_filename = blkdebug_parse_filename,
1032 .bdrv_file_open = blkdebug_open,
1033 .bdrv_close = blkdebug_close,
c5e8bfb7 1034 .bdrv_reopen_prepare = blkdebug_reopen_prepare,
69c6449f 1035 .bdrv_child_perm = blkdebug_child_perm,
d7010dfb 1036
f4681212 1037 .bdrv_getlength = blkdebug_getlength,
2c31b04c 1038 .bdrv_refresh_filename = blkdebug_refresh_filename,
835db3ee 1039 .bdrv_refresh_limits = blkdebug_refresh_limits,
6a143727 1040
7c3a9985
KW
1041 .bdrv_co_preadv = blkdebug_co_preadv,
1042 .bdrv_co_pwritev = blkdebug_co_pwritev,
1043 .bdrv_co_flush_to_disk = blkdebug_co_flush,
63188c24
EB
1044 .bdrv_co_pwrite_zeroes = blkdebug_co_pwrite_zeroes,
1045 .bdrv_co_pdiscard = blkdebug_co_pdiscard,
3e4d0e72 1046 .bdrv_co_block_status = blkdebug_co_block_status,
8b9b0cc2 1047
3c90c65d
KW
1048 .bdrv_debug_event = blkdebug_debug_event,
1049 .bdrv_debug_breakpoint = blkdebug_debug_breakpoint,
4cc70e93
FZ
1050 .bdrv_debug_remove_breakpoint
1051 = blkdebug_debug_remove_breakpoint,
3c90c65d
KW
1052 .bdrv_debug_resume = blkdebug_debug_resume,
1053 .bdrv_debug_is_suspended = blkdebug_debug_is_suspended,
2654267c
HR
1054
1055 .strong_runtime_opts = blkdebug_strong_runtime_opts,
6a143727
KW
1056};
1057
1058static void bdrv_blkdebug_init(void)
1059{
1060 bdrv_register(&bdrv_blkdebug);
1061}
1062
1063block_init(bdrv_blkdebug_init);