]> git.proxmox.com Git - mirror_qemu.git/blob - block.c
block: Remove bdrv_make_anon()
[mirror_qemu.git] / block.c
1 /*
2 * QEMU System Emulator block driver
3 *
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24 #include "qemu/osdep.h"
25 #include "trace.h"
26 #include "block/block_int.h"
27 #include "block/blockjob.h"
28 #include "qemu/error-report.h"
29 #include "qemu/module.h"
30 #include "qapi/qmp/qerror.h"
31 #include "qapi/qmp/qbool.h"
32 #include "qapi/qmp/qjson.h"
33 #include "sysemu/block-backend.h"
34 #include "sysemu/sysemu.h"
35 #include "qemu/notify.h"
36 #include "qemu/coroutine.h"
37 #include "block/qapi.h"
38 #include "qmp-commands.h"
39 #include "qemu/timer.h"
40 #include "qapi-event.h"
41 #include "block/throttle-groups.h"
42 #include "qemu/cutils.h"
43 #include "qemu/id.h"
44
45 #ifdef CONFIG_BSD
46 #include <sys/ioctl.h>
47 #include <sys/queue.h>
48 #ifndef __DragonFly__
49 #include <sys/disk.h>
50 #endif
51 #endif
52
53 #ifdef _WIN32
54 #include <windows.h>
55 #endif
56
57 #define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
58
59 static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
60 QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
61
62 static QTAILQ_HEAD(, BlockDriverState) all_bdrv_states =
63 QTAILQ_HEAD_INITIALIZER(all_bdrv_states);
64
65 static QLIST_HEAD(, BlockDriver) bdrv_drivers =
66 QLIST_HEAD_INITIALIZER(bdrv_drivers);
67
68 static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
69 const char *reference, QDict *options, int flags,
70 BlockDriverState *parent,
71 const BdrvChildRole *child_role, Error **errp);
72
73 /* If non-zero, use only whitelisted block drivers */
74 static int use_bdrv_whitelist;
75
76 static void bdrv_close(BlockDriverState *bs);
77
78 #ifdef _WIN32
79 static int is_windows_drive_prefix(const char *filename)
80 {
81 return (((filename[0] >= 'a' && filename[0] <= 'z') ||
82 (filename[0] >= 'A' && filename[0] <= 'Z')) &&
83 filename[1] == ':');
84 }
85
86 int is_windows_drive(const char *filename)
87 {
88 if (is_windows_drive_prefix(filename) &&
89 filename[2] == '\0')
90 return 1;
91 if (strstart(filename, "\\\\.\\", NULL) ||
92 strstart(filename, "//./", NULL))
93 return 1;
94 return 0;
95 }
96 #endif
97
98 size_t bdrv_opt_mem_align(BlockDriverState *bs)
99 {
100 if (!bs || !bs->drv) {
101 /* page size or 4k (hdd sector size) should be on the safe side */
102 return MAX(4096, getpagesize());
103 }
104
105 return bs->bl.opt_mem_alignment;
106 }
107
108 size_t bdrv_min_mem_align(BlockDriverState *bs)
109 {
110 if (!bs || !bs->drv) {
111 /* page size or 4k (hdd sector size) should be on the safe side */
112 return MAX(4096, getpagesize());
113 }
114
115 return bs->bl.min_mem_alignment;
116 }
117
118 /* check if the path starts with "<protocol>:" */
119 int path_has_protocol(const char *path)
120 {
121 const char *p;
122
123 #ifdef _WIN32
124 if (is_windows_drive(path) ||
125 is_windows_drive_prefix(path)) {
126 return 0;
127 }
128 p = path + strcspn(path, ":/\\");
129 #else
130 p = path + strcspn(path, ":/");
131 #endif
132
133 return *p == ':';
134 }
135
136 int path_is_absolute(const char *path)
137 {
138 #ifdef _WIN32
139 /* specific case for names like: "\\.\d:" */
140 if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
141 return 1;
142 }
143 return (*path == '/' || *path == '\\');
144 #else
145 return (*path == '/');
146 #endif
147 }
148
149 /* if filename is absolute, just copy it to dest. Otherwise, build a
150 path to it by considering it is relative to base_path. URL are
151 supported. */
152 void path_combine(char *dest, int dest_size,
153 const char *base_path,
154 const char *filename)
155 {
156 const char *p, *p1;
157 int len;
158
159 if (dest_size <= 0)
160 return;
161 if (path_is_absolute(filename)) {
162 pstrcpy(dest, dest_size, filename);
163 } else {
164 p = strchr(base_path, ':');
165 if (p)
166 p++;
167 else
168 p = base_path;
169 p1 = strrchr(base_path, '/');
170 #ifdef _WIN32
171 {
172 const char *p2;
173 p2 = strrchr(base_path, '\\');
174 if (!p1 || p2 > p1)
175 p1 = p2;
176 }
177 #endif
178 if (p1)
179 p1++;
180 else
181 p1 = base_path;
182 if (p1 > p)
183 p = p1;
184 len = p - base_path;
185 if (len > dest_size - 1)
186 len = dest_size - 1;
187 memcpy(dest, base_path, len);
188 dest[len] = '\0';
189 pstrcat(dest, dest_size, filename);
190 }
191 }
192
193 void bdrv_get_full_backing_filename_from_filename(const char *backed,
194 const char *backing,
195 char *dest, size_t sz,
196 Error **errp)
197 {
198 if (backing[0] == '\0' || path_has_protocol(backing) ||
199 path_is_absolute(backing))
200 {
201 pstrcpy(dest, sz, backing);
202 } else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
203 error_setg(errp, "Cannot use relative backing file names for '%s'",
204 backed);
205 } else {
206 path_combine(dest, sz, backed, backing);
207 }
208 }
209
210 void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
211 Error **errp)
212 {
213 char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
214
215 bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
216 dest, sz, errp);
217 }
218
219 void bdrv_register(BlockDriver *bdrv)
220 {
221 bdrv_setup_io_funcs(bdrv);
222
223 QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
224 }
225
226 BlockDriverState *bdrv_new_root(void)
227 {
228 return bdrv_new();
229 }
230
231 BlockDriverState *bdrv_new(void)
232 {
233 BlockDriverState *bs;
234 int i;
235
236 bs = g_new0(BlockDriverState, 1);
237 QLIST_INIT(&bs->dirty_bitmaps);
238 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
239 QLIST_INIT(&bs->op_blockers[i]);
240 }
241 notifier_with_return_list_init(&bs->before_write_notifiers);
242 qemu_co_queue_init(&bs->throttled_reqs[0]);
243 qemu_co_queue_init(&bs->throttled_reqs[1]);
244 bs->refcnt = 1;
245 bs->aio_context = qemu_get_aio_context();
246
247 QTAILQ_INSERT_TAIL(&all_bdrv_states, bs, bs_list);
248
249 return bs;
250 }
251
252 BlockDriver *bdrv_find_format(const char *format_name)
253 {
254 BlockDriver *drv1;
255 QLIST_FOREACH(drv1, &bdrv_drivers, list) {
256 if (!strcmp(drv1->format_name, format_name)) {
257 return drv1;
258 }
259 }
260 return NULL;
261 }
262
263 static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
264 {
265 static const char *whitelist_rw[] = {
266 CONFIG_BDRV_RW_WHITELIST
267 };
268 static const char *whitelist_ro[] = {
269 CONFIG_BDRV_RO_WHITELIST
270 };
271 const char **p;
272
273 if (!whitelist_rw[0] && !whitelist_ro[0]) {
274 return 1; /* no whitelist, anything goes */
275 }
276
277 for (p = whitelist_rw; *p; p++) {
278 if (!strcmp(drv->format_name, *p)) {
279 return 1;
280 }
281 }
282 if (read_only) {
283 for (p = whitelist_ro; *p; p++) {
284 if (!strcmp(drv->format_name, *p)) {
285 return 1;
286 }
287 }
288 }
289 return 0;
290 }
291
292 typedef struct CreateCo {
293 BlockDriver *drv;
294 char *filename;
295 QemuOpts *opts;
296 int ret;
297 Error *err;
298 } CreateCo;
299
300 static void coroutine_fn bdrv_create_co_entry(void *opaque)
301 {
302 Error *local_err = NULL;
303 int ret;
304
305 CreateCo *cco = opaque;
306 assert(cco->drv);
307
308 ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
309 if (local_err) {
310 error_propagate(&cco->err, local_err);
311 }
312 cco->ret = ret;
313 }
314
315 int bdrv_create(BlockDriver *drv, const char* filename,
316 QemuOpts *opts, Error **errp)
317 {
318 int ret;
319
320 Coroutine *co;
321 CreateCo cco = {
322 .drv = drv,
323 .filename = g_strdup(filename),
324 .opts = opts,
325 .ret = NOT_DONE,
326 .err = NULL,
327 };
328
329 if (!drv->bdrv_create) {
330 error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
331 ret = -ENOTSUP;
332 goto out;
333 }
334
335 if (qemu_in_coroutine()) {
336 /* Fast-path if already in coroutine context */
337 bdrv_create_co_entry(&cco);
338 } else {
339 co = qemu_coroutine_create(bdrv_create_co_entry);
340 qemu_coroutine_enter(co, &cco);
341 while (cco.ret == NOT_DONE) {
342 aio_poll(qemu_get_aio_context(), true);
343 }
344 }
345
346 ret = cco.ret;
347 if (ret < 0) {
348 if (cco.err) {
349 error_propagate(errp, cco.err);
350 } else {
351 error_setg_errno(errp, -ret, "Could not create image");
352 }
353 }
354
355 out:
356 g_free(cco.filename);
357 return ret;
358 }
359
360 int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
361 {
362 BlockDriver *drv;
363 Error *local_err = NULL;
364 int ret;
365
366 drv = bdrv_find_protocol(filename, true, errp);
367 if (drv == NULL) {
368 return -ENOENT;
369 }
370
371 ret = bdrv_create(drv, filename, opts, &local_err);
372 if (local_err) {
373 error_propagate(errp, local_err);
374 }
375 return ret;
376 }
377
378 /**
379 * Try to get @bs's logical and physical block size.
380 * On success, store them in @bsz struct and return 0.
381 * On failure return -errno.
382 * @bs must not be empty.
383 */
384 int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
385 {
386 BlockDriver *drv = bs->drv;
387
388 if (drv && drv->bdrv_probe_blocksizes) {
389 return drv->bdrv_probe_blocksizes(bs, bsz);
390 }
391
392 return -ENOTSUP;
393 }
394
395 /**
396 * Try to get @bs's geometry (cyls, heads, sectors).
397 * On success, store them in @geo struct and return 0.
398 * On failure return -errno.
399 * @bs must not be empty.
400 */
401 int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
402 {
403 BlockDriver *drv = bs->drv;
404
405 if (drv && drv->bdrv_probe_geometry) {
406 return drv->bdrv_probe_geometry(bs, geo);
407 }
408
409 return -ENOTSUP;
410 }
411
412 /*
413 * Create a uniquely-named empty temporary file.
414 * Return 0 upon success, otherwise a negative errno value.
415 */
416 int get_tmp_filename(char *filename, int size)
417 {
418 #ifdef _WIN32
419 char temp_dir[MAX_PATH];
420 /* GetTempFileName requires that its output buffer (4th param)
421 have length MAX_PATH or greater. */
422 assert(size >= MAX_PATH);
423 return (GetTempPath(MAX_PATH, temp_dir)
424 && GetTempFileName(temp_dir, "qem", 0, filename)
425 ? 0 : -GetLastError());
426 #else
427 int fd;
428 const char *tmpdir;
429 tmpdir = getenv("TMPDIR");
430 if (!tmpdir) {
431 tmpdir = "/var/tmp";
432 }
433 if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
434 return -EOVERFLOW;
435 }
436 fd = mkstemp(filename);
437 if (fd < 0) {
438 return -errno;
439 }
440 if (close(fd) != 0) {
441 unlink(filename);
442 return -errno;
443 }
444 return 0;
445 #endif
446 }
447
448 /*
449 * Detect host devices. By convention, /dev/cdrom[N] is always
450 * recognized as a host CDROM.
451 */
452 static BlockDriver *find_hdev_driver(const char *filename)
453 {
454 int score_max = 0, score;
455 BlockDriver *drv = NULL, *d;
456
457 QLIST_FOREACH(d, &bdrv_drivers, list) {
458 if (d->bdrv_probe_device) {
459 score = d->bdrv_probe_device(filename);
460 if (score > score_max) {
461 score_max = score;
462 drv = d;
463 }
464 }
465 }
466
467 return drv;
468 }
469
470 BlockDriver *bdrv_find_protocol(const char *filename,
471 bool allow_protocol_prefix,
472 Error **errp)
473 {
474 BlockDriver *drv1;
475 char protocol[128];
476 int len;
477 const char *p;
478
479 /* TODO Drivers without bdrv_file_open must be specified explicitly */
480
481 /*
482 * XXX(hch): we really should not let host device detection
483 * override an explicit protocol specification, but moving this
484 * later breaks access to device names with colons in them.
485 * Thanks to the brain-dead persistent naming schemes on udev-
486 * based Linux systems those actually are quite common.
487 */
488 drv1 = find_hdev_driver(filename);
489 if (drv1) {
490 return drv1;
491 }
492
493 if (!path_has_protocol(filename) || !allow_protocol_prefix) {
494 return &bdrv_file;
495 }
496
497 p = strchr(filename, ':');
498 assert(p != NULL);
499 len = p - filename;
500 if (len > sizeof(protocol) - 1)
501 len = sizeof(protocol) - 1;
502 memcpy(protocol, filename, len);
503 protocol[len] = '\0';
504 QLIST_FOREACH(drv1, &bdrv_drivers, list) {
505 if (drv1->protocol_name &&
506 !strcmp(drv1->protocol_name, protocol)) {
507 return drv1;
508 }
509 }
510
511 error_setg(errp, "Unknown protocol '%s'", protocol);
512 return NULL;
513 }
514
515 /*
516 * Guess image format by probing its contents.
517 * This is not a good idea when your image is raw (CVE-2008-2004), but
518 * we do it anyway for backward compatibility.
519 *
520 * @buf contains the image's first @buf_size bytes.
521 * @buf_size is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
522 * but can be smaller if the image file is smaller)
523 * @filename is its filename.
524 *
525 * For all block drivers, call the bdrv_probe() method to get its
526 * probing score.
527 * Return the first block driver with the highest probing score.
528 */
529 BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
530 const char *filename)
531 {
532 int score_max = 0, score;
533 BlockDriver *drv = NULL, *d;
534
535 QLIST_FOREACH(d, &bdrv_drivers, list) {
536 if (d->bdrv_probe) {
537 score = d->bdrv_probe(buf, buf_size, filename);
538 if (score > score_max) {
539 score_max = score;
540 drv = d;
541 }
542 }
543 }
544
545 return drv;
546 }
547
548 static int find_image_format(BlockDriverState *bs, const char *filename,
549 BlockDriver **pdrv, Error **errp)
550 {
551 BlockDriver *drv;
552 uint8_t buf[BLOCK_PROBE_BUF_SIZE];
553 int ret = 0;
554
555 /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
556 if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
557 *pdrv = &bdrv_raw;
558 return ret;
559 }
560
561 ret = bdrv_pread(bs, 0, buf, sizeof(buf));
562 if (ret < 0) {
563 error_setg_errno(errp, -ret, "Could not read image for determining its "
564 "format");
565 *pdrv = NULL;
566 return ret;
567 }
568
569 drv = bdrv_probe_all(buf, ret, filename);
570 if (!drv) {
571 error_setg(errp, "Could not determine image format: No compatible "
572 "driver found");
573 ret = -ENOENT;
574 }
575 *pdrv = drv;
576 return ret;
577 }
578
579 /**
580 * Set the current 'total_sectors' value
581 * Return 0 on success, -errno on error.
582 */
583 static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
584 {
585 BlockDriver *drv = bs->drv;
586
587 /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
588 if (bdrv_is_sg(bs))
589 return 0;
590
591 /* query actual device if possible, otherwise just trust the hint */
592 if (drv->bdrv_getlength) {
593 int64_t length = drv->bdrv_getlength(bs);
594 if (length < 0) {
595 return length;
596 }
597 hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
598 }
599
600 bs->total_sectors = hint;
601 return 0;
602 }
603
604 /**
605 * Combines a QDict of new block driver @options with any missing options taken
606 * from @old_options, so that leaving out an option defaults to its old value.
607 */
608 static void bdrv_join_options(BlockDriverState *bs, QDict *options,
609 QDict *old_options)
610 {
611 if (bs->drv && bs->drv->bdrv_join_options) {
612 bs->drv->bdrv_join_options(options, old_options);
613 } else {
614 qdict_join(options, old_options, false);
615 }
616 }
617
618 /**
619 * Set open flags for a given discard mode
620 *
621 * Return 0 on success, -1 if the discard mode was invalid.
622 */
623 int bdrv_parse_discard_flags(const char *mode, int *flags)
624 {
625 *flags &= ~BDRV_O_UNMAP;
626
627 if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
628 /* do nothing */
629 } else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
630 *flags |= BDRV_O_UNMAP;
631 } else {
632 return -1;
633 }
634
635 return 0;
636 }
637
638 /**
639 * Set open flags for a given cache mode
640 *
641 * Return 0 on success, -1 if the cache mode was invalid.
642 */
643 int bdrv_parse_cache_flags(const char *mode, int *flags)
644 {
645 *flags &= ~BDRV_O_CACHE_MASK;
646
647 if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
648 *flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
649 } else if (!strcmp(mode, "directsync")) {
650 *flags |= BDRV_O_NOCACHE;
651 } else if (!strcmp(mode, "writeback")) {
652 *flags |= BDRV_O_CACHE_WB;
653 } else if (!strcmp(mode, "unsafe")) {
654 *flags |= BDRV_O_CACHE_WB;
655 *flags |= BDRV_O_NO_FLUSH;
656 } else if (!strcmp(mode, "writethrough")) {
657 /* this is the default */
658 } else {
659 return -1;
660 }
661
662 return 0;
663 }
664
665 /*
666 * Returns the options and flags that a temporary snapshot should get, based on
667 * the originally requested flags (the originally requested image will have
668 * flags like a backing file)
669 */
670 static void bdrv_temp_snapshot_options(int *child_flags, QDict *child_options,
671 int parent_flags, QDict *parent_options)
672 {
673 *child_flags = (parent_flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
674
675 /* For temporary files, unconditional cache=unsafe is fine */
676 qdict_set_default_str(child_options, BDRV_OPT_CACHE_WB, "on");
677 qdict_set_default_str(child_options, BDRV_OPT_CACHE_DIRECT, "off");
678 qdict_set_default_str(child_options, BDRV_OPT_CACHE_NO_FLUSH, "on");
679 }
680
681 /*
682 * Returns the options and flags that bs->file should get if a protocol driver
683 * is expected, based on the given options and flags for the parent BDS
684 */
685 static void bdrv_inherited_options(int *child_flags, QDict *child_options,
686 int parent_flags, QDict *parent_options)
687 {
688 int flags = parent_flags;
689
690 /* Enable protocol handling, disable format probing for bs->file */
691 flags |= BDRV_O_PROTOCOL;
692
693 /* If the cache mode isn't explicitly set, inherit direct and no-flush from
694 * the parent. */
695 qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
696 qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
697
698 /* Our block drivers take care to send flushes and respect unmap policy,
699 * so we can default to enable both on lower layers regardless of the
700 * corresponding parent options. */
701 qdict_set_default_str(child_options, BDRV_OPT_CACHE_WB, "on");
702 flags |= BDRV_O_UNMAP;
703
704 /* Clear flags that only apply to the top layer */
705 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ);
706
707 *child_flags = flags;
708 }
709
710 const BdrvChildRole child_file = {
711 .inherit_options = bdrv_inherited_options,
712 };
713
714 /*
715 * Returns the options and flags that bs->file should get if the use of formats
716 * (and not only protocols) is permitted for it, based on the given options and
717 * flags for the parent BDS
718 */
719 static void bdrv_inherited_fmt_options(int *child_flags, QDict *child_options,
720 int parent_flags, QDict *parent_options)
721 {
722 child_file.inherit_options(child_flags, child_options,
723 parent_flags, parent_options);
724
725 *child_flags &= ~BDRV_O_PROTOCOL;
726 }
727
728 const BdrvChildRole child_format = {
729 .inherit_options = bdrv_inherited_fmt_options,
730 };
731
732 /*
733 * Returns the options and flags that bs->backing should get, based on the
734 * given options and flags for the parent BDS
735 */
736 static void bdrv_backing_options(int *child_flags, QDict *child_options,
737 int parent_flags, QDict *parent_options)
738 {
739 int flags = parent_flags;
740
741 /* The cache mode is inherited unmodified for backing files */
742 qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_WB);
743 qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
744 qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
745
746 /* backing files always opened read-only */
747 flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
748
749 /* snapshot=on is handled on the top layer */
750 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
751
752 *child_flags = flags;
753 }
754
755 static const BdrvChildRole child_backing = {
756 .inherit_options = bdrv_backing_options,
757 };
758
759 static int bdrv_open_flags(BlockDriverState *bs, int flags)
760 {
761 int open_flags = flags | BDRV_O_CACHE_WB;
762
763 /*
764 * Clear flags that are internal to the block layer before opening the
765 * image.
766 */
767 open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
768
769 /*
770 * Snapshots should be writable.
771 */
772 if (flags & BDRV_O_TEMPORARY) {
773 open_flags |= BDRV_O_RDWR;
774 }
775
776 return open_flags;
777 }
778
779 static void update_flags_from_options(int *flags, QemuOpts *opts)
780 {
781 *flags &= ~BDRV_O_CACHE_MASK;
782
783 assert(qemu_opt_find(opts, BDRV_OPT_CACHE_WB));
784 if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, false)) {
785 *flags |= BDRV_O_CACHE_WB;
786 }
787
788 assert(qemu_opt_find(opts, BDRV_OPT_CACHE_NO_FLUSH));
789 if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_NO_FLUSH, false)) {
790 *flags |= BDRV_O_NO_FLUSH;
791 }
792
793 assert(qemu_opt_find(opts, BDRV_OPT_CACHE_DIRECT));
794 if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_DIRECT, false)) {
795 *flags |= BDRV_O_NOCACHE;
796 }
797 }
798
799 static void update_options_from_flags(QDict *options, int flags)
800 {
801 if (!qdict_haskey(options, BDRV_OPT_CACHE_WB)) {
802 qdict_put(options, BDRV_OPT_CACHE_WB,
803 qbool_from_bool(flags & BDRV_O_CACHE_WB));
804 }
805 if (!qdict_haskey(options, BDRV_OPT_CACHE_DIRECT)) {
806 qdict_put(options, BDRV_OPT_CACHE_DIRECT,
807 qbool_from_bool(flags & BDRV_O_NOCACHE));
808 }
809 if (!qdict_haskey(options, BDRV_OPT_CACHE_NO_FLUSH)) {
810 qdict_put(options, BDRV_OPT_CACHE_NO_FLUSH,
811 qbool_from_bool(flags & BDRV_O_NO_FLUSH));
812 }
813 }
814
815 static void bdrv_assign_node_name(BlockDriverState *bs,
816 const char *node_name,
817 Error **errp)
818 {
819 char *gen_node_name = NULL;
820
821 if (!node_name) {
822 node_name = gen_node_name = id_generate(ID_BLOCK);
823 } else if (!id_wellformed(node_name)) {
824 /*
825 * Check for empty string or invalid characters, but not if it is
826 * generated (generated names use characters not available to the user)
827 */
828 error_setg(errp, "Invalid node name");
829 return;
830 }
831
832 /* takes care of avoiding namespaces collisions */
833 if (blk_by_name(node_name)) {
834 error_setg(errp, "node-name=%s is conflicting with a device id",
835 node_name);
836 goto out;
837 }
838
839 /* takes care of avoiding duplicates node names */
840 if (bdrv_find_node(node_name)) {
841 error_setg(errp, "Duplicate node name");
842 goto out;
843 }
844
845 /* copy node name into the bs and insert it into the graph list */
846 pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
847 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
848 out:
849 g_free(gen_node_name);
850 }
851
852 static QemuOptsList bdrv_runtime_opts = {
853 .name = "bdrv_common",
854 .head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
855 .desc = {
856 {
857 .name = "node-name",
858 .type = QEMU_OPT_STRING,
859 .help = "Node name of the block device node",
860 },
861 {
862 .name = "driver",
863 .type = QEMU_OPT_STRING,
864 .help = "Block driver to use for the node",
865 },
866 {
867 .name = BDRV_OPT_CACHE_WB,
868 .type = QEMU_OPT_BOOL,
869 .help = "Enable writeback mode",
870 },
871 {
872 .name = BDRV_OPT_CACHE_DIRECT,
873 .type = QEMU_OPT_BOOL,
874 .help = "Bypass software writeback cache on the host",
875 },
876 {
877 .name = BDRV_OPT_CACHE_NO_FLUSH,
878 .type = QEMU_OPT_BOOL,
879 .help = "Ignore flush requests",
880 },
881 { /* end of list */ }
882 },
883 };
884
885 /*
886 * Common part for opening disk images and files
887 *
888 * Removes all processed options from *options.
889 */
890 static int bdrv_open_common(BlockDriverState *bs, BdrvChild *file,
891 QDict *options, Error **errp)
892 {
893 int ret, open_flags;
894 const char *filename;
895 const char *driver_name = NULL;
896 const char *node_name = NULL;
897 QemuOpts *opts;
898 BlockDriver *drv;
899 Error *local_err = NULL;
900
901 assert(bs->file == NULL);
902 assert(options != NULL && bs->options != options);
903
904 opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
905 qemu_opts_absorb_qdict(opts, options, &local_err);
906 if (local_err) {
907 error_propagate(errp, local_err);
908 ret = -EINVAL;
909 goto fail_opts;
910 }
911
912 driver_name = qemu_opt_get(opts, "driver");
913 drv = bdrv_find_format(driver_name);
914 assert(drv != NULL);
915
916 if (file != NULL) {
917 filename = file->bs->filename;
918 } else {
919 filename = qdict_get_try_str(options, "filename");
920 }
921
922 if (drv->bdrv_needs_filename && !filename) {
923 error_setg(errp, "The '%s' block driver requires a file name",
924 drv->format_name);
925 ret = -EINVAL;
926 goto fail_opts;
927 }
928
929 trace_bdrv_open_common(bs, filename ?: "", bs->open_flags,
930 drv->format_name);
931
932 node_name = qemu_opt_get(opts, "node-name");
933 bdrv_assign_node_name(bs, node_name, &local_err);
934 if (local_err) {
935 error_propagate(errp, local_err);
936 ret = -EINVAL;
937 goto fail_opts;
938 }
939
940 bs->request_alignment = 512;
941 bs->zero_beyond_eof = true;
942 bs->read_only = !(bs->open_flags & BDRV_O_RDWR);
943
944 if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
945 error_setg(errp,
946 !bs->read_only && bdrv_is_whitelisted(drv, true)
947 ? "Driver '%s' can only be used for read-only devices"
948 : "Driver '%s' is not whitelisted",
949 drv->format_name);
950 ret = -ENOTSUP;
951 goto fail_opts;
952 }
953
954 assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
955 if (bs->open_flags & BDRV_O_COPY_ON_READ) {
956 if (!bs->read_only) {
957 bdrv_enable_copy_on_read(bs);
958 } else {
959 error_setg(errp, "Can't use copy-on-read on read-only device");
960 ret = -EINVAL;
961 goto fail_opts;
962 }
963 }
964
965 if (filename != NULL) {
966 pstrcpy(bs->filename, sizeof(bs->filename), filename);
967 } else {
968 bs->filename[0] = '\0';
969 }
970 pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
971
972 bs->drv = drv;
973 bs->opaque = g_malloc0(drv->instance_size);
974
975 /* Apply cache mode options */
976 update_flags_from_options(&bs->open_flags, opts);
977 bdrv_set_enable_write_cache(bs, bs->open_flags & BDRV_O_CACHE_WB);
978
979 /* Open the image, either directly or using a protocol */
980 open_flags = bdrv_open_flags(bs, bs->open_flags);
981 if (drv->bdrv_file_open) {
982 assert(file == NULL);
983 assert(!drv->bdrv_needs_filename || filename != NULL);
984 ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
985 } else {
986 if (file == NULL) {
987 error_setg(errp, "Can't use '%s' as a block driver for the "
988 "protocol level", drv->format_name);
989 ret = -EINVAL;
990 goto free_and_fail;
991 }
992 bs->file = file;
993 ret = drv->bdrv_open(bs, options, open_flags, &local_err);
994 }
995
996 if (ret < 0) {
997 if (local_err) {
998 error_propagate(errp, local_err);
999 } else if (bs->filename[0]) {
1000 error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
1001 } else {
1002 error_setg_errno(errp, -ret, "Could not open image");
1003 }
1004 goto free_and_fail;
1005 }
1006
1007 if (bs->encrypted) {
1008 error_report("Encrypted images are deprecated");
1009 error_printf("Support for them will be removed in a future release.\n"
1010 "You can use 'qemu-img convert' to convert your image"
1011 " to an unencrypted one.\n");
1012 }
1013
1014 ret = refresh_total_sectors(bs, bs->total_sectors);
1015 if (ret < 0) {
1016 error_setg_errno(errp, -ret, "Could not refresh total sector count");
1017 goto free_and_fail;
1018 }
1019
1020 bdrv_refresh_limits(bs, &local_err);
1021 if (local_err) {
1022 error_propagate(errp, local_err);
1023 ret = -EINVAL;
1024 goto free_and_fail;
1025 }
1026
1027 assert(bdrv_opt_mem_align(bs) != 0);
1028 assert(bdrv_min_mem_align(bs) != 0);
1029 assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
1030
1031 qemu_opts_del(opts);
1032 return 0;
1033
1034 free_and_fail:
1035 bs->file = NULL;
1036 g_free(bs->opaque);
1037 bs->opaque = NULL;
1038 bs->drv = NULL;
1039 fail_opts:
1040 qemu_opts_del(opts);
1041 return ret;
1042 }
1043
1044 static QDict *parse_json_filename(const char *filename, Error **errp)
1045 {
1046 QObject *options_obj;
1047 QDict *options;
1048 int ret;
1049
1050 ret = strstart(filename, "json:", &filename);
1051 assert(ret);
1052
1053 options_obj = qobject_from_json(filename);
1054 if (!options_obj) {
1055 error_setg(errp, "Could not parse the JSON options");
1056 return NULL;
1057 }
1058
1059 if (qobject_type(options_obj) != QTYPE_QDICT) {
1060 qobject_decref(options_obj);
1061 error_setg(errp, "Invalid JSON object given");
1062 return NULL;
1063 }
1064
1065 options = qobject_to_qdict(options_obj);
1066 qdict_flatten(options);
1067
1068 return options;
1069 }
1070
1071 static void parse_json_protocol(QDict *options, const char **pfilename,
1072 Error **errp)
1073 {
1074 QDict *json_options;
1075 Error *local_err = NULL;
1076
1077 /* Parse json: pseudo-protocol */
1078 if (!*pfilename || !g_str_has_prefix(*pfilename, "json:")) {
1079 return;
1080 }
1081
1082 json_options = parse_json_filename(*pfilename, &local_err);
1083 if (local_err) {
1084 error_propagate(errp, local_err);
1085 return;
1086 }
1087
1088 /* Options given in the filename have lower priority than options
1089 * specified directly */
1090 qdict_join(options, json_options, false);
1091 QDECREF(json_options);
1092 *pfilename = NULL;
1093 }
1094
1095 /*
1096 * Fills in default options for opening images and converts the legacy
1097 * filename/flags pair to option QDict entries.
1098 * The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
1099 * block driver has been specified explicitly.
1100 */
1101 static int bdrv_fill_options(QDict **options, const char *filename,
1102 int *flags, Error **errp)
1103 {
1104 const char *drvname;
1105 bool protocol = *flags & BDRV_O_PROTOCOL;
1106 bool parse_filename = false;
1107 BlockDriver *drv = NULL;
1108 Error *local_err = NULL;
1109
1110 drvname = qdict_get_try_str(*options, "driver");
1111 if (drvname) {
1112 drv = bdrv_find_format(drvname);
1113 if (!drv) {
1114 error_setg(errp, "Unknown driver '%s'", drvname);
1115 return -ENOENT;
1116 }
1117 /* If the user has explicitly specified the driver, this choice should
1118 * override the BDRV_O_PROTOCOL flag */
1119 protocol = drv->bdrv_file_open;
1120 }
1121
1122 if (protocol) {
1123 *flags |= BDRV_O_PROTOCOL;
1124 } else {
1125 *flags &= ~BDRV_O_PROTOCOL;
1126 }
1127
1128 /* Translate cache options from flags into options */
1129 update_options_from_flags(*options, *flags);
1130
1131 /* Fetch the file name from the options QDict if necessary */
1132 if (protocol && filename) {
1133 if (!qdict_haskey(*options, "filename")) {
1134 qdict_put(*options, "filename", qstring_from_str(filename));
1135 parse_filename = true;
1136 } else {
1137 error_setg(errp, "Can't specify 'file' and 'filename' options at "
1138 "the same time");
1139 return -EINVAL;
1140 }
1141 }
1142
1143 /* Find the right block driver */
1144 filename = qdict_get_try_str(*options, "filename");
1145
1146 if (!drvname && protocol) {
1147 if (filename) {
1148 drv = bdrv_find_protocol(filename, parse_filename, errp);
1149 if (!drv) {
1150 return -EINVAL;
1151 }
1152
1153 drvname = drv->format_name;
1154 qdict_put(*options, "driver", qstring_from_str(drvname));
1155 } else {
1156 error_setg(errp, "Must specify either driver or file");
1157 return -EINVAL;
1158 }
1159 }
1160
1161 assert(drv || !protocol);
1162
1163 /* Driver-specific filename parsing */
1164 if (drv && drv->bdrv_parse_filename && parse_filename) {
1165 drv->bdrv_parse_filename(filename, *options, &local_err);
1166 if (local_err) {
1167 error_propagate(errp, local_err);
1168 return -EINVAL;
1169 }
1170
1171 if (!drv->bdrv_needs_filename) {
1172 qdict_del(*options, "filename");
1173 }
1174 }
1175
1176 return 0;
1177 }
1178
1179 BdrvChild *bdrv_root_attach_child(BlockDriverState *child_bs,
1180 const char *child_name,
1181 const BdrvChildRole *child_role)
1182 {
1183 BdrvChild *child = g_new(BdrvChild, 1);
1184 *child = (BdrvChild) {
1185 .bs = child_bs,
1186 .name = g_strdup(child_name),
1187 .role = child_role,
1188 };
1189
1190 QLIST_INSERT_HEAD(&child_bs->parents, child, next_parent);
1191
1192 return child;
1193 }
1194
1195 static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
1196 BlockDriverState *child_bs,
1197 const char *child_name,
1198 const BdrvChildRole *child_role)
1199 {
1200 BdrvChild *child = bdrv_root_attach_child(child_bs, child_name, child_role);
1201 QLIST_INSERT_HEAD(&parent_bs->children, child, next);
1202 return child;
1203 }
1204
1205 static void bdrv_detach_child(BdrvChild *child)
1206 {
1207 if (child->next.le_prev) {
1208 QLIST_REMOVE(child, next);
1209 child->next.le_prev = NULL;
1210 }
1211 QLIST_REMOVE(child, next_parent);
1212 g_free(child->name);
1213 g_free(child);
1214 }
1215
1216 void bdrv_root_unref_child(BdrvChild *child)
1217 {
1218 BlockDriverState *child_bs;
1219
1220 child_bs = child->bs;
1221 bdrv_detach_child(child);
1222 bdrv_unref(child_bs);
1223 }
1224
1225 void bdrv_unref_child(BlockDriverState *parent, BdrvChild *child)
1226 {
1227 if (child == NULL) {
1228 return;
1229 }
1230
1231 if (child->bs->inherits_from == parent) {
1232 child->bs->inherits_from = NULL;
1233 }
1234
1235 bdrv_root_unref_child(child);
1236 }
1237
1238 /*
1239 * Sets the backing file link of a BDS. A new reference is created; callers
1240 * which don't need their own reference any more must call bdrv_unref().
1241 */
1242 void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
1243 {
1244 if (backing_hd) {
1245 bdrv_ref(backing_hd);
1246 }
1247
1248 if (bs->backing) {
1249 assert(bs->backing_blocker);
1250 bdrv_op_unblock_all(bs->backing->bs, bs->backing_blocker);
1251 bdrv_unref_child(bs, bs->backing);
1252 } else if (backing_hd) {
1253 error_setg(&bs->backing_blocker,
1254 "node is used as backing hd of '%s'",
1255 bdrv_get_device_or_node_name(bs));
1256 }
1257
1258 if (!backing_hd) {
1259 error_free(bs->backing_blocker);
1260 bs->backing_blocker = NULL;
1261 bs->backing = NULL;
1262 goto out;
1263 }
1264 bs->backing = bdrv_attach_child(bs, backing_hd, "backing", &child_backing);
1265 bs->open_flags &= ~BDRV_O_NO_BACKING;
1266 pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
1267 pstrcpy(bs->backing_format, sizeof(bs->backing_format),
1268 backing_hd->drv ? backing_hd->drv->format_name : "");
1269
1270 bdrv_op_block_all(backing_hd, bs->backing_blocker);
1271 /* Otherwise we won't be able to commit due to check in bdrv_commit */
1272 bdrv_op_unblock(backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
1273 bs->backing_blocker);
1274 out:
1275 bdrv_refresh_limits(bs, NULL);
1276 }
1277
1278 /*
1279 * Opens the backing file for a BlockDriverState if not yet open
1280 *
1281 * bdref_key specifies the key for the image's BlockdevRef in the options QDict.
1282 * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1283 * itself, all options starting with "${bdref_key}." are considered part of the
1284 * BlockdevRef.
1285 *
1286 * TODO Can this be unified with bdrv_open_image()?
1287 */
1288 int bdrv_open_backing_file(BlockDriverState *bs, QDict *parent_options,
1289 const char *bdref_key, Error **errp)
1290 {
1291 char *backing_filename = g_malloc0(PATH_MAX);
1292 char *bdref_key_dot;
1293 const char *reference = NULL;
1294 int ret = 0;
1295 BlockDriverState *backing_hd;
1296 QDict *options;
1297 QDict *tmp_parent_options = NULL;
1298 Error *local_err = NULL;
1299
1300 if (bs->backing != NULL) {
1301 goto free_exit;
1302 }
1303
1304 /* NULL means an empty set of options */
1305 if (parent_options == NULL) {
1306 tmp_parent_options = qdict_new();
1307 parent_options = tmp_parent_options;
1308 }
1309
1310 bs->open_flags &= ~BDRV_O_NO_BACKING;
1311
1312 bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1313 qdict_extract_subqdict(parent_options, &options, bdref_key_dot);
1314 g_free(bdref_key_dot);
1315
1316 reference = qdict_get_try_str(parent_options, bdref_key);
1317 if (reference || qdict_haskey(options, "file.filename")) {
1318 backing_filename[0] = '\0';
1319 } else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
1320 QDECREF(options);
1321 goto free_exit;
1322 } else {
1323 bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
1324 &local_err);
1325 if (local_err) {
1326 ret = -EINVAL;
1327 error_propagate(errp, local_err);
1328 QDECREF(options);
1329 goto free_exit;
1330 }
1331 }
1332
1333 if (!bs->drv || !bs->drv->supports_backing) {
1334 ret = -EINVAL;
1335 error_setg(errp, "Driver doesn't support backing files");
1336 QDECREF(options);
1337 goto free_exit;
1338 }
1339
1340 if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
1341 qdict_put(options, "driver", qstring_from_str(bs->backing_format));
1342 }
1343
1344 backing_hd = NULL;
1345 ret = bdrv_open_inherit(&backing_hd,
1346 *backing_filename ? backing_filename : NULL,
1347 reference, options, 0, bs, &child_backing,
1348 errp);
1349 if (ret < 0) {
1350 bs->open_flags |= BDRV_O_NO_BACKING;
1351 error_prepend(errp, "Could not open backing file: ");
1352 goto free_exit;
1353 }
1354
1355 /* Hook up the backing file link; drop our reference, bs owns the
1356 * backing_hd reference now */
1357 bdrv_set_backing_hd(bs, backing_hd);
1358 bdrv_unref(backing_hd);
1359
1360 qdict_del(parent_options, bdref_key);
1361
1362 free_exit:
1363 g_free(backing_filename);
1364 QDECREF(tmp_parent_options);
1365 return ret;
1366 }
1367
1368 /*
1369 * Opens a disk image whose options are given as BlockdevRef in another block
1370 * device's options.
1371 *
1372 * If allow_none is true, no image will be opened if filename is false and no
1373 * BlockdevRef is given. NULL will be returned, but errp remains unset.
1374 *
1375 * bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
1376 * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1377 * itself, all options starting with "${bdref_key}." are considered part of the
1378 * BlockdevRef.
1379 *
1380 * The BlockdevRef will be removed from the options QDict.
1381 */
1382 BdrvChild *bdrv_open_child(const char *filename,
1383 QDict *options, const char *bdref_key,
1384 BlockDriverState* parent,
1385 const BdrvChildRole *child_role,
1386 bool allow_none, Error **errp)
1387 {
1388 BdrvChild *c = NULL;
1389 BlockDriverState *bs;
1390 QDict *image_options;
1391 int ret;
1392 char *bdref_key_dot;
1393 const char *reference;
1394
1395 assert(child_role != NULL);
1396
1397 bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1398 qdict_extract_subqdict(options, &image_options, bdref_key_dot);
1399 g_free(bdref_key_dot);
1400
1401 reference = qdict_get_try_str(options, bdref_key);
1402 if (!filename && !reference && !qdict_size(image_options)) {
1403 if (!allow_none) {
1404 error_setg(errp, "A block device must be specified for \"%s\"",
1405 bdref_key);
1406 }
1407 QDECREF(image_options);
1408 goto done;
1409 }
1410
1411 bs = NULL;
1412 ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
1413 parent, child_role, errp);
1414 if (ret < 0) {
1415 goto done;
1416 }
1417
1418 c = bdrv_attach_child(parent, bs, bdref_key, child_role);
1419
1420 done:
1421 qdict_del(options, bdref_key);
1422 return c;
1423 }
1424
1425 static int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags,
1426 QDict *snapshot_options, Error **errp)
1427 {
1428 /* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
1429 char *tmp_filename = g_malloc0(PATH_MAX + 1);
1430 int64_t total_size;
1431 QemuOpts *opts = NULL;
1432 BlockDriverState *bs_snapshot;
1433 Error *local_err = NULL;
1434 int ret;
1435
1436 /* if snapshot, we create a temporary backing file and open it
1437 instead of opening 'filename' directly */
1438
1439 /* Get the required size from the image */
1440 total_size = bdrv_getlength(bs);
1441 if (total_size < 0) {
1442 ret = total_size;
1443 error_setg_errno(errp, -total_size, "Could not get image size");
1444 goto out;
1445 }
1446
1447 /* Create the temporary image */
1448 ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
1449 if (ret < 0) {
1450 error_setg_errno(errp, -ret, "Could not get temporary filename");
1451 goto out;
1452 }
1453
1454 opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
1455 &error_abort);
1456 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
1457 ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, errp);
1458 qemu_opts_del(opts);
1459 if (ret < 0) {
1460 error_prepend(errp, "Could not create temporary overlay '%s': ",
1461 tmp_filename);
1462 goto out;
1463 }
1464
1465 /* Prepare options QDict for the temporary file */
1466 qdict_put(snapshot_options, "file.driver",
1467 qstring_from_str("file"));
1468 qdict_put(snapshot_options, "file.filename",
1469 qstring_from_str(tmp_filename));
1470 qdict_put(snapshot_options, "driver",
1471 qstring_from_str("qcow2"));
1472
1473 bs_snapshot = bdrv_new();
1474
1475 ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
1476 flags, &local_err);
1477 snapshot_options = NULL;
1478 if (ret < 0) {
1479 error_propagate(errp, local_err);
1480 goto out;
1481 }
1482
1483 bdrv_append(bs_snapshot, bs);
1484
1485 out:
1486 QDECREF(snapshot_options);
1487 g_free(tmp_filename);
1488 return ret;
1489 }
1490
1491 /*
1492 * Opens a disk image (raw, qcow2, vmdk, ...)
1493 *
1494 * options is a QDict of options to pass to the block drivers, or NULL for an
1495 * empty set of options. The reference to the QDict belongs to the block layer
1496 * after the call (even on failure), so if the caller intends to reuse the
1497 * dictionary, it needs to use QINCREF() before calling bdrv_open.
1498 *
1499 * If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
1500 * If it is not NULL, the referenced BDS will be reused.
1501 *
1502 * The reference parameter may be used to specify an existing block device which
1503 * should be opened. If specified, neither options nor a filename may be given,
1504 * nor can an existing BDS be reused (that is, *pbs has to be NULL).
1505 */
1506 static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
1507 const char *reference, QDict *options, int flags,
1508 BlockDriverState *parent,
1509 const BdrvChildRole *child_role, Error **errp)
1510 {
1511 int ret;
1512 BdrvChild *file = NULL;
1513 BlockDriverState *bs;
1514 BlockDriver *drv = NULL;
1515 const char *drvname;
1516 const char *backing;
1517 Error *local_err = NULL;
1518 QDict *snapshot_options = NULL;
1519 int snapshot_flags = 0;
1520
1521 assert(pbs);
1522 assert(!child_role || !flags);
1523 assert(!child_role == !parent);
1524
1525 if (reference) {
1526 bool options_non_empty = options ? qdict_size(options) : false;
1527 QDECREF(options);
1528
1529 if (*pbs) {
1530 error_setg(errp, "Cannot reuse an existing BDS when referencing "
1531 "another block device");
1532 return -EINVAL;
1533 }
1534
1535 if (filename || options_non_empty) {
1536 error_setg(errp, "Cannot reference an existing block device with "
1537 "additional options or a new filename");
1538 return -EINVAL;
1539 }
1540
1541 bs = bdrv_lookup_bs(reference, reference, errp);
1542 if (!bs) {
1543 return -ENODEV;
1544 }
1545 bdrv_ref(bs);
1546 *pbs = bs;
1547 return 0;
1548 }
1549
1550 if (*pbs) {
1551 bs = *pbs;
1552 } else {
1553 bs = bdrv_new();
1554 }
1555
1556 /* NULL means an empty set of options */
1557 if (options == NULL) {
1558 options = qdict_new();
1559 }
1560
1561 /* json: syntax counts as explicit options, as if in the QDict */
1562 parse_json_protocol(options, &filename, &local_err);
1563 if (local_err) {
1564 ret = -EINVAL;
1565 goto fail;
1566 }
1567
1568 bs->explicit_options = qdict_clone_shallow(options);
1569
1570 if (child_role) {
1571 bs->inherits_from = parent;
1572 child_role->inherit_options(&flags, options,
1573 parent->open_flags, parent->options);
1574 }
1575
1576 ret = bdrv_fill_options(&options, filename, &flags, &local_err);
1577 if (local_err) {
1578 goto fail;
1579 }
1580
1581 bs->open_flags = flags;
1582 bs->options = options;
1583 options = qdict_clone_shallow(options);
1584
1585 /* Find the right image format driver */
1586 drvname = qdict_get_try_str(options, "driver");
1587 if (drvname) {
1588 drv = bdrv_find_format(drvname);
1589 if (!drv) {
1590 error_setg(errp, "Unknown driver: '%s'", drvname);
1591 ret = -EINVAL;
1592 goto fail;
1593 }
1594 }
1595
1596 assert(drvname || !(flags & BDRV_O_PROTOCOL));
1597
1598 backing = qdict_get_try_str(options, "backing");
1599 if (backing && *backing == '\0') {
1600 flags |= BDRV_O_NO_BACKING;
1601 qdict_del(options, "backing");
1602 }
1603
1604 /* Open image file without format layer */
1605 if ((flags & BDRV_O_PROTOCOL) == 0) {
1606 if (flags & BDRV_O_RDWR) {
1607 flags |= BDRV_O_ALLOW_RDWR;
1608 }
1609 if (flags & BDRV_O_SNAPSHOT) {
1610 snapshot_options = qdict_new();
1611 bdrv_temp_snapshot_options(&snapshot_flags, snapshot_options,
1612 flags, options);
1613 bdrv_backing_options(&flags, options, flags, options);
1614 }
1615
1616 bs->open_flags = flags;
1617
1618 file = bdrv_open_child(filename, options, "file", bs,
1619 &child_file, true, &local_err);
1620 if (local_err) {
1621 ret = -EINVAL;
1622 goto fail;
1623 }
1624 }
1625
1626 /* Image format probing */
1627 bs->probed = !drv;
1628 if (!drv && file) {
1629 ret = find_image_format(file->bs, filename, &drv, &local_err);
1630 if (ret < 0) {
1631 goto fail;
1632 }
1633 /*
1634 * This option update would logically belong in bdrv_fill_options(),
1635 * but we first need to open bs->file for the probing to work, while
1636 * opening bs->file already requires the (mostly) final set of options
1637 * so that cache mode etc. can be inherited.
1638 *
1639 * Adding the driver later is somewhat ugly, but it's not an option
1640 * that would ever be inherited, so it's correct. We just need to make
1641 * sure to update both bs->options (which has the full effective
1642 * options for bs) and options (which has file.* already removed).
1643 */
1644 qdict_put(bs->options, "driver", qstring_from_str(drv->format_name));
1645 qdict_put(options, "driver", qstring_from_str(drv->format_name));
1646 } else if (!drv) {
1647 error_setg(errp, "Must specify either driver or file");
1648 ret = -EINVAL;
1649 goto fail;
1650 }
1651
1652 /* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
1653 assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
1654 /* file must be NULL if a protocol BDS is about to be created
1655 * (the inverse results in an error message from bdrv_open_common()) */
1656 assert(!(flags & BDRV_O_PROTOCOL) || !file);
1657
1658 /* Open the image */
1659 ret = bdrv_open_common(bs, file, options, &local_err);
1660 if (ret < 0) {
1661 goto fail;
1662 }
1663
1664 if (file && (bs->file != file)) {
1665 bdrv_unref_child(bs, file);
1666 file = NULL;
1667 }
1668
1669 /* If there is a backing file, use it */
1670 if ((flags & BDRV_O_NO_BACKING) == 0) {
1671 ret = bdrv_open_backing_file(bs, options, "backing", &local_err);
1672 if (ret < 0) {
1673 goto close_and_fail;
1674 }
1675 }
1676
1677 bdrv_refresh_filename(bs);
1678
1679 /* Check if any unknown options were used */
1680 if (options && (qdict_size(options) != 0)) {
1681 const QDictEntry *entry = qdict_first(options);
1682 if (flags & BDRV_O_PROTOCOL) {
1683 error_setg(errp, "Block protocol '%s' doesn't support the option "
1684 "'%s'", drv->format_name, entry->key);
1685 } else {
1686 error_setg(errp,
1687 "Block format '%s' does not support the option '%s'",
1688 drv->format_name, entry->key);
1689 }
1690
1691 ret = -EINVAL;
1692 goto close_and_fail;
1693 }
1694
1695 if (!bdrv_key_required(bs)) {
1696 if (bs->blk) {
1697 blk_dev_change_media_cb(bs->blk, true);
1698 }
1699 } else if (!runstate_check(RUN_STATE_PRELAUNCH)
1700 && !runstate_check(RUN_STATE_INMIGRATE)
1701 && !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
1702 error_setg(errp,
1703 "Guest must be stopped for opening of encrypted image");
1704 ret = -EBUSY;
1705 goto close_and_fail;
1706 }
1707
1708 QDECREF(options);
1709 *pbs = bs;
1710
1711 /* For snapshot=on, create a temporary qcow2 overlay. bs points to the
1712 * temporary snapshot afterwards. */
1713 if (snapshot_flags) {
1714 ret = bdrv_append_temp_snapshot(bs, snapshot_flags, snapshot_options,
1715 &local_err);
1716 snapshot_options = NULL;
1717 if (local_err) {
1718 goto close_and_fail;
1719 }
1720 }
1721
1722 return 0;
1723
1724 fail:
1725 if (file != NULL) {
1726 bdrv_unref_child(bs, file);
1727 }
1728 QDECREF(snapshot_options);
1729 QDECREF(bs->explicit_options);
1730 QDECREF(bs->options);
1731 QDECREF(options);
1732 bs->options = NULL;
1733 if (!*pbs) {
1734 /* If *pbs is NULL, a new BDS has been created in this function and
1735 needs to be freed now. Otherwise, it does not need to be closed,
1736 since it has not really been opened yet. */
1737 bdrv_unref(bs);
1738 }
1739 if (local_err) {
1740 error_propagate(errp, local_err);
1741 }
1742 return ret;
1743
1744 close_and_fail:
1745 /* See fail path, but now the BDS has to be always closed */
1746 if (*pbs) {
1747 bdrv_close(bs);
1748 } else {
1749 bdrv_unref(bs);
1750 }
1751 QDECREF(snapshot_options);
1752 QDECREF(options);
1753 if (local_err) {
1754 error_propagate(errp, local_err);
1755 }
1756 return ret;
1757 }
1758
1759 int bdrv_open(BlockDriverState **pbs, const char *filename,
1760 const char *reference, QDict *options, int flags, Error **errp)
1761 {
1762 return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
1763 NULL, errp);
1764 }
1765
1766 typedef struct BlockReopenQueueEntry {
1767 bool prepared;
1768 BDRVReopenState state;
1769 QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
1770 } BlockReopenQueueEntry;
1771
1772 /*
1773 * Adds a BlockDriverState to a simple queue for an atomic, transactional
1774 * reopen of multiple devices.
1775 *
1776 * bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
1777 * already performed, or alternatively may be NULL a new BlockReopenQueue will
1778 * be created and initialized. This newly created BlockReopenQueue should be
1779 * passed back in for subsequent calls that are intended to be of the same
1780 * atomic 'set'.
1781 *
1782 * bs is the BlockDriverState to add to the reopen queue.
1783 *
1784 * options contains the changed options for the associated bs
1785 * (the BlockReopenQueue takes ownership)
1786 *
1787 * flags contains the open flags for the associated bs
1788 *
1789 * returns a pointer to bs_queue, which is either the newly allocated
1790 * bs_queue, or the existing bs_queue being used.
1791 *
1792 */
1793 static BlockReopenQueue *bdrv_reopen_queue_child(BlockReopenQueue *bs_queue,
1794 BlockDriverState *bs,
1795 QDict *options,
1796 int flags,
1797 const BdrvChildRole *role,
1798 QDict *parent_options,
1799 int parent_flags)
1800 {
1801 assert(bs != NULL);
1802
1803 BlockReopenQueueEntry *bs_entry;
1804 BdrvChild *child;
1805 QDict *old_options, *explicit_options;
1806
1807 if (bs_queue == NULL) {
1808 bs_queue = g_new0(BlockReopenQueue, 1);
1809 QSIMPLEQ_INIT(bs_queue);
1810 }
1811
1812 if (!options) {
1813 options = qdict_new();
1814 }
1815
1816 /*
1817 * Precedence of options:
1818 * 1. Explicitly passed in options (highest)
1819 * 2. Set in flags (only for top level)
1820 * 3. Retained from explicitly set options of bs
1821 * 4. Inherited from parent node
1822 * 5. Retained from effective options of bs
1823 */
1824
1825 if (!parent_options) {
1826 /*
1827 * Any setting represented by flags is always updated. If the
1828 * corresponding QDict option is set, it takes precedence. Otherwise
1829 * the flag is translated into a QDict option. The old setting of bs is
1830 * not considered.
1831 */
1832 update_options_from_flags(options, flags);
1833 }
1834
1835 /* Old explicitly set values (don't overwrite by inherited value) */
1836 old_options = qdict_clone_shallow(bs->explicit_options);
1837 bdrv_join_options(bs, options, old_options);
1838 QDECREF(old_options);
1839
1840 explicit_options = qdict_clone_shallow(options);
1841
1842 /* Inherit from parent node */
1843 if (parent_options) {
1844 assert(!flags);
1845 role->inherit_options(&flags, options, parent_flags, parent_options);
1846 }
1847
1848 /* Old values are used for options that aren't set yet */
1849 old_options = qdict_clone_shallow(bs->options);
1850 bdrv_join_options(bs, options, old_options);
1851 QDECREF(old_options);
1852
1853 /* bdrv_open() masks this flag out */
1854 flags &= ~BDRV_O_PROTOCOL;
1855
1856 QLIST_FOREACH(child, &bs->children, next) {
1857 QDict *new_child_options;
1858 char *child_key_dot;
1859
1860 /* reopen can only change the options of block devices that were
1861 * implicitly created and inherited options. For other (referenced)
1862 * block devices, a syntax like "backing.foo" results in an error. */
1863 if (child->bs->inherits_from != bs) {
1864 continue;
1865 }
1866
1867 child_key_dot = g_strdup_printf("%s.", child->name);
1868 qdict_extract_subqdict(options, &new_child_options, child_key_dot);
1869 g_free(child_key_dot);
1870
1871 bdrv_reopen_queue_child(bs_queue, child->bs, new_child_options, 0,
1872 child->role, options, flags);
1873 }
1874
1875 bs_entry = g_new0(BlockReopenQueueEntry, 1);
1876 QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
1877
1878 bs_entry->state.bs = bs;
1879 bs_entry->state.options = options;
1880 bs_entry->state.explicit_options = explicit_options;
1881 bs_entry->state.flags = flags;
1882
1883 return bs_queue;
1884 }
1885
1886 BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
1887 BlockDriverState *bs,
1888 QDict *options, int flags)
1889 {
1890 return bdrv_reopen_queue_child(bs_queue, bs, options, flags,
1891 NULL, NULL, 0);
1892 }
1893
1894 /*
1895 * Reopen multiple BlockDriverStates atomically & transactionally.
1896 *
1897 * The queue passed in (bs_queue) must have been built up previous
1898 * via bdrv_reopen_queue().
1899 *
1900 * Reopens all BDS specified in the queue, with the appropriate
1901 * flags. All devices are prepared for reopen, and failure of any
1902 * device will cause all device changes to be abandonded, and intermediate
1903 * data cleaned up.
1904 *
1905 * If all devices prepare successfully, then the changes are committed
1906 * to all devices.
1907 *
1908 */
1909 int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
1910 {
1911 int ret = -1;
1912 BlockReopenQueueEntry *bs_entry, *next;
1913 Error *local_err = NULL;
1914
1915 assert(bs_queue != NULL);
1916
1917 bdrv_drain_all();
1918
1919 QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1920 if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
1921 error_propagate(errp, local_err);
1922 goto cleanup;
1923 }
1924 bs_entry->prepared = true;
1925 }
1926
1927 /* If we reach this point, we have success and just need to apply the
1928 * changes
1929 */
1930 QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1931 bdrv_reopen_commit(&bs_entry->state);
1932 }
1933
1934 ret = 0;
1935
1936 cleanup:
1937 QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
1938 if (ret && bs_entry->prepared) {
1939 bdrv_reopen_abort(&bs_entry->state);
1940 } else if (ret) {
1941 QDECREF(bs_entry->state.explicit_options);
1942 }
1943 QDECREF(bs_entry->state.options);
1944 g_free(bs_entry);
1945 }
1946 g_free(bs_queue);
1947 return ret;
1948 }
1949
1950
1951 /* Reopen a single BlockDriverState with the specified flags. */
1952 int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
1953 {
1954 int ret = -1;
1955 Error *local_err = NULL;
1956 BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, NULL, bdrv_flags);
1957
1958 ret = bdrv_reopen_multiple(queue, &local_err);
1959 if (local_err != NULL) {
1960 error_propagate(errp, local_err);
1961 }
1962 return ret;
1963 }
1964
1965
1966 /*
1967 * Prepares a BlockDriverState for reopen. All changes are staged in the
1968 * 'opaque' field of the BDRVReopenState, which is used and allocated by
1969 * the block driver layer .bdrv_reopen_prepare()
1970 *
1971 * bs is the BlockDriverState to reopen
1972 * flags are the new open flags
1973 * queue is the reopen queue
1974 *
1975 * Returns 0 on success, non-zero on error. On error errp will be set
1976 * as well.
1977 *
1978 * On failure, bdrv_reopen_abort() will be called to clean up any data.
1979 * It is the responsibility of the caller to then call the abort() or
1980 * commit() for any other BDS that have been left in a prepare() state
1981 *
1982 */
1983 int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
1984 Error **errp)
1985 {
1986 int ret = -1;
1987 Error *local_err = NULL;
1988 BlockDriver *drv;
1989 QemuOpts *opts;
1990 const char *value;
1991
1992 assert(reopen_state != NULL);
1993 assert(reopen_state->bs->drv != NULL);
1994 drv = reopen_state->bs->drv;
1995
1996 /* Process generic block layer options */
1997 opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
1998 qemu_opts_absorb_qdict(opts, reopen_state->options, &local_err);
1999 if (local_err) {
2000 error_propagate(errp, local_err);
2001 ret = -EINVAL;
2002 goto error;
2003 }
2004
2005 update_flags_from_options(&reopen_state->flags, opts);
2006
2007 /* If a guest device is attached, it owns WCE */
2008 if (reopen_state->bs->blk && blk_get_attached_dev(reopen_state->bs->blk)) {
2009 bool old_wce = bdrv_enable_write_cache(reopen_state->bs);
2010 bool new_wce = (reopen_state->flags & BDRV_O_CACHE_WB);
2011 if (old_wce != new_wce) {
2012 error_setg(errp, "Cannot change cache.writeback: Device attached");
2013 ret = -EINVAL;
2014 goto error;
2015 }
2016 }
2017
2018 /* node-name and driver must be unchanged. Put them back into the QDict, so
2019 * that they are checked at the end of this function. */
2020 value = qemu_opt_get(opts, "node-name");
2021 if (value) {
2022 qdict_put(reopen_state->options, "node-name", qstring_from_str(value));
2023 }
2024
2025 value = qemu_opt_get(opts, "driver");
2026 if (value) {
2027 qdict_put(reopen_state->options, "driver", qstring_from_str(value));
2028 }
2029
2030 /* if we are to stay read-only, do not allow permission change
2031 * to r/w */
2032 if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
2033 reopen_state->flags & BDRV_O_RDWR) {
2034 error_setg(errp, "Node '%s' is read only",
2035 bdrv_get_device_or_node_name(reopen_state->bs));
2036 goto error;
2037 }
2038
2039
2040 ret = bdrv_flush(reopen_state->bs);
2041 if (ret) {
2042 error_setg_errno(errp, -ret, "Error flushing drive");
2043 goto error;
2044 }
2045
2046 if (drv->bdrv_reopen_prepare) {
2047 ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
2048 if (ret) {
2049 if (local_err != NULL) {
2050 error_propagate(errp, local_err);
2051 } else {
2052 error_setg(errp, "failed while preparing to reopen image '%s'",
2053 reopen_state->bs->filename);
2054 }
2055 goto error;
2056 }
2057 } else {
2058 /* It is currently mandatory to have a bdrv_reopen_prepare()
2059 * handler for each supported drv. */
2060 error_setg(errp, "Block format '%s' used by node '%s' "
2061 "does not support reopening files", drv->format_name,
2062 bdrv_get_device_or_node_name(reopen_state->bs));
2063 ret = -1;
2064 goto error;
2065 }
2066
2067 /* Options that are not handled are only okay if they are unchanged
2068 * compared to the old state. It is expected that some options are only
2069 * used for the initial open, but not reopen (e.g. filename) */
2070 if (qdict_size(reopen_state->options)) {
2071 const QDictEntry *entry = qdict_first(reopen_state->options);
2072
2073 do {
2074 QString *new_obj = qobject_to_qstring(entry->value);
2075 const char *new = qstring_get_str(new_obj);
2076 const char *old = qdict_get_try_str(reopen_state->bs->options,
2077 entry->key);
2078
2079 if (!old || strcmp(new, old)) {
2080 error_setg(errp, "Cannot change the option '%s'", entry->key);
2081 ret = -EINVAL;
2082 goto error;
2083 }
2084 } while ((entry = qdict_next(reopen_state->options, entry)));
2085 }
2086
2087 ret = 0;
2088
2089 error:
2090 qemu_opts_del(opts);
2091 return ret;
2092 }
2093
2094 /*
2095 * Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
2096 * makes them final by swapping the staging BlockDriverState contents into
2097 * the active BlockDriverState contents.
2098 */
2099 void bdrv_reopen_commit(BDRVReopenState *reopen_state)
2100 {
2101 BlockDriver *drv;
2102
2103 assert(reopen_state != NULL);
2104 drv = reopen_state->bs->drv;
2105 assert(drv != NULL);
2106
2107 /* If there are any driver level actions to take */
2108 if (drv->bdrv_reopen_commit) {
2109 drv->bdrv_reopen_commit(reopen_state);
2110 }
2111
2112 /* set BDS specific flags now */
2113 QDECREF(reopen_state->bs->explicit_options);
2114
2115 reopen_state->bs->explicit_options = reopen_state->explicit_options;
2116 reopen_state->bs->open_flags = reopen_state->flags;
2117 reopen_state->bs->enable_write_cache = !!(reopen_state->flags &
2118 BDRV_O_CACHE_WB);
2119 reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
2120
2121 bdrv_refresh_limits(reopen_state->bs, NULL);
2122 }
2123
2124 /*
2125 * Abort the reopen, and delete and free the staged changes in
2126 * reopen_state
2127 */
2128 void bdrv_reopen_abort(BDRVReopenState *reopen_state)
2129 {
2130 BlockDriver *drv;
2131
2132 assert(reopen_state != NULL);
2133 drv = reopen_state->bs->drv;
2134 assert(drv != NULL);
2135
2136 if (drv->bdrv_reopen_abort) {
2137 drv->bdrv_reopen_abort(reopen_state);
2138 }
2139
2140 QDECREF(reopen_state->explicit_options);
2141 }
2142
2143
2144 static void bdrv_close(BlockDriverState *bs)
2145 {
2146 BdrvAioNotifier *ban, *ban_next;
2147
2148 assert(!bs->job);
2149
2150 /* Disable I/O limits and drain all pending throttled requests */
2151 if (bs->throttle_state) {
2152 bdrv_io_limits_disable(bs);
2153 }
2154
2155 bdrv_drained_begin(bs); /* complete I/O */
2156 bdrv_flush(bs);
2157 bdrv_drain(bs); /* in case flush left pending I/O */
2158
2159 bdrv_release_named_dirty_bitmaps(bs);
2160 assert(QLIST_EMPTY(&bs->dirty_bitmaps));
2161
2162 if (bs->blk) {
2163 blk_dev_change_media_cb(bs->blk, false);
2164 }
2165
2166 if (bs->drv) {
2167 BdrvChild *child, *next;
2168
2169 bs->drv->bdrv_close(bs);
2170 bs->drv = NULL;
2171
2172 bdrv_set_backing_hd(bs, NULL);
2173
2174 if (bs->file != NULL) {
2175 bdrv_unref_child(bs, bs->file);
2176 bs->file = NULL;
2177 }
2178
2179 QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
2180 /* TODO Remove bdrv_unref() from drivers' close function and use
2181 * bdrv_unref_child() here */
2182 if (child->bs->inherits_from == bs) {
2183 child->bs->inherits_from = NULL;
2184 }
2185 bdrv_detach_child(child);
2186 }
2187
2188 g_free(bs->opaque);
2189 bs->opaque = NULL;
2190 bs->copy_on_read = 0;
2191 bs->backing_file[0] = '\0';
2192 bs->backing_format[0] = '\0';
2193 bs->total_sectors = 0;
2194 bs->encrypted = 0;
2195 bs->valid_key = 0;
2196 bs->sg = 0;
2197 bs->zero_beyond_eof = false;
2198 QDECREF(bs->options);
2199 QDECREF(bs->explicit_options);
2200 bs->options = NULL;
2201 QDECREF(bs->full_open_options);
2202 bs->full_open_options = NULL;
2203 }
2204
2205 QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
2206 g_free(ban);
2207 }
2208 QLIST_INIT(&bs->aio_notifiers);
2209 bdrv_drained_end(bs);
2210 }
2211
2212 void bdrv_close_all(void)
2213 {
2214 BlockDriverState *bs;
2215 AioContext *aio_context;
2216
2217 /* Drop references from requests still in flight, such as canceled block
2218 * jobs whose AIO context has not been polled yet */
2219 bdrv_drain_all();
2220
2221 blk_remove_all_bs();
2222 blockdev_close_all_bdrv_states();
2223
2224 /* Cancel all block jobs */
2225 while (!QTAILQ_EMPTY(&all_bdrv_states)) {
2226 QTAILQ_FOREACH(bs, &all_bdrv_states, bs_list) {
2227 aio_context = bdrv_get_aio_context(bs);
2228
2229 aio_context_acquire(aio_context);
2230 if (bs->job) {
2231 block_job_cancel_sync(bs->job);
2232 aio_context_release(aio_context);
2233 break;
2234 }
2235 aio_context_release(aio_context);
2236 }
2237
2238 /* All the remaining BlockDriverStates are referenced directly or
2239 * indirectly from block jobs, so there needs to be at least one BDS
2240 * directly used by a block job */
2241 assert(bs);
2242 }
2243 }
2244
2245 /* Fields that need to stay with the top-level BDS */
2246 static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
2247 BlockDriverState *bs_src)
2248 {
2249 /* move some fields that need to stay attached to the device */
2250
2251 /* dev info */
2252 bs_dest->copy_on_read = bs_src->copy_on_read;
2253
2254 bs_dest->enable_write_cache = bs_src->enable_write_cache;
2255
2256 /* dirty bitmap */
2257 bs_dest->dirty_bitmaps = bs_src->dirty_bitmaps;
2258 }
2259
2260 static void change_parent_backing_link(BlockDriverState *from,
2261 BlockDriverState *to)
2262 {
2263 BdrvChild *c, *next;
2264
2265 if (from->blk) {
2266 /* FIXME We bypass blk_set_bs(), so we need to make these updates
2267 * manually. The root problem is not in this change function, but the
2268 * existence of BlockDriverState.blk. */
2269 to->blk = from->blk;
2270 from->blk = NULL;
2271 }
2272
2273 QLIST_FOREACH_SAFE(c, &from->parents, next_parent, next) {
2274 assert(c->role != &child_backing);
2275 c->bs = to;
2276 QLIST_REMOVE(c, next_parent);
2277 QLIST_INSERT_HEAD(&to->parents, c, next_parent);
2278 bdrv_ref(to);
2279 bdrv_unref(from);
2280 }
2281 }
2282
2283 static void swap_feature_fields(BlockDriverState *bs_top,
2284 BlockDriverState *bs_new)
2285 {
2286 BlockDriverState tmp;
2287
2288 bdrv_move_feature_fields(&tmp, bs_top);
2289 bdrv_move_feature_fields(bs_top, bs_new);
2290 bdrv_move_feature_fields(bs_new, &tmp);
2291
2292 assert(!bs_new->throttle_state);
2293 if (bs_top->throttle_state) {
2294 assert(bs_top->io_limits_enabled);
2295 bdrv_io_limits_enable(bs_new, throttle_group_get_name(bs_top));
2296 bdrv_io_limits_disable(bs_top);
2297 }
2298 }
2299
2300 /*
2301 * Add new bs contents at the top of an image chain while the chain is
2302 * live, while keeping required fields on the top layer.
2303 *
2304 * This will modify the BlockDriverState fields, and swap contents
2305 * between bs_new and bs_top. Both bs_new and bs_top are modified.
2306 *
2307 * bs_new must not be attached to a BlockBackend.
2308 *
2309 * This function does not create any image files.
2310 *
2311 * bdrv_append() takes ownership of a bs_new reference and unrefs it because
2312 * that's what the callers commonly need. bs_new will be referenced by the old
2313 * parents of bs_top after bdrv_append() returns. If the caller needs to keep a
2314 * reference of its own, it must call bdrv_ref().
2315 */
2316 void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
2317 {
2318 assert(!bdrv_requests_pending(bs_top));
2319 assert(!bdrv_requests_pending(bs_new));
2320
2321 bdrv_ref(bs_top);
2322 change_parent_backing_link(bs_top, bs_new);
2323
2324 /* Some fields always stay on top of the backing file chain */
2325 swap_feature_fields(bs_top, bs_new);
2326
2327 bdrv_set_backing_hd(bs_new, bs_top);
2328 bdrv_unref(bs_top);
2329
2330 /* bs_new is now referenced by its new parents, we don't need the
2331 * additional reference any more. */
2332 bdrv_unref(bs_new);
2333 }
2334
2335 void bdrv_replace_in_backing_chain(BlockDriverState *old, BlockDriverState *new)
2336 {
2337 assert(!bdrv_requests_pending(old));
2338 assert(!bdrv_requests_pending(new));
2339
2340 bdrv_ref(old);
2341
2342 if (old->blk) {
2343 /* As long as these fields aren't in BlockBackend, but in the top-level
2344 * BlockDriverState, it's not possible for a BDS to have two BBs.
2345 *
2346 * We really want to copy the fields from old to new, but we go for a
2347 * swap instead so that pointers aren't duplicated and cause trouble.
2348 * (Also, bdrv_swap() used to do the same.) */
2349 assert(!new->blk);
2350 swap_feature_fields(old, new);
2351 }
2352 change_parent_backing_link(old, new);
2353
2354 /* Change backing files if a previously independent node is added to the
2355 * chain. For active commit, we replace top by its own (indirect) backing
2356 * file and don't do anything here so we don't build a loop. */
2357 if (new->backing == NULL && !bdrv_chain_contains(backing_bs(old), new)) {
2358 bdrv_set_backing_hd(new, backing_bs(old));
2359 bdrv_set_backing_hd(old, NULL);
2360 }
2361
2362 bdrv_unref(old);
2363 }
2364
2365 static void bdrv_delete(BlockDriverState *bs)
2366 {
2367 assert(!bs->job);
2368 assert(bdrv_op_blocker_is_empty(bs));
2369 assert(!bs->refcnt);
2370
2371 bdrv_close(bs);
2372
2373 /* remove from list, if necessary */
2374 if (bs->node_name[0] != '\0') {
2375 QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
2376 }
2377 QTAILQ_REMOVE(&all_bdrv_states, bs, bs_list);
2378
2379 g_free(bs);
2380 }
2381
2382 /*
2383 * Run consistency checks on an image
2384 *
2385 * Returns 0 if the check could be completed (it doesn't mean that the image is
2386 * free of errors) or -errno when an internal error occurred. The results of the
2387 * check are stored in res.
2388 */
2389 int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
2390 {
2391 if (bs->drv == NULL) {
2392 return -ENOMEDIUM;
2393 }
2394 if (bs->drv->bdrv_check == NULL) {
2395 return -ENOTSUP;
2396 }
2397
2398 memset(res, 0, sizeof(*res));
2399 return bs->drv->bdrv_check(bs, res, fix);
2400 }
2401
2402 #define COMMIT_BUF_SECTORS 2048
2403
2404 /* commit COW file into the raw image */
2405 int bdrv_commit(BlockDriverState *bs)
2406 {
2407 BlockDriver *drv = bs->drv;
2408 int64_t sector, total_sectors, length, backing_length;
2409 int n, ro, open_flags;
2410 int ret = 0;
2411 uint8_t *buf = NULL;
2412
2413 if (!drv)
2414 return -ENOMEDIUM;
2415
2416 if (!bs->backing) {
2417 return -ENOTSUP;
2418 }
2419
2420 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
2421 bdrv_op_is_blocked(bs->backing->bs, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
2422 return -EBUSY;
2423 }
2424
2425 ro = bs->backing->bs->read_only;
2426 open_flags = bs->backing->bs->open_flags;
2427
2428 if (ro) {
2429 if (bdrv_reopen(bs->backing->bs, open_flags | BDRV_O_RDWR, NULL)) {
2430 return -EACCES;
2431 }
2432 }
2433
2434 length = bdrv_getlength(bs);
2435 if (length < 0) {
2436 ret = length;
2437 goto ro_cleanup;
2438 }
2439
2440 backing_length = bdrv_getlength(bs->backing->bs);
2441 if (backing_length < 0) {
2442 ret = backing_length;
2443 goto ro_cleanup;
2444 }
2445
2446 /* If our top snapshot is larger than the backing file image,
2447 * grow the backing file image if possible. If not possible,
2448 * we must return an error */
2449 if (length > backing_length) {
2450 ret = bdrv_truncate(bs->backing->bs, length);
2451 if (ret < 0) {
2452 goto ro_cleanup;
2453 }
2454 }
2455
2456 total_sectors = length >> BDRV_SECTOR_BITS;
2457
2458 /* qemu_try_blockalign() for bs will choose an alignment that works for
2459 * bs->backing->bs as well, so no need to compare the alignment manually. */
2460 buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
2461 if (buf == NULL) {
2462 ret = -ENOMEM;
2463 goto ro_cleanup;
2464 }
2465
2466 for (sector = 0; sector < total_sectors; sector += n) {
2467 ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
2468 if (ret < 0) {
2469 goto ro_cleanup;
2470 }
2471 if (ret) {
2472 ret = bdrv_read(bs, sector, buf, n);
2473 if (ret < 0) {
2474 goto ro_cleanup;
2475 }
2476
2477 ret = bdrv_write(bs->backing->bs, sector, buf, n);
2478 if (ret < 0) {
2479 goto ro_cleanup;
2480 }
2481 }
2482 }
2483
2484 if (drv->bdrv_make_empty) {
2485 ret = drv->bdrv_make_empty(bs);
2486 if (ret < 0) {
2487 goto ro_cleanup;
2488 }
2489 bdrv_flush(bs);
2490 }
2491
2492 /*
2493 * Make sure all data we wrote to the backing device is actually
2494 * stable on disk.
2495 */
2496 if (bs->backing) {
2497 bdrv_flush(bs->backing->bs);
2498 }
2499
2500 ret = 0;
2501 ro_cleanup:
2502 qemu_vfree(buf);
2503
2504 if (ro) {
2505 /* ignoring error return here */
2506 bdrv_reopen(bs->backing->bs, open_flags & ~BDRV_O_RDWR, NULL);
2507 }
2508
2509 return ret;
2510 }
2511
2512 /*
2513 * Return values:
2514 * 0 - success
2515 * -EINVAL - backing format specified, but no file
2516 * -ENOSPC - can't update the backing file because no space is left in the
2517 * image file header
2518 * -ENOTSUP - format driver doesn't support changing the backing file
2519 */
2520 int bdrv_change_backing_file(BlockDriverState *bs,
2521 const char *backing_file, const char *backing_fmt)
2522 {
2523 BlockDriver *drv = bs->drv;
2524 int ret;
2525
2526 /* Backing file format doesn't make sense without a backing file */
2527 if (backing_fmt && !backing_file) {
2528 return -EINVAL;
2529 }
2530
2531 if (drv->bdrv_change_backing_file != NULL) {
2532 ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
2533 } else {
2534 ret = -ENOTSUP;
2535 }
2536
2537 if (ret == 0) {
2538 pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
2539 pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
2540 }
2541 return ret;
2542 }
2543
2544 /*
2545 * Finds the image layer in the chain that has 'bs' as its backing file.
2546 *
2547 * active is the current topmost image.
2548 *
2549 * Returns NULL if bs is not found in active's image chain,
2550 * or if active == bs.
2551 *
2552 * Returns the bottommost base image if bs == NULL.
2553 */
2554 BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
2555 BlockDriverState *bs)
2556 {
2557 while (active && bs != backing_bs(active)) {
2558 active = backing_bs(active);
2559 }
2560
2561 return active;
2562 }
2563
2564 /* Given a BDS, searches for the base layer. */
2565 BlockDriverState *bdrv_find_base(BlockDriverState *bs)
2566 {
2567 return bdrv_find_overlay(bs, NULL);
2568 }
2569
2570 /*
2571 * Drops images above 'base' up to and including 'top', and sets the image
2572 * above 'top' to have base as its backing file.
2573 *
2574 * Requires that the overlay to 'top' is opened r/w, so that the backing file
2575 * information in 'bs' can be properly updated.
2576 *
2577 * E.g., this will convert the following chain:
2578 * bottom <- base <- intermediate <- top <- active
2579 *
2580 * to
2581 *
2582 * bottom <- base <- active
2583 *
2584 * It is allowed for bottom==base, in which case it converts:
2585 *
2586 * base <- intermediate <- top <- active
2587 *
2588 * to
2589 *
2590 * base <- active
2591 *
2592 * If backing_file_str is non-NULL, it will be used when modifying top's
2593 * overlay image metadata.
2594 *
2595 * Error conditions:
2596 * if active == top, that is considered an error
2597 *
2598 */
2599 int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
2600 BlockDriverState *base, const char *backing_file_str)
2601 {
2602 BlockDriverState *new_top_bs = NULL;
2603 int ret = -EIO;
2604
2605 if (!top->drv || !base->drv) {
2606 goto exit;
2607 }
2608
2609 new_top_bs = bdrv_find_overlay(active, top);
2610
2611 if (new_top_bs == NULL) {
2612 /* we could not find the image above 'top', this is an error */
2613 goto exit;
2614 }
2615
2616 /* special case of new_top_bs->backing->bs already pointing to base - nothing
2617 * to do, no intermediate images */
2618 if (backing_bs(new_top_bs) == base) {
2619 ret = 0;
2620 goto exit;
2621 }
2622
2623 /* Make sure that base is in the backing chain of top */
2624 if (!bdrv_chain_contains(top, base)) {
2625 goto exit;
2626 }
2627
2628 /* success - we can delete the intermediate states, and link top->base */
2629 backing_file_str = backing_file_str ? backing_file_str : base->filename;
2630 ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
2631 base->drv ? base->drv->format_name : "");
2632 if (ret) {
2633 goto exit;
2634 }
2635 bdrv_set_backing_hd(new_top_bs, base);
2636
2637 ret = 0;
2638 exit:
2639 return ret;
2640 }
2641
2642 /**
2643 * Truncate file to 'offset' bytes (needed only for file protocols)
2644 */
2645 int bdrv_truncate(BlockDriverState *bs, int64_t offset)
2646 {
2647 BlockDriver *drv = bs->drv;
2648 int ret;
2649 if (!drv)
2650 return -ENOMEDIUM;
2651 if (!drv->bdrv_truncate)
2652 return -ENOTSUP;
2653 if (bs->read_only)
2654 return -EACCES;
2655
2656 ret = drv->bdrv_truncate(bs, offset);
2657 if (ret == 0) {
2658 ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
2659 bdrv_dirty_bitmap_truncate(bs);
2660 if (bs->blk) {
2661 blk_dev_resize_cb(bs->blk);
2662 }
2663 }
2664 return ret;
2665 }
2666
2667 /**
2668 * Length of a allocated file in bytes. Sparse files are counted by actual
2669 * allocated space. Return < 0 if error or unknown.
2670 */
2671 int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
2672 {
2673 BlockDriver *drv = bs->drv;
2674 if (!drv) {
2675 return -ENOMEDIUM;
2676 }
2677 if (drv->bdrv_get_allocated_file_size) {
2678 return drv->bdrv_get_allocated_file_size(bs);
2679 }
2680 if (bs->file) {
2681 return bdrv_get_allocated_file_size(bs->file->bs);
2682 }
2683 return -ENOTSUP;
2684 }
2685
2686 /**
2687 * Return number of sectors on success, -errno on error.
2688 */
2689 int64_t bdrv_nb_sectors(BlockDriverState *bs)
2690 {
2691 BlockDriver *drv = bs->drv;
2692
2693 if (!drv)
2694 return -ENOMEDIUM;
2695
2696 if (drv->has_variable_length) {
2697 int ret = refresh_total_sectors(bs, bs->total_sectors);
2698 if (ret < 0) {
2699 return ret;
2700 }
2701 }
2702 return bs->total_sectors;
2703 }
2704
2705 /**
2706 * Return length in bytes on success, -errno on error.
2707 * The length is always a multiple of BDRV_SECTOR_SIZE.
2708 */
2709 int64_t bdrv_getlength(BlockDriverState *bs)
2710 {
2711 int64_t ret = bdrv_nb_sectors(bs);
2712
2713 ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
2714 return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
2715 }
2716
2717 /* return 0 as number of sectors if no device present or error */
2718 void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
2719 {
2720 int64_t nb_sectors = bdrv_nb_sectors(bs);
2721
2722 *nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
2723 }
2724
2725 int bdrv_is_read_only(BlockDriverState *bs)
2726 {
2727 return bs->read_only;
2728 }
2729
2730 int bdrv_is_sg(BlockDriverState *bs)
2731 {
2732 return bs->sg;
2733 }
2734
2735 int bdrv_enable_write_cache(BlockDriverState *bs)
2736 {
2737 return bs->enable_write_cache;
2738 }
2739
2740 void bdrv_set_enable_write_cache(BlockDriverState *bs, bool wce)
2741 {
2742 bs->enable_write_cache = wce;
2743
2744 /* so a reopen() will preserve wce */
2745 if (wce) {
2746 bs->open_flags |= BDRV_O_CACHE_WB;
2747 } else {
2748 bs->open_flags &= ~BDRV_O_CACHE_WB;
2749 }
2750 }
2751
2752 int bdrv_is_encrypted(BlockDriverState *bs)
2753 {
2754 if (bs->backing && bs->backing->bs->encrypted) {
2755 return 1;
2756 }
2757 return bs->encrypted;
2758 }
2759
2760 int bdrv_key_required(BlockDriverState *bs)
2761 {
2762 BdrvChild *backing = bs->backing;
2763
2764 if (backing && backing->bs->encrypted && !backing->bs->valid_key) {
2765 return 1;
2766 }
2767 return (bs->encrypted && !bs->valid_key);
2768 }
2769
2770 int bdrv_set_key(BlockDriverState *bs, const char *key)
2771 {
2772 int ret;
2773 if (bs->backing && bs->backing->bs->encrypted) {
2774 ret = bdrv_set_key(bs->backing->bs, key);
2775 if (ret < 0)
2776 return ret;
2777 if (!bs->encrypted)
2778 return 0;
2779 }
2780 if (!bs->encrypted) {
2781 return -EINVAL;
2782 } else if (!bs->drv || !bs->drv->bdrv_set_key) {
2783 return -ENOMEDIUM;
2784 }
2785 ret = bs->drv->bdrv_set_key(bs, key);
2786 if (ret < 0) {
2787 bs->valid_key = 0;
2788 } else if (!bs->valid_key) {
2789 bs->valid_key = 1;
2790 if (bs->blk) {
2791 /* call the change callback now, we skipped it on open */
2792 blk_dev_change_media_cb(bs->blk, true);
2793 }
2794 }
2795 return ret;
2796 }
2797
2798 /*
2799 * Provide an encryption key for @bs.
2800 * If @key is non-null:
2801 * If @bs is not encrypted, fail.
2802 * Else if the key is invalid, fail.
2803 * Else set @bs's key to @key, replacing the existing key, if any.
2804 * If @key is null:
2805 * If @bs is encrypted and still lacks a key, fail.
2806 * Else do nothing.
2807 * On failure, store an error object through @errp if non-null.
2808 */
2809 void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
2810 {
2811 if (key) {
2812 if (!bdrv_is_encrypted(bs)) {
2813 error_setg(errp, "Node '%s' is not encrypted",
2814 bdrv_get_device_or_node_name(bs));
2815 } else if (bdrv_set_key(bs, key) < 0) {
2816 error_setg(errp, QERR_INVALID_PASSWORD);
2817 }
2818 } else {
2819 if (bdrv_key_required(bs)) {
2820 error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
2821 "'%s' (%s) is encrypted",
2822 bdrv_get_device_or_node_name(bs),
2823 bdrv_get_encrypted_filename(bs));
2824 }
2825 }
2826 }
2827
2828 const char *bdrv_get_format_name(BlockDriverState *bs)
2829 {
2830 return bs->drv ? bs->drv->format_name : NULL;
2831 }
2832
2833 static int qsort_strcmp(const void *a, const void *b)
2834 {
2835 return strcmp(a, b);
2836 }
2837
2838 void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
2839 void *opaque)
2840 {
2841 BlockDriver *drv;
2842 int count = 0;
2843 int i;
2844 const char **formats = NULL;
2845
2846 QLIST_FOREACH(drv, &bdrv_drivers, list) {
2847 if (drv->format_name) {
2848 bool found = false;
2849 int i = count;
2850 while (formats && i && !found) {
2851 found = !strcmp(formats[--i], drv->format_name);
2852 }
2853
2854 if (!found) {
2855 formats = g_renew(const char *, formats, count + 1);
2856 formats[count++] = drv->format_name;
2857 }
2858 }
2859 }
2860
2861 qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
2862
2863 for (i = 0; i < count; i++) {
2864 it(opaque, formats[i]);
2865 }
2866
2867 g_free(formats);
2868 }
2869
2870 /* This function is to find a node in the bs graph */
2871 BlockDriverState *bdrv_find_node(const char *node_name)
2872 {
2873 BlockDriverState *bs;
2874
2875 assert(node_name);
2876
2877 QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2878 if (!strcmp(node_name, bs->node_name)) {
2879 return bs;
2880 }
2881 }
2882 return NULL;
2883 }
2884
2885 /* Put this QMP function here so it can access the static graph_bdrv_states. */
2886 BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
2887 {
2888 BlockDeviceInfoList *list, *entry;
2889 BlockDriverState *bs;
2890
2891 list = NULL;
2892 QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2893 BlockDeviceInfo *info = bdrv_block_device_info(bs, errp);
2894 if (!info) {
2895 qapi_free_BlockDeviceInfoList(list);
2896 return NULL;
2897 }
2898 entry = g_malloc0(sizeof(*entry));
2899 entry->value = info;
2900 entry->next = list;
2901 list = entry;
2902 }
2903
2904 return list;
2905 }
2906
2907 BlockDriverState *bdrv_lookup_bs(const char *device,
2908 const char *node_name,
2909 Error **errp)
2910 {
2911 BlockBackend *blk;
2912 BlockDriverState *bs;
2913
2914 if (device) {
2915 blk = blk_by_name(device);
2916
2917 if (blk) {
2918 bs = blk_bs(blk);
2919 if (!bs) {
2920 error_setg(errp, "Device '%s' has no medium", device);
2921 }
2922
2923 return bs;
2924 }
2925 }
2926
2927 if (node_name) {
2928 bs = bdrv_find_node(node_name);
2929
2930 if (bs) {
2931 return bs;
2932 }
2933 }
2934
2935 error_setg(errp, "Cannot find device=%s nor node_name=%s",
2936 device ? device : "",
2937 node_name ? node_name : "");
2938 return NULL;
2939 }
2940
2941 /* If 'base' is in the same chain as 'top', return true. Otherwise,
2942 * return false. If either argument is NULL, return false. */
2943 bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
2944 {
2945 while (top && top != base) {
2946 top = backing_bs(top);
2947 }
2948
2949 return top != NULL;
2950 }
2951
2952 BlockDriverState *bdrv_next_node(BlockDriverState *bs)
2953 {
2954 if (!bs) {
2955 return QTAILQ_FIRST(&graph_bdrv_states);
2956 }
2957 return QTAILQ_NEXT(bs, node_list);
2958 }
2959
2960 /* Iterates over all top-level BlockDriverStates, i.e. BDSs that are owned by
2961 * the monitor or attached to a BlockBackend */
2962 BlockDriverState *bdrv_next(BlockDriverState *bs)
2963 {
2964 if (!bs || bs->blk) {
2965 bs = blk_next_root_bs(bs);
2966 if (bs) {
2967 return bs;
2968 }
2969 }
2970
2971 /* Ignore all BDSs that are attached to a BlockBackend here; they have been
2972 * handled by the above block already */
2973 do {
2974 bs = bdrv_next_monitor_owned(bs);
2975 } while (bs && bs->blk);
2976 return bs;
2977 }
2978
2979 const char *bdrv_get_node_name(const BlockDriverState *bs)
2980 {
2981 return bs->node_name;
2982 }
2983
2984 /* TODO check what callers really want: bs->node_name or blk_name() */
2985 const char *bdrv_get_device_name(const BlockDriverState *bs)
2986 {
2987 return bs->blk ? blk_name(bs->blk) : "";
2988 }
2989
2990 /* This can be used to identify nodes that might not have a device
2991 * name associated. Since node and device names live in the same
2992 * namespace, the result is unambiguous. The exception is if both are
2993 * absent, then this returns an empty (non-null) string. */
2994 const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
2995 {
2996 return bs->blk ? blk_name(bs->blk) : bs->node_name;
2997 }
2998
2999 int bdrv_get_flags(BlockDriverState *bs)
3000 {
3001 return bs->open_flags;
3002 }
3003
3004 int bdrv_has_zero_init_1(BlockDriverState *bs)
3005 {
3006 return 1;
3007 }
3008
3009 int bdrv_has_zero_init(BlockDriverState *bs)
3010 {
3011 assert(bs->drv);
3012
3013 /* If BS is a copy on write image, it is initialized to
3014 the contents of the base image, which may not be zeroes. */
3015 if (bs->backing) {
3016 return 0;
3017 }
3018 if (bs->drv->bdrv_has_zero_init) {
3019 return bs->drv->bdrv_has_zero_init(bs);
3020 }
3021
3022 /* safe default */
3023 return 0;
3024 }
3025
3026 bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
3027 {
3028 BlockDriverInfo bdi;
3029
3030 if (bs->backing) {
3031 return false;
3032 }
3033
3034 if (bdrv_get_info(bs, &bdi) == 0) {
3035 return bdi.unallocated_blocks_are_zero;
3036 }
3037
3038 return false;
3039 }
3040
3041 bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
3042 {
3043 BlockDriverInfo bdi;
3044
3045 if (bs->backing || !(bs->open_flags & BDRV_O_UNMAP)) {
3046 return false;
3047 }
3048
3049 if (bdrv_get_info(bs, &bdi) == 0) {
3050 return bdi.can_write_zeroes_with_unmap;
3051 }
3052
3053 return false;
3054 }
3055
3056 const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
3057 {
3058 if (bs->backing && bs->backing->bs->encrypted)
3059 return bs->backing_file;
3060 else if (bs->encrypted)
3061 return bs->filename;
3062 else
3063 return NULL;
3064 }
3065
3066 void bdrv_get_backing_filename(BlockDriverState *bs,
3067 char *filename, int filename_size)
3068 {
3069 pstrcpy(filename, filename_size, bs->backing_file);
3070 }
3071
3072 int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
3073 {
3074 BlockDriver *drv = bs->drv;
3075 if (!drv)
3076 return -ENOMEDIUM;
3077 if (!drv->bdrv_get_info)
3078 return -ENOTSUP;
3079 memset(bdi, 0, sizeof(*bdi));
3080 return drv->bdrv_get_info(bs, bdi);
3081 }
3082
3083 ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
3084 {
3085 BlockDriver *drv = bs->drv;
3086 if (drv && drv->bdrv_get_specific_info) {
3087 return drv->bdrv_get_specific_info(bs);
3088 }
3089 return NULL;
3090 }
3091
3092 void bdrv_debug_event(BlockDriverState *bs, BlkdebugEvent event)
3093 {
3094 if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
3095 return;
3096 }
3097
3098 bs->drv->bdrv_debug_event(bs, event);
3099 }
3100
3101 int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
3102 const char *tag)
3103 {
3104 while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
3105 bs = bs->file ? bs->file->bs : NULL;
3106 }
3107
3108 if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
3109 return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
3110 }
3111
3112 return -ENOTSUP;
3113 }
3114
3115 int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
3116 {
3117 while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
3118 bs = bs->file ? bs->file->bs : NULL;
3119 }
3120
3121 if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
3122 return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
3123 }
3124
3125 return -ENOTSUP;
3126 }
3127
3128 int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
3129 {
3130 while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
3131 bs = bs->file ? bs->file->bs : NULL;
3132 }
3133
3134 if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
3135 return bs->drv->bdrv_debug_resume(bs, tag);
3136 }
3137
3138 return -ENOTSUP;
3139 }
3140
3141 bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
3142 {
3143 while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
3144 bs = bs->file ? bs->file->bs : NULL;
3145 }
3146
3147 if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
3148 return bs->drv->bdrv_debug_is_suspended(bs, tag);
3149 }
3150
3151 return false;
3152 }
3153
3154 int bdrv_is_snapshot(BlockDriverState *bs)
3155 {
3156 return !!(bs->open_flags & BDRV_O_SNAPSHOT);
3157 }
3158
3159 /* backing_file can either be relative, or absolute, or a protocol. If it is
3160 * relative, it must be relative to the chain. So, passing in bs->filename
3161 * from a BDS as backing_file should not be done, as that may be relative to
3162 * the CWD rather than the chain. */
3163 BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
3164 const char *backing_file)
3165 {
3166 char *filename_full = NULL;
3167 char *backing_file_full = NULL;
3168 char *filename_tmp = NULL;
3169 int is_protocol = 0;
3170 BlockDriverState *curr_bs = NULL;
3171 BlockDriverState *retval = NULL;
3172
3173 if (!bs || !bs->drv || !backing_file) {
3174 return NULL;
3175 }
3176
3177 filename_full = g_malloc(PATH_MAX);
3178 backing_file_full = g_malloc(PATH_MAX);
3179 filename_tmp = g_malloc(PATH_MAX);
3180
3181 is_protocol = path_has_protocol(backing_file);
3182
3183 for (curr_bs = bs; curr_bs->backing; curr_bs = curr_bs->backing->bs) {
3184
3185 /* If either of the filename paths is actually a protocol, then
3186 * compare unmodified paths; otherwise make paths relative */
3187 if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
3188 if (strcmp(backing_file, curr_bs->backing_file) == 0) {
3189 retval = curr_bs->backing->bs;
3190 break;
3191 }
3192 } else {
3193 /* If not an absolute filename path, make it relative to the current
3194 * image's filename path */
3195 path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3196 backing_file);
3197
3198 /* We are going to compare absolute pathnames */
3199 if (!realpath(filename_tmp, filename_full)) {
3200 continue;
3201 }
3202
3203 /* We need to make sure the backing filename we are comparing against
3204 * is relative to the current image filename (or absolute) */
3205 path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3206 curr_bs->backing_file);
3207
3208 if (!realpath(filename_tmp, backing_file_full)) {
3209 continue;
3210 }
3211
3212 if (strcmp(backing_file_full, filename_full) == 0) {
3213 retval = curr_bs->backing->bs;
3214 break;
3215 }
3216 }
3217 }
3218
3219 g_free(filename_full);
3220 g_free(backing_file_full);
3221 g_free(filename_tmp);
3222 return retval;
3223 }
3224
3225 int bdrv_get_backing_file_depth(BlockDriverState *bs)
3226 {
3227 if (!bs->drv) {
3228 return 0;
3229 }
3230
3231 if (!bs->backing) {
3232 return 0;
3233 }
3234
3235 return 1 + bdrv_get_backing_file_depth(bs->backing->bs);
3236 }
3237
3238 void bdrv_init(void)
3239 {
3240 module_call_init(MODULE_INIT_BLOCK);
3241 }
3242
3243 void bdrv_init_with_whitelist(void)
3244 {
3245 use_bdrv_whitelist = 1;
3246 bdrv_init();
3247 }
3248
3249 void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
3250 {
3251 Error *local_err = NULL;
3252 int ret;
3253
3254 if (!bs->drv) {
3255 return;
3256 }
3257
3258 if (!(bs->open_flags & BDRV_O_INACTIVE)) {
3259 return;
3260 }
3261 bs->open_flags &= ~BDRV_O_INACTIVE;
3262
3263 if (bs->drv->bdrv_invalidate_cache) {
3264 bs->drv->bdrv_invalidate_cache(bs, &local_err);
3265 } else if (bs->file) {
3266 bdrv_invalidate_cache(bs->file->bs, &local_err);
3267 }
3268 if (local_err) {
3269 bs->open_flags |= BDRV_O_INACTIVE;
3270 error_propagate(errp, local_err);
3271 return;
3272 }
3273
3274 ret = refresh_total_sectors(bs, bs->total_sectors);
3275 if (ret < 0) {
3276 bs->open_flags |= BDRV_O_INACTIVE;
3277 error_setg_errno(errp, -ret, "Could not refresh total sector count");
3278 return;
3279 }
3280 }
3281
3282 void bdrv_invalidate_cache_all(Error **errp)
3283 {
3284 BlockDriverState *bs = NULL;
3285 Error *local_err = NULL;
3286
3287 while ((bs = bdrv_next(bs)) != NULL) {
3288 AioContext *aio_context = bdrv_get_aio_context(bs);
3289
3290 aio_context_acquire(aio_context);
3291 bdrv_invalidate_cache(bs, &local_err);
3292 aio_context_release(aio_context);
3293 if (local_err) {
3294 error_propagate(errp, local_err);
3295 return;
3296 }
3297 }
3298 }
3299
3300 static int bdrv_inactivate(BlockDriverState *bs)
3301 {
3302 int ret;
3303
3304 if (bs->drv->bdrv_inactivate) {
3305 ret = bs->drv->bdrv_inactivate(bs);
3306 if (ret < 0) {
3307 return ret;
3308 }
3309 }
3310
3311 bs->open_flags |= BDRV_O_INACTIVE;
3312 return 0;
3313 }
3314
3315 int bdrv_inactivate_all(void)
3316 {
3317 BlockDriverState *bs = NULL;
3318 int ret;
3319
3320 while ((bs = bdrv_next(bs)) != NULL) {
3321 AioContext *aio_context = bdrv_get_aio_context(bs);
3322
3323 aio_context_acquire(aio_context);
3324 ret = bdrv_inactivate(bs);
3325 aio_context_release(aio_context);
3326 if (ret < 0) {
3327 return ret;
3328 }
3329 }
3330
3331 return 0;
3332 }
3333
3334 /**************************************************************/
3335 /* removable device support */
3336
3337 /**
3338 * Return TRUE if the media is present
3339 */
3340 bool bdrv_is_inserted(BlockDriverState *bs)
3341 {
3342 BlockDriver *drv = bs->drv;
3343 BdrvChild *child;
3344
3345 if (!drv) {
3346 return false;
3347 }
3348 if (drv->bdrv_is_inserted) {
3349 return drv->bdrv_is_inserted(bs);
3350 }
3351 QLIST_FOREACH(child, &bs->children, next) {
3352 if (!bdrv_is_inserted(child->bs)) {
3353 return false;
3354 }
3355 }
3356 return true;
3357 }
3358
3359 /**
3360 * Return whether the media changed since the last call to this
3361 * function, or -ENOTSUP if we don't know. Most drivers don't know.
3362 */
3363 int bdrv_media_changed(BlockDriverState *bs)
3364 {
3365 BlockDriver *drv = bs->drv;
3366
3367 if (drv && drv->bdrv_media_changed) {
3368 return drv->bdrv_media_changed(bs);
3369 }
3370 return -ENOTSUP;
3371 }
3372
3373 /**
3374 * If eject_flag is TRUE, eject the media. Otherwise, close the tray
3375 */
3376 void bdrv_eject(BlockDriverState *bs, bool eject_flag)
3377 {
3378 BlockDriver *drv = bs->drv;
3379 const char *device_name;
3380
3381 if (drv && drv->bdrv_eject) {
3382 drv->bdrv_eject(bs, eject_flag);
3383 }
3384
3385 device_name = bdrv_get_device_name(bs);
3386 if (device_name[0] != '\0') {
3387 qapi_event_send_device_tray_moved(device_name,
3388 eject_flag, &error_abort);
3389 }
3390 }
3391
3392 /**
3393 * Lock or unlock the media (if it is locked, the user won't be able
3394 * to eject it manually).
3395 */
3396 void bdrv_lock_medium(BlockDriverState *bs, bool locked)
3397 {
3398 BlockDriver *drv = bs->drv;
3399
3400 trace_bdrv_lock_medium(bs, locked);
3401
3402 if (drv && drv->bdrv_lock_medium) {
3403 drv->bdrv_lock_medium(bs, locked);
3404 }
3405 }
3406
3407 /* Get a reference to bs */
3408 void bdrv_ref(BlockDriverState *bs)
3409 {
3410 bs->refcnt++;
3411 }
3412
3413 /* Release a previously grabbed reference to bs.
3414 * If after releasing, reference count is zero, the BlockDriverState is
3415 * deleted. */
3416 void bdrv_unref(BlockDriverState *bs)
3417 {
3418 if (!bs) {
3419 return;
3420 }
3421 assert(bs->refcnt > 0);
3422 if (--bs->refcnt == 0) {
3423 bdrv_delete(bs);
3424 }
3425 }
3426
3427 struct BdrvOpBlocker {
3428 Error *reason;
3429 QLIST_ENTRY(BdrvOpBlocker) list;
3430 };
3431
3432 bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
3433 {
3434 BdrvOpBlocker *blocker;
3435 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3436 if (!QLIST_EMPTY(&bs->op_blockers[op])) {
3437 blocker = QLIST_FIRST(&bs->op_blockers[op]);
3438 if (errp) {
3439 *errp = error_copy(blocker->reason);
3440 error_prepend(errp, "Node '%s' is busy: ",
3441 bdrv_get_device_or_node_name(bs));
3442 }
3443 return true;
3444 }
3445 return false;
3446 }
3447
3448 void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
3449 {
3450 BdrvOpBlocker *blocker;
3451 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3452
3453 blocker = g_new0(BdrvOpBlocker, 1);
3454 blocker->reason = reason;
3455 QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
3456 }
3457
3458 void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
3459 {
3460 BdrvOpBlocker *blocker, *next;
3461 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3462 QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
3463 if (blocker->reason == reason) {
3464 QLIST_REMOVE(blocker, list);
3465 g_free(blocker);
3466 }
3467 }
3468 }
3469
3470 void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
3471 {
3472 int i;
3473 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3474 bdrv_op_block(bs, i, reason);
3475 }
3476 }
3477
3478 void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
3479 {
3480 int i;
3481 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3482 bdrv_op_unblock(bs, i, reason);
3483 }
3484 }
3485
3486 bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
3487 {
3488 int i;
3489
3490 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3491 if (!QLIST_EMPTY(&bs->op_blockers[i])) {
3492 return false;
3493 }
3494 }
3495 return true;
3496 }
3497
3498 void bdrv_img_create(const char *filename, const char *fmt,
3499 const char *base_filename, const char *base_fmt,
3500 char *options, uint64_t img_size, int flags,
3501 Error **errp, bool quiet)
3502 {
3503 QemuOptsList *create_opts = NULL;
3504 QemuOpts *opts = NULL;
3505 const char *backing_fmt, *backing_file;
3506 int64_t size;
3507 BlockDriver *drv, *proto_drv;
3508 Error *local_err = NULL;
3509 int ret = 0;
3510
3511 /* Find driver and parse its options */
3512 drv = bdrv_find_format(fmt);
3513 if (!drv) {
3514 error_setg(errp, "Unknown file format '%s'", fmt);
3515 return;
3516 }
3517
3518 proto_drv = bdrv_find_protocol(filename, true, errp);
3519 if (!proto_drv) {
3520 return;
3521 }
3522
3523 if (!drv->create_opts) {
3524 error_setg(errp, "Format driver '%s' does not support image creation",
3525 drv->format_name);
3526 return;
3527 }
3528
3529 if (!proto_drv->create_opts) {
3530 error_setg(errp, "Protocol driver '%s' does not support image creation",
3531 proto_drv->format_name);
3532 return;
3533 }
3534
3535 create_opts = qemu_opts_append(create_opts, drv->create_opts);
3536 create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
3537
3538 /* Create parameter list with default values */
3539 opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
3540 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
3541
3542 /* Parse -o options */
3543 if (options) {
3544 qemu_opts_do_parse(opts, options, NULL, &local_err);
3545 if (local_err) {
3546 error_report_err(local_err);
3547 local_err = NULL;
3548 error_setg(errp, "Invalid options for file format '%s'", fmt);
3549 goto out;
3550 }
3551 }
3552
3553 if (base_filename) {
3554 qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
3555 if (local_err) {
3556 error_setg(errp, "Backing file not supported for file format '%s'",
3557 fmt);
3558 goto out;
3559 }
3560 }
3561
3562 if (base_fmt) {
3563 qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
3564 if (local_err) {
3565 error_setg(errp, "Backing file format not supported for file "
3566 "format '%s'", fmt);
3567 goto out;
3568 }
3569 }
3570
3571 backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
3572 if (backing_file) {
3573 if (!strcmp(filename, backing_file)) {
3574 error_setg(errp, "Error: Trying to create an image with the "
3575 "same filename as the backing file");
3576 goto out;
3577 }
3578 }
3579
3580 backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
3581
3582 // The size for the image must always be specified, with one exception:
3583 // If we are using a backing file, we can obtain the size from there
3584 size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
3585 if (size == -1) {
3586 if (backing_file) {
3587 BlockDriverState *bs;
3588 char *full_backing = g_new0(char, PATH_MAX);
3589 int64_t size;
3590 int back_flags;
3591 QDict *backing_options = NULL;
3592
3593 bdrv_get_full_backing_filename_from_filename(filename, backing_file,
3594 full_backing, PATH_MAX,
3595 &local_err);
3596 if (local_err) {
3597 g_free(full_backing);
3598 goto out;
3599 }
3600
3601 /* backing files always opened read-only */
3602 back_flags =
3603 flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
3604
3605 if (backing_fmt) {
3606 backing_options = qdict_new();
3607 qdict_put(backing_options, "driver",
3608 qstring_from_str(backing_fmt));
3609 }
3610
3611 bs = NULL;
3612 ret = bdrv_open(&bs, full_backing, NULL, backing_options,
3613 back_flags, &local_err);
3614 g_free(full_backing);
3615 if (ret < 0) {
3616 goto out;
3617 }
3618 size = bdrv_getlength(bs);
3619 if (size < 0) {
3620 error_setg_errno(errp, -size, "Could not get size of '%s'",
3621 backing_file);
3622 bdrv_unref(bs);
3623 goto out;
3624 }
3625
3626 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
3627
3628 bdrv_unref(bs);
3629 } else {
3630 error_setg(errp, "Image creation needs a size parameter");
3631 goto out;
3632 }
3633 }
3634
3635 if (!quiet) {
3636 printf("Formatting '%s', fmt=%s ", filename, fmt);
3637 qemu_opts_print(opts, " ");
3638 puts("");
3639 }
3640
3641 ret = bdrv_create(drv, filename, opts, &local_err);
3642
3643 if (ret == -EFBIG) {
3644 /* This is generally a better message than whatever the driver would
3645 * deliver (especially because of the cluster_size_hint), since that
3646 * is most probably not much different from "image too large". */
3647 const char *cluster_size_hint = "";
3648 if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
3649 cluster_size_hint = " (try using a larger cluster size)";
3650 }
3651 error_setg(errp, "The image size is too large for file format '%s'"
3652 "%s", fmt, cluster_size_hint);
3653 error_free(local_err);
3654 local_err = NULL;
3655 }
3656
3657 out:
3658 qemu_opts_del(opts);
3659 qemu_opts_free(create_opts);
3660 if (local_err) {
3661 error_propagate(errp, local_err);
3662 }
3663 }
3664
3665 AioContext *bdrv_get_aio_context(BlockDriverState *bs)
3666 {
3667 return bs->aio_context;
3668 }
3669
3670 void bdrv_detach_aio_context(BlockDriverState *bs)
3671 {
3672 BdrvAioNotifier *baf;
3673
3674 if (!bs->drv) {
3675 return;
3676 }
3677
3678 QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
3679 baf->detach_aio_context(baf->opaque);
3680 }
3681
3682 if (bs->throttle_state) {
3683 throttle_timers_detach_aio_context(&bs->throttle_timers);
3684 }
3685 if (bs->drv->bdrv_detach_aio_context) {
3686 bs->drv->bdrv_detach_aio_context(bs);
3687 }
3688 if (bs->file) {
3689 bdrv_detach_aio_context(bs->file->bs);
3690 }
3691 if (bs->backing) {
3692 bdrv_detach_aio_context(bs->backing->bs);
3693 }
3694
3695 bs->aio_context = NULL;
3696 }
3697
3698 void bdrv_attach_aio_context(BlockDriverState *bs,
3699 AioContext *new_context)
3700 {
3701 BdrvAioNotifier *ban;
3702
3703 if (!bs->drv) {
3704 return;
3705 }
3706
3707 bs->aio_context = new_context;
3708
3709 if (bs->backing) {
3710 bdrv_attach_aio_context(bs->backing->bs, new_context);
3711 }
3712 if (bs->file) {
3713 bdrv_attach_aio_context(bs->file->bs, new_context);
3714 }
3715 if (bs->drv->bdrv_attach_aio_context) {
3716 bs->drv->bdrv_attach_aio_context(bs, new_context);
3717 }
3718 if (bs->throttle_state) {
3719 throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
3720 }
3721
3722 QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
3723 ban->attached_aio_context(new_context, ban->opaque);
3724 }
3725 }
3726
3727 void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
3728 {
3729 bdrv_drain(bs); /* ensure there are no in-flight requests */
3730
3731 bdrv_detach_aio_context(bs);
3732
3733 /* This function executes in the old AioContext so acquire the new one in
3734 * case it runs in a different thread.
3735 */
3736 aio_context_acquire(new_context);
3737 bdrv_attach_aio_context(bs, new_context);
3738 aio_context_release(new_context);
3739 }
3740
3741 void bdrv_add_aio_context_notifier(BlockDriverState *bs,
3742 void (*attached_aio_context)(AioContext *new_context, void *opaque),
3743 void (*detach_aio_context)(void *opaque), void *opaque)
3744 {
3745 BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
3746 *ban = (BdrvAioNotifier){
3747 .attached_aio_context = attached_aio_context,
3748 .detach_aio_context = detach_aio_context,
3749 .opaque = opaque
3750 };
3751
3752 QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
3753 }
3754
3755 void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
3756 void (*attached_aio_context)(AioContext *,
3757 void *),
3758 void (*detach_aio_context)(void *),
3759 void *opaque)
3760 {
3761 BdrvAioNotifier *ban, *ban_next;
3762
3763 QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
3764 if (ban->attached_aio_context == attached_aio_context &&
3765 ban->detach_aio_context == detach_aio_context &&
3766 ban->opaque == opaque)
3767 {
3768 QLIST_REMOVE(ban, list);
3769 g_free(ban);
3770
3771 return;
3772 }
3773 }
3774
3775 abort();
3776 }
3777
3778 int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
3779 BlockDriverAmendStatusCB *status_cb, void *cb_opaque)
3780 {
3781 if (!bs->drv->bdrv_amend_options) {
3782 return -ENOTSUP;
3783 }
3784 return bs->drv->bdrv_amend_options(bs, opts, status_cb, cb_opaque);
3785 }
3786
3787 /* This function will be called by the bdrv_recurse_is_first_non_filter method
3788 * of block filter and by bdrv_is_first_non_filter.
3789 * It is used to test if the given bs is the candidate or recurse more in the
3790 * node graph.
3791 */
3792 bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
3793 BlockDriverState *candidate)
3794 {
3795 /* return false if basic checks fails */
3796 if (!bs || !bs->drv) {
3797 return false;
3798 }
3799
3800 /* the code reached a non block filter driver -> check if the bs is
3801 * the same as the candidate. It's the recursion termination condition.
3802 */
3803 if (!bs->drv->is_filter) {
3804 return bs == candidate;
3805 }
3806 /* Down this path the driver is a block filter driver */
3807
3808 /* If the block filter recursion method is defined use it to recurse down
3809 * the node graph.
3810 */
3811 if (bs->drv->bdrv_recurse_is_first_non_filter) {
3812 return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
3813 }
3814
3815 /* the driver is a block filter but don't allow to recurse -> return false
3816 */
3817 return false;
3818 }
3819
3820 /* This function checks if the candidate is the first non filter bs down it's
3821 * bs chain. Since we don't have pointers to parents it explore all bs chains
3822 * from the top. Some filters can choose not to pass down the recursion.
3823 */
3824 bool bdrv_is_first_non_filter(BlockDriverState *candidate)
3825 {
3826 BlockDriverState *bs = NULL;
3827
3828 /* walk down the bs forest recursively */
3829 while ((bs = bdrv_next(bs)) != NULL) {
3830 bool perm;
3831
3832 /* try to recurse in this top level bs */
3833 perm = bdrv_recurse_is_first_non_filter(bs, candidate);
3834
3835 /* candidate is the first non filter */
3836 if (perm) {
3837 return true;
3838 }
3839 }
3840
3841 return false;
3842 }
3843
3844 BlockDriverState *check_to_replace_node(BlockDriverState *parent_bs,
3845 const char *node_name, Error **errp)
3846 {
3847 BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
3848 AioContext *aio_context;
3849
3850 if (!to_replace_bs) {
3851 error_setg(errp, "Node name '%s' not found", node_name);
3852 return NULL;
3853 }
3854
3855 aio_context = bdrv_get_aio_context(to_replace_bs);
3856 aio_context_acquire(aio_context);
3857
3858 if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
3859 to_replace_bs = NULL;
3860 goto out;
3861 }
3862
3863 /* We don't want arbitrary node of the BDS chain to be replaced only the top
3864 * most non filter in order to prevent data corruption.
3865 * Another benefit is that this tests exclude backing files which are
3866 * blocked by the backing blockers.
3867 */
3868 if (!bdrv_recurse_is_first_non_filter(parent_bs, to_replace_bs)) {
3869 error_setg(errp, "Only top most non filter can be replaced");
3870 to_replace_bs = NULL;
3871 goto out;
3872 }
3873
3874 out:
3875 aio_context_release(aio_context);
3876 return to_replace_bs;
3877 }
3878
3879 static bool append_open_options(QDict *d, BlockDriverState *bs)
3880 {
3881 const QDictEntry *entry;
3882 QemuOptDesc *desc;
3883 BdrvChild *child;
3884 bool found_any = false;
3885 const char *p;
3886
3887 for (entry = qdict_first(bs->options); entry;
3888 entry = qdict_next(bs->options, entry))
3889 {
3890 /* Exclude options for children */
3891 QLIST_FOREACH(child, &bs->children, next) {
3892 if (strstart(qdict_entry_key(entry), child->name, &p)
3893 && (!*p || *p == '.'))
3894 {
3895 break;
3896 }
3897 }
3898 if (child) {
3899 continue;
3900 }
3901
3902 /* And exclude all non-driver-specific options */
3903 for (desc = bdrv_runtime_opts.desc; desc->name; desc++) {
3904 if (!strcmp(qdict_entry_key(entry), desc->name)) {
3905 break;
3906 }
3907 }
3908 if (desc->name) {
3909 continue;
3910 }
3911
3912 qobject_incref(qdict_entry_value(entry));
3913 qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
3914 found_any = true;
3915 }
3916
3917 return found_any;
3918 }
3919
3920 /* Updates the following BDS fields:
3921 * - exact_filename: A filename which may be used for opening a block device
3922 * which (mostly) equals the given BDS (even without any
3923 * other options; so reading and writing must return the same
3924 * results, but caching etc. may be different)
3925 * - full_open_options: Options which, when given when opening a block device
3926 * (without a filename), result in a BDS (mostly)
3927 * equalling the given one
3928 * - filename: If exact_filename is set, it is copied here. Otherwise,
3929 * full_open_options is converted to a JSON object, prefixed with
3930 * "json:" (for use through the JSON pseudo protocol) and put here.
3931 */
3932 void bdrv_refresh_filename(BlockDriverState *bs)
3933 {
3934 BlockDriver *drv = bs->drv;
3935 QDict *opts;
3936
3937 if (!drv) {
3938 return;
3939 }
3940
3941 /* This BDS's file name will most probably depend on its file's name, so
3942 * refresh that first */
3943 if (bs->file) {
3944 bdrv_refresh_filename(bs->file->bs);
3945 }
3946
3947 if (drv->bdrv_refresh_filename) {
3948 /* Obsolete information is of no use here, so drop the old file name
3949 * information before refreshing it */
3950 bs->exact_filename[0] = '\0';
3951 if (bs->full_open_options) {
3952 QDECREF(bs->full_open_options);
3953 bs->full_open_options = NULL;
3954 }
3955
3956 opts = qdict_new();
3957 append_open_options(opts, bs);
3958 drv->bdrv_refresh_filename(bs, opts);
3959 QDECREF(opts);
3960 } else if (bs->file) {
3961 /* Try to reconstruct valid information from the underlying file */
3962 bool has_open_options;
3963
3964 bs->exact_filename[0] = '\0';
3965 if (bs->full_open_options) {
3966 QDECREF(bs->full_open_options);
3967 bs->full_open_options = NULL;
3968 }
3969
3970 opts = qdict_new();
3971 has_open_options = append_open_options(opts, bs);
3972
3973 /* If no specific options have been given for this BDS, the filename of
3974 * the underlying file should suffice for this one as well */
3975 if (bs->file->bs->exact_filename[0] && !has_open_options) {
3976 strcpy(bs->exact_filename, bs->file->bs->exact_filename);
3977 }
3978 /* Reconstructing the full options QDict is simple for most format block
3979 * drivers, as long as the full options are known for the underlying
3980 * file BDS. The full options QDict of that file BDS should somehow
3981 * contain a representation of the filename, therefore the following
3982 * suffices without querying the (exact_)filename of this BDS. */
3983 if (bs->file->bs->full_open_options) {
3984 qdict_put_obj(opts, "driver",
3985 QOBJECT(qstring_from_str(drv->format_name)));
3986 QINCREF(bs->file->bs->full_open_options);
3987 qdict_put_obj(opts, "file",
3988 QOBJECT(bs->file->bs->full_open_options));
3989
3990 bs->full_open_options = opts;
3991 } else {
3992 QDECREF(opts);
3993 }
3994 } else if (!bs->full_open_options && qdict_size(bs->options)) {
3995 /* There is no underlying file BDS (at least referenced by BDS.file),
3996 * so the full options QDict should be equal to the options given
3997 * specifically for this block device when it was opened (plus the
3998 * driver specification).
3999 * Because those options don't change, there is no need to update
4000 * full_open_options when it's already set. */
4001
4002 opts = qdict_new();
4003 append_open_options(opts, bs);
4004 qdict_put_obj(opts, "driver",
4005 QOBJECT(qstring_from_str(drv->format_name)));
4006
4007 if (bs->exact_filename[0]) {
4008 /* This may not work for all block protocol drivers (some may
4009 * require this filename to be parsed), but we have to find some
4010 * default solution here, so just include it. If some block driver
4011 * does not support pure options without any filename at all or
4012 * needs some special format of the options QDict, it needs to
4013 * implement the driver-specific bdrv_refresh_filename() function.
4014 */
4015 qdict_put_obj(opts, "filename",
4016 QOBJECT(qstring_from_str(bs->exact_filename)));
4017 }
4018
4019 bs->full_open_options = opts;
4020 }
4021
4022 if (bs->exact_filename[0]) {
4023 pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
4024 } else if (bs->full_open_options) {
4025 QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
4026 snprintf(bs->filename, sizeof(bs->filename), "json:%s",
4027 qstring_get_str(json));
4028 QDECREF(json);
4029 }
4030 }