]> git.proxmox.com Git - qemu.git/blob - block.c
check for bs->drv in bdrv_flush (Christoph Hellwig)
[qemu.git] / block.c
1 /*
2 * QEMU System Emulator block driver
3 *
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24 #include "config-host.h"
25 #ifdef HOST_BSD
26 /* include native header before sys-queue.h */
27 #include <sys/queue.h>
28 #endif
29
30 #include "qemu-common.h"
31 #include "monitor.h"
32 #include "block_int.h"
33
34 #ifdef HOST_BSD
35 #include <sys/types.h>
36 #include <sys/stat.h>
37 #include <sys/ioctl.h>
38 #ifndef __DragonFly__
39 #include <sys/disk.h>
40 #endif
41 #endif
42
43 #ifdef _WIN32
44 #include <windows.h>
45 #endif
46
47 #define SECTOR_BITS 9
48 #define SECTOR_SIZE (1 << SECTOR_BITS)
49
50 static AIOPool vectored_aio_pool;
51
52 typedef struct BlockDriverAIOCBSync {
53 BlockDriverAIOCB common;
54 QEMUBH *bh;
55 int ret;
56 } BlockDriverAIOCBSync;
57
58 static BlockDriverAIOCB *bdrv_aio_read_em(BlockDriverState *bs,
59 int64_t sector_num, uint8_t *buf, int nb_sectors,
60 BlockDriverCompletionFunc *cb, void *opaque);
61 static BlockDriverAIOCB *bdrv_aio_write_em(BlockDriverState *bs,
62 int64_t sector_num, const uint8_t *buf, int nb_sectors,
63 BlockDriverCompletionFunc *cb, void *opaque);
64 static void bdrv_aio_cancel_em(BlockDriverAIOCB *acb);
65 static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
66 uint8_t *buf, int nb_sectors);
67 static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
68 const uint8_t *buf, int nb_sectors);
69
70 BlockDriverState *bdrv_first;
71
72 static BlockDriver *first_drv;
73
74 int path_is_absolute(const char *path)
75 {
76 const char *p;
77 #ifdef _WIN32
78 /* specific case for names like: "\\.\d:" */
79 if (*path == '/' || *path == '\\')
80 return 1;
81 #endif
82 p = strchr(path, ':');
83 if (p)
84 p++;
85 else
86 p = path;
87 #ifdef _WIN32
88 return (*p == '/' || *p == '\\');
89 #else
90 return (*p == '/');
91 #endif
92 }
93
94 /* if filename is absolute, just copy it to dest. Otherwise, build a
95 path to it by considering it is relative to base_path. URL are
96 supported. */
97 void path_combine(char *dest, int dest_size,
98 const char *base_path,
99 const char *filename)
100 {
101 const char *p, *p1;
102 int len;
103
104 if (dest_size <= 0)
105 return;
106 if (path_is_absolute(filename)) {
107 pstrcpy(dest, dest_size, filename);
108 } else {
109 p = strchr(base_path, ':');
110 if (p)
111 p++;
112 else
113 p = base_path;
114 p1 = strrchr(base_path, '/');
115 #ifdef _WIN32
116 {
117 const char *p2;
118 p2 = strrchr(base_path, '\\');
119 if (!p1 || p2 > p1)
120 p1 = p2;
121 }
122 #endif
123 if (p1)
124 p1++;
125 else
126 p1 = base_path;
127 if (p1 > p)
128 p = p1;
129 len = p - base_path;
130 if (len > dest_size - 1)
131 len = dest_size - 1;
132 memcpy(dest, base_path, len);
133 dest[len] = '\0';
134 pstrcat(dest, dest_size, filename);
135 }
136 }
137
138
139 static void bdrv_register(BlockDriver *bdrv)
140 {
141 if (!bdrv->bdrv_aio_read) {
142 /* add AIO emulation layer */
143 bdrv->bdrv_aio_read = bdrv_aio_read_em;
144 bdrv->bdrv_aio_write = bdrv_aio_write_em;
145 bdrv->bdrv_aio_cancel = bdrv_aio_cancel_em;
146 bdrv->aiocb_size = sizeof(BlockDriverAIOCBSync);
147 } else if (!bdrv->bdrv_read) {
148 /* add synchronous IO emulation layer */
149 bdrv->bdrv_read = bdrv_read_em;
150 bdrv->bdrv_write = bdrv_write_em;
151 }
152 aio_pool_init(&bdrv->aio_pool, bdrv->aiocb_size, bdrv->bdrv_aio_cancel);
153 bdrv->next = first_drv;
154 first_drv = bdrv;
155 }
156
157 /* create a new block device (by default it is empty) */
158 BlockDriverState *bdrv_new(const char *device_name)
159 {
160 BlockDriverState **pbs, *bs;
161
162 bs = qemu_mallocz(sizeof(BlockDriverState));
163 pstrcpy(bs->device_name, sizeof(bs->device_name), device_name);
164 if (device_name[0] != '\0') {
165 /* insert at the end */
166 pbs = &bdrv_first;
167 while (*pbs != NULL)
168 pbs = &(*pbs)->next;
169 *pbs = bs;
170 }
171 return bs;
172 }
173
174 BlockDriver *bdrv_find_format(const char *format_name)
175 {
176 BlockDriver *drv1;
177 for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
178 if (!strcmp(drv1->format_name, format_name))
179 return drv1;
180 }
181 return NULL;
182 }
183
184 int bdrv_create2(BlockDriver *drv,
185 const char *filename, int64_t size_in_sectors,
186 const char *backing_file, const char *backing_format,
187 int flags)
188 {
189 if (drv->bdrv_create2)
190 return drv->bdrv_create2(filename, size_in_sectors, backing_file,
191 backing_format, flags);
192 if (drv->bdrv_create)
193 return drv->bdrv_create(filename, size_in_sectors, backing_file,
194 flags);
195 return -ENOTSUP;
196 }
197
198 int bdrv_create(BlockDriver *drv,
199 const char *filename, int64_t size_in_sectors,
200 const char *backing_file, int flags)
201 {
202 if (!drv->bdrv_create)
203 return -ENOTSUP;
204 return drv->bdrv_create(filename, size_in_sectors, backing_file, flags);
205 }
206
207 #ifdef _WIN32
208 void get_tmp_filename(char *filename, int size)
209 {
210 char temp_dir[MAX_PATH];
211
212 GetTempPath(MAX_PATH, temp_dir);
213 GetTempFileName(temp_dir, "qem", 0, filename);
214 }
215 #else
216 void get_tmp_filename(char *filename, int size)
217 {
218 int fd;
219 const char *tmpdir;
220 /* XXX: race condition possible */
221 tmpdir = getenv("TMPDIR");
222 if (!tmpdir)
223 tmpdir = "/tmp";
224 snprintf(filename, size, "%s/vl.XXXXXX", tmpdir);
225 fd = mkstemp(filename);
226 close(fd);
227 }
228 #endif
229
230 #ifdef _WIN32
231 static int is_windows_drive_prefix(const char *filename)
232 {
233 return (((filename[0] >= 'a' && filename[0] <= 'z') ||
234 (filename[0] >= 'A' && filename[0] <= 'Z')) &&
235 filename[1] == ':');
236 }
237
238 static int is_windows_drive(const char *filename)
239 {
240 if (is_windows_drive_prefix(filename) &&
241 filename[2] == '\0')
242 return 1;
243 if (strstart(filename, "\\\\.\\", NULL) ||
244 strstart(filename, "//./", NULL))
245 return 1;
246 return 0;
247 }
248 #endif
249
250 static BlockDriver *find_protocol(const char *filename)
251 {
252 BlockDriver *drv1;
253 char protocol[128];
254 int len;
255 const char *p;
256
257 #ifdef _WIN32
258 if (is_windows_drive(filename) ||
259 is_windows_drive_prefix(filename))
260 return &bdrv_raw;
261 #endif
262 p = strchr(filename, ':');
263 if (!p)
264 return &bdrv_raw;
265 len = p - filename;
266 if (len > sizeof(protocol) - 1)
267 len = sizeof(protocol) - 1;
268 memcpy(protocol, filename, len);
269 protocol[len] = '\0';
270 for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
271 if (drv1->protocol_name &&
272 !strcmp(drv1->protocol_name, protocol))
273 return drv1;
274 }
275 return NULL;
276 }
277
278 /* XXX: force raw format if block or character device ? It would
279 simplify the BSD case */
280 static BlockDriver *find_image_format(const char *filename)
281 {
282 int ret, score, score_max;
283 BlockDriver *drv1, *drv;
284 uint8_t buf[2048];
285 BlockDriverState *bs;
286
287 /* detect host devices. By convention, /dev/cdrom[N] is always
288 recognized as a host CDROM */
289 if (strstart(filename, "/dev/cdrom", NULL))
290 return &bdrv_host_device;
291 #ifdef _WIN32
292 if (is_windows_drive(filename))
293 return &bdrv_host_device;
294 #else
295 {
296 struct stat st;
297 if (stat(filename, &st) >= 0 &&
298 (S_ISCHR(st.st_mode) || S_ISBLK(st.st_mode))) {
299 return &bdrv_host_device;
300 }
301 }
302 #endif
303
304 drv = find_protocol(filename);
305 /* no need to test disk image formats for vvfat */
306 if (drv == &bdrv_vvfat)
307 return drv;
308
309 ret = bdrv_file_open(&bs, filename, BDRV_O_RDONLY);
310 if (ret < 0)
311 return NULL;
312 ret = bdrv_pread(bs, 0, buf, sizeof(buf));
313 bdrv_delete(bs);
314 if (ret < 0) {
315 return NULL;
316 }
317
318 score_max = 0;
319 for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
320 if (drv1->bdrv_probe) {
321 score = drv1->bdrv_probe(buf, ret, filename);
322 if (score > score_max) {
323 score_max = score;
324 drv = drv1;
325 }
326 }
327 }
328 return drv;
329 }
330
331 int bdrv_file_open(BlockDriverState **pbs, const char *filename, int flags)
332 {
333 BlockDriverState *bs;
334 int ret;
335
336 bs = bdrv_new("");
337 ret = bdrv_open2(bs, filename, flags | BDRV_O_FILE, NULL);
338 if (ret < 0) {
339 bdrv_delete(bs);
340 return ret;
341 }
342 bs->growable = 1;
343 *pbs = bs;
344 return 0;
345 }
346
347 int bdrv_open(BlockDriverState *bs, const char *filename, int flags)
348 {
349 return bdrv_open2(bs, filename, flags, NULL);
350 }
351
352 int bdrv_open2(BlockDriverState *bs, const char *filename, int flags,
353 BlockDriver *drv)
354 {
355 int ret, open_flags;
356 char tmp_filename[PATH_MAX];
357 char backing_filename[PATH_MAX];
358
359 bs->read_only = 0;
360 bs->is_temporary = 0;
361 bs->encrypted = 0;
362 bs->valid_key = 0;
363
364 if (flags & BDRV_O_SNAPSHOT) {
365 BlockDriverState *bs1;
366 int64_t total_size;
367 int is_protocol = 0;
368
369 /* if snapshot, we create a temporary backing file and open it
370 instead of opening 'filename' directly */
371
372 /* if there is a backing file, use it */
373 bs1 = bdrv_new("");
374 ret = bdrv_open2(bs1, filename, 0, drv);
375 if (ret < 0) {
376 bdrv_delete(bs1);
377 return ret;
378 }
379 total_size = bdrv_getlength(bs1) >> SECTOR_BITS;
380
381 if (bs1->drv && bs1->drv->protocol_name)
382 is_protocol = 1;
383
384 bdrv_delete(bs1);
385
386 get_tmp_filename(tmp_filename, sizeof(tmp_filename));
387
388 /* Real path is meaningless for protocols */
389 if (is_protocol)
390 snprintf(backing_filename, sizeof(backing_filename),
391 "%s", filename);
392 else
393 realpath(filename, backing_filename);
394
395 ret = bdrv_create2(&bdrv_qcow2, tmp_filename,
396 total_size, backing_filename,
397 (drv ? drv->format_name : NULL), 0);
398 if (ret < 0) {
399 return ret;
400 }
401 filename = tmp_filename;
402 drv = &bdrv_qcow2;
403 bs->is_temporary = 1;
404 }
405
406 pstrcpy(bs->filename, sizeof(bs->filename), filename);
407 if (flags & BDRV_O_FILE) {
408 drv = find_protocol(filename);
409 } else if (!drv) {
410 drv = find_image_format(filename);
411 }
412 if (!drv) {
413 ret = -ENOENT;
414 goto unlink_and_fail;
415 }
416 bs->drv = drv;
417 bs->opaque = qemu_mallocz(drv->instance_size);
418 /* Note: for compatibility, we open disk image files as RDWR, and
419 RDONLY as fallback */
420 if (!(flags & BDRV_O_FILE))
421 open_flags = BDRV_O_RDWR | (flags & BDRV_O_CACHE_MASK);
422 else
423 open_flags = flags & ~(BDRV_O_FILE | BDRV_O_SNAPSHOT);
424 ret = drv->bdrv_open(bs, filename, open_flags);
425 if ((ret == -EACCES || ret == -EPERM) && !(flags & BDRV_O_FILE)) {
426 ret = drv->bdrv_open(bs, filename, open_flags & ~BDRV_O_RDWR);
427 bs->read_only = 1;
428 }
429 if (ret < 0) {
430 qemu_free(bs->opaque);
431 bs->opaque = NULL;
432 bs->drv = NULL;
433 unlink_and_fail:
434 if (bs->is_temporary)
435 unlink(filename);
436 return ret;
437 }
438 if (drv->bdrv_getlength) {
439 bs->total_sectors = bdrv_getlength(bs) >> SECTOR_BITS;
440 }
441 #ifndef _WIN32
442 if (bs->is_temporary) {
443 unlink(filename);
444 }
445 #endif
446 if (bs->backing_file[0] != '\0') {
447 /* if there is a backing file, use it */
448 BlockDriver *back_drv = NULL;
449 bs->backing_hd = bdrv_new("");
450 path_combine(backing_filename, sizeof(backing_filename),
451 filename, bs->backing_file);
452 if (bs->backing_format[0] != '\0')
453 back_drv = bdrv_find_format(bs->backing_format);
454 ret = bdrv_open2(bs->backing_hd, backing_filename, open_flags,
455 back_drv);
456 if (ret < 0) {
457 bdrv_close(bs);
458 return ret;
459 }
460 }
461
462 if (!bdrv_key_required(bs)) {
463 /* call the change callback */
464 bs->media_changed = 1;
465 if (bs->change_cb)
466 bs->change_cb(bs->change_opaque);
467 }
468 return 0;
469 }
470
471 void bdrv_close(BlockDriverState *bs)
472 {
473 if (bs->drv) {
474 if (bs->backing_hd)
475 bdrv_delete(bs->backing_hd);
476 bs->drv->bdrv_close(bs);
477 qemu_free(bs->opaque);
478 #ifdef _WIN32
479 if (bs->is_temporary) {
480 unlink(bs->filename);
481 }
482 #endif
483 bs->opaque = NULL;
484 bs->drv = NULL;
485
486 /* call the change callback */
487 bs->media_changed = 1;
488 if (bs->change_cb)
489 bs->change_cb(bs->change_opaque);
490 }
491 }
492
493 void bdrv_delete(BlockDriverState *bs)
494 {
495 BlockDriverState **pbs;
496
497 pbs = &bdrv_first;
498 while (*pbs != bs && *pbs != NULL)
499 pbs = &(*pbs)->next;
500 if (*pbs == bs)
501 *pbs = bs->next;
502
503 bdrv_close(bs);
504 qemu_free(bs);
505 }
506
507 /* commit COW file into the raw image */
508 int bdrv_commit(BlockDriverState *bs)
509 {
510 BlockDriver *drv = bs->drv;
511 int64_t i, total_sectors;
512 int n, j;
513 unsigned char sector[512];
514
515 if (!drv)
516 return -ENOMEDIUM;
517
518 if (bs->read_only) {
519 return -EACCES;
520 }
521
522 if (!bs->backing_hd) {
523 return -ENOTSUP;
524 }
525
526 total_sectors = bdrv_getlength(bs) >> SECTOR_BITS;
527 for (i = 0; i < total_sectors;) {
528 if (drv->bdrv_is_allocated(bs, i, 65536, &n)) {
529 for(j = 0; j < n; j++) {
530 if (bdrv_read(bs, i, sector, 1) != 0) {
531 return -EIO;
532 }
533
534 if (bdrv_write(bs->backing_hd, i, sector, 1) != 0) {
535 return -EIO;
536 }
537 i++;
538 }
539 } else {
540 i += n;
541 }
542 }
543
544 if (drv->bdrv_make_empty)
545 return drv->bdrv_make_empty(bs);
546
547 return 0;
548 }
549
550 static int bdrv_check_byte_request(BlockDriverState *bs, int64_t offset,
551 size_t size)
552 {
553 int64_t len;
554
555 if (!bdrv_is_inserted(bs))
556 return -ENOMEDIUM;
557
558 if (bs->growable)
559 return 0;
560
561 len = bdrv_getlength(bs);
562
563 if ((offset + size) > len)
564 return -EIO;
565
566 return 0;
567 }
568
569 static int bdrv_check_request(BlockDriverState *bs, int64_t sector_num,
570 int nb_sectors)
571 {
572 return bdrv_check_byte_request(bs, sector_num * 512, nb_sectors * 512);
573 }
574
575 /* return < 0 if error. See bdrv_write() for the return codes */
576 int bdrv_read(BlockDriverState *bs, int64_t sector_num,
577 uint8_t *buf, int nb_sectors)
578 {
579 BlockDriver *drv = bs->drv;
580
581 if (!drv)
582 return -ENOMEDIUM;
583 if (bdrv_check_request(bs, sector_num, nb_sectors))
584 return -EIO;
585
586 return drv->bdrv_read(bs, sector_num, buf, nb_sectors);
587 }
588
589 /* Return < 0 if error. Important errors are:
590 -EIO generic I/O error (may happen for all errors)
591 -ENOMEDIUM No media inserted.
592 -EINVAL Invalid sector number or nb_sectors
593 -EACCES Trying to write a read-only device
594 */
595 int bdrv_write(BlockDriverState *bs, int64_t sector_num,
596 const uint8_t *buf, int nb_sectors)
597 {
598 BlockDriver *drv = bs->drv;
599 if (!bs->drv)
600 return -ENOMEDIUM;
601 if (bs->read_only)
602 return -EACCES;
603 if (bdrv_check_request(bs, sector_num, nb_sectors))
604 return -EIO;
605
606 return drv->bdrv_write(bs, sector_num, buf, nb_sectors);
607 }
608
609 int bdrv_pread(BlockDriverState *bs, int64_t offset,
610 void *buf, int count1)
611 {
612 uint8_t tmp_buf[SECTOR_SIZE];
613 int len, nb_sectors, count;
614 int64_t sector_num;
615
616 count = count1;
617 /* first read to align to sector start */
618 len = (SECTOR_SIZE - offset) & (SECTOR_SIZE - 1);
619 if (len > count)
620 len = count;
621 sector_num = offset >> SECTOR_BITS;
622 if (len > 0) {
623 if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
624 return -EIO;
625 memcpy(buf, tmp_buf + (offset & (SECTOR_SIZE - 1)), len);
626 count -= len;
627 if (count == 0)
628 return count1;
629 sector_num++;
630 buf += len;
631 }
632
633 /* read the sectors "in place" */
634 nb_sectors = count >> SECTOR_BITS;
635 if (nb_sectors > 0) {
636 if (bdrv_read(bs, sector_num, buf, nb_sectors) < 0)
637 return -EIO;
638 sector_num += nb_sectors;
639 len = nb_sectors << SECTOR_BITS;
640 buf += len;
641 count -= len;
642 }
643
644 /* add data from the last sector */
645 if (count > 0) {
646 if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
647 return -EIO;
648 memcpy(buf, tmp_buf, count);
649 }
650 return count1;
651 }
652
653 int bdrv_pwrite(BlockDriverState *bs, int64_t offset,
654 const void *buf, int count1)
655 {
656 uint8_t tmp_buf[SECTOR_SIZE];
657 int len, nb_sectors, count;
658 int64_t sector_num;
659
660 count = count1;
661 /* first write to align to sector start */
662 len = (SECTOR_SIZE - offset) & (SECTOR_SIZE - 1);
663 if (len > count)
664 len = count;
665 sector_num = offset >> SECTOR_BITS;
666 if (len > 0) {
667 if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
668 return -EIO;
669 memcpy(tmp_buf + (offset & (SECTOR_SIZE - 1)), buf, len);
670 if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0)
671 return -EIO;
672 count -= len;
673 if (count == 0)
674 return count1;
675 sector_num++;
676 buf += len;
677 }
678
679 /* write the sectors "in place" */
680 nb_sectors = count >> SECTOR_BITS;
681 if (nb_sectors > 0) {
682 if (bdrv_write(bs, sector_num, buf, nb_sectors) < 0)
683 return -EIO;
684 sector_num += nb_sectors;
685 len = nb_sectors << SECTOR_BITS;
686 buf += len;
687 count -= len;
688 }
689
690 /* add data from the last sector */
691 if (count > 0) {
692 if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
693 return -EIO;
694 memcpy(tmp_buf, buf, count);
695 if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0)
696 return -EIO;
697 }
698 return count1;
699 }
700
701 /**
702 * Truncate file to 'offset' bytes (needed only for file protocols)
703 */
704 int bdrv_truncate(BlockDriverState *bs, int64_t offset)
705 {
706 BlockDriver *drv = bs->drv;
707 if (!drv)
708 return -ENOMEDIUM;
709 if (!drv->bdrv_truncate)
710 return -ENOTSUP;
711 return drv->bdrv_truncate(bs, offset);
712 }
713
714 /**
715 * Length of a file in bytes. Return < 0 if error or unknown.
716 */
717 int64_t bdrv_getlength(BlockDriverState *bs)
718 {
719 BlockDriver *drv = bs->drv;
720 if (!drv)
721 return -ENOMEDIUM;
722 if (!drv->bdrv_getlength) {
723 /* legacy mode */
724 return bs->total_sectors * SECTOR_SIZE;
725 }
726 return drv->bdrv_getlength(bs);
727 }
728
729 /* return 0 as number of sectors if no device present or error */
730 void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
731 {
732 int64_t length;
733 length = bdrv_getlength(bs);
734 if (length < 0)
735 length = 0;
736 else
737 length = length >> SECTOR_BITS;
738 *nb_sectors_ptr = length;
739 }
740
741 struct partition {
742 uint8_t boot_ind; /* 0x80 - active */
743 uint8_t head; /* starting head */
744 uint8_t sector; /* starting sector */
745 uint8_t cyl; /* starting cylinder */
746 uint8_t sys_ind; /* What partition type */
747 uint8_t end_head; /* end head */
748 uint8_t end_sector; /* end sector */
749 uint8_t end_cyl; /* end cylinder */
750 uint32_t start_sect; /* starting sector counting from 0 */
751 uint32_t nr_sects; /* nr of sectors in partition */
752 } __attribute__((packed));
753
754 /* try to guess the disk logical geometry from the MSDOS partition table. Return 0 if OK, -1 if could not guess */
755 static int guess_disk_lchs(BlockDriverState *bs,
756 int *pcylinders, int *pheads, int *psectors)
757 {
758 uint8_t buf[512];
759 int ret, i, heads, sectors, cylinders;
760 struct partition *p;
761 uint32_t nr_sects;
762 uint64_t nb_sectors;
763
764 bdrv_get_geometry(bs, &nb_sectors);
765
766 ret = bdrv_read(bs, 0, buf, 1);
767 if (ret < 0)
768 return -1;
769 /* test msdos magic */
770 if (buf[510] != 0x55 || buf[511] != 0xaa)
771 return -1;
772 for(i = 0; i < 4; i++) {
773 p = ((struct partition *)(buf + 0x1be)) + i;
774 nr_sects = le32_to_cpu(p->nr_sects);
775 if (nr_sects && p->end_head) {
776 /* We make the assumption that the partition terminates on
777 a cylinder boundary */
778 heads = p->end_head + 1;
779 sectors = p->end_sector & 63;
780 if (sectors == 0)
781 continue;
782 cylinders = nb_sectors / (heads * sectors);
783 if (cylinders < 1 || cylinders > 16383)
784 continue;
785 *pheads = heads;
786 *psectors = sectors;
787 *pcylinders = cylinders;
788 #if 0
789 printf("guessed geometry: LCHS=%d %d %d\n",
790 cylinders, heads, sectors);
791 #endif
792 return 0;
793 }
794 }
795 return -1;
796 }
797
798 void bdrv_guess_geometry(BlockDriverState *bs, int *pcyls, int *pheads, int *psecs)
799 {
800 int translation, lba_detected = 0;
801 int cylinders, heads, secs;
802 uint64_t nb_sectors;
803
804 /* if a geometry hint is available, use it */
805 bdrv_get_geometry(bs, &nb_sectors);
806 bdrv_get_geometry_hint(bs, &cylinders, &heads, &secs);
807 translation = bdrv_get_translation_hint(bs);
808 if (cylinders != 0) {
809 *pcyls = cylinders;
810 *pheads = heads;
811 *psecs = secs;
812 } else {
813 if (guess_disk_lchs(bs, &cylinders, &heads, &secs) == 0) {
814 if (heads > 16) {
815 /* if heads > 16, it means that a BIOS LBA
816 translation was active, so the default
817 hardware geometry is OK */
818 lba_detected = 1;
819 goto default_geometry;
820 } else {
821 *pcyls = cylinders;
822 *pheads = heads;
823 *psecs = secs;
824 /* disable any translation to be in sync with
825 the logical geometry */
826 if (translation == BIOS_ATA_TRANSLATION_AUTO) {
827 bdrv_set_translation_hint(bs,
828 BIOS_ATA_TRANSLATION_NONE);
829 }
830 }
831 } else {
832 default_geometry:
833 /* if no geometry, use a standard physical disk geometry */
834 cylinders = nb_sectors / (16 * 63);
835
836 if (cylinders > 16383)
837 cylinders = 16383;
838 else if (cylinders < 2)
839 cylinders = 2;
840 *pcyls = cylinders;
841 *pheads = 16;
842 *psecs = 63;
843 if ((lba_detected == 1) && (translation == BIOS_ATA_TRANSLATION_AUTO)) {
844 if ((*pcyls * *pheads) <= 131072) {
845 bdrv_set_translation_hint(bs,
846 BIOS_ATA_TRANSLATION_LARGE);
847 } else {
848 bdrv_set_translation_hint(bs,
849 BIOS_ATA_TRANSLATION_LBA);
850 }
851 }
852 }
853 bdrv_set_geometry_hint(bs, *pcyls, *pheads, *psecs);
854 }
855 }
856
857 void bdrv_set_geometry_hint(BlockDriverState *bs,
858 int cyls, int heads, int secs)
859 {
860 bs->cyls = cyls;
861 bs->heads = heads;
862 bs->secs = secs;
863 }
864
865 void bdrv_set_type_hint(BlockDriverState *bs, int type)
866 {
867 bs->type = type;
868 bs->removable = ((type == BDRV_TYPE_CDROM ||
869 type == BDRV_TYPE_FLOPPY));
870 }
871
872 void bdrv_set_translation_hint(BlockDriverState *bs, int translation)
873 {
874 bs->translation = translation;
875 }
876
877 void bdrv_get_geometry_hint(BlockDriverState *bs,
878 int *pcyls, int *pheads, int *psecs)
879 {
880 *pcyls = bs->cyls;
881 *pheads = bs->heads;
882 *psecs = bs->secs;
883 }
884
885 int bdrv_get_type_hint(BlockDriverState *bs)
886 {
887 return bs->type;
888 }
889
890 int bdrv_get_translation_hint(BlockDriverState *bs)
891 {
892 return bs->translation;
893 }
894
895 int bdrv_is_removable(BlockDriverState *bs)
896 {
897 return bs->removable;
898 }
899
900 int bdrv_is_read_only(BlockDriverState *bs)
901 {
902 return bs->read_only;
903 }
904
905 int bdrv_is_sg(BlockDriverState *bs)
906 {
907 return bs->sg;
908 }
909
910 /* XXX: no longer used */
911 void bdrv_set_change_cb(BlockDriverState *bs,
912 void (*change_cb)(void *opaque), void *opaque)
913 {
914 bs->change_cb = change_cb;
915 bs->change_opaque = opaque;
916 }
917
918 int bdrv_is_encrypted(BlockDriverState *bs)
919 {
920 if (bs->backing_hd && bs->backing_hd->encrypted)
921 return 1;
922 return bs->encrypted;
923 }
924
925 int bdrv_key_required(BlockDriverState *bs)
926 {
927 BlockDriverState *backing_hd = bs->backing_hd;
928
929 if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key)
930 return 1;
931 return (bs->encrypted && !bs->valid_key);
932 }
933
934 int bdrv_set_key(BlockDriverState *bs, const char *key)
935 {
936 int ret;
937 if (bs->backing_hd && bs->backing_hd->encrypted) {
938 ret = bdrv_set_key(bs->backing_hd, key);
939 if (ret < 0)
940 return ret;
941 if (!bs->encrypted)
942 return 0;
943 }
944 if (!bs->encrypted || !bs->drv || !bs->drv->bdrv_set_key)
945 return -1;
946 ret = bs->drv->bdrv_set_key(bs, key);
947 if (ret < 0) {
948 bs->valid_key = 0;
949 } else if (!bs->valid_key) {
950 bs->valid_key = 1;
951 /* call the change callback now, we skipped it on open */
952 bs->media_changed = 1;
953 if (bs->change_cb)
954 bs->change_cb(bs->change_opaque);
955 }
956 return ret;
957 }
958
959 void bdrv_get_format(BlockDriverState *bs, char *buf, int buf_size)
960 {
961 if (!bs->drv) {
962 buf[0] = '\0';
963 } else {
964 pstrcpy(buf, buf_size, bs->drv->format_name);
965 }
966 }
967
968 void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
969 void *opaque)
970 {
971 BlockDriver *drv;
972
973 for (drv = first_drv; drv != NULL; drv = drv->next) {
974 it(opaque, drv->format_name);
975 }
976 }
977
978 BlockDriverState *bdrv_find(const char *name)
979 {
980 BlockDriverState *bs;
981
982 for (bs = bdrv_first; bs != NULL; bs = bs->next) {
983 if (!strcmp(name, bs->device_name))
984 return bs;
985 }
986 return NULL;
987 }
988
989 void bdrv_iterate(void (*it)(void *opaque, BlockDriverState *bs), void *opaque)
990 {
991 BlockDriverState *bs;
992
993 for (bs = bdrv_first; bs != NULL; bs = bs->next) {
994 it(opaque, bs);
995 }
996 }
997
998 const char *bdrv_get_device_name(BlockDriverState *bs)
999 {
1000 return bs->device_name;
1001 }
1002
1003 void bdrv_flush(BlockDriverState *bs)
1004 {
1005 if (!bs->drv)
1006 return;
1007 if (bs->drv->bdrv_flush)
1008 bs->drv->bdrv_flush(bs);
1009 if (bs->backing_hd)
1010 bdrv_flush(bs->backing_hd);
1011 }
1012
1013 void bdrv_flush_all(void)
1014 {
1015 BlockDriverState *bs;
1016
1017 for (bs = bdrv_first; bs != NULL; bs = bs->next)
1018 if (bs->drv && !bdrv_is_read_only(bs) &&
1019 (!bdrv_is_removable(bs) || bdrv_is_inserted(bs)))
1020 bdrv_flush(bs);
1021 }
1022
1023 /*
1024 * Returns true iff the specified sector is present in the disk image. Drivers
1025 * not implementing the functionality are assumed to not support backing files,
1026 * hence all their sectors are reported as allocated.
1027 *
1028 * 'pnum' is set to the number of sectors (including and immediately following
1029 * the specified sector) that are known to be in the same
1030 * allocated/unallocated state.
1031 *
1032 * 'nb_sectors' is the max value 'pnum' should be set to.
1033 */
1034 int bdrv_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors,
1035 int *pnum)
1036 {
1037 int64_t n;
1038 if (!bs->drv->bdrv_is_allocated) {
1039 if (sector_num >= bs->total_sectors) {
1040 *pnum = 0;
1041 return 0;
1042 }
1043 n = bs->total_sectors - sector_num;
1044 *pnum = (n < nb_sectors) ? (n) : (nb_sectors);
1045 return 1;
1046 }
1047 return bs->drv->bdrv_is_allocated(bs, sector_num, nb_sectors, pnum);
1048 }
1049
1050 void bdrv_info(Monitor *mon)
1051 {
1052 BlockDriverState *bs;
1053
1054 for (bs = bdrv_first; bs != NULL; bs = bs->next) {
1055 monitor_printf(mon, "%s:", bs->device_name);
1056 monitor_printf(mon, " type=");
1057 switch(bs->type) {
1058 case BDRV_TYPE_HD:
1059 monitor_printf(mon, "hd");
1060 break;
1061 case BDRV_TYPE_CDROM:
1062 monitor_printf(mon, "cdrom");
1063 break;
1064 case BDRV_TYPE_FLOPPY:
1065 monitor_printf(mon, "floppy");
1066 break;
1067 }
1068 monitor_printf(mon, " removable=%d", bs->removable);
1069 if (bs->removable) {
1070 monitor_printf(mon, " locked=%d", bs->locked);
1071 }
1072 if (bs->drv) {
1073 monitor_printf(mon, " file=");
1074 monitor_print_filename(mon, bs->filename);
1075 if (bs->backing_file[0] != '\0') {
1076 monitor_printf(mon, " backing_file=");
1077 monitor_print_filename(mon, bs->backing_file);
1078 }
1079 monitor_printf(mon, " ro=%d", bs->read_only);
1080 monitor_printf(mon, " drv=%s", bs->drv->format_name);
1081 monitor_printf(mon, " encrypted=%d", bdrv_is_encrypted(bs));
1082 } else {
1083 monitor_printf(mon, " [not inserted]");
1084 }
1085 monitor_printf(mon, "\n");
1086 }
1087 }
1088
1089 /* The "info blockstats" command. */
1090 void bdrv_info_stats(Monitor *mon)
1091 {
1092 BlockDriverState *bs;
1093
1094 for (bs = bdrv_first; bs != NULL; bs = bs->next) {
1095 monitor_printf(mon, "%s:"
1096 " rd_bytes=%" PRIu64
1097 " wr_bytes=%" PRIu64
1098 " rd_operations=%" PRIu64
1099 " wr_operations=%" PRIu64
1100 "\n",
1101 bs->device_name,
1102 bs->rd_bytes, bs->wr_bytes,
1103 bs->rd_ops, bs->wr_ops);
1104 }
1105 }
1106
1107 const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
1108 {
1109 if (bs->backing_hd && bs->backing_hd->encrypted)
1110 return bs->backing_file;
1111 else if (bs->encrypted)
1112 return bs->filename;
1113 else
1114 return NULL;
1115 }
1116
1117 void bdrv_get_backing_filename(BlockDriverState *bs,
1118 char *filename, int filename_size)
1119 {
1120 if (!bs->backing_hd) {
1121 pstrcpy(filename, filename_size, "");
1122 } else {
1123 pstrcpy(filename, filename_size, bs->backing_file);
1124 }
1125 }
1126
1127 int bdrv_write_compressed(BlockDriverState *bs, int64_t sector_num,
1128 const uint8_t *buf, int nb_sectors)
1129 {
1130 BlockDriver *drv = bs->drv;
1131 if (!drv)
1132 return -ENOMEDIUM;
1133 if (!drv->bdrv_write_compressed)
1134 return -ENOTSUP;
1135 return drv->bdrv_write_compressed(bs, sector_num, buf, nb_sectors);
1136 }
1137
1138 int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
1139 {
1140 BlockDriver *drv = bs->drv;
1141 if (!drv)
1142 return -ENOMEDIUM;
1143 if (!drv->bdrv_get_info)
1144 return -ENOTSUP;
1145 memset(bdi, 0, sizeof(*bdi));
1146 return drv->bdrv_get_info(bs, bdi);
1147 }
1148
1149 /**************************************************************/
1150 /* handling of snapshots */
1151
1152 int bdrv_snapshot_create(BlockDriverState *bs,
1153 QEMUSnapshotInfo *sn_info)
1154 {
1155 BlockDriver *drv = bs->drv;
1156 if (!drv)
1157 return -ENOMEDIUM;
1158 if (!drv->bdrv_snapshot_create)
1159 return -ENOTSUP;
1160 return drv->bdrv_snapshot_create(bs, sn_info);
1161 }
1162
1163 int bdrv_snapshot_goto(BlockDriverState *bs,
1164 const char *snapshot_id)
1165 {
1166 BlockDriver *drv = bs->drv;
1167 if (!drv)
1168 return -ENOMEDIUM;
1169 if (!drv->bdrv_snapshot_goto)
1170 return -ENOTSUP;
1171 return drv->bdrv_snapshot_goto(bs, snapshot_id);
1172 }
1173
1174 int bdrv_snapshot_delete(BlockDriverState *bs, const char *snapshot_id)
1175 {
1176 BlockDriver *drv = bs->drv;
1177 if (!drv)
1178 return -ENOMEDIUM;
1179 if (!drv->bdrv_snapshot_delete)
1180 return -ENOTSUP;
1181 return drv->bdrv_snapshot_delete(bs, snapshot_id);
1182 }
1183
1184 int bdrv_snapshot_list(BlockDriverState *bs,
1185 QEMUSnapshotInfo **psn_info)
1186 {
1187 BlockDriver *drv = bs->drv;
1188 if (!drv)
1189 return -ENOMEDIUM;
1190 if (!drv->bdrv_snapshot_list)
1191 return -ENOTSUP;
1192 return drv->bdrv_snapshot_list(bs, psn_info);
1193 }
1194
1195 #define NB_SUFFIXES 4
1196
1197 char *get_human_readable_size(char *buf, int buf_size, int64_t size)
1198 {
1199 static const char suffixes[NB_SUFFIXES] = "KMGT";
1200 int64_t base;
1201 int i;
1202
1203 if (size <= 999) {
1204 snprintf(buf, buf_size, "%" PRId64, size);
1205 } else {
1206 base = 1024;
1207 for(i = 0; i < NB_SUFFIXES; i++) {
1208 if (size < (10 * base)) {
1209 snprintf(buf, buf_size, "%0.1f%c",
1210 (double)size / base,
1211 suffixes[i]);
1212 break;
1213 } else if (size < (1000 * base) || i == (NB_SUFFIXES - 1)) {
1214 snprintf(buf, buf_size, "%" PRId64 "%c",
1215 ((size + (base >> 1)) / base),
1216 suffixes[i]);
1217 break;
1218 }
1219 base = base * 1024;
1220 }
1221 }
1222 return buf;
1223 }
1224
1225 char *bdrv_snapshot_dump(char *buf, int buf_size, QEMUSnapshotInfo *sn)
1226 {
1227 char buf1[128], date_buf[128], clock_buf[128];
1228 #ifdef _WIN32
1229 struct tm *ptm;
1230 #else
1231 struct tm tm;
1232 #endif
1233 time_t ti;
1234 int64_t secs;
1235
1236 if (!sn) {
1237 snprintf(buf, buf_size,
1238 "%-10s%-20s%7s%20s%15s",
1239 "ID", "TAG", "VM SIZE", "DATE", "VM CLOCK");
1240 } else {
1241 ti = sn->date_sec;
1242 #ifdef _WIN32
1243 ptm = localtime(&ti);
1244 strftime(date_buf, sizeof(date_buf),
1245 "%Y-%m-%d %H:%M:%S", ptm);
1246 #else
1247 localtime_r(&ti, &tm);
1248 strftime(date_buf, sizeof(date_buf),
1249 "%Y-%m-%d %H:%M:%S", &tm);
1250 #endif
1251 secs = sn->vm_clock_nsec / 1000000000;
1252 snprintf(clock_buf, sizeof(clock_buf),
1253 "%02d:%02d:%02d.%03d",
1254 (int)(secs / 3600),
1255 (int)((secs / 60) % 60),
1256 (int)(secs % 60),
1257 (int)((sn->vm_clock_nsec / 1000000) % 1000));
1258 snprintf(buf, buf_size,
1259 "%-10s%-20s%7s%20s%15s",
1260 sn->id_str, sn->name,
1261 get_human_readable_size(buf1, sizeof(buf1), sn->vm_state_size),
1262 date_buf,
1263 clock_buf);
1264 }
1265 return buf;
1266 }
1267
1268
1269 /**************************************************************/
1270 /* async I/Os */
1271
1272 typedef struct VectorTranslationAIOCB {
1273 BlockDriverAIOCB common;
1274 QEMUIOVector *iov;
1275 uint8_t *bounce;
1276 int is_write;
1277 BlockDriverAIOCB *aiocb;
1278 } VectorTranslationAIOCB;
1279
1280 static void bdrv_aio_cancel_vector(BlockDriverAIOCB *_acb)
1281 {
1282 VectorTranslationAIOCB *acb
1283 = container_of(_acb, VectorTranslationAIOCB, common);
1284
1285 bdrv_aio_cancel(acb->aiocb);
1286 }
1287
1288 static void bdrv_aio_rw_vector_cb(void *opaque, int ret)
1289 {
1290 VectorTranslationAIOCB *s = (VectorTranslationAIOCB *)opaque;
1291
1292 if (!s->is_write) {
1293 qemu_iovec_from_buffer(s->iov, s->bounce, s->iov->size);
1294 }
1295 qemu_vfree(s->bounce);
1296 s->common.cb(s->common.opaque, ret);
1297 qemu_aio_release(s);
1298 }
1299
1300 static BlockDriverAIOCB *bdrv_aio_rw_vector(BlockDriverState *bs,
1301 int64_t sector_num,
1302 QEMUIOVector *iov,
1303 int nb_sectors,
1304 BlockDriverCompletionFunc *cb,
1305 void *opaque,
1306 int is_write)
1307
1308 {
1309 VectorTranslationAIOCB *s = qemu_aio_get_pool(&vectored_aio_pool, bs,
1310 cb, opaque);
1311
1312 s->iov = iov;
1313 s->bounce = qemu_memalign(512, nb_sectors * 512);
1314 s->is_write = is_write;
1315 if (is_write) {
1316 qemu_iovec_to_buffer(s->iov, s->bounce);
1317 s->aiocb = bdrv_aio_write(bs, sector_num, s->bounce, nb_sectors,
1318 bdrv_aio_rw_vector_cb, s);
1319 } else {
1320 s->aiocb = bdrv_aio_read(bs, sector_num, s->bounce, nb_sectors,
1321 bdrv_aio_rw_vector_cb, s);
1322 }
1323 if (!s->aiocb) {
1324 qemu_vfree(s->bounce);
1325 qemu_aio_release(s);
1326 return NULL;
1327 }
1328 return &s->common;
1329 }
1330
1331 BlockDriverAIOCB *bdrv_aio_readv(BlockDriverState *bs, int64_t sector_num,
1332 QEMUIOVector *iov, int nb_sectors,
1333 BlockDriverCompletionFunc *cb, void *opaque)
1334 {
1335 if (bdrv_check_request(bs, sector_num, nb_sectors))
1336 return NULL;
1337
1338 return bdrv_aio_rw_vector(bs, sector_num, iov, nb_sectors,
1339 cb, opaque, 0);
1340 }
1341
1342 BlockDriverAIOCB *bdrv_aio_writev(BlockDriverState *bs, int64_t sector_num,
1343 QEMUIOVector *iov, int nb_sectors,
1344 BlockDriverCompletionFunc *cb, void *opaque)
1345 {
1346 if (bdrv_check_request(bs, sector_num, nb_sectors))
1347 return NULL;
1348
1349 return bdrv_aio_rw_vector(bs, sector_num, iov, nb_sectors,
1350 cb, opaque, 1);
1351 }
1352
1353 BlockDriverAIOCB *bdrv_aio_read(BlockDriverState *bs, int64_t sector_num,
1354 uint8_t *buf, int nb_sectors,
1355 BlockDriverCompletionFunc *cb, void *opaque)
1356 {
1357 BlockDriver *drv = bs->drv;
1358 BlockDriverAIOCB *ret;
1359
1360 if (!drv)
1361 return NULL;
1362 if (bdrv_check_request(bs, sector_num, nb_sectors))
1363 return NULL;
1364
1365 ret = drv->bdrv_aio_read(bs, sector_num, buf, nb_sectors, cb, opaque);
1366
1367 if (ret) {
1368 /* Update stats even though technically transfer has not happened. */
1369 bs->rd_bytes += (unsigned) nb_sectors * SECTOR_SIZE;
1370 bs->rd_ops ++;
1371 }
1372
1373 return ret;
1374 }
1375
1376 BlockDriverAIOCB *bdrv_aio_write(BlockDriverState *bs, int64_t sector_num,
1377 const uint8_t *buf, int nb_sectors,
1378 BlockDriverCompletionFunc *cb, void *opaque)
1379 {
1380 BlockDriver *drv = bs->drv;
1381 BlockDriverAIOCB *ret;
1382
1383 if (!drv)
1384 return NULL;
1385 if (bs->read_only)
1386 return NULL;
1387 if (bdrv_check_request(bs, sector_num, nb_sectors))
1388 return NULL;
1389
1390 ret = drv->bdrv_aio_write(bs, sector_num, buf, nb_sectors, cb, opaque);
1391
1392 if (ret) {
1393 /* Update stats even though technically transfer has not happened. */
1394 bs->wr_bytes += (unsigned) nb_sectors * SECTOR_SIZE;
1395 bs->wr_ops ++;
1396 }
1397
1398 return ret;
1399 }
1400
1401 void bdrv_aio_cancel(BlockDriverAIOCB *acb)
1402 {
1403 acb->pool->cancel(acb);
1404 }
1405
1406
1407 /**************************************************************/
1408 /* async block device emulation */
1409
1410 static void bdrv_aio_bh_cb(void *opaque)
1411 {
1412 BlockDriverAIOCBSync *acb = opaque;
1413 acb->common.cb(acb->common.opaque, acb->ret);
1414 qemu_aio_release(acb);
1415 }
1416
1417 static BlockDriverAIOCB *bdrv_aio_read_em(BlockDriverState *bs,
1418 int64_t sector_num, uint8_t *buf, int nb_sectors,
1419 BlockDriverCompletionFunc *cb, void *opaque)
1420 {
1421 BlockDriverAIOCBSync *acb;
1422 int ret;
1423
1424 acb = qemu_aio_get(bs, cb, opaque);
1425 if (!acb->bh)
1426 acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
1427 ret = bdrv_read(bs, sector_num, buf, nb_sectors);
1428 acb->ret = ret;
1429 qemu_bh_schedule(acb->bh);
1430 return &acb->common;
1431 }
1432
1433 static BlockDriverAIOCB *bdrv_aio_write_em(BlockDriverState *bs,
1434 int64_t sector_num, const uint8_t *buf, int nb_sectors,
1435 BlockDriverCompletionFunc *cb, void *opaque)
1436 {
1437 BlockDriverAIOCBSync *acb;
1438 int ret;
1439
1440 acb = qemu_aio_get(bs, cb, opaque);
1441 if (!acb->bh)
1442 acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
1443 ret = bdrv_write(bs, sector_num, buf, nb_sectors);
1444 acb->ret = ret;
1445 qemu_bh_schedule(acb->bh);
1446 return &acb->common;
1447 }
1448
1449 static void bdrv_aio_cancel_em(BlockDriverAIOCB *blockacb)
1450 {
1451 BlockDriverAIOCBSync *acb = (BlockDriverAIOCBSync *)blockacb;
1452 qemu_bh_cancel(acb->bh);
1453 qemu_aio_release(acb);
1454 }
1455
1456 /**************************************************************/
1457 /* sync block device emulation */
1458
1459 static void bdrv_rw_em_cb(void *opaque, int ret)
1460 {
1461 *(int *)opaque = ret;
1462 }
1463
1464 #define NOT_DONE 0x7fffffff
1465
1466 static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
1467 uint8_t *buf, int nb_sectors)
1468 {
1469 int async_ret;
1470 BlockDriverAIOCB *acb;
1471
1472 async_ret = NOT_DONE;
1473 acb = bdrv_aio_read(bs, sector_num, buf, nb_sectors,
1474 bdrv_rw_em_cb, &async_ret);
1475 if (acb == NULL)
1476 return -1;
1477
1478 while (async_ret == NOT_DONE) {
1479 qemu_aio_wait();
1480 }
1481
1482 return async_ret;
1483 }
1484
1485 static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
1486 const uint8_t *buf, int nb_sectors)
1487 {
1488 int async_ret;
1489 BlockDriverAIOCB *acb;
1490
1491 async_ret = NOT_DONE;
1492 acb = bdrv_aio_write(bs, sector_num, buf, nb_sectors,
1493 bdrv_rw_em_cb, &async_ret);
1494 if (acb == NULL)
1495 return -1;
1496 while (async_ret == NOT_DONE) {
1497 qemu_aio_wait();
1498 }
1499 return async_ret;
1500 }
1501
1502 void bdrv_init(void)
1503 {
1504 aio_pool_init(&vectored_aio_pool, sizeof(VectorTranslationAIOCB),
1505 bdrv_aio_cancel_vector);
1506
1507 bdrv_register(&bdrv_raw);
1508 bdrv_register(&bdrv_host_device);
1509 #ifndef _WIN32
1510 bdrv_register(&bdrv_cow);
1511 #endif
1512 bdrv_register(&bdrv_qcow);
1513 bdrv_register(&bdrv_vmdk);
1514 bdrv_register(&bdrv_cloop);
1515 bdrv_register(&bdrv_dmg);
1516 bdrv_register(&bdrv_bochs);
1517 bdrv_register(&bdrv_vpc);
1518 bdrv_register(&bdrv_vvfat);
1519 bdrv_register(&bdrv_qcow2);
1520 bdrv_register(&bdrv_parallels);
1521 bdrv_register(&bdrv_nbd);
1522 }
1523
1524 void aio_pool_init(AIOPool *pool, int aiocb_size,
1525 void (*cancel)(BlockDriverAIOCB *acb))
1526 {
1527 pool->aiocb_size = aiocb_size;
1528 pool->cancel = cancel;
1529 pool->free_aiocb = NULL;
1530 }
1531
1532 void *qemu_aio_get_pool(AIOPool *pool, BlockDriverState *bs,
1533 BlockDriverCompletionFunc *cb, void *opaque)
1534 {
1535 BlockDriverAIOCB *acb;
1536
1537 if (pool->free_aiocb) {
1538 acb = pool->free_aiocb;
1539 pool->free_aiocb = acb->next;
1540 } else {
1541 acb = qemu_mallocz(pool->aiocb_size);
1542 acb->pool = pool;
1543 }
1544 acb->bs = bs;
1545 acb->cb = cb;
1546 acb->opaque = opaque;
1547 return acb;
1548 }
1549
1550 void *qemu_aio_get(BlockDriverState *bs, BlockDriverCompletionFunc *cb,
1551 void *opaque)
1552 {
1553 return qemu_aio_get_pool(&bs->drv->aio_pool, bs, cb, opaque);
1554 }
1555
1556 void qemu_aio_release(void *p)
1557 {
1558 BlockDriverAIOCB *acb = (BlockDriverAIOCB *)p;
1559 AIOPool *pool = acb->pool;
1560 acb->next = pool->free_aiocb;
1561 pool->free_aiocb = acb;
1562 }
1563
1564 /**************************************************************/
1565 /* removable device support */
1566
1567 /**
1568 * Return TRUE if the media is present
1569 */
1570 int bdrv_is_inserted(BlockDriverState *bs)
1571 {
1572 BlockDriver *drv = bs->drv;
1573 int ret;
1574 if (!drv)
1575 return 0;
1576 if (!drv->bdrv_is_inserted)
1577 return 1;
1578 ret = drv->bdrv_is_inserted(bs);
1579 return ret;
1580 }
1581
1582 /**
1583 * Return TRUE if the media changed since the last call to this
1584 * function. It is currently only used for floppy disks
1585 */
1586 int bdrv_media_changed(BlockDriverState *bs)
1587 {
1588 BlockDriver *drv = bs->drv;
1589 int ret;
1590
1591 if (!drv || !drv->bdrv_media_changed)
1592 ret = -ENOTSUP;
1593 else
1594 ret = drv->bdrv_media_changed(bs);
1595 if (ret == -ENOTSUP)
1596 ret = bs->media_changed;
1597 bs->media_changed = 0;
1598 return ret;
1599 }
1600
1601 /**
1602 * If eject_flag is TRUE, eject the media. Otherwise, close the tray
1603 */
1604 void bdrv_eject(BlockDriverState *bs, int eject_flag)
1605 {
1606 BlockDriver *drv = bs->drv;
1607 int ret;
1608
1609 if (!drv || !drv->bdrv_eject) {
1610 ret = -ENOTSUP;
1611 } else {
1612 ret = drv->bdrv_eject(bs, eject_flag);
1613 }
1614 if (ret == -ENOTSUP) {
1615 if (eject_flag)
1616 bdrv_close(bs);
1617 }
1618 }
1619
1620 int bdrv_is_locked(BlockDriverState *bs)
1621 {
1622 return bs->locked;
1623 }
1624
1625 /**
1626 * Lock or unlock the media (if it is locked, the user won't be able
1627 * to eject it manually).
1628 */
1629 void bdrv_set_locked(BlockDriverState *bs, int locked)
1630 {
1631 BlockDriver *drv = bs->drv;
1632
1633 bs->locked = locked;
1634 if (drv && drv->bdrv_set_locked) {
1635 drv->bdrv_set_locked(bs, locked);
1636 }
1637 }
1638
1639 /* needed for generic scsi interface */
1640
1641 int bdrv_ioctl(BlockDriverState *bs, unsigned long int req, void *buf)
1642 {
1643 BlockDriver *drv = bs->drv;
1644
1645 if (drv && drv->bdrv_ioctl)
1646 return drv->bdrv_ioctl(bs, req, buf);
1647 return -ENOTSUP;
1648 }
1649
1650 BlockDriverAIOCB *bdrv_aio_ioctl(BlockDriverState *bs,
1651 unsigned long int req, void *buf,
1652 BlockDriverCompletionFunc *cb, void *opaque)
1653 {
1654 BlockDriver *drv = bs->drv;
1655
1656 if (drv && drv->bdrv_aio_ioctl)
1657 return drv->bdrv_aio_ioctl(bs, req, buf, cb, opaque);
1658 return NULL;
1659 }