]> git.proxmox.com Git - mirror_qemu.git/blame - block/vpc.c
block/vpc: Pad VHDFooter, replace uint8_t[] buffers
[mirror_qemu.git] / block / vpc.c
CommitLineData
6a0f9e82 1/*
cc2040f8 2 * Block driver for Connectix / Microsoft Virtual PC images
5fafdf24 3 *
6a0f9e82 4 * Copyright (c) 2005 Alex Beregszaszi
15d35bc5 5 * Copyright (c) 2009 Kevin Wolf <kwolf@suse.de>
5fafdf24 6 *
6a0f9e82
FB
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 * THE SOFTWARE.
24 */
922a01a0 25
80c71a24 26#include "qemu/osdep.h"
da34e65c 27#include "qapi/error.h"
737e150e 28#include "block/block_int.h"
609f45ea 29#include "block/qdict.h"
b8f45cdf 30#include "sysemu/block-backend.h"
1de7afc9 31#include "qemu/module.h"
922a01a0 32#include "qemu/option.h"
795c40b8 33#include "migration/blocker.h"
58369e22 34#include "qemu/bswap.h"
38440a21 35#include "qemu/uuid.h"
182c8835
KW
36#include "qapi/qmp/qdict.h"
37#include "qapi/qobject-input-visitor.h"
38#include "qapi/qapi-visit-block-core.h"
6a0f9e82
FB
39
40/**************************************************************/
41
42#define HEADER_SIZE 512
43
44//#define CACHE
45
2cfacb62
AL
46enum vhd_type {
47 VHD_FIXED = 2,
48 VHD_DYNAMIC = 3,
49 VHD_DIFFERENCING = 4,
50};
51
9c057d0b 52/* Seconds since Jan 1, 2000 0:00:00 (UTC) */
57c7d9e5
AL
53#define VHD_TIMESTAMP_BASE 946684800
54
fb9245c2
JC
55#define VHD_CHS_MAX_C 65535LL
56#define VHD_CHS_MAX_H 16
57#define VHD_CHS_MAX_S 255
58
c23fb11b 59#define VHD_MAX_SECTORS 0xff000000 /* 2040 GiB max image size */
fb9245c2
JC
60#define VHD_MAX_GEOMETRY (VHD_CHS_MAX_C * VHD_CHS_MAX_H * VHD_CHS_MAX_S)
61
62#define VPC_OPT_FORCE_SIZE "force_size"
97f1c45c 63
9c057d0b 64/* always big-endian */
e54835c0 65typedef struct vhd_footer {
9c057d0b 66 char creator[8]; /* "conectix" */
2cfacb62
AL
67 uint32_t features;
68 uint32_t version;
69
9c057d0b 70 /* Offset of next header structure, 0xFFFFFFFF if none */
2cfacb62
AL
71 uint64_t data_offset;
72
9c057d0b 73 /* Seconds since Jan 1, 2000 0:00:00 (UTC) */
2cfacb62
AL
74 uint32_t timestamp;
75
9c057d0b 76 char creator_app[4]; /* e.g., "vpc " */
2cfacb62
AL
77 uint16_t major;
78 uint16_t minor;
9c057d0b 79 char creator_os[4]; /* "Wi2k" */
2cfacb62
AL
80
81 uint64_t orig_size;
03671ded 82 uint64_t current_size;
2cfacb62
AL
83
84 uint16_t cyls;
85 uint8_t heads;
86 uint8_t secs_per_cyl;
87
88 uint32_t type;
89
9c057d0b
JC
90 /* Checksum of the Hard Disk Footer ("one's complement of the sum of all
91 the bytes in the footer without the checksum field") */
2cfacb62
AL
92 uint32_t checksum;
93
9c057d0b 94 /* UUID used to identify a parent hard disk (backing file) */
38440a21 95 QemuUUID uuid;
2cfacb62
AL
96
97 uint8_t in_saved_state;
275734e4 98 uint8_t reserved[427];
e54835c0 99} QEMU_PACKED VHDFooter;
b9fa33a6 100
275734e4
MA
101QEMU_BUILD_BUG_ON(sizeof(VHDFooter) != 512);
102
e54835c0 103typedef struct vhd_dyndisk_header {
9c057d0b 104 char magic[8]; /* "cxsparse" */
2cfacb62 105
9c057d0b 106 /* Offset of next header structure, 0xFFFFFFFF if none */
2cfacb62
AL
107 uint64_t data_offset;
108
9c057d0b 109 /* Offset of the Block Allocation Table (BAT) */
2cfacb62
AL
110 uint64_t table_offset;
111
112 uint32_t version;
9c057d0b 113 uint32_t max_table_entries; /* 32bit/entry */
2cfacb62 114
9c057d0b 115 /* 2 MB by default, must be a power of two */
2cfacb62
AL
116 uint32_t block_size;
117
118 uint32_t checksum;
119 uint8_t parent_uuid[16];
120 uint32_t parent_timestamp;
121 uint32_t reserved;
122
9c057d0b 123 /* Backing file name (in UTF-16) */
2cfacb62
AL
124 uint8_t parent_name[512];
125
126 struct {
127 uint32_t platform;
128 uint32_t data_space;
129 uint32_t data_length;
130 uint32_t reserved;
131 uint64_t data_offset;
132 } parent_locator[8];
e326f078 133 uint8_t reserved2[256];
e54835c0 134} QEMU_PACKED VHDDynDiskHeader;
6a0f9e82 135
e326f078
MA
136QEMU_BUILD_BUG_ON(sizeof(VHDDynDiskHeader) != 1024);
137
6a0f9e82 138typedef struct BDRVVPCState {
848c66e8 139 CoMutex lock;
275734e4 140 VHDFooter footer;
15d35bc5 141 uint64_t free_data_block_offset;
2cfacb62 142 int max_table_entries;
6a0f9e82 143 uint32_t *pagetable;
15d35bc5
AL
144 uint64_t bat_offset;
145 uint64_t last_bitmap_offset;
6a0f9e82 146
2cfacb62 147 uint32_t block_size;
15d35bc5 148 uint32_t bitmap_size;
c540d53a
JC
149 bool force_use_chs;
150 bool force_use_sz;
15d35bc5 151
6a0f9e82
FB
152#ifdef CACHE
153 uint8_t *pageentry_u8;
154 uint32_t *pageentry_u32;
155 uint16_t *pageentry_u16;
3b46e624 156
6a0f9e82
FB
157 uint64_t last_bitmap;
158#endif
612ff3d8
KW
159
160 Error *migration_blocker;
6a0f9e82
FB
161} BDRVVPCState;
162
c540d53a
JC
163#define VPC_OPT_SIZE_CALC "force_size_calc"
164static QemuOptsList vpc_runtime_opts = {
165 .name = "vpc-runtime-opts",
166 .head = QTAILQ_HEAD_INITIALIZER(vpc_runtime_opts.head),
167 .desc = {
168 {
169 .name = VPC_OPT_SIZE_CALC,
170 .type = QEMU_OPT_STRING,
171 .help = "Force disk size calculation to use either CHS geometry, "
172 "or use the disk current_size specified in the VHD footer. "
173 "{chs, current_size}"
174 },
175 { /* end of list */ }
176 }
177};
178
182c8835
KW
179static QemuOptsList vpc_create_opts;
180
7550379d 181static uint32_t vpc_checksum(void *p, size_t size)
57c7d9e5 182{
7550379d 183 uint8_t *buf = p;
57c7d9e5
AL
184 uint32_t res = 0;
185 int i;
186
187 for (i = 0; i < size; i++)
188 res += buf[i];
189
190 return ~res;
191}
192
193
6a0f9e82
FB
194static int vpc_probe(const uint8_t *buf, int buf_size, const char *filename)
195{
ffe8ab83 196 if (buf_size >= 8 && !strncmp((char *)buf, "conectix", 8))
7d37435b 197 return 100;
6a0f9e82
FB
198 return 0;
199}
200
c540d53a
JC
201static void vpc_parse_options(BlockDriverState *bs, QemuOpts *opts,
202 Error **errp)
203{
204 BDRVVPCState *s = bs->opaque;
205 const char *size_calc;
206
207 size_calc = qemu_opt_get(opts, VPC_OPT_SIZE_CALC);
208
209 if (!size_calc) {
210 /* no override, use autodetect only */
211 } else if (!strcmp(size_calc, "current_size")) {
212 s->force_use_sz = true;
213 } else if (!strcmp(size_calc, "chs")) {
214 s->force_use_chs = true;
215 } else {
216 error_setg(errp, "Invalid size calculation mode: '%s'", size_calc);
217 }
218}
219
015a1036
HR
220static int vpc_open(BlockDriverState *bs, QDict *options, int flags,
221 Error **errp)
6a0f9e82
FB
222{
223 BDRVVPCState *s = bs->opaque;
66f82cee 224 int i;
e54835c0 225 VHDFooter *footer;
c540d53a
JC
226 QemuOpts *opts = NULL;
227 Error *local_err = NULL;
228 bool use_chs;
e326f078 229 VHDDynDiskHeader dyndisk_header;
57c7d9e5 230 uint32_t checksum;
97f1c45c 231 uint64_t computed_size;
b15deac7 232 uint64_t pagetable_size;
24da78db 233 int disk_type = VHD_DYNAMIC;
59294e46 234 int ret;
81caa3cc 235 int64_t bs_size;
6a0f9e82 236
8b1869da
HR
237 bs->file = bdrv_open_child(NULL, options, "file", bs, &child_of_bds,
238 BDRV_CHILD_IMAGE, false, errp);
4e4bf5c4
KW
239 if (!bs->file) {
240 return -EINVAL;
241 }
242
c540d53a 243 opts = qemu_opts_create(&vpc_runtime_opts, NULL, 0, &error_abort);
af175e85 244 if (!qemu_opts_absorb_qdict(opts, options, errp)) {
c540d53a
JC
245 ret = -EINVAL;
246 goto fail;
247 }
248
249 vpc_parse_options(bs, opts, &local_err);
250 if (local_err) {
251 error_propagate(errp, local_err);
252 ret = -EINVAL;
253 goto fail;
254 }
255
275734e4 256 ret = bdrv_pread(bs->file, 0, &s->footer, HEADER_SIZE);
59294e46 257 if (ret < 0) {
32f6439c 258 error_setg(errp, "Unable to read VHD header");
6a0f9e82 259 goto fail;
59294e46 260 }
6a0f9e82 261
275734e4 262 footer = &s->footer;
24da78db 263 if (strncmp(footer->creator, "conectix", 8)) {
9a4f4c31 264 int64_t offset = bdrv_getlength(bs->file->bs);
59294e46
KW
265 if (offset < 0) {
266 ret = offset;
32f6439c 267 error_setg(errp, "Invalid file size");
59294e46
KW
268 goto fail;
269 } else if (offset < HEADER_SIZE) {
270 ret = -EINVAL;
32f6439c 271 error_setg(errp, "File too small for a VHD header");
24da78db
CA
272 goto fail;
273 }
59294e46 274
24da78db 275 /* If a fixed disk, the footer is found only at the end of the file */
275734e4 276 ret = bdrv_pread(bs->file, offset - HEADER_SIZE, footer,
59294e46
KW
277 HEADER_SIZE);
278 if (ret < 0) {
24da78db
CA
279 goto fail;
280 }
281 if (strncmp(footer->creator, "conectix", 8)) {
76abe407
PB
282 error_setg(errp, "invalid VPC image");
283 ret = -EINVAL;
24da78db
CA
284 goto fail;
285 }
286 disk_type = VHD_FIXED;
287 }
6a0f9e82 288
57c7d9e5
AL
289 checksum = be32_to_cpu(footer->checksum);
290 footer->checksum = 0;
275734e4 291 if (vpc_checksum(footer, HEADER_SIZE) != checksum) {
04788ba2
MA
292 error_setg(errp, "Incorrect header checksum");
293 ret = -EINVAL;
294 goto fail;
295 }
57c7d9e5 296
c088b691 297 /* Write 'checksum' back to footer, or else will leave it with zero. */
a4127c42 298 footer->checksum = cpu_to_be32(checksum);
c088b691 299
9c057d0b
JC
300 /* The visible size of a image in Virtual PC depends on the geometry
301 rather than on the size stored in the footer (the size in the footer
302 is too large usually) */
33ccf667
SH
303 bs->total_sectors = (int64_t)
304 be16_to_cpu(footer->cyls) * footer->heads * footer->secs_per_cyl;
1fa79228 305
c540d53a
JC
306 /* Microsoft Virtual PC and Microsoft Hyper-V produce and read
307 * VHD image sizes differently. VPC will rely on CHS geometry,
308 * while Hyper-V and disk2vhd use the size specified in the footer.
309 *
310 * We use a couple of approaches to try and determine the correct method:
311 * look at the Creator App field, and look for images that have CHS
312 * geometry that is the maximum value.
313 *
314 * If the CHS geometry is the maximum CHS geometry, then we assume that
315 * the size is the footer->current_size to avoid truncation. Otherwise,
316 * we follow the table based on footer->creator_app:
317 *
318 * Known creator apps:
319 * 'vpc ' : CHS Virtual PC (uses disk geometry)
320 * 'qemu' : CHS QEMU (uses disk geometry)
fb9245c2 321 * 'qem2' : current_size QEMU (uses current_size)
c540d53a
JC
322 * 'win ' : current_size Hyper-V
323 * 'd2v ' : current_size Disk2vhd
9bdfb9e8 324 * 'tap\0' : current_size XenServer
bab246db 325 * 'CTXS' : current_size XenConverter
c540d53a
JC
326 *
327 * The user can override the table values via drive options, however
328 * even with an override we will still use current_size for images
329 * that have CHS geometry of the maximum size.
330 */
331 use_chs = (!!strncmp(footer->creator_app, "win ", 4) &&
fb9245c2 332 !!strncmp(footer->creator_app, "qem2", 4) &&
9bdfb9e8 333 !!strncmp(footer->creator_app, "d2v ", 4) &&
bab246db 334 !!strncmp(footer->creator_app, "CTXS", 4) &&
9bdfb9e8 335 !!memcmp(footer->creator_app, "tap", 4)) || s->force_use_chs;
c540d53a
JC
336
337 if (!use_chs || bs->total_sectors == VHD_MAX_GEOMETRY || s->force_use_sz) {
03671ded 338 bs->total_sectors = be64_to_cpu(footer->current_size) /
c540d53a 339 BDRV_SECTOR_SIZE;
0173e7bb
PL
340 }
341
c23fb11b
JC
342 /* Allow a maximum disk size of 2040 GiB */
343 if (bs->total_sectors > VHD_MAX_SECTORS) {
59294e46 344 ret = -EFBIG;
efc8243d
SH
345 goto fail;
346 }
347
24da78db 348 if (disk_type == VHD_DYNAMIC) {
02df95c4 349 ret = bdrv_pread(bs->file, be64_to_cpu(footer->data_offset),
3d6101a3 350 &dyndisk_header, sizeof(dyndisk_header));
59294e46 351 if (ret < 0) {
32f6439c 352 error_setg(errp, "Error reading dynamic VHD header");
24da78db
CA
353 goto fail;
354 }
b9fa33a6 355
e326f078 356 if (strncmp(dyndisk_header.magic, "cxsparse", 8)) {
32f6439c 357 error_setg(errp, "Invalid header magic");
59294e46 358 ret = -EINVAL;
24da78db
CA
359 goto fail;
360 }
6a0f9e82 361
e326f078 362 s->block_size = be32_to_cpu(dyndisk_header.block_size);
5e71dfad
KW
363 if (!is_power_of_2(s->block_size) || s->block_size < BDRV_SECTOR_SIZE) {
364 error_setg(errp, "Invalid block size %" PRIu32, s->block_size);
365 ret = -EINVAL;
366 goto fail;
367 }
24da78db 368 s->bitmap_size = ((s->block_size / (8 * 512)) + 511) & ~511;
15d35bc5 369
e326f078 370 s->max_table_entries = be32_to_cpu(dyndisk_header.max_table_entries);
97f1c45c
JC
371
372 if ((bs->total_sectors * 512) / s->block_size > 0xffffffffU) {
32f6439c 373 error_setg(errp, "Too many blocks");
97f1c45c
JC
374 ret = -EINVAL;
375 goto fail;
376 }
97f1c45c
JC
377
378 computed_size = (uint64_t) s->max_table_entries * s->block_size;
379 if (computed_size < bs->total_sectors * 512) {
32f6439c 380 error_setg(errp, "Page table too small");
97f1c45c
JC
381 ret = -EINVAL;
382 goto fail;
383 }
384
b15deac7
JC
385 if (s->max_table_entries > SIZE_MAX / 4 ||
386 s->max_table_entries > (int) INT_MAX / 4) {
387 error_setg(errp, "Max Table Entries too large (%" PRId32 ")",
388 s->max_table_entries);
389 ret = -EINVAL;
390 goto fail;
391 }
392
393 pagetable_size = (uint64_t) s->max_table_entries * 4;
394
9a4f4c31 395 s->pagetable = qemu_try_blockalign(bs->file->bs, pagetable_size);
5fb09cd5 396 if (s->pagetable == NULL) {
32f6439c 397 error_setg(errp, "Unable to allocate memory for page table");
5fb09cd5
KW
398 ret = -ENOMEM;
399 goto fail;
400 }
b71d1c2e 401
e326f078 402 s->bat_offset = be64_to_cpu(dyndisk_header.table_offset);
59294e46 403
cf2ab8fc 404 ret = bdrv_pread(bs->file, s->bat_offset, s->pagetable,
9a4f4c31 405 pagetable_size);
59294e46 406 if (ret < 0) {
32f6439c 407 error_setg(errp, "Error reading pagetable");
24da78db
CA
408 goto fail;
409 }
b71d1c2e 410
24da78db 411 s->free_data_block_offset =
b15deac7 412 ROUND_UP(s->bat_offset + pagetable_size, 512);
15d35bc5 413
24da78db
CA
414 for (i = 0; i < s->max_table_entries; i++) {
415 be32_to_cpus(&s->pagetable[i]);
416 if (s->pagetable[i] != 0xFFFFFFFF) {
417 int64_t next = (512 * (int64_t) s->pagetable[i]) +
418 s->bitmap_size + s->block_size;
15d35bc5 419
24da78db
CA
420 if (next > s->free_data_block_offset) {
421 s->free_data_block_offset = next;
422 }
423 }
15d35bc5 424 }
15d35bc5 425
81caa3cc
EB
426 bs_size = bdrv_getlength(bs->file->bs);
427 if (bs_size < 0) {
428 error_setg_errno(errp, -bs_size, "Unable to learn image size");
429 ret = bs_size;
430 goto fail;
431 }
432 if (s->free_data_block_offset > bs_size) {
fb8fe35f
PL
433 error_setg(errp, "block-vpc: free_data_block_offset points after "
434 "the end of file. The image has been truncated.");
435 ret = -EINVAL;
436 goto fail;
437 }
438
24da78db 439 s->last_bitmap_offset = (int64_t) -1;
6a0f9e82 440
6a0f9e82 441#ifdef CACHE
24da78db
CA
442 s->pageentry_u8 = g_malloc(512);
443 s->pageentry_u32 = s->pageentry_u8;
444 s->pageentry_u16 = s->pageentry_u8;
445 s->last_pagetable = -1;
6a0f9e82 446#endif
24da78db 447 }
6a0f9e82 448
612ff3d8 449 /* Disable migration when VHD images are used */
81e5f78a
AG
450 error_setg(&s->migration_blocker, "The vpc format used by node '%s' "
451 "does not support live migration",
452 bdrv_get_device_or_node_name(bs));
386f6c07
MA
453 ret = migrate_add_blocker(s->migration_blocker, errp);
454 if (ret < 0) {
fe44dc91
AA
455 error_free(s->migration_blocker);
456 goto fail;
457 }
458
459 qemu_co_mutex_init(&s->lock);
c317b646 460 qemu_opts_del(opts);
612ff3d8 461
6a0f9e82 462 return 0;
59294e46
KW
463
464fail:
c317b646 465 qemu_opts_del(opts);
97f1c45c 466 qemu_vfree(s->pagetable);
59294e46
KW
467#ifdef CACHE
468 g_free(s->pageentry_u8);
469#endif
470 return ret;
6a0f9e82
FB
471}
472
3fe4b700
JC
473static int vpc_reopen_prepare(BDRVReopenState *state,
474 BlockReopenQueue *queue, Error **errp)
475{
476 return 0;
477}
478
b71d1c2e
AL
479/*
480 * Returns the absolute byte offset of the given sector in the image file.
481 * If the sector is not allocated, -1 is returned instead.
cfc87e00
PM
482 * If an error occurred trying to write an updated block bitmap back to
483 * the file, -2 is returned, and the error value is written to *err.
484 * This can only happen for a write operation.
15d35bc5
AL
485 *
486 * The parameter write must be 1 if the offset will be used for a write
487 * operation (the block bitmaps is updated then), 0 otherwise.
cfc87e00 488 * If write is true then err must not be NULL.
b71d1c2e 489 */
d46b7cc6 490static inline int64_t get_image_offset(BlockDriverState *bs, uint64_t offset,
cfc87e00 491 bool write, int *err)
6a0f9e82
FB
492{
493 BDRVVPCState *s = bs->opaque;
6a0f9e82 494 uint64_t bitmap_offset, block_offset;
d46b7cc6 495 uint32_t pagetable_index, offset_in_block;
6a0f9e82 496
cfc87e00
PM
497 assert(!(write && err == NULL));
498
2cfacb62 499 pagetable_index = offset / s->block_size;
d46b7cc6 500 offset_in_block = offset % s->block_size;
3b46e624 501
15d35bc5 502 if (pagetable_index >= s->max_table_entries || s->pagetable[pagetable_index] == 0xffffffff)
9c057d0b 503 return -1; /* not allocated */
6a0f9e82 504
378e2aea 505 bitmap_offset = 512 * (uint64_t) s->pagetable[pagetable_index];
d46b7cc6 506 block_offset = bitmap_offset + s->bitmap_size + offset_in_block;
15d35bc5 507
9c057d0b
JC
508 /* We must ensure that we don't write to any sectors which are marked as
509 unused in the bitmap. We get away with setting all bits in the block
510 bitmap each time we write to a new block. This might cause Virtual PC to
511 miss sparse read optimization, but it's not a problem in terms of
512 correctness. */
15d35bc5
AL
513 if (write && (s->last_bitmap_offset != bitmap_offset)) {
514 uint8_t bitmap[s->bitmap_size];
cfc87e00 515 int r;
15d35bc5
AL
516
517 s->last_bitmap_offset = bitmap_offset;
518 memset(bitmap, 0xff, s->bitmap_size);
cfc87e00
PM
519 r = bdrv_pwrite_sync(bs->file, bitmap_offset, bitmap, s->bitmap_size);
520 if (r < 0) {
521 *err = r;
522 return -2;
523 }
15d35bc5 524 }
3b46e624 525
b71d1c2e 526 return block_offset;
6a0f9e82
FB
527}
528
15d35bc5
AL
529/*
530 * Writes the footer to the end of the image file. This is needed when the
531 * file grows as it overwrites the old footer
532 *
533 * Returns 0 on success and < 0 on error
534 */
5f14f31d 535static int rewrite_footer(BlockDriverState *bs)
15d35bc5
AL
536{
537 int ret;
538 BDRVVPCState *s = bs->opaque;
539 int64_t offset = s->free_data_block_offset;
540
275734e4 541 ret = bdrv_pwrite_sync(bs->file, offset, &s->footer, HEADER_SIZE);
15d35bc5
AL
542 if (ret < 0)
543 return ret;
544
545 return 0;
546}
547
548/*
549 * Allocates a new block. This involves writing a new footer and updating
550 * the Block Allocation Table to use the space at the old end of the image
551 * file (overwriting the old footer)
552 *
553 * Returns the sectors' offset in the image file on success and < 0 on error
554 */
5f14f31d 555static int64_t alloc_block(BlockDriverState *bs, int64_t offset)
15d35bc5
AL
556{
557 BDRVVPCState *s = bs->opaque;
558 int64_t bat_offset;
559 uint32_t index, bat_value;
560 int ret;
561 uint8_t bitmap[s->bitmap_size];
562
9c057d0b 563 /* Check if sector_num is valid */
513b0f02
KW
564 if ((offset < 0) || (offset > bs->total_sectors * BDRV_SECTOR_SIZE)) {
565 return -EINVAL;
566 }
15d35bc5 567
9c057d0b 568 /* Write entry into in-memory BAT */
513b0f02
KW
569 index = offset / s->block_size;
570 assert(s->pagetable[index] == 0xFFFFFFFF);
15d35bc5
AL
571 s->pagetable[index] = s->free_data_block_offset / 512;
572
9c057d0b 573 /* Initialize the block's bitmap */
15d35bc5 574 memset(bitmap, 0xff, s->bitmap_size);
d9ca2ea2 575 ret = bdrv_pwrite_sync(bs->file, s->free_data_block_offset, bitmap,
078a458e 576 s->bitmap_size);
5bb1cbac
KW
577 if (ret < 0) {
578 return ret;
579 }
15d35bc5 580
9c057d0b 581 /* Write new footer (the old one will be overwritten) */
15d35bc5
AL
582 s->free_data_block_offset += s->block_size + s->bitmap_size;
583 ret = rewrite_footer(bs);
584 if (ret < 0)
585 goto fail;
586
9c057d0b 587 /* Write BAT entry to disk */
15d35bc5 588 bat_offset = s->bat_offset + (4 * index);
a4127c42 589 bat_value = cpu_to_be32(s->pagetable[index]);
d9ca2ea2 590 ret = bdrv_pwrite_sync(bs->file, bat_offset, &bat_value, 4);
15d35bc5
AL
591 if (ret < 0)
592 goto fail;
593
cfc87e00 594 return get_image_offset(bs, offset, false, NULL);
15d35bc5
AL
595
596fail:
597 s->free_data_block_offset -= (s->block_size + s->bitmap_size);
513b0f02 598 return ret;
15d35bc5
AL
599}
600
97b00e28
PB
601static int vpc_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
602{
603 BDRVVPCState *s = (BDRVVPCState *)bs->opaque;
97b00e28 604
275734e4 605 if (be32_to_cpu(s->footer.type) != VHD_FIXED) {
97b00e28
PB
606 bdi->cluster_size = s->block_size;
607 }
608
609 return 0;
610}
611
d46b7cc6
KW
612static int coroutine_fn
613vpc_co_preadv(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
614 QEMUIOVector *qiov, int flags)
6a0f9e82 615{
6c6ea921 616 BDRVVPCState *s = bs->opaque;
6a0f9e82 617 int ret;
d46b7cc6
KW
618 int64_t image_offset;
619 int64_t n_bytes;
620 int64_t bytes_done = 0;
d46b7cc6 621 QEMUIOVector local_qiov;
6a0f9e82 622
275734e4 623 if (be32_to_cpu(s->footer.type) == VHD_FIXED) {
a03ef88f 624 return bdrv_co_preadv(bs->file, offset, bytes, qiov, 0);
24da78db 625 }
b71d1c2e 626
d46b7cc6
KW
627 qemu_co_mutex_lock(&s->lock);
628 qemu_iovec_init(&local_qiov, qiov->niov);
6c6ea921 629
d46b7cc6 630 while (bytes > 0) {
cfc87e00 631 image_offset = get_image_offset(bs, offset, false, NULL);
d46b7cc6
KW
632 n_bytes = MIN(bytes, s->block_size - (offset % s->block_size));
633
634 if (image_offset == -1) {
635 qemu_iovec_memset(qiov, bytes_done, 0, n_bytes);
b71d1c2e 636 } else {
d46b7cc6
KW
637 qemu_iovec_reset(&local_qiov);
638 qemu_iovec_concat(&local_qiov, qiov, bytes_done, n_bytes);
639
126734c4 640 qemu_co_mutex_unlock(&s->lock);
a03ef88f 641 ret = bdrv_co_preadv(bs->file, image_offset, n_bytes,
d46b7cc6 642 &local_qiov, 0);
126734c4 643 qemu_co_mutex_lock(&s->lock);
d46b7cc6
KW
644 if (ret < 0) {
645 goto fail;
6c6ea921 646 }
b71d1c2e
AL
647 }
648
d46b7cc6
KW
649 bytes -= n_bytes;
650 offset += n_bytes;
651 bytes_done += n_bytes;
6a0f9e82 652 }
6a0f9e82 653
d46b7cc6
KW
654 ret = 0;
655fail:
656 qemu_iovec_destroy(&local_qiov);
2914caa0 657 qemu_co_mutex_unlock(&s->lock);
d46b7cc6 658
2914caa0
PB
659 return ret;
660}
661
513b0f02
KW
662static int coroutine_fn
663vpc_co_pwritev(BlockDriverState *bs, uint64_t offset, uint64_t bytes,
664 QEMUIOVector *qiov, int flags)
15d35bc5 665{
6c6ea921 666 BDRVVPCState *s = bs->opaque;
513b0f02
KW
667 int64_t image_offset;
668 int64_t n_bytes;
669 int64_t bytes_done = 0;
c8115f8e 670 int ret = 0;
513b0f02 671 QEMUIOVector local_qiov;
15d35bc5 672
275734e4 673 if (be32_to_cpu(s->footer.type) == VHD_FIXED) {
a03ef88f 674 return bdrv_co_pwritev(bs->file, offset, bytes, qiov, 0);
24da78db 675 }
15d35bc5 676
513b0f02
KW
677 qemu_co_mutex_lock(&s->lock);
678 qemu_iovec_init(&local_qiov, qiov->niov);
679
680 while (bytes > 0) {
cfc87e00
PM
681 image_offset = get_image_offset(bs, offset, true, &ret);
682 if (image_offset == -2) {
683 /* Failed to write block bitmap: can't proceed with write */
684 goto fail;
685 }
513b0f02 686 n_bytes = MIN(bytes, s->block_size - (offset % s->block_size));
6c6ea921 687
513b0f02
KW
688 if (image_offset == -1) {
689 image_offset = alloc_block(bs, offset);
690 if (image_offset < 0) {
691 ret = image_offset;
692 goto fail;
693 }
15d35bc5
AL
694 }
695
513b0f02
KW
696 qemu_iovec_reset(&local_qiov);
697 qemu_iovec_concat(&local_qiov, qiov, bytes_done, n_bytes);
698
126734c4 699 qemu_co_mutex_unlock(&s->lock);
a03ef88f 700 ret = bdrv_co_pwritev(bs->file, image_offset, n_bytes,
513b0f02 701 &local_qiov, 0);
126734c4 702 qemu_co_mutex_lock(&s->lock);
513b0f02
KW
703 if (ret < 0) {
704 goto fail;
6c6ea921 705 }
15d35bc5 706
513b0f02
KW
707 bytes -= n_bytes;
708 offset += n_bytes;
709 bytes_done += n_bytes;
15d35bc5
AL
710 }
711
513b0f02
KW
712 ret = 0;
713fail:
714 qemu_iovec_destroy(&local_qiov);
e183ef75 715 qemu_co_mutex_unlock(&s->lock);
513b0f02 716
e183ef75
PB
717 return ret;
718}
719
2f83673b
EB
720static int coroutine_fn vpc_co_block_status(BlockDriverState *bs,
721 bool want_zero,
722 int64_t offset, int64_t bytes,
723 int64_t *pnum, int64_t *map,
724 BlockDriverState **file)
0cc84887
KW
725{
726 BDRVVPCState *s = bs->opaque;
2f83673b 727 int64_t image_offset;
0cc84887 728 bool allocated;
2f83673b
EB
729 int ret;
730 int64_t n;
0cc84887 731
275734e4 732 if (be32_to_cpu(s->footer.type) == VHD_FIXED) {
2f83673b
EB
733 *pnum = bytes;
734 *map = offset;
7429e207 735 *file = bs->file->bs;
fbc8e1b7 736 return BDRV_BLOCK_DATA | BDRV_BLOCK_OFFSET_VALID | BDRV_BLOCK_RECURSE;
0cc84887
KW
737 }
738
778b087e
PB
739 qemu_co_mutex_lock(&s->lock);
740
2f83673b
EB
741 image_offset = get_image_offset(bs, offset, false, NULL);
742 allocated = (image_offset != -1);
0cc84887 743 *pnum = 0;
2c060c0f 744 ret = BDRV_BLOCK_ZERO;
0cc84887
KW
745
746 do {
747 /* All sectors in a block are contiguous (without using the bitmap) */
2f83673b
EB
748 n = ROUND_UP(offset + 1, s->block_size) - offset;
749 n = MIN(n, bytes);
0cc84887
KW
750
751 *pnum += n;
2f83673b
EB
752 offset += n;
753 bytes -= n;
2ec711dc
PL
754 /* *pnum can't be greater than one block for allocated
755 * sectors since there is always a bitmap in between. */
756 if (allocated) {
7429e207 757 *file = bs->file->bs;
2f83673b
EB
758 *map = image_offset;
759 ret = BDRV_BLOCK_DATA | BDRV_BLOCK_OFFSET_VALID;
778b087e 760 break;
2ec711dc 761 }
2f83673b 762 if (bytes == 0) {
0cc84887
KW
763 break;
764 }
2f83673b
EB
765 image_offset = get_image_offset(bs, offset, false, NULL);
766 } while (image_offset == -1);
0cc84887 767
778b087e
PB
768 qemu_co_mutex_unlock(&s->lock);
769 return ret;
0cc84887
KW
770}
771
57c7d9e5
AL
772/*
773 * Calculates the number of cylinders, heads and sectors per cylinder
774 * based on a given number of sectors. This is the algorithm described
775 * in the VHD specification.
776 *
777 * Note that the geometry doesn't always exactly match total_sectors but
778 * may round it down.
6e9ea0c0 779 *
c23fb11b 780 * Returns 0 on success, -EFBIG if the size is larger than 2040 GiB. Override
258d2edb
CA
781 * the hardware EIDE and ATA-2 limit of 16 heads (max disk size of 127 GB)
782 * and instead allow up to 255 heads.
57c7d9e5 783 */
5f14f31d 784static int calculate_geometry(int64_t total_sectors, uint16_t *cyls,
785 uint8_t *heads, uint8_t *secs_per_cyl)
57c7d9e5
AL
786{
787 uint32_t cyls_times_heads;
788
690cbb09 789 total_sectors = MIN(total_sectors, VHD_MAX_GEOMETRY);
57c7d9e5 790
690cbb09 791 if (total_sectors >= 65535LL * 16 * 63) {
57c7d9e5 792 *secs_per_cyl = 255;
690cbb09 793 *heads = 16;
57c7d9e5
AL
794 cyls_times_heads = total_sectors / *secs_per_cyl;
795 } else {
796 *secs_per_cyl = 17;
797 cyls_times_heads = total_sectors / *secs_per_cyl;
13f1493f 798 *heads = DIV_ROUND_UP(cyls_times_heads, 1024);
57c7d9e5 799
690cbb09 800 if (*heads < 4) {
57c7d9e5 801 *heads = 4;
690cbb09 802 }
57c7d9e5
AL
803
804 if (cyls_times_heads >= (*heads * 1024) || *heads > 16) {
805 *secs_per_cyl = 31;
806 *heads = 16;
807 cyls_times_heads = total_sectors / *secs_per_cyl;
808 }
809
810 if (cyls_times_heads >= (*heads * 1024)) {
811 *secs_per_cyl = 63;
812 *heads = 16;
813 cyls_times_heads = total_sectors / *secs_per_cyl;
814 }
815 }
816
dede4188 817 *cyls = cyls_times_heads / *heads;
6e9ea0c0
AJ
818
819 return 0;
57c7d9e5
AL
820}
821
b8f45cdf 822static int create_dynamic_disk(BlockBackend *blk, uint8_t *buf,
fef6070e 823 int64_t total_sectors)
57c7d9e5 824{
e326f078 825 VHDDynDiskHeader dyndisk_header;
b0ce8cb0 826 uint8_t bat_sector[512];
57c7d9e5 827 size_t block_size, num_bat_entries;
24da78db 828 int i;
fef6070e
JC
829 int ret;
830 int64_t offset = 0;
57c7d9e5 831
9c057d0b 832 /* Write the footer (twice: at the beginning and at the end) */
57c7d9e5 833 block_size = 0x200000;
3f6de653 834 num_bat_entries = DIV_ROUND_UP(total_sectors, block_size / 512);
57c7d9e5 835
8341f00d 836 ret = blk_pwrite(blk, offset, buf, HEADER_SIZE, 0);
40a99aac 837 if (ret < 0) {
f0ff243a
BS
838 goto fail;
839 }
57c7d9e5 840
fef6070e 841 offset = 1536 + ((num_bat_entries * 4 + 511) & ~511);
8341f00d 842 ret = blk_pwrite(blk, offset, buf, HEADER_SIZE, 0);
fef6070e 843 if (ret < 0) {
f0ff243a
BS
844 goto fail;
845 }
57c7d9e5 846
9c057d0b 847 /* Write the initial BAT */
fef6070e 848 offset = 3 * 512;
57c7d9e5 849
b0ce8cb0 850 memset(bat_sector, 0xFF, 512);
13f1493f 851 for (i = 0; i < DIV_ROUND_UP(num_bat_entries * 4, 512); i++) {
b0ce8cb0 852 ret = blk_pwrite(blk, offset, bat_sector, 512, 0);
fef6070e 853 if (ret < 0) {
f0ff243a
BS
854 goto fail;
855 }
fef6070e 856 offset += 512;
f0ff243a 857 }
57c7d9e5 858
9c057d0b 859 /* Prepare the Dynamic Disk Header */
3d6101a3 860 memset(&dyndisk_header, 0, sizeof(dyndisk_header));
57c7d9e5 861
e326f078 862 memcpy(dyndisk_header.magic, "cxsparse", 8);
57c7d9e5 863
78439f6a
CA
864 /*
865 * Note: The spec is actually wrong here for data_offset, it says
866 * 0xFFFFFFFF, but MS tools expect all 64 bits to be set.
867 */
e326f078
MA
868 dyndisk_header.data_offset = cpu_to_be64(0xFFFFFFFFFFFFFFFFULL);
869 dyndisk_header.table_offset = cpu_to_be64(3 * 512);
870 dyndisk_header.version = cpu_to_be32(0x00010000);
871 dyndisk_header.block_size = cpu_to_be32(block_size);
872 dyndisk_header.max_table_entries = cpu_to_be32(num_bat_entries);
57c7d9e5 873
3d6101a3
MA
874 dyndisk_header.checksum = cpu_to_be32(
875 vpc_checksum(&dyndisk_header, sizeof(dyndisk_header)));
57c7d9e5 876
9c057d0b 877 /* Write the header */
fef6070e 878 offset = 512;
57c7d9e5 879
3d6101a3 880 ret = blk_pwrite(blk, offset, &dyndisk_header, sizeof(dyndisk_header), 0);
fef6070e 881 if (ret < 0) {
f0ff243a
BS
882 goto fail;
883 }
f0ff243a 884
1a37e312 885 ret = 0;
24da78db
CA
886 fail:
887 return ret;
888}
889
b8f45cdf 890static int create_fixed_disk(BlockBackend *blk, uint8_t *buf,
ed3d2ec9 891 int64_t total_size, Error **errp)
24da78db 892{
fef6070e 893 int ret;
24da78db
CA
894
895 /* Add footer to total size */
fef6070e
JC
896 total_size += HEADER_SIZE;
897
8c6242b6 898 ret = blk_truncate(blk, total_size, false, PREALLOC_MODE_OFF, 0, errp);
fef6070e
JC
899 if (ret < 0) {
900 return ret;
24da78db
CA
901 }
902
8341f00d 903 ret = blk_pwrite(blk, total_size - HEADER_SIZE, buf, HEADER_SIZE, 0);
fef6070e 904 if (ret < 0) {
ed3d2ec9 905 error_setg_errno(errp, -ret, "Unable to write VHD header");
fef6070e
JC
906 return ret;
907 }
24da78db 908
1a37e312 909 return 0;
24da78db
CA
910}
911
1cfeaf38
KW
912static int calculate_rounded_image_size(BlockdevCreateOptionsVpc *vpc_opts,
913 uint16_t *out_cyls,
914 uint8_t *out_heads,
915 uint8_t *out_secs_per_cyl,
916 int64_t *out_total_sectors,
917 Error **errp)
918{
919 int64_t total_size = vpc_opts->size;
920 uint16_t cyls = 0;
921 uint8_t heads = 0;
922 uint8_t secs_per_cyl = 0;
923 int64_t total_sectors;
924 int i;
925
926 /*
927 * Calculate matching total_size and geometry. Increase the number of
928 * sectors requested until we get enough (or fail). This ensures that
929 * qemu-img convert doesn't truncate images, but rather rounds up.
930 *
931 * If the image size can't be represented by a spec conformant CHS geometry,
932 * we set the geometry to 65535 x 16 x 255 (CxHxS) sectors and use
933 * the image size from the VHD footer to calculate total_sectors.
934 */
935 if (vpc_opts->force_size) {
936 /* This will force the use of total_size for sector count, below */
937 cyls = VHD_CHS_MAX_C;
938 heads = VHD_CHS_MAX_H;
939 secs_per_cyl = VHD_CHS_MAX_S;
940 } else {
941 total_sectors = MIN(VHD_MAX_GEOMETRY, total_size / BDRV_SECTOR_SIZE);
942 for (i = 0; total_sectors > (int64_t)cyls * heads * secs_per_cyl; i++) {
943 calculate_geometry(total_sectors + i, &cyls, &heads, &secs_per_cyl);
944 }
945 }
946
947 if ((int64_t)cyls * heads * secs_per_cyl == VHD_MAX_GEOMETRY) {
948 total_sectors = total_size / BDRV_SECTOR_SIZE;
949 /* Allow a maximum disk size of 2040 GiB */
950 if (total_sectors > VHD_MAX_SECTORS) {
951 error_setg(errp, "Disk size is too large, max size is 2040 GiB");
952 return -EFBIG;
953 }
954 } else {
955 total_sectors = (int64_t) cyls * heads * secs_per_cyl;
956 }
957
958 *out_total_sectors = total_sectors;
959 if (out_cyls) {
960 *out_cyls = cyls;
961 *out_heads = heads;
962 *out_secs_per_cyl = secs_per_cyl;
963 }
964
965 return 0;
966}
967
182c8835
KW
968static int coroutine_fn vpc_co_create(BlockdevCreateOptions *opts,
969 Error **errp)
24da78db 970{
182c8835
KW
971 BlockdevCreateOptionsVpc *vpc_opts;
972 BlockBackend *blk = NULL;
973 BlockDriverState *bs = NULL;
974
275734e4 975 VHDFooter footer;
24da78db
CA
976 uint16_t cyls = 0;
977 uint8_t heads = 0;
978 uint8_t secs_per_cyl = 0;
979 int64_t total_sectors;
980 int64_t total_size;
981 int disk_type;
982 int ret = -EIO;
0dbaaa79 983 QemuUUID uuid;
24da78db 984
182c8835
KW
985 assert(opts->driver == BLOCKDEV_DRIVER_VPC);
986 vpc_opts = &opts->u.vpc;
987
988 /* Validate options and set default values */
989 total_size = vpc_opts->size;
990
991 if (!vpc_opts->has_subformat) {
992 vpc_opts->subformat = BLOCKDEV_VPC_SUBFORMAT_DYNAMIC;
993 }
994 switch (vpc_opts->subformat) {
995 case BLOCKDEV_VPC_SUBFORMAT_DYNAMIC:
24da78db 996 disk_type = VHD_DYNAMIC;
182c8835
KW
997 break;
998 case BLOCKDEV_VPC_SUBFORMAT_FIXED:
999 disk_type = VHD_FIXED;
1000 break;
1001 default:
1002 g_assert_not_reached();
24da78db
CA
1003 }
1004
182c8835
KW
1005 /* Create BlockBackend to write to the image */
1006 bs = bdrv_open_blockdev_ref(vpc_opts->file, errp);
1007 if (bs == NULL) {
1008 return -EIO;
24da78db 1009 }
b8f45cdf 1010
a3aeeab5
EB
1011 blk = blk_new_with_bs(bs, BLK_PERM_WRITE | BLK_PERM_RESIZE, BLK_PERM_ALL,
1012 errp);
1013 if (!blk) {
1014 ret = -EPERM;
fef6070e 1015 goto out;
4ab15590 1016 }
b8f45cdf
KW
1017 blk_set_allow_write_beyond_eof(blk, true);
1018
1cfeaf38
KW
1019 /* Get geometry and check that it matches the image size*/
1020 ret = calculate_rounded_image_size(vpc_opts, &cyls, &heads, &secs_per_cyl,
1021 &total_sectors, errp);
1022 if (ret < 0) {
1023 goto out;
690cbb09
PL
1024 }
1025
1cfeaf38
KW
1026 if (total_size != total_sectors * BDRV_SECTOR_SIZE) {
1027 error_setg(errp, "The requested image size cannot be represented in "
1028 "CHS geometry");
1029 error_append_hint(errp, "Try size=%llu or force-size=on (the "
1030 "latter makes the image incompatible with "
1031 "Virtual PC)",
1032 total_sectors * BDRV_SECTOR_SIZE);
1033 ret = -EINVAL;
1034 goto out;
24da78db 1035 }
ecd880d9 1036
24da78db 1037 /* Prepare the Hard Disk Footer */
275734e4 1038 memset(&footer, 0, HEADER_SIZE);
24da78db 1039
275734e4 1040 memcpy(footer.creator, "conectix", 8);
182c8835 1041 if (vpc_opts->force_size) {
275734e4 1042 memcpy(footer.creator_app, "qem2", 4);
fb9245c2 1043 } else {
275734e4 1044 memcpy(footer.creator_app, "qemu", 4);
fb9245c2 1045 }
275734e4 1046 memcpy(footer.creator_os, "Wi2k", 4);
24da78db 1047
275734e4
MA
1048 footer.features = cpu_to_be32(0x02);
1049 footer.version = cpu_to_be32(0x00010000);
24da78db 1050 if (disk_type == VHD_DYNAMIC) {
275734e4 1051 footer.data_offset = cpu_to_be64(HEADER_SIZE);
24da78db 1052 } else {
275734e4 1053 footer.data_offset = cpu_to_be64(0xFFFFFFFFFFFFFFFFULL);
24da78db 1054 }
275734e4 1055 footer.timestamp = cpu_to_be32(time(NULL) - VHD_TIMESTAMP_BASE);
24da78db
CA
1056
1057 /* Version of Virtual PC 2007 */
275734e4
MA
1058 footer.major = cpu_to_be16(0x0005);
1059 footer.minor = cpu_to_be16(0x0003);
1060 footer.orig_size = cpu_to_be64(total_size);
1061 footer.current_size = cpu_to_be64(total_size);
1062 footer.cyls = cpu_to_be16(cyls);
1063 footer.heads = heads;
1064 footer.secs_per_cyl = secs_per_cyl;
24da78db 1065
275734e4 1066 footer.type = cpu_to_be32(disk_type);
24da78db 1067
0dbaaa79 1068 qemu_uuid_generate(&uuid);
275734e4 1069 footer.uuid = uuid;
24da78db 1070
275734e4 1071 footer.checksum = cpu_to_be32(vpc_checksum(&footer, HEADER_SIZE));
24da78db
CA
1072
1073 if (disk_type == VHD_DYNAMIC) {
275734e4 1074 ret = create_dynamic_disk(blk, (uint8_t *)&footer, total_sectors);
ed3d2ec9
HR
1075 if (ret < 0) {
1076 error_setg(errp, "Unable to create or write VHD header");
1077 }
24da78db 1078 } else {
275734e4 1079 ret = create_fixed_disk(blk, (uint8_t *)&footer, total_size, errp);
0211b9be 1080 }
24da78db 1081
fec9921f 1082out:
b8f45cdf 1083 blk_unref(blk);
182c8835
KW
1084 bdrv_unref(bs);
1085 return ret;
1086}
1087
b92902df
ML
1088static int coroutine_fn vpc_co_create_opts(BlockDriver *drv,
1089 const char *filename,
1090 QemuOpts *opts,
1091 Error **errp)
182c8835
KW
1092{
1093 BlockdevCreateOptions *create_options = NULL;
92adf9db 1094 QDict *qdict;
182c8835
KW
1095 Visitor *v;
1096 BlockDriverState *bs = NULL;
182c8835
KW
1097 int ret;
1098
1099 static const QDictRenames opt_renames[] = {
1100 { VPC_OPT_FORCE_SIZE, "force-size" },
1101 { NULL, NULL },
1102 };
1103
1104 /* Parse options and convert legacy syntax */
1105 qdict = qemu_opts_to_qdict_filtered(opts, NULL, &vpc_create_opts, true);
1106
1107 if (!qdict_rename_keys(qdict, opt_renames, errp)) {
1108 ret = -EINVAL;
1109 goto fail;
1110 }
1111
1112 /* Create and open the file (protocol layer) */
668f62ec 1113 ret = bdrv_create_file(filename, opts, errp);
182c8835 1114 if (ret < 0) {
182c8835
KW
1115 goto fail;
1116 }
1117
1118 bs = bdrv_open(filename, NULL, NULL,
1119 BDRV_O_RDWR | BDRV_O_RESIZE | BDRV_O_PROTOCOL, errp);
1120 if (bs == NULL) {
1121 ret = -EIO;
1122 goto fail;
1123 }
1124
1125 /* Now get the QAPI type BlockdevCreateOptions */
1126 qdict_put_str(qdict, "driver", "vpc");
1127 qdict_put_str(qdict, "file", bs->node_name);
1128
af91062e
MA
1129 v = qobject_input_visitor_new_flat_confused(qdict, errp);
1130 if (!v) {
182c8835
KW
1131 ret = -EINVAL;
1132 goto fail;
1133 }
1134
b11a093c 1135 visit_type_BlockdevCreateOptions(v, NULL, &create_options, errp);
182c8835 1136 visit_free(v);
b11a093c 1137 if (!create_options) {
182c8835
KW
1138 ret = -EINVAL;
1139 goto fail;
1140 }
1141
1142 /* Silently round up size */
1143 assert(create_options->driver == BLOCKDEV_DRIVER_VPC);
1144 create_options->u.vpc.size =
1145 ROUND_UP(create_options->u.vpc.size, BDRV_SECTOR_SIZE);
1146
1cfeaf38
KW
1147 if (!create_options->u.vpc.force_size) {
1148 int64_t total_sectors;
1149 ret = calculate_rounded_image_size(&create_options->u.vpc, NULL, NULL,
1150 NULL, &total_sectors, errp);
1151 if (ret < 0) {
1152 goto fail;
1153 }
1154
1155 create_options->u.vpc.size = total_sectors * BDRV_SECTOR_SIZE;
1156 }
1157
1158
182c8835
KW
1159 /* Create the vpc image (format layer) */
1160 ret = vpc_co_create(create_options, errp);
1161
1162fail:
cb3e7f08 1163 qobject_unref(qdict);
182c8835
KW
1164 bdrv_unref(bs);
1165 qapi_free_BlockdevCreateOptions(create_options);
f0ff243a 1166 return ret;
57c7d9e5
AL
1167}
1168
182c8835 1169
72c6cc94
KW
1170static int vpc_has_zero_init(BlockDriverState *bs)
1171{
1172 BDRVVPCState *s = bs->opaque;
72c6cc94 1173
275734e4 1174 if (be32_to_cpu(s->footer.type) == VHD_FIXED) {
9a4f4c31 1175 return bdrv_has_zero_init(bs->file->bs);
72c6cc94
KW
1176 } else {
1177 return 1;
1178 }
1179}
1180
6a0f9e82
FB
1181static void vpc_close(BlockDriverState *bs)
1182{
1183 BDRVVPCState *s = bs->opaque;
97f1c45c 1184 qemu_vfree(s->pagetable);
6a0f9e82 1185#ifdef CACHE
7267c094 1186 g_free(s->pageentry_u8);
6a0f9e82 1187#endif
612ff3d8
KW
1188
1189 migrate_del_blocker(s->migration_blocker);
1190 error_free(s->migration_blocker);
6a0f9e82
FB
1191}
1192
fec9921f
CL
1193static QemuOptsList vpc_create_opts = {
1194 .name = "vpc-create-opts",
1195 .head = QTAILQ_HEAD_INITIALIZER(vpc_create_opts.head),
1196 .desc = {
1197 {
1198 .name = BLOCK_OPT_SIZE,
1199 .type = QEMU_OPT_SIZE,
1200 .help = "Virtual disk size"
1201 },
1202 {
1203 .name = BLOCK_OPT_SUBFMT,
1204 .type = QEMU_OPT_STRING,
1205 .help =
1206 "Type of virtual hard disk format. Supported formats are "
1207 "{dynamic (default) | fixed} "
1208 },
fb9245c2
JC
1209 {
1210 .name = VPC_OPT_FORCE_SIZE,
1211 .type = QEMU_OPT_BOOL,
1212 .help = "Force disk size calculation to use the actual size "
1213 "specified, rather than using the nearest CHS-based "
1214 "calculation"
1215 },
fec9921f
CL
1216 { /* end of list */ }
1217 }
0e7e1989
KW
1218};
1219
2654267c
HR
1220static const char *const vpc_strong_runtime_opts[] = {
1221 VPC_OPT_SIZE_CALC,
1222
1223 NULL
1224};
1225
5efa9d5a 1226static BlockDriver bdrv_vpc = {
4a411185
KW
1227 .format_name = "vpc",
1228 .instance_size = sizeof(BDRVVPCState),
c68b89ac 1229
72c6cc94
KW
1230 .bdrv_probe = vpc_probe,
1231 .bdrv_open = vpc_open,
1232 .bdrv_close = vpc_close,
1233 .bdrv_reopen_prepare = vpc_reopen_prepare,
69dca43d 1234 .bdrv_child_perm = bdrv_default_perms,
182c8835 1235 .bdrv_co_create = vpc_co_create,
efc75e2a 1236 .bdrv_co_create_opts = vpc_co_create_opts,
0e7e1989 1237
d46b7cc6 1238 .bdrv_co_preadv = vpc_co_preadv,
513b0f02 1239 .bdrv_co_pwritev = vpc_co_pwritev,
2f83673b 1240 .bdrv_co_block_status = vpc_co_block_status,
c68b89ac 1241
97b00e28
PB
1242 .bdrv_get_info = vpc_get_info,
1243
d67066d8 1244 .is_format = true,
fec9921f 1245 .create_opts = &vpc_create_opts,
72c6cc94 1246 .bdrv_has_zero_init = vpc_has_zero_init,
2654267c 1247 .strong_runtime_opts = vpc_strong_runtime_opts,
6a0f9e82 1248};
5efa9d5a
AL
1249
1250static void bdrv_vpc_init(void)
1251{
1252 bdrv_register(&bdrv_vpc);
1253}
1254
1255block_init(bdrv_vpc_init);